File tree 1 file changed +13
-0
lines changed
addons/hf-llm-models/templates
1 file changed +13
-0
lines changed Original file line number Diff line number Diff line change @@ -69,12 +69,19 @@ spec:
69
69
- --tensor-parallel-size={{ .Values.tensorParallelSize }}
70
70
{{- if .Values.maxModelLen }}
71
71
- --max-model-len={{ .Values.maxModelLen }}
72
+ {{- end }}
73
+ {{- if .Values.extraArgs }}
74
+ {{- range .Values.extraArgs }}
75
+ - {{ . }}
76
+ {{- end }}
72
77
{{- end }}
73
78
image : {{ .Values.vllmImage }}
74
79
imagePullPolicy : IfNotPresent
75
80
env :
76
81
- name : HF_TOKEN
77
82
value : {{ .Values.huggingFaceToken }}
83
+ - name : NCCL_DEBUG
84
+ value : INFO
78
85
ports :
79
86
- containerPort : 8000
80
87
protocol : TCP
@@ -105,13 +112,19 @@ spec:
105
112
nvidia.com/gpu : {{ .Values.resources.limits.nvidiaGpu }}
106
113
{{- end }}
107
114
volumeMounts :
115
+ - name : dshm
116
+ mountPath : /dev/shm
108
117
- name : model-volume
109
118
mountPath : {{ .Values.modelDir }}
110
119
name : vllm
111
120
securityContext :
112
121
allowPrivilegeEscalation : false
113
122
terminationGracePeriodSeconds : 10
114
123
volumes :
124
+ - name : dshm
125
+ emptyDir :
126
+ medium : Memory
127
+ sizeLimit : 4Gi
115
128
- name : model-volume
116
129
persistentVolumeClaim :
117
130
claimName : " {{ .Release.Name }}-hf-llm"
You can’t perform that action at this time.
0 commit comments