Skip to content

Commit a454098

Browse files
authored
add deployment strategy (#247)
1 parent 9c8a748 commit a454098

3 files changed

Lines changed: 38 additions & 0 deletions

File tree

charts/llm-d-modelservice/templates/decode-deployment.yaml

Lines changed: 4 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -21,6 +21,10 @@ metadata:
2121
{{- end }}
2222
spec:
2323
replicas: {{ ternary .Values.decode.replicas 1 (hasKey .Values.decode "replicas") }}
24+
{{- if .Values.decode.strategy }}
25+
strategy:
26+
{{- toYaml .Values.decode.strategy | nindent 4 }}
27+
{{- end }}
2428
selector:
2529
matchLabels:
2630
{{- include "llm-d-modelservice.decodelabels" . | nindent 6 }}

charts/llm-d-modelservice/templates/prefill-deployment.yaml

Lines changed: 4 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -21,6 +21,10 @@ metadata:
2121
{{- end }}
2222
spec:
2323
replicas: {{ ternary .Values.prefill.replicas 1 (hasKey .Values.prefill "replicas") }}
24+
{{- if .Values.prefill.strategy }}
25+
strategy:
26+
{{- toYaml .Values.prefill.strategy | nindent 4 }}
27+
{{- end }}
2428
selector:
2529
matchLabels:
2630
{{- include "llm-d-modelservice.prefilllabels" . | nindent 6 }}

charts/llm-d-modelservice/values.yaml

Lines changed: 30 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -250,6 +250,21 @@ decode:
250250
enabled: false
251251

252252
replicas: 1
253+
254+
# @schema
255+
# type: object
256+
# additionalProperties: true
257+
# @schema
258+
# -- Deployment strategy configuration for decode pods.
259+
# -- Defaults to Kubernetes default if not specified.
260+
# -- Example:
261+
# -- strategy:
262+
# -- type: RollingUpdate
263+
# -- rollingUpdate:
264+
# -- maxSurge: 0
265+
# -- maxUnavailable: 1
266+
# strategy: {}
267+
253268
# @schema
254269
# additionalProperties: true
255270
# @schema
@@ -464,6 +479,21 @@ prefill:
464479
enabled: false
465480

466481
replicas: 0
482+
483+
# @schema
484+
# type: object
485+
# additionalProperties: true
486+
# @schema
487+
# -- Deployment strategy configuration for prefill pods.
488+
# -- Defaults to Kubernetes default if not specified.
489+
# -- Example:
490+
# -- strategy:
491+
# -- type: RollingUpdate
492+
# -- rollingUpdate:
493+
# -- maxSurge: 0
494+
# -- maxUnavailable: 1
495+
# strategy: {}
496+
467497
# @schema
468498
# additionalProperties: true
469499
# @schema

0 commit comments

Comments
 (0)