Skip to content

Commit ad7c928

Browse files
committed
fix: add intel-xe accelerator environment variable support
- add VLLM_WORKER_MULTIPROC_METHOD: spawn for Intel-xe - bump version Signed-off-by: Wen Zhou <wenzhou@redhat.com>
1 parent 2890bf5 commit ad7c928

15 files changed

+41
-35
lines changed

charts/llm-d-modelservice/Chart.yaml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -13,7 +13,7 @@ type: application
1313
# This is the chart version. This version number should be incremented each time you make changes
1414
# to the chart and its templates, including the app version.
1515
# Versions are expected to follow Semantic Versioning (https://semver.org/)
16-
version: "v0.4.2"
16+
version: "v0.4.3"
1717
# This is the version number of the application being deployed. This version number should be
1818
# incremented each time you make changes to the application. Versions are not expected to
1919
# follow Semantic Versioning. They should reflect the version the application is using.

charts/llm-d-modelservice/values.schema.json

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -14,7 +14,7 @@
1414
"type": "boolean"
1515
},
1616
"env": {
17-
"additionalProperties": false,
17+
"additionalProperties": true,
1818
"description": "Environment variables specific to accelerator types",
1919
"properties": {
2020
"intel-i915": {

charts/llm-d-modelservice/values.schema.tmpl.json

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -14,7 +14,7 @@
1414
"type": "boolean"
1515
},
1616
"env": {
17-
"additionalProperties": false,
17+
"additionalProperties": true,
1818
"description": "Environment variables specific to accelerator types",
1919
"properties": {
2020
"intel-i915": {

charts/llm-d-modelservice/values.yaml

Lines changed: 4 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -74,7 +74,7 @@ modelArtifacts:
7474
multinode: false
7575

7676
# Global accelerator configuration
77-
# Supported types: nvidia, intel-i915, intel-xe, intel-gaudi, amd, google
77+
# Supported types: nvidia, intel-i915, intel-xe, intel-gaudi, amd, google, cpu
7878
accelerator:
7979
# Type of accelerator to use
8080
type: nvidia
@@ -101,6 +101,9 @@ accelerator:
101101
value: "1"
102102
- name: VLLM_WORKER_MULTIPROC_METHOD
103103
value: "spawn"
104+
intel-xe:
105+
- name: VLLM_WORKER_MULTIPROC_METHOD
106+
value: "spawn"
104107
# ResourceClaimTemplate configurations for DRA (used when dra: true)
105108
# Each accelerator type can have its own claim template configuration
106109
resourceClaimTemplates:

examples/output-cpu.yaml

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -6,7 +6,7 @@ kind: ServiceAccount
66
metadata:
77
name: cpu-sim-llm-d-modelservice
88
labels:
9-
helm.sh/chart: llm-d-modelservice-v0.4.2
9+
helm.sh/chart: llm-d-modelservice-v0.4.3
1010
app.kubernetes.io/version: "v0.3.0"
1111
app.kubernetes.io/managed-by: Helm
1212
---
@@ -16,7 +16,7 @@ kind: Deployment
1616
metadata:
1717
name: cpu-sim-llm-d-modelservice-decode
1818
labels:
19-
helm.sh/chart: llm-d-modelservice-v0.4.2
19+
helm.sh/chart: llm-d-modelservice-v0.4.3
2020
app.kubernetes.io/version: "v0.3.0"
2121
app.kubernetes.io/managed-by: Helm
2222
spec:
@@ -106,7 +106,7 @@ kind: Deployment
106106
metadata:
107107
name: cpu-sim-llm-d-modelservice-prefill
108108
labels:
109-
helm.sh/chart: llm-d-modelservice-v0.4.2
109+
helm.sh/chart: llm-d-modelservice-v0.4.3
110110
app.kubernetes.io/version: "v0.3.0"
111111
app.kubernetes.io/managed-by: Helm
112112
spec:

examples/output-dra.yaml

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -6,7 +6,7 @@ kind: ServiceAccount
66
metadata:
77
name: dra-llm-d-modelservice
88
labels:
9-
helm.sh/chart: llm-d-modelservice-v0.4.2
9+
helm.sh/chart: llm-d-modelservice-v0.4.3
1010
app.kubernetes.io/version: "v0.3.0"
1111
app.kubernetes.io/managed-by: Helm
1212
---
@@ -16,7 +16,7 @@ kind: Deployment
1616
metadata:
1717
name: dra-llm-d-modelservice-decode
1818
labels:
19-
helm.sh/chart: llm-d-modelservice-v0.4.2
19+
helm.sh/chart: llm-d-modelservice-v0.4.3
2020
app.kubernetes.io/version: "v0.3.0"
2121
app.kubernetes.io/managed-by: Helm
2222
spec:
@@ -116,7 +116,7 @@ kind: ResourceClaimTemplate
116116
metadata:
117117
name: intel-gaudi-claim-template-decode
118118
labels:
119-
helm.sh/chart: llm-d-modelservice-v0.4.2
119+
helm.sh/chart: llm-d-modelservice-v0.4.3
120120
app.kubernetes.io/version: "v0.3.0"
121121
app.kubernetes.io/managed-by: Helm
122122
llm-d.ai/role: decode

examples/output-gaudi.yaml

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -6,7 +6,7 @@ kind: ServiceAccount
66
metadata:
77
name: gaudi-llm-d-modelservice
88
labels:
9-
helm.sh/chart: llm-d-modelservice-v0.4.2
9+
helm.sh/chart: llm-d-modelservice-v0.4.3
1010
app.kubernetes.io/version: "v0.3.0"
1111
app.kubernetes.io/managed-by: Helm
1212
---
@@ -16,7 +16,7 @@ kind: Deployment
1616
metadata:
1717
name: gaudi-llm-d-modelservice-decode
1818
labels:
19-
helm.sh/chart: llm-d-modelservice-v0.4.2
19+
helm.sh/chart: llm-d-modelservice-v0.4.3
2020
app.kubernetes.io/version: "v0.3.0"
2121
app.kubernetes.io/managed-by: Helm
2222
spec:

examples/output-heterogeneous-pd.yaml

Lines changed: 4 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -6,7 +6,7 @@ kind: ServiceAccount
66
metadata:
77
name: heterogeneous-pd-llm-d-modelservice
88
labels:
9-
helm.sh/chart: llm-d-modelservice-v0.4.2
9+
helm.sh/chart: llm-d-modelservice-v0.4.3
1010
app.kubernetes.io/version: "v0.3.0"
1111
app.kubernetes.io/managed-by: Helm
1212
---
@@ -16,7 +16,7 @@ kind: Deployment
1616
metadata:
1717
name: heterogeneous-pd-llm-d-modelservice-decode
1818
labels:
19-
helm.sh/chart: llm-d-modelservice-v0.4.2
19+
helm.sh/chart: llm-d-modelservice-v0.4.3
2020
app.kubernetes.io/version: "v0.3.0"
2121
app.kubernetes.io/managed-by: Helm
2222
spec:
@@ -132,7 +132,7 @@ kind: Deployment
132132
metadata:
133133
name: heterogeneous-pd-llm-d-modelservice-prefill
134134
labels:
135-
helm.sh/chart: llm-d-modelservice-v0.4.2
135+
helm.sh/chart: llm-d-modelservice-v0.4.3
136136
app.kubernetes.io/version: "v0.3.0"
137137
app.kubernetes.io/managed-by: Helm
138138
spec:
@@ -226,7 +226,7 @@ kind: ResourceClaimTemplate
226226
metadata:
227227
name: nvidia-claim-template-decode
228228
labels:
229-
helm.sh/chart: llm-d-modelservice-v0.4.2
229+
helm.sh/chart: llm-d-modelservice-v0.4.3
230230
app.kubernetes.io/version: "v0.3.0"
231231
app.kubernetes.io/managed-by: Helm
232232
llm-d.ai/role: decode

examples/output-pd-mnnvl.yaml

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -6,7 +6,7 @@ kind: ServiceAccount
66
metadata:
77
name: pd-mnnvl-llm-d-modelservice
88
labels:
9-
helm.sh/chart: llm-d-modelservice-v0.4.2
9+
helm.sh/chart: llm-d-modelservice-v0.4.3
1010
app.kubernetes.io/version: "v0.3.0"
1111
app.kubernetes.io/managed-by: Helm
1212
---
@@ -16,7 +16,7 @@ kind: Deployment
1616
metadata:
1717
name: pd-mnnvl-llm-d-modelservice-decode
1818
labels:
19-
helm.sh/chart: llm-d-modelservice-v0.4.2
19+
helm.sh/chart: llm-d-modelservice-v0.4.3
2020
app.kubernetes.io/version: "v0.3.0"
2121
app.kubernetes.io/managed-by: Helm
2222
spec:
@@ -132,7 +132,7 @@ kind: Deployment
132132
metadata:
133133
name: pd-mnnvl-llm-d-modelservice-prefill
134134
labels:
135-
helm.sh/chart: llm-d-modelservice-v0.4.2
135+
helm.sh/chart: llm-d-modelservice-v0.4.3
136136
app.kubernetes.io/version: "v0.3.0"
137137
app.kubernetes.io/managed-by: Helm
138138
spec:

examples/output-pd.yaml

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -6,7 +6,7 @@ kind: ServiceAccount
66
metadata:
77
name: pd-llm-d-modelservice
88
labels:
9-
helm.sh/chart: llm-d-modelservice-v0.4.2
9+
helm.sh/chart: llm-d-modelservice-v0.4.3
1010
app.kubernetes.io/version: "v0.3.0"
1111
app.kubernetes.io/managed-by: Helm
1212
---
@@ -16,7 +16,7 @@ kind: Deployment
1616
metadata:
1717
name: pd-llm-d-modelservice-decode
1818
labels:
19-
helm.sh/chart: llm-d-modelservice-v0.4.2
19+
helm.sh/chart: llm-d-modelservice-v0.4.3
2020
app.kubernetes.io/version: "v0.3.0"
2121
app.kubernetes.io/managed-by: Helm
2222
spec:
@@ -128,7 +128,7 @@ kind: Deployment
128128
metadata:
129129
name: pd-llm-d-modelservice-prefill
130130
labels:
131-
helm.sh/chart: llm-d-modelservice-v0.4.2
131+
helm.sh/chart: llm-d-modelservice-v0.4.3
132132
app.kubernetes.io/version: "v0.3.0"
133133
app.kubernetes.io/managed-by: Helm
134134
spec:

0 commit comments

Comments
 (0)