Skip to content

Commit c97db00

Browse files
authored
update: add env variable for main container(vllm) when DRA is enabled for Intel-xe (#189)
* fix: add intel-xe accelerator environment variable support - add VLLM_WORKER_MULTIPROC_METHOD: spawn for Intel-xe - bump version Signed-off-by: Wen Zhou <wenzhou@redhat.com> * update: fix schema generation Signed-off-by: Wen Zhou <wenzhou@redhat.com> --------- Signed-off-by: Wen Zhou <wenzhou@redhat.com>
1 parent 201293d commit c97db00

File tree

4 files changed

+67
-3
lines changed

4 files changed

+67
-3
lines changed

charts/llm-d-modelservice/values.schema.json

Lines changed: 30 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -4,7 +4,7 @@
44
"properties": {
55
"accelerator": {
66
"additionalProperties": false,
7-
"description": " Supported types: nvidia, intel-i915, intel-xe, intel-gaudi, amd, google",
7+
"description": " Supported types: nvidia, intel-i915, intel-xe, intel-gaudi, amd, google, cpu",
88
"properties": {
99
"dra": {
1010
"default": false,
@@ -83,6 +83,35 @@
8383
"required": [],
8484
"title": "intel-i915",
8585
"type": "array"
86+
},
87+
"intel-xe": {
88+
"items": {
89+
"anyOf": [
90+
{
91+
"additionalProperties": false,
92+
"properties": {
93+
"name": {
94+
"default": "VLLM_WORKER_MULTIPROC_METHOD",
95+
"required": [],
96+
"title": "name",
97+
"type": "string"
98+
},
99+
"value": {
100+
"default": "spawn",
101+
"required": [],
102+
"title": "value",
103+
"type": "string"
104+
}
105+
},
106+
"required": [],
107+
"type": "object"
108+
}
109+
],
110+
"required": []
111+
},
112+
"required": [],
113+
"title": "intel-xe",
114+
"type": "array"
86115
}
87116
},
88117
"required": [],

charts/llm-d-modelservice/values.schema.tmpl.json

Lines changed: 30 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -4,7 +4,7 @@
44
"properties": {
55
"accelerator": {
66
"additionalProperties": false,
7-
"description": " Supported types: nvidia, intel-i915, intel-xe, intel-gaudi, amd, google",
7+
"description": " Supported types: nvidia, intel-i915, intel-xe, intel-gaudi, amd, google, cpu",
88
"properties": {
99
"dra": {
1010
"default": false,
@@ -83,6 +83,35 @@
8383
"required": [],
8484
"title": "intel-i915",
8585
"type": "array"
86+
},
87+
"intel-xe": {
88+
"items": {
89+
"anyOf": [
90+
{
91+
"additionalProperties": false,
92+
"properties": {
93+
"name": {
94+
"default": "VLLM_WORKER_MULTIPROC_METHOD",
95+
"required": [],
96+
"title": "name",
97+
"type": "string"
98+
},
99+
"value": {
100+
"default": "spawn",
101+
"required": [],
102+
"title": "value",
103+
"type": "string"
104+
}
105+
},
106+
"required": [],
107+
"type": "object"
108+
}
109+
],
110+
"required": []
111+
},
112+
"required": [],
113+
"title": "intel-xe",
114+
"type": "array"
86115
}
87116
},
88117
"required": [],

charts/llm-d-modelservice/values.yaml

Lines changed: 4 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -74,7 +74,7 @@ modelArtifacts:
7474
multinode: false
7575

7676
# Global accelerator configuration
77-
# Supported types: nvidia, intel-i915, intel-xe, intel-gaudi, amd, google
77+
# Supported types: nvidia, intel-i915, intel-xe, intel-gaudi, amd, google, cpu
7878
accelerator:
7979
# Type of accelerator to use
8080
type: nvidia
@@ -101,6 +101,9 @@ accelerator:
101101
value: "1"
102102
- name: VLLM_WORKER_MULTIPROC_METHOD
103103
value: "spawn"
104+
intel-xe:
105+
- name: VLLM_WORKER_MULTIPROC_METHOD
106+
value: "spawn"
104107
# ResourceClaimTemplate configurations for DRA (used when dra: true)
105108
# Each accelerator type can have its own claim template configuration
106109
resourceClaimTemplates:

examples/output-xpu.yaml

Lines changed: 3 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -93,6 +93,9 @@ spec:
9393
- name: HF_HOME
9494
value: /model-cache
9595

96+
- name: VLLM_WORKER_MULTIPROC_METHOD
97+
value: "spawn"
98+
9699
ports:
97100
- containerPort: 8200
98101
protocol: TCP

0 commit comments

Comments
 (0)