update: add env variable for main container(vllm) when DRA is enabled

zdtsw · zdtsw · commit af1ab6f044cd · 2026-01-27T15:39:07.000+01:00
for Intel

- currently when DRA is enabled it skip adding 3 env for intel-i915 and
  one VLLM_WORKER_MULTIPROC_METHOD for intel-xe
- three env variable were previouly only injected if use legancy
  accelerators(intel i915 or the new Xe)

Signed-off-by: Wen Zhou &lt;wenzhou@redhat.com&gt;
diff --git a/charts/llm-d-modelservice/templates/_helpers.tpl b/charts/llm-d-modelservice/templates/_helpers.tpl
@@ -246,7 +246,22 @@ nvidia.com/gpu
 
 {{/* Get accelerator environment variables based on type */}}
 {{- define "llm-d-modelservice.acceleratorEnv" -}}
-{{- $acceleratorType := .Values.accelerator.type | default "nvidia" -}}
+{{- $acceleratorType := "" -}}
+{{- if .Values.dra.enabled -}}
+  {{- /* Use explicit acceleratorEnvType if provided, otherwise map DRA type */ -}}
+  {{- if .Values.dra.acceleratorEnvType -}}
+    {{- $acceleratorType = .Values.dra.acceleratorEnvType -}}
+  {{- else -}}
+    {{- $draType := .Values.dra.type | default "nvidia" -}}
+    {{- if eq $draType "intel" -}}
+      {{- $acceleratorType = "intel-i915" -}}
+    {{- else -}}
+      {{- $acceleratorType = $draType -}}
+    {{- end -}}
+  {{- end -}}
+{{- else -}}
+  {{- $acceleratorType = .Values.accelerator.type | default "nvidia" -}}
+{{- end -}}
 {{- if and (ne $acceleratorType "cpu") (hasKey .Values.accelerator.env $acceleratorType) -}}
 {{- $envVars := index .Values.accelerator.env $acceleratorType -}}
 {{- range $envVars }}
diff --git a/charts/llm-d-modelservice/values.schema.json b/charts/llm-d-modelservice/values.schema.json
@@ -7,10 +7,58 @@
             "description": " Supported types: nvidia, intel-i915, intel-xe, intel-gaudi, amd, google",
             "properties": {
                 "env": {
-                    "additionalProperties": false,
-                    "description": "Environment variables specific to accelerator types",
+                    "additionalProperties": true,
+                    "description": " @schema additionalProperties: true @schema",
                     "properties": {
                         "intel-i915": {
+                            "items": {
+                                "anyOf": [
+                                    {
+                                        "additionalProperties": false,
+                                        "properties": {
+                                            "name": {
+                                                "default": "VLLM_USE_V1",
+                                                "required": [],
+                                                "title": "name",
+                                                "type": "string"
+                                            },
+                                            "value": {
+                                                "default": "1",
+                                                "required": [],
+                                                "title": "value",
+                                                "type": "string"
+                                            }
+                                        },
+                                        "required": [],
+                                        "type": "object"
+                                    },
+                                    {
+                                        "additionalProperties": false,
+                                        "properties": {
+                                            "name": {
+                                                "default": "TORCH_LLM_ALLREDUCE",
+                                                "required": [],
+                                                "title": "name",
+                                                "type": "string"
+                                            },
+                                            "value": {
+                                                "default": "1",
+                                                "required": [],
+                                                "title": "value",
+                                                "type": "string"
+                                            }
+                                        },
+                                        "required": [],
+                                        "type": "object"
+                                    }
+                                ],
+                                "required": []
+                            },
+                            "required": [],
+                            "title": "intel-i915",
+                            "type": "array"
+                        },
+                        "intel-xe": {
                             "items": {
                                 "anyOf": [
                                     {
@@ -74,13 +122,12 @@
                                 "required": []
                             },
                             "required": [],
-                            "title": "intel-i915",
+                            "title": "intel-xe",
                             "type": "array"
                         }
                     },
                     "required": [],
-                    "title": "env",
-                    "type": "object"
+                    "title": "env"
                 },
                 "resources": {
                     "additionalProperties": false,
@@ -1660,6 +1707,7 @@
             "description": " additionalProperties: true @schema",
             "properties": {
                 "claimTemplates": {
+                    "description": " acceleratorEnvType: \"\"",
                     "items": {
                         "anyOf": [
                             {
@@ -1861,8 +1909,7 @@
                         "required": []
                     },
                     "required": [],
-                    "title": "claimTemplates",
-                    "type": "array"
+                    "title": "claimTemplates"
                 },
                 "enabled": {
                     "default": false,
diff --git a/charts/llm-d-modelservice/values.schema.tmpl.json b/charts/llm-d-modelservice/values.schema.tmpl.json
@@ -7,10 +7,58 @@
       "description": " Supported types: nvidia, intel-i915, intel-xe, intel-gaudi, amd, google",
       "properties": {
         "env": {
-          "additionalProperties": false,
-          "description": "Environment variables specific to accelerator types",
+          "additionalProperties": true,
+          "description": " @schema additionalProperties: true @schema",
           "properties": {
             "intel-i915": {
+              "items": {
+                "anyOf": [
+                  {
+                    "additionalProperties": false,
+                    "properties": {
+                      "name": {
+                        "default": "VLLM_USE_V1",
+                        "required": [],
+                        "title": "name",
+                        "type": "string"
+                      },
+                      "value": {
+                        "default": "1",
+                        "required": [],
+                        "title": "value",
+                        "type": "string"
+                      }
+                    },
+                    "required": [],
+                    "type": "object"
+                  },
+                  {
+                    "additionalProperties": false,
+                    "properties": {
+                      "name": {
+                        "default": "TORCH_LLM_ALLREDUCE",
+                        "required": [],
+                        "title": "name",
+                        "type": "string"
+                      },
+                      "value": {
+                        "default": "1",
+                        "required": [],
+                        "title": "value",
+                        "type": "string"
+                      }
+                    },
+                    "required": [],
+                    "type": "object"
+                  }
+                ],
+                "required": []
+              },
+              "required": [],
+              "title": "intel-i915",
+              "type": "array"
+            },
+            "intel-xe": {
               "items": {
                 "anyOf": [
                   {
@@ -74,13 +122,12 @@
                 "required": []
               },
               "required": [],
-              "title": "intel-i915",
+              "title": "intel-xe",
               "type": "array"
             }
           },
           "required": [],
-          "title": "env",
-          "type": "object"
+          "title": "env"
         },
         "resources": {
           "additionalProperties": false,
@@ -346,6 +393,7 @@
       "description": " additionalProperties: true @schema",
       "properties": {
         "claimTemplates": {
+          "description": " acceleratorEnvType: \"\"",
           "items": {
             "anyOf": [
               {
@@ -547,8 +595,7 @@
             "required": []
           },
           "required": [],
-          "title": "claimTemplates",
-          "type": "array"
+          "title": "claimTemplates"
         },
         "enabled": {
           "default": false,
diff --git a/charts/llm-d-modelservice/values.yaml b/charts/llm-d-modelservice/values.yaml
@@ -74,7 +74,7 @@ modelArtifacts:
 multinode: false
 
 # Global accelerator configuration
-# Supported types: nvidia, intel-i915, intel-xe, intel-gaudi, amd, google
+# Supported types: nvidia, intel-i915, intel-xe, intel-gaudi, amd, google, cpu
 accelerator:
   # Type of accelerator to use
   type: nvidia
@@ -87,6 +87,9 @@ accelerator:
     amd: "amd.com/gpu"
     google: "google.com/tpu"
   # Environment variables specific to accelerator types
+  # @schema
+  # additionalProperties: true
+  # @schema
   env:
     intel-i915:
       - name: VLLM_USE_V1
@@ -95,6 +98,9 @@ accelerator:
         value: "1"
       - name: VLLM_WORKER_MULTIPROC_METHOD
         value: "spawn"
+    intel-xe:
+      - name: VLLM_WORKER_MULTIPROC_METHOD
+        value: "spawn"
 
 # @schema
 # additionalProperties: true
@@ -122,6 +128,8 @@ requester:
 dra:
   enabled: false # true: use this block instead of the `accelerator`
   type: nvidia # which claimTemplates entry to use
+  # Optional: inject env variable for vllm (e.g., "intel-i915" or "intel-xe"). Need to match accelerator.resource map's key
+  # acceleratorEnvType: ""
   claimTemplates:
     - name: nvidia
       class: gpu.nvidia.com
diff --git a/examples/output-dra.yaml b/examples/output-dra.yaml
@@ -90,6 +90,13 @@ spec:
                 name: llm-d-hf-token
                 key: HF_TOKEN
           
+          - name: VLLM_USE_V1
+            value: "1"
+          - name: TORCH_LLM_ALLREDUCE
+            value: "1"
+          - name: VLLM_WORKER_MULTIPROC_METHOD
+            value: "spawn"
+          
           resources:
             claims:
             - name: intel-resource-claim
diff --git a/examples/output-xpu.yaml b/examples/output-xpu.yaml
@@ -92,6 +92,9 @@ spec:
           - name: HF_HOME
             value: /model-cache
           
+          - name: VLLM_WORKER_MULTIPROC_METHOD
+            value: "spawn"
+          
           ports:
           - containerPort: 8200
             protocol: TCP