File tree Expand file tree Collapse file tree 5 files changed +22
-29
lines changed
tests/chainsaw/cli/cuj1-training Expand file tree Collapse file tree 5 files changed +22
-29
lines changed Original file line number Diff line number Diff line change 6969 version : 1.19.2
7070 valuesFile : components/k8s-ephemeral-storage-metrics/values.yaml
7171 dependencyRefs :
72- - kube-prometheus-stack
72+ - kube-prometheus-stack
73+
74+ - name : nvidia-dra-driver-gpu
75+ type : Helm
76+ source : https://helm.ngc.nvidia.com/nvidia
77+ version : " 25.12.0"
78+ valuesFile : components/nvidia-dra-driver-gpu/values.yaml
79+ dependencyRefs :
80+ - gpu-operator
81+
82+ - name : kai-scheduler
83+ type : Helm
84+ source : oci://ghcr.io/nvidia/kai-scheduler
85+ version : v0.12.14
86+ valuesFile : components/kai-scheduler/values.yaml
87+ dependencyRefs :
88+ - gpu-operator
Original file line number Diff line number Diff line change 7575
7676 - name : nvidia-dra-driver-gpu
7777 type : Helm
78- source : https://helm.ngc.nvidia.com/nvidia
79- version : " 25.12.0"
80- valuesFile : components/nvidia-dra-driver-gpu/values.yaml
81- dependencyRefs :
82- - gpu-operator
8378 overrides :
8479 gpuResourcesEnabledOverride : true
8580 # EKS has no control-plane nodes — remove the default nodeAffinity
8984 tolerations :
9085 - operator : Exists
9186
92- - name : kai-scheduler
93- type : Helm
94- source : oci://ghcr.io/nvidia/kai-scheduler
95- version : v0.12.14
96- valuesFile : components/kai-scheduler/values.yaml
97- dependencyRefs :
98- - gpu-operator
99-
10087 - name : dynamo-crds
10188 type : Helm
10289 source : https://helm.ngc.nvidia.com/nvidia/ai-dynamo
Original file line number Diff line number Diff line change 3434 value : " >= 1.34"
3535
3636 componentRefs :
37- - name : kai-scheduler
38- type : Helm
39- source : oci://ghcr.io/nvidia/kai-scheduler
40- version : v0.12.14
41- valuesFile : components/kai-scheduler/values.yaml
42- dependencyRefs :
43- - gpu-operator
44-
4537 - name : dynamo-crds
4638 type : Helm
4739 source : https://helm.ngc.nvidia.com/nvidia/ai-dynamo
Original file line number Diff line number Diff line change @@ -179,15 +179,9 @@ spec:
179179 cpu : 500m
180180 memory : 1Gi
181181
182- # nvidia-dra-driver-gpu: DRA driver for GPU resource management
183- # For kind with GPU passthrough, use "/" as driver root (host drivers)
182+ # nvidia-dra-driver-gpu: override driver root for kind GPU passthrough
184183 - name : nvidia-dra-driver-gpu
185184 type : Helm
186- source : https://helm.ngc.nvidia.com/nvidia
187- version : " 25.12.0"
188- valuesFile : components/nvidia-dra-driver-gpu/values.yaml
189- dependencyRefs :
190- - gpu-operator
191185 overrides :
192186 # Use "/" for host-installed drivers (kind GPU passthrough)
193187 nvidiaDriverRoot : " /"
Original file line number Diff line number Diff line change @@ -40,8 +40,10 @@ componentRefs: ## alphabetically sorted
4040 - name : cert-manager
4141 - name : gpu-operator
4242 - name : k8s-ephemeral-storage-metrics
43+ - name : kai-scheduler
4344 - name : kube-prometheus-stack
4445 - name : kubeflow-trainer
46+ - name : nvidia-dra-driver-gpu
4547 - name : nvsentinel
4648 - name : prometheus-adapter
4749 - name : skyhook-customizations
@@ -51,9 +53,11 @@ deploymentOrder:
5153 - aws-efa
5254 - cert-manager
5355 - gpu-operator
56+ - kai-scheduler
5457 - kube-prometheus-stack
5558 - k8s-ephemeral-storage-metrics
5659 - kubeflow-trainer
60+ - nvidia-dra-driver-gpu
5761 - nvsentinel
5862 - prometheus-adapter
5963 - skyhook-operator
You can’t perform that action at this time.
0 commit comments