Skip to content

Commit 8e1afe8

Browse files
committed
tests/ai-conformance: use nvidia GPU operator to install GPU drivers
1 parent 6451ae3 commit 8e1afe8

File tree

1 file changed

+2
-12
lines changed

1 file changed

+2
-12
lines changed

tests/e2e/scenarios/ai-conformance/run-test.sh

Lines changed: 2 additions & 12 deletions
Original file line numberDiff line numberDiff line change
@@ -142,15 +142,6 @@ kubeletPlugin:
142142
effect: NoSchedule
143143
EOF
144144

145-
cat > values.yaml <<EOF
146-
# The driver daemonset needs a toleration for the nvidia.com/gpu taint
147-
kubeletPlugin:
148-
tolerations:
149-
- key: nvidia.com/gpu
150-
operator: Exists
151-
effect: NoSchedule
152-
EOF
153-
154145
helm upgrade -i nvidia-dra-driver-gpu nvidia/nvidia-dra-driver-gpu \
155146
--version="25.12.0" \
156147
--create-namespace \
@@ -178,9 +169,8 @@ echo "----------------------------------------------------------------"
178169
# Wait for kOps validation
179170
"${KOPS}" validate cluster --wait=15m
180171

181-
# Verify Components
182-
echo "Verifying NVIDIA Device Plugin..."
183-
#kubectl rollout status daemonset -n kube-system nvidia-device-plugin-daemonset --timeout=5m || echo "Warning: NVIDIA Device Plugin not ready yet"
172+
echo "Verifying GPU Operator device plugin..."
173+
kubectl rollout status daemonset -n gpu-operator nvidia-device-plugin-daemonset --timeout=5m || echo "Warning: GPU Operator device plugin not ready yet"
184174

185175
echo "Verifying Kueue..."
186176
kubectl rollout status deployment -n kueue-system kueue-controller-manager --timeout=5m || echo "Warning: Kueue not ready yet"

0 commit comments

Comments
 (0)