diff --git a/articles/aks/gpu-cluster.md b/articles/aks/gpu-cluster.md index b1ae071ea..51bd37b12 100644 --- a/articles/aks/gpu-cluster.md +++ b/articles/aks/gpu-cluster.md @@ -157,13 +157,19 @@ To use Azure Linux, you specify the OS SKU by setting `os-sku` to `AzureLinux` d operator: "Equal" value: "gpu" effect: "NoSchedule" + - key: "kubernetes.azure.com/scalesetpriority" + operator: "Equal" + value: "spot" + effect: "NoSchedule" + nodeSelector: + kubernetes.azure.com/accelerator: nvidia # Mark this pod as a critical add-on; when enabled, the critical add-on # scheduler reserves resources for critical add-on pods so that they can # be rescheduled after a failure. # See https://kubernetes.io/docs/tasks/administer-cluster/guaranteed-scheduling-critical-addon-pods/ priorityClassName: "system-node-critical" containers: - - image: nvcr.io/nvidia/k8s-device-plugin:v0.17.0 + - image: nvcr.io/nvidia/k8s-device-plugin:v0.17.1 name: nvidia-device-plugin-ctr env: - name: FAIL_ON_INIT_ERROR