File tree Expand file tree Collapse file tree 2 files changed +4
-38
lines changed
examples/machine-learning Expand file tree Collapse file tree 2 files changed +4
-38
lines changed Original file line number Diff line number Diff line change 2424 # Image settings
2525 base_image :
2626 project : ubuntu-os-accelerator-images
27- image : ubuntu-accelerator-2204-amd64-with-nvidia-570-v20250712
27+ image : ubuntu-accelerator-2204-amd64-with-nvidia-570-v20250722
2828 image_build_machine_type : n2-standard-16
2929 build_slurm_from_git_ref : 6.10.0
3030 # Cluster env settings
@@ -147,24 +147,7 @@ deployment_groups:
147147 ansible.builtin.apt:
148148 deb: "{{ cuda_repo_filename }}"
149149 state: present
150- # The following 2 tasks work around a temporary issue with Ubuntu
151- # packaging of NVIDIA 570 driver series for kernel 6.8.0-1032
152- # This command ensures that any holds are removed before attempting an upgrade.
153- # We ignore failures in case the packages were not held.
154- - name: Unhold NVIDIA driver packages
155- ansible.builtin.command:
156- cmd: apt-mark unhold linux-modules-nvidia-570-server-open-gcp linux-modules-nvidia-570-server-open-6.8.0-1032-gcp
157- become: true
158- changed_when: false
159- failed_when: false
160- - name: Install latest NVIDIA driver metapackage and kernel module
161- ansible.builtin.apt:
162- name:
163- - linux-modules-nvidia-570-server-open-gcp
164- - linux-modules-nvidia-570-server-open-6.8.0-1032-gcp
165- state: latest
166- update_cache: yes
167- become: true
150+
168151 - name: Reduce NVIDIA repository priority
169152 ansible.builtin.copy:
170153 dest: /etc/apt/preferences.d/cuda-repository-pin-600
Original file line number Diff line number Diff line change 2424 # Image settings
2525 base_image :
2626 project : ubuntu-os-accelerator-images
27- image : ubuntu-accelerator-2204-amd64-with-nvidia-570-v20250712
27+ image : ubuntu-accelerator-2204-amd64-with-nvidia-570-v20250722
2828 image_build_machine_type : n2-standard-16
2929 build_slurm_from_git_ref : 6.10.0
3030 # Cluster env settings
@@ -148,24 +148,7 @@ deployment_groups:
148148 ansible.builtin.apt:
149149 deb: "{{ cuda_repo_filename }}"
150150 state: present
151- # The following 2 tasks work around a temporary issue with Ubuntu
152- # packaging of NVIDIA 570 driver series for kernel 6.8.0-1032
153- # This command ensures that any holds are removed before attempting an upgrade.
154- # We ignore failures in case the packages were not held.
155- - name: Unhold NVIDIA driver packages
156- ansible.builtin.command:
157- cmd: apt-mark unhold linux-modules-nvidia-570-server-open-gcp linux-modules-nvidia-570-server-open-6.8.0-1032-gcp
158- become: true
159- changed_when: false
160- failed_when: false
161- - name: Install latest NVIDIA driver metapackage and kernel module
162- ansible.builtin.apt:
163- name:
164- - linux-modules-nvidia-570-server-open-gcp
165- - linux-modules-nvidia-570-server-open-6.8.0-1032-gcp
166- state: latest
167- update_cache: yes
168- become: true
151+
169152 - name: Reduce NVIDIA repository priority
170153 ansible.builtin.copy:
171154 dest: /etc/apt/preferences.d/cuda-repository-pin-600
You can’t perform that action at this time.
0 commit comments