Skip to content

Commit 9eb8d16

Browse files
authored
Pin the GKE version for GKE A3 High blueprint (#4815)
1 parent f4ed882 commit 9eb8d16

File tree

2 files changed

+15
-5
lines changed

2 files changed

+15
-5
lines changed

examples/gke-a3-highgpu.yaml

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -89,6 +89,7 @@ deployment_groups:
8989
k8s_network_names:
9090
gvnic_prefix: vpc
9191
gvnic_start_index: 1
92+
version_prefix: 1.33.5-gke.1308000
9293
outputs: [instructions]
9394

9495
- id: a3_highgpu_pool

tools/cloud-build/daily-tests/ansible_playbooks/test-validation/test-gke-a3-high.yml

Lines changed: 14 additions & 5 deletions
Original file line numberDiff line numberDiff line change
@@ -1,4 +1,4 @@
1-
# Copyright 2025 "Google LLC"
1+
# Copyright 2025 Google LLC
22
#
33
# Licensed under the Apache License, Version 2.0 (the "License");
44
# you may not use this file except in compliance with the License.
@@ -23,6 +23,16 @@
2323
ansible.builtin.shell: |
2424
gcloud container clusters get-credentials {{ deployment_name }} --region {{ region }} --project {{ custom_vars.project }} --verbosity=debug
2525
26+
- name: Get GKE cluster version
27+
delegate_to: localhost
28+
ansible.builtin.shell: |
29+
gcloud container clusters describe {{ deployment_name }} --region {{ region }} --project {{ custom_vars.project }} --format="value(currentMasterVersion)"
30+
register: gke_version_info
31+
32+
- name: Print GKE cluster version
33+
ansible.builtin.debug:
34+
msg: "GKE Cluster Version: {{ gke_version_info.stdout }}"
35+
2636
- name: Download NCCL test file
2737
delegate_to: localhost
2838
ansible.builtin.shell: |
@@ -33,7 +43,7 @@
3343

3444
- name: Display NCCL test file
3545
debug:
36-
msg: "{{nccl_test_file_contents.stdout}}"
46+
msg: "{{ nccl_test_file_contents.stdout }}"
3747

3848
- name: Create NCCL config map and deploy NCCL test pods
3949
delegate_to: localhost
@@ -58,7 +68,7 @@
5868

5969
- name: Print the NCCL test logs
6070
debug:
61-
msg: "{{nccl_test_logs.stdout}}"
71+
msg: "{{ nccl_test_logs.stdout }}"
6272

6373
- name: Ensure average bus bandwidth is >= 25 GB/s
6474
delegate_to: localhost
@@ -70,5 +80,4 @@
7080
- name: Clean up
7181
delegate_to: localhost
7282
ansible.builtin.shell: |
73-
kubectl delete pod --all -v=9
74-
kubectl delete service --all -v=9
83+
kubectl delete -f {{ workspace }}/examples/nccl-test.yaml

0 commit comments

Comments
 (0)