Skip to content

Commit c1950dd

Browse files
committed
pin nccl-plugin-gpudirecttcpx-dev to latest
1 parent 8f734ed commit c1950dd

File tree

1 file changed

+9
-2
lines changed

1 file changed

+9
-2
lines changed

tools/cloud-build/daily-tests/ansible_playbooks/test-validation/test-gke-a3-high.yml

Lines changed: 9 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -35,6 +35,13 @@
3535
debug:
3636
msg: "{{nccl_test_file_contents.stdout}}"
3737

38+
- name: Pin nccl-plugin-gpudirecttcpx-dev to latest tag
39+
delegate_to: localhost
40+
ansible.builtin.replace:
41+
path: "{{ workspace }}/examples/nccl-test.yaml"
42+
regexp: 'nccl-plugin-gpudirecttcpx-dev:v3.1.9'
43+
replace: 'nccl-plugin-gpudirecttcpx-dev:latest'
44+
3845
- name: Create NCCL config map and deploy NCCL test pods
3946
delegate_to: localhost
4047
ansible.builtin.shell: |
@@ -60,12 +67,12 @@
6067
debug:
6168
msg: "{{nccl_test_logs.stdout}}"
6269

63-
- name: Ensure average bus bandwidth is >= 19 GB/s
70+
- name: Ensure average bus bandwidth is >= 25 GB/s
6471
delegate_to: localhost
6572
ansible.builtin.shell: |
6673
grep -o '# Avg bus bandwidth : [0-9\.]*' pod_logs.txt | cut -d ':' -f 2 | awk '{$1=$1;print}'
6774
register: avg_bus_bandwidth
68-
failed_when: avg_bus_bandwidth.stdout | float < 19
75+
failed_when: avg_bus_bandwidth.stdout | float < 25
6976

7077
- name: Clean up
7178
delegate_to: localhost

0 commit comments

Comments
 (0)