1616name : Precompiled images
1717
1818on :
19- schedule :
20- - cron : ' 00 09 * * *'
19+ pull_request :
20+ types :
21+ - opened
22+ - synchronize
23+ branches :
24+ - test-holodeck
25+ push :
26+ branches :
27+ - test-holodeck
2128
2229jobs :
2330 set-driver-version-matrix :
@@ -39,17 +46,20 @@ jobs:
3946 echo "driver_branch=$driver_branch_json" >> $GITHUB_OUTPUT
4047
4148 # get kernel flavors
42- KERNEL_FLAVORS=("aws" "azure" "generic" "nvidia" "oracle")
49+ # KERNEL_FLAVORS=("aws" "azure" "generic" "nvidia" "oracle")
50+ KERNEL_FLAVORS=("generic")
4351 kernel_flavors_json=$(printf '%s\n' "${KERNEL_FLAVORS[@]}" | jq -R . | jq -cs .)
4452 echo "kernel_flavors=$kernel_flavors_json" >> $GITHUB_OUTPUT
4553
4654 # get ubuntu distributions
47- DIST=("ubuntu22.04" "ubuntu24.04")
55+ # DIST=("ubuntu22.04" "ubuntu24.04")
56+ DIST=("ubuntu22.04")
4857 dist_json=$(printf '%s\n' "${DIST[@]}" | jq -R . | jq -cs .)
4958 echo "dist=$dist_json" >> $GITHUB_OUTPUT
5059
5160 # LTS_KERNEL setup
52- LTS_KERNEL=("5.15" "6.8")
61+ # LTS_KERNEL=("5.15" "6.8")
62+ LTS_KERNEL=("6.8")
5363 lts_kernel_json=$(printf '%s\n' "${LTS_KERNEL[@]}" | jq -R . | jq -cs .)
5464 echo "lts_kernel=$lts_kernel_json" >> $GITHUB_OUTPUT
5565
@@ -321,7 +331,7 @@ jobs:
321331 echo "DRIVER_BRANCHES=${DRIVER_BRANCHES[*]}" >> $GITHUB_ENV
322332
323333 - name : Set up Holodeck
324- uses : NVIDIA/holodeck@v0.2.6
334+ uses : NVIDIA/holodeck@main
325335 env :
326336 AWS_SECRET_ACCESS_KEY : ${{ secrets.AWS_SECRET_ACCESS_KEY }}
327337 AWS_ACCESS_KEY_ID : ${{ secrets.AWS_ACCESS_KEY_ID }}
@@ -346,27 +356,6 @@ jobs:
346356 sudo apt-get update
347357 sudo apt-get install -y gh
348358
349- - name : Upgrade the kernel for Precompiled e2e test
350- env :
351- UPGRADE_KERNEL_SCRIPT : " ./tests/scripts/upgrade-kernel.sh"
352- run : |
353- status=0
354- ./tests/ci-remote-exec.sh "${UPGRADE_KERNEL_SCRIPT}" "${KERNEL_VERSION}" || status=$?
355- # On the target system, all scripts/test-case exit with code 1 for error handling.
356- # However, since reboot-related disconnections break the SSH connection
357- # and can cause the entire job to exit, we should ignore all errors except
358- # exit code 1. During a reboot, exit code 1 will not be thrown, so handling
359- # other errors as code 1 will ensure proper management of reboot scenarios
360- if [ $status -eq 1 ]; then
361- echo "Kernel version $KERNEL_VERSION upgrade failed"
362- exit 1
363- fi
364- ./tests/scripts/remote_retry.sh || status=$?
365- if [ $status -ne 0 ]; then
366- echo "Failed to connect to remote instance"
367- exit $status
368- fi
369-
370359 - name : Precompiled e2e test gpu driver validation
371360 env :
372361 TEST_CASE : " ./tests/cases/nvidia-driver.sh"
0 commit comments