Skip to content

Add compute-matrix debugging to identify empty strategy #987

Add compute-matrix debugging to identify empty strategy

Add compute-matrix debugging to identify empty strategy #987

Workflow file for this run

# SPDX-FileCopyrightText: Copyright (c) 2023 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
# SPDX-License-Identifier: Apache-2.0
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
# This is the main workflow that runs on every PR and push to main
name: pr
defaults:
run:
shell: bash -euo pipefail {0}
on:
push:
branches:
- "pull-request/[0-9]+"
# Only runs one instance of this workflow at a time for a given PR and cancels any in-progress runs when a new one starts.
concurrency:
group: ${{ github.workflow }}-on-${{ github.event_name }}-from-${{ github.ref_name }}
cancel-in-progress: true
jobs:
doxygen-check:
name: Doxygen check
runs-on: ubuntu-latest
steps:
- name: Checkout repo
uses: actions/checkout@v3
- name: Install Doxygen
run: |
sudo apt-get update -q
sudo apt-get install -y doxygen
- name: Check Doxygen docs
run: |
./ci/pre-commit/doxygen.sh
if [ $? -ne 0 ]; then
echo "Doxygen check failed"
exit 1
fi
shell: bash -euxo pipefail {0}
compute-matrix:
name: Compute matrix
runs-on: ubuntu-latest
outputs:
DEVCONTAINER_VERSION: ${{steps.set-outputs.outputs.DEVCONTAINER_VERSION}}
NVCC_FULL_MATRIX: ${{steps.set-outputs.outputs.NVCC_FULL_MATRIX}}
CUDA_VERSIONS: ${{steps.set-outputs.outputs.CUDA_VERSIONS}}
HOST_COMPILERS: ${{steps.set-outputs.outputs.HOST_COMPILERS}}
PER_CUDA_COMPILER_MATRIX: ${{steps.set-outputs.outputs.PER_CUDA_COMPILER_MATRIX}}
steps:
- name: Checkout repo
uses: actions/checkout@v3
- name: Compute matrix outputs
id: set-outputs
run: |
echo "=== Compute Matrix Debug ==="
echo "yq version:"
yq --version
echo "matrix.yml contents:"
cat ci/matrix.yml
echo "=== Running compute-matrix script ==="
.github/actions/compute-matrix/compute-matrix.sh -v ci/matrix.yml pull_request
echo "=== Script completed, checking outputs ==="
echo "CUDA_VERSIONS: ${CUDA_VERSIONS:-UNSET}"
echo "HOST_COMPILERS: ${HOST_COMPILERS:-UNSET}"
echo "PER_CUDA_COMPILER_MATRIX: ${PER_CUDA_COMPILER_MATRIX:-UNSET}"
ci:
name: CUDA${{ matrix.cuda_version }} ${{ matrix.compiler }}
needs: compute-matrix
uses: ./.github/workflows/dispatch-build-and-test.yml
strategy:
fail-fast: false
matrix:
cuda_version: ${{ fromJSON(needs.compute-matrix.outputs.CUDA_VERSIONS) }}
compiler: ${{ fromJSON(needs.compute-matrix.outputs.HOST_COMPILERS) }}
with:
per_cuda_compiler_matrix: ${{ toJSON(fromJSON(needs.compute-matrix.outputs.PER_CUDA_COMPILER_MATRIX)[ format('{0}-{1}', matrix.cuda_version, matrix.compiler) ]) }}
devcontainer_version: ${{ needs.compute-matrix.outputs.DEVCONTAINER_VERSION }}
verify-devcontainers:
name: Verify Dev Containers
uses: ./.github/workflows/verify-devcontainers.yml
# This job is the final job that runs after all other jobs and is used for branch protection status checks.
# See: https://docs.github.com/en/pull-requests/collaborating-with-pull-requests/collaborating-on-repositories-with-code-quality-features/about-status-checks
# https://github.com/orgs/community/discussions/26822#discussioncomment-5122101
ci-success:
runs-on: ubuntu-latest
name: CI success
if: ${{ always() }} # need to use always() instead of !cancelled() because skipped jobs count as success
needs:
- doxygen-check
- ci
- verify-devcontainers
steps:
- name: Debug - Print all job results
run: |
echo "=== Job Results Debug ==="
echo "doxygen-check result: ${{ needs.doxygen-check.result }}"
echo "ci result: ${{ needs.ci.result }}"
echo "verify-devcontainers result: ${{ needs.verify-devcontainers.result }}"
echo "=========================="
echo "=== CI Matrix Job Details ==="
echo "CI job outputs (this shows individual matrix job results):"
echo '${{ toJSON(needs.ci.outputs) }}'
echo ""
echo "CI job result object:"
echo '${{ toJSON(needs.ci) }}'
echo "=========================="
echo "=== Checking for failures ==="
if [[ "${{ needs.doxygen-check.result }}" == "failure" ]]; then
echo "❌ doxygen-check FAILED"
else
echo "✅ doxygen-check: ${{ needs.doxygen-check.result }}"
fi
if [[ "${{ needs.ci.result }}" == "failure" ]]; then
echo "❌ ci FAILED (one or more matrix jobs failed)"
echo " Check the 'CI Matrix Job Details' section above to see which specific matrix jobs failed"
else
echo "✅ ci: ${{ needs.ci.result }}"
fi
if [[ "${{ needs.verify-devcontainers.result }}" == "failure" ]]; then
echo "❌ verify-devcontainers FAILED"
else
echo "✅ verify-devcontainers: ${{ needs.verify-devcontainers.result }}"
fi
echo "=== Checking for cancelled ==="
if [[ "${{ needs.doxygen-check.result }}" == "cancelled" ]]; then
echo "🚫 doxygen-check CANCELLED"
fi
if [[ "${{ needs.ci.result }}" == "cancelled" ]]; then
echo "🚫 ci CANCELLED"
fi
if [[ "${{ needs.verify-devcontainers.result }}" == "cancelled" ]]; then
echo "🚫 verify-devcontainers CANCELLED"
fi
echo "=== Final Status Check ==="
- name: Check status of all precursor jobs
if: >-
${{
contains(needs.*.result, 'failure')
|| contains(needs.*.result, 'cancelled')
}}
run: |
echo "❌ CI FAILED: One or more prerequisite jobs failed or were cancelled"
echo "Check the debug output above to see which job(s) caused the failure"
exit 1