Skip to content

Commit efa8b47

Browse files
committed
chore: add debugging
1 parent 5bdf0ce commit efa8b47

File tree

3 files changed

+47
-4
lines changed

3 files changed

+47
-4
lines changed

.github/workflows/integration-gcp.yml

Lines changed: 7 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -130,21 +130,25 @@ jobs:
130130
GCP_ZONE: "${{ env.TF_VAR_zone }}"
131131
GCP_SERVICE_ACCOUNT: "${{ env.SERVICE_ACCOUNT }}"
132132
NVSENTINEL_VERSION: "${{ steps.ref-name.outputs.value }}"
133-
run: tests/uat/install-apps.sh
133+
run: |
134+
set -euxo pipefail
135+
tests/uat/install-apps.sh
134136
135137
# Test
136138
- name: Run UAT Tests
137139
id: tests
138140
if: steps.apps.outcome == 'success'
139141
shell: bash
140-
run: tests/uat/tests.sh
142+
run: |
143+
set -euxo pipefail
144+
tests/uat/tests.sh
141145
142146
# Teardown
143147
- name: Destroy Cluster
144148
if: always() && steps.cluster.outcome != 'skipped' && env.SKIP_DELETE != 'true'
145149
shell: bash
146150
run: |
147-
set -euo pipefail
151+
set -euxo pipefail
148152
cd tests/uat/gcp/cluster
149153
terraform destroy -auto-approve
150154

tests/uat/gcp/gpu-operator-values.yaml

Lines changed: 14 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -34,4 +34,17 @@ toolkit:
3434
enabled: true
3535
env:
3636
- name: RUNTIME_CONFIG_SOURCE
37-
value: file
37+
value: file
38+
39+
# Fix deprecated node-role label warnings
40+
node-feature-discovery:
41+
master:
42+
affinity:
43+
nodeAffinity:
44+
preferredDuringSchedulingIgnoredDuringExecution:
45+
- weight: 1
46+
preference:
47+
matchExpressions:
48+
- key: "node-role.kubernetes.io/control-plane"
49+
operator: In
50+
values: [""]

tests/uat/install-apps.sh

Lines changed: 26 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -59,6 +59,32 @@ GCP_SERVICE_ACCOUNT="${GCP_SERVICE_ACCOUNT:-}"
5959
# ARM64-specific values file (if needed)
6060
NVSENTINEL_ARM64_VALUES="${REPO_ROOT}/distros/kubernetes/nvsentinel/values-tilt-arm64.yaml"
6161

62+
63+
# Print out variables for debugging (alphabetical order)
64+
log "Using configuration (raw):"
65+
log " - AWS_REGION: $AWS_REGION"
66+
log " - CERT_MANAGER_VALUES: $CERT_MANAGER_VALUES"
67+
log " - CERT_MANAGER_VERSION: $CERT_MANAGER_VERSION"
68+
log " - CLUSTER_NAME: $CLUSTER_NAME"
69+
log " - CSP: $CSP"
70+
log " - FAKE_GPU_NODE_COUNT: $FAKE_GPU_NODE_COUNT"
71+
log " - GCP_PROJECT_ID: $GCP_PROJECT_ID"
72+
log " - GCP_SERVICE_ACCOUNT: $GCP_SERVICE_ACCOUNT"
73+
log " - GCP_ZONE: $GCP_ZONE"
74+
log " - GPU_OPERATOR_VALUES: $GPU_OPERATOR_VALUES"
75+
log " - GPU_OPERATOR_VERSION: $GPU_OPERATOR_VERSION"
76+
log " - KWOK_VERSION: $KWOK_VERSION (chart: $KWOK_CHART_VERSION)"
77+
log " - NVSENTINEL_ARM64_VALUES: $NVSENTINEL_ARM64_VALUES"
78+
log " - NVSENTINEL_CHART: $NVSENTINEL_CHART"
79+
log " - NVSENTINEL_VALUES: $NVSENTINEL_VALUES"
80+
log " - NVSENTINEL_VERSION: $NVSENTINEL_VERSION"
81+
log " - PROMETHEUS_OPERATOR_VERSION: $PROMETHEUS_OPERATOR_VERSION"
82+
log " - PROMETHEUS_VALUES: $PROMETHEUS_VALUES"
83+
log " - RESOURCE_QUOTA_RESOURCE: $RESOURCE_QUOTA_RESOURCE"
84+
log " - VALUES_DIR: $VALUES_DIR"
85+
log ""
86+
87+
6288
install_prometheus_operator() {
6389
log "Installing Prometheus Operator (version $PROMETHEUS_OPERATOR_VERSION)..."
6490

0 commit comments

Comments
 (0)