JAX inference offloading bridge #5032
ci.yaml
on: pull_request
metadata
4s
Matrix: amd64 / test-distribution
Matrix: arm64 / test-distribution
amd64
/
...
/
build-mpi-operator-compatible-base
2m 12s
arm64
/
...
/
build-mpi-operator-compatible-base
Matrix: amd64 / test-jax-cutlass-h100 / jax-cutlass-test-h100
Matrix: amd64 / test-jax / run-unit-test
Matrix: amd64 / test-te-a100 / run-unit-test
Matrix: amd64 / test-te-h100 / te-test-h100
amd64
/
build-torchax
8m 30s
amd64
/
...
/
launch-slurm-runner
1h 0m
amd64
/
test-nsys-jax-eks
4m 4s
amd64
/
...
/
launch-slurm-runner
2h 1m
Matrix: amd64 / test-nsys-jax / run-unit-test
Matrix: amd64 / test-nccl / nccl-test
Matrix: amd64 / test-nccl / nccl-test-gke / nccl-gke
Matrix: arm64 / test-jax-cutlass-h100 / jax-cutlass-test-h100
Waiting for pending jobs
Matrix: arm64 / test-jax / run-unit-test
Waiting for pending jobs
Matrix: arm64 / test-te-a100 / run-unit-test
Waiting for pending jobs
Matrix: arm64 / test-te-h100 / te-test-h100
Waiting for pending jobs
arm64
/
build-torchax
8m 5s
arm64
/
test-nsys-jax-eks
0s
arm64
/
...
/
launch-slurm-runner
arm64
/
...
/
launch-slurm-runner
Matrix: arm64 / test-nsys-jax / run-unit-test
Waiting for pending jobs
Matrix: arm64 / test-nccl / nccl-test
Waiting for pending jobs
Matrix: arm64 / test-nccl / nccl-test-gke / nccl-gke
Waiting for pending jobs
Matrix: amd64 / test-maxtext / maxtext-multinode
Matrix: amd64 / test-maxtext / single-process-multi-device
amd64
/
test-axlearn-eks
17m 9s
amd64
/
test-axlearn-fuji-models-eks
5m 24s
Matrix: amd64 / test-nsys-jax-archive
Matrix: arm64 / test-maxtext / maxtext-multinode
Waiting for pending jobs
Matrix: arm64 / test-maxtext / single-process-multi-device
Waiting for pending jobs
arm64
/
test-axlearn-eks
0s
arm64
/
test-axlearn-fuji-models-eks
0s
Matrix: arm64 / test-nsys-jax-archive
Matrix: amd64 / test-rosetta-t5x / vit-multi-gpu-multi-node
Matrix: arm64 / test-rosetta-t5x / vit-multi-gpu-multi-node
Waiting for pending jobs
Matrix: publish-containers
finalize
/
publish-badge
6s
Annotations
9 errors
|
amd64 / test-te-h100 / te-test-h100 (unittest, 8)
Process completed with exit code 1.
|
|
amd64 / test-jax / jax-A100-unit-test
The self-hosted runner lost communication with the server. Verify the machine is running and has a healthy network connection. Anything in your workflow that terminates the runner process, starves it for CPU/Memory, or blocks its network access can cause this error.
|
|
amd64 / test-nsys-jax / nsys-jax-A100-unit-test
Process completed with exit code 1.
|
|
amd64 / test-nsys-jax / nsys-jax-A100-unit-test
The action 'Run tests' has timed out after 60 minutes.
|
|
amd64 / test-te-a100 / te-A100-unit-test
The self-hosted runner lost communication with the server. Verify the machine is running and has a healthy network connection. Anything in your workflow that terminates the runner process, starves it for CPU/Memory, or blocks its network access can cause this error.
|
|
amd64 / test-maxtext / test-maxtext-metrics
Process completed with exit code 1.
|
|
amd64 / test-maxtext / test-maxtext-outcome
Process completed with exit code 1.
|
|
amd64 / test-rosetta-t5x / test-t5x-rosetta-metrics
Process completed with exit code 1.
|
|
amd64 / test-rosetta-t5x / test-t5x-rosetta-outcome
Process completed with exit code 1.
|
Artifacts
Produced during runtime
| Name | Size | Digest | |
|---|---|---|---|
|
artifact-axlearn-build-amd64
|
566 Bytes |
sha256:554f1b7958675607888b406de0363b660d1e1f58ea6f045dc9bc3b36d1d9b683
|
|
|
artifact-axlearn-build-arm64
|
567 Bytes |
sha256:57206e477a851a7ed3655c6e205770cc9253eb71f5d45156448ba64d9e5d9d8f
|
|
|
artifact-axlearn-test
|
179 KB |
sha256:db41e10fb2695a215a20144753504e0721ef91a6dfc84b1b6b59d7b2615b9174
|
|
|
artifact-base-build-amd64
|
567 Bytes |
sha256:cbd7ddfdb6b5af8adacf57bd3fb4faf2914a63884a6e97926a3cdfd293398244
|
|
|
artifact-base-build-arm64
|
566 Bytes |
sha256:9ed5ec48b2c58975562db9fea18468df66091b6b45ab905f3f51c1bda7da13f9
|
|
|
artifact-equinox-build-amd64
|
569 Bytes |
sha256:bbd09fa2254e73126205dd41046b2d7aae29f538ead8999f71ec206c96c9c3ba
|
|
|
artifact-equinox-build-arm64
|
568 Bytes |
sha256:d0a6740e875148d544945b5e72ac16c9243fb33a745a33154c64d3ed19c553ee
|
|
|
artifact-final-report
|
3.43 KB |
sha256:b79a6ea93dd5e917a6a461ccdc9b7d5062b46cd644267c964dc18fd13cc7b67b
|
|
|
artifact-jax-build-amd64
|
553 Bytes |
sha256:c21ff7c25e11d0414cdc5bcec9cd360353431538aeac93791d1a3eb9903ac63c
|
|
|
artifact-jax-build-arm64
|
550 Bytes |
sha256:784e00571b1ea038421b01952a6f6573bef8f617ccf9166c1d5dc3a042da2894
|
|
|
artifact-maxtext-build-amd64
|
567 Bytes |
sha256:71769dedb9810330ee8bf83821a54739cebb93670f30663fe475ec34291586d1
|
|
|
artifact-maxtext-build-arm64
|
568 Bytes |
sha256:14100fc6b8c09e6537f617911f3d5fc4ebacee02dce05abfab0b4cd970043e4f
|
|
|
artifact-maxtext-test
|
640 Bytes |
sha256:014e23a365ba00fb5788c27a797619578800dc15d5d3521d32282b57b27469ed
|
|
|
artifact-mpi-operator-compatible-base-build-amd64
|
639 Bytes |
sha256:0629728d1917ae1569fcd9b8bdae2de63df3496e163f3dd43850c0cf480f4153
|
|
|
artifact-nccl-gke-build-amd64
|
572 Bytes |
sha256:ce83a852d990f3082913d52d33a67b89c2f24a7f9e55a294b69e4523136c2862
|
|
|
artifact-rosetta-build-t5x-amd64
|
585 Bytes |
sha256:733f07da1dcefdd29d0f30606dba291ab55c3106937c1582d2afdb49bc51cd21
|
|
|
artifact-rosetta-build-t5x-arm64
|
584 Bytes |
sha256:d8fc54856e969c7267aef3f9925ad9d19cd027987605ec262d6e38bd1d8a0ff0
|
|
|
artifact-rosetta-t5x-mgmn-test
|
624 Bytes |
sha256:842e94f73395b5616cacbc2b146ab0ff436ff3baf57025c24fd8f96f335421a4
|
|
|
artifact-t5x-build-amd64
|
569 Bytes |
sha256:ea26952df8683d41a9cb0a94a570e05a1b22423b46de7e656933fe82ac3f3d29
|
|
|
artifact-t5x-build-arm64
|
567 Bytes |
sha256:d034bf087ffb0e109e5c6dcc20e9254a9ebb8abccff7f35b280213c449fc939e
|
|
|
artifact-torchax-build-amd64
|
568 Bytes |
sha256:079f93b7bbd8d502a83bdb8d7d5ea361f4d61a2cde51e6be007ae106bbe6b0af
|
|
|
artifact-torchax-build-arm64
|
568 Bytes |
sha256:f9933e1717bb753cc746ae949bbbce3a21715347a000f49611ca3069effea816
|
|
|
artifact-workflow-metadata
|
277 Bytes |
sha256:d47e1e84d8e4620cc814582d21529d031b92e760bb5c16f1b6fc9b31e5df39de
|
|
|
bumped-manifest
|
51.6 KB |
sha256:57f798f759c92363a6a69540312b06ce7f2388106c3f105640ef2f3b46bf24ca
|
|
|
final-axlearn
|
263 Bytes |
sha256:7cb4af3278c1d31c368aec9e47977aa660b338fd39c25d32458af1897b1f2a18
|
|
|
final-base
|
254 Bytes |
sha256:0f4f2895626b77a127dca62f553e7dba32ae6a38de02cf3f0422cc0a9538b78d
|
|
|
final-equinox
|
263 Bytes |
sha256:04dc75229f0940cb2e03f71183e64cc526f6496f273e558cc9e46560f24172e7
|
|
|
final-jax
|
251 Bytes |
sha256:25db0dfd1da812d2274c2a85b145f20ce821d88e0d899463b712105595b9f0e2
|
|
|
final-maxtext
|
262 Bytes |
sha256:ff5dcf3180a5be088855f29b749ff59a9fb13b9faf906b6eba4378de23abe2fa
|
|
|
final-t5x
|
251 Bytes |
sha256:6bf334e145acca03fab8b550f728adbdabfd17ee89a1ca4f978dfb5c1d25093a
|
|
|
final-upstream-t5x
|
277 Bytes |
sha256:462cf373ff1e08c16be687b3a81c4f5107d705698b31c5f460966470b54f407d
|
|
|
gke-maxtext-train
|
366 MB |
sha256:a82ef3066a22098911acc907ff9d5e48bda6016d5eaf89538a40a000b136ec94
|
|
|
gke-maxtext-train-sitrep
|
228 Bytes |
sha256:fadbf17f47b11114a088c2938e7b31a21ca72e19f98e3303475c871f085e29f6
|
|
|
jax-cutlass-test-H100
|
4.69 KB |
sha256:6034dd74309f30d2a7ce5c9e547c4a17964a73d5288199bed0940fd4523b44fb
|
|
|
mealkit-axlearn
|
272 Bytes |
sha256:5f9d215ea9c3e42b9a6acd3cf3f6bafc6bcf9a88d694e10a435b7de54a9b052c
|
|
|
mealkit-equinox
|
272 Bytes |
sha256:1c5571e07d017b37a68a2642c18f87dc5a2a158ab6af570c63e961b874cdd17f
|
|
|
mealkit-jax
|
261 Bytes |
sha256:24077af20cca33960e206380a007908cfa32998acf2cadde630100258a57ccc9
|
|
|
mealkit-maxtext
|
271 Bytes |
sha256:4203995ff9f11674cf0e4d70893893d49d047e40b41184644f6a07c6ed8ec014
|
|
|
mealkit-t5x
|
261 Bytes |
sha256:4f6a5ff71da13cdc0d4639a08e08df1d095de09c09ed3569d666083844276f54
|
|
|
mealkit-upstream-t5x
|
286 Bytes |
sha256:d45b5253c2a359ddcf2bf49c0e9d45041acd731bcc77df96e03a53b632997a25
|
|
|
nccl-gke-all-gather
|
15.4 KB |
sha256:98bc56a3215eca399fe116564d411967b66375f5c12b5b2bc7fddd9f49be8285
|
|
|
nccl-gke-all-gather-sitrep
|
231 Bytes |
sha256:a24f8d20b661443392a565811e1d8019f09eb3b3b7699cc8309c4d8782f4e826
|
|
|
nccl-gke-all-reduce
|
15.6 KB |
sha256:04a8dcbef8f7ee3a65b9a2f846350223b8f75c29e2102d2ac083e787a4b4167c
|
|
|
nccl-gke-all-reduce-sitrep
|
231 Bytes |
sha256:cc3fd2932f944b27e50379d1aa209bb39188b7a17b8c4f36e2fa89edff339b46
|
|
|
nccl-gke-broadcast
|
15.2 KB |
sha256:b592d5fe20b539b92ee61000158abcd3ae6df60ddd2f9266e670fd41f4a2e1d1
|
|
|
nccl-gke-broadcast-sitrep
|
229 Bytes |
sha256:0240756a615d1e5008e88f112542cb62eb4df33d48574dae2992b9f53a142198
|
|
|
nccl-gke-reduce-scatter
|
15.5 KB |
sha256:bbbfc67f80fcb96bff931b3e768533ab8c895139e3de9388b0b40bab94c9344a
|
|
|
nccl-gke-reduce-scatter-sitrep
|
234 Bytes |
sha256:aa962bc9d2857c8c82650bd317e22e1e2ee97d3b031fb9f869705c4c371af4aa
|
|
|
nsys-jax-unit-test-A100
|
1.6 KB |
sha256:e0b8d50d4806c9a6c5e700b05a0547339e2b2daa37be387956e3865559a665a1
|
|
|
rosetta-t5x-vit-19316880629-VIT8G1N
|
16.5 KB |
sha256:bbd74d9c6771cf086407bdfac09da6458407cded9b561a006c1d7b5cd9be6f20
|
|
|
te-unit-test-H100
|
2.08 MB |
sha256:8460d01faab5adc581a900dc75a867d73e6bd53a8d9ed38c0131672b978d2cc5
|
|
|
upstream-maxtext-19316880629-1DP2FSDP4TP1PP_single_process
|
23.7 KB |
sha256:a34eb97a9041abe54e394b1f7e2a303009868c719881a68795ab8ce85602689d
|
|
|
upstream-maxtext-19316880629-2DP2FSDP2TP1PP
|
575 Bytes |
sha256:26a70ae144aa56dd3dfcd6aa6d64c71c2dbf2f0eae1b47e6c9ca6f1448747c5e
|
|