Summary
Jobs
metadata
bump-manifest
amd64
build-base
test-distribution (extra-only-distribution.sh)
test-distribution (mirror-only-distribution.sh)
test-distribution (upstream-only-distribution.sh)
test-distribution (local-patch-distribution.sh)
build-jax
build-triton
build-equinox
build-maxtext
build-levanter
build-upstream-t5x
build-upstream-pax
build-gemma
launch-slurm-runner
jax-V100-unit-test
jax-A100-unit-test
launch-slurm-runner
nsys-jax-V100-unit-test
nsys-jax-A100-unit-test
launch-slurm-runner
pallas-V100-unit-test
pallas-A100-unit-test
launch-slurm-runner
triton-V100-unit-test
triton-A100-unit-test
single-process-multi-device (1, 1, 2, 4)
maxtext-multinode (1, 1, 1, 1)
maxtext-multinode (1, 1, 8, 1)
maxtext-multinode (1, 1, 1, 8)
maxtext-multinode (1, 1, 4, 2)
maxtext-multinode (1, 2, 2, 2)
maxtext-multinode (1, 4, 2, 2)
test-maxtext-metrics
test-maxtext-summary
sitrep
test-maxtext-outcome
launch-slurm-runner
levanter-V100-unit-test
levanter-A100-unit-test
build-rosetta
t5x-multi-gpu (1P8G, 8)
t5x-multi-gpu (1P2G_fmha, 2, --enable-fmha 1)
t5x-multi-node (8G2N, 8, 2)
t5x-multi-node (8G2N_fmha, 8, 2, --enable-fmha 1)
test-upstream-t5x-metrics
test-upstream-t5x-summary
sitrep
test-upstream-t5x-outcome
build-rosetta
te-2GPU
te-4GPU
te-8GPU
sitrep
launch-slurm-runner
te-V100-unit-test
te-A100-unit-test
single-process-multi-device (1, 8, 1, 1)
single-process-multi-device (1, 1, 2, 4)
pax-multi-node (1DP1FSDP1TP1PP, 1, 1, 1, 1, 4)
pax-multi-node (8DP1FSDP1TP1PP, 1, 8, 1, 1, 4)
pax-multi-node (1DP8FSDP1TP1PP, 1, 1, 8, 1, 4)
pax-multi-node (2DP1FSDP1TP4PP, 4, 2, 1, 1, 4)
pax-multi-node (4DP1FSDP2TP1PP, 1, 4, 1, 2, 4)
pax-multi-node (16DP1FSDP1TP1PP, 1, 16, 1, 1, 4)
pax-multi-node (2DP1FSDP2TP4PP, 4, 2, 1, 2, 4)
pax-multi-node (LLaMA_eval, 1, 1, 8, 1, 4, true, --model-type LLaMA70BProxy --evaluate)
single-process-evaluation (1, 8, 1, 1)
test-upstream-pax-metrics
test-upstream-pax-summary
sitrep
test-upstream-pax-outcome
launch-slurm-runner
gemma-V100-unit-test
gemma-A100-unit-test
single-process-multi-device (1P1G_te-0, 1, --enable-te 0)
single-process-multi-device (1P8G_te-1, 8, --gin.train/utils.DatasetConfig.pack=False --gin.train...
multi-gpu-multi-node (2N8G-te-1, 8, 2, --gin.train/utils.DatasetConfig.pack=False --gin.train_eva...
multi-gpu-multi-node (2N2G_te-0, 2, 2, --enable-te 0)
vit-single-process-multi-device (8)
vit-multi-gpu-multi-node (1, 1)
vit-multi-gpu-multi-node (1, 2)
vit-multi-gpu-multi-node (8, 1)
vit-multi-gpu-multi-node (8, 2)
test-t5x-rosetta-metrics
test-t5x-rosetta-summary
sitrep
test-t5x-rosetta-outcome
collect-docker-tags
single-process-multi-device-te (1, 8, 1, 1)
single-process-multi-device-te (1, 1, 2, 4)
rosetta-pax-multi-node-te (1DP1FSDP1TP1PP_TE, 1, 1, 1, 1, 4)
rosetta-pax-multi-node-te (8DP1FSDP1TP1PP_TE, 1, 8, 1, 1, 4)
rosetta-pax-multi-node-te (1DP8FSDP1TP1PP_TE, 1, 1, 8, 1, 4)
rosetta-pax-multi-node-te (4DP1FSDP2TP1PP_TE, 1, 4, 1, 2, 4)
rosetta-pax-multi-node-te (16DP1FSDP1TP1PP_TE, 1, 16, 1, 1, 4)
rosetta-pax-multi-node-te (5B_fused_attn_1, 1, 1, 8, 1, 2, --model-type 5B)
rosetta-pax-multi-node-te (5B_fused_attn_0, 1, 1, 8, 1, 2, --model-type 5B --disable-fused-attn)
rosetta-pax-multi-node-te (LLaMA_eval_TE, 1, 1, 8, 1, 4, true, --model-type LLaMA70BProxy --evalu...
rosetta-pax-multi-node (1, 8, 1, 1)
rosetta-pax-multi-node (1, 4, 1, 2)
rosetta-pax-multi-node (4, 2, 1, 1)
rosetta-pax-multi-node (4, 2, 1, 2)
rosetta-pax-single-node-dropout-te (1, 8, 1, 1)
single-process-evaluation-te (1, 8, 1, 1)
test-pax-rosetta-metrics
test-pax-rosetta-summary
sitrep
test-pax-rosetta-outcome
arm64
merge-new-manifest
make-publish-configs
publish-containers (jax, jax-mealkit, 500, ghcr.io/nvidia/jax-toolbox-internal:11382252869-jax-am...
publish-containers (triton, jax-mealkit, 500, ghcr.io/nvidia/jax-toolbox-internal:11382252869-tri...
publish-containers (equinox, jax-mealkit, 500, ghcr.io/nvidia/jax-toolbox-internal:11382252869-eq...
publish-containers (maxtext, jax-mealkit, 500, ghcr.io/nvidia/jax-toolbox-internal:11382252869-ma...
publish-containers (levanter, jax-mealkit, 500, ghcr.io/nvidia/jax-toolbox-internal:11382252869-l...
publish-containers (upstream-t5x, jax-mealkit, 500, ghcr.io/nvidia/jax-toolbox-internal:113822528...
publish-containers (upstream-pax, jax-mealkit, 500, ghcr.io/nvidia/jax-toolbox-internal:113822528...
publish-containers (t5x, jax-mealkit, 500, ghcr.io/nvidia/jax-toolbox-internal:11382252869-t5x-am...
publish-containers (pax, jax-mealkit, 500, ghcr.io/nvidia/jax-toolbox-internal:11382252869-pax-am...
publish-containers (gemma, jax-mealkit, 500, ghcr.io/nvidia/jax-toolbox-internal:11382252869-gemm...
publish-containers (base, jax, 800, ghcr.io/nvidia/jax-toolbox-internal:11382252869-base-amd64, g...
publish-containers (jax, jax, 1000, ghcr.io/nvidia/jax-toolbox-internal:11382252869-jax-amd64, gh...
publish-containers (triton, jax, 900, ghcr.io/nvidia/jax-toolbox-internal:11382252869-triton-amd6...
publish-containers (equinox, jax, 900, ghcr.io/nvidia/jax-toolbox-internal:11382252869-equinox-am...
publish-containers (maxtext, jax, 900, ghcr.io/nvidia/jax-toolbox-internal:11382252869-maxtext-am...
publish-containers (levanter, jax, 900, ghcr.io/nvidia/jax-toolbox-internal:11382252869-levanter-...
publish-containers (upstream-t5x, jax, 900, ghcr.io/nvidia/jax-toolbox-internal:11382252869-upstr...
publish-containers (upstream-pax, jax, 900, ghcr.io/nvidia/jax-toolbox-internal:11382252869-upstr...
publish-containers (t5x, jax, 900, ghcr.io/nvidia/jax-toolbox-internal:11382252869-t5x-amd64, ghc...
publish-containers (pax, jax, 900, ghcr.io/nvidia/jax-toolbox-internal:11382252869-pax-amd64, ghc...
publish-containers (gemma, jax, 900, ghcr.io/nvidia/jax-toolbox-internal:11382252869-gemma-amd64,...
finalize
You can’t perform that action at this time.