diff --git a/.github/workflows/cicd-main.yml b/.github/workflows/cicd-main.yml index 345482e9a1a8..55a952c21eb6 100644 --- a/.github/workflows/cicd-main.yml +++ b/.github/workflows/cicd-main.yml @@ -217,15 +217,14 @@ jobs: SCRIPT: | NEMO_NUMBA_MINVER=0.53 pytest tests/hydra -m "not pleasefixme" --with_downloads - OPTIONAL_L0_Unit_Tests_GPU_Lightning: + L0_Unit_Tests_GPU_Lightning: needs: [cicd-test-container-setup] uses: ./.github/workflows/_test_template.yml - if: contains(fromJSON(needs.cicd-test-container-setup.outputs.test_to_run), 'OPTIONAL_L0_Unit_Tests_GPU_Lightning') || needs.cicd-test-container-setup.outputs.all == 'true' + if: contains(fromJSON(needs.cicd-test-container-setup.outputs.test_to_run), 'L0_Unit_Tests_GPU_Lightning') || needs.cicd-test-container-setup.outputs.all == 'true' with: RUNNER: self-hosted-azure SCRIPT: | NEMO_NUMBA_MINVER=0.53 pytest tests/lightning -m "not pleasefixme" --with_downloads - IS_OPTIONAL: true L0_Unit_Tests_GPU_Others: needs: [cicd-test-container-setup] @@ -2468,10 +2467,10 @@ jobs: rm -rf examples/nlp/language_modeling/gpt_pretrain_results rm -rf examples/nlp/language_modeling/gpt_index_mappings - L2_Megatron_GPT_Pretraining_and_Resume_Training_PP2: + Optional_L2_Megatron_GPT_Pretraining_and_Resume_Training_PP2: needs: [cicd-test-container-setup] uses: ./.github/workflows/_test_template.yml - if: contains(fromJSON(needs.cicd-test-container-setup.outputs.test_to_run), 'L2_Megatron_GPT_Pretraining_and_Resume_Training_PP2') || needs.cicd-test-container-setup.outputs.all == 'true' + if: contains(fromJSON(needs.cicd-test-container-setup.outputs.test_to_run), 'Optional_L2_Megatron_GPT_Pretraining_and_Resume_Training_PP2') || needs.cicd-test-container-setup.outputs.all == 'true' with: RUNNER: self-hosted-azure-gpus-2-h100 SCRIPT: | @@ -2578,6 +2577,7 @@ jobs: AFTER_SCRIPT: | rm -rf examples/nlp/language_modeling/gpt_pretrain_results rm -rf examples/nlp/language_modeling/gpt_index_mappings + IS_OPTIONAL: true OPTIONAL_L2_Megatron_GPT_Auto_Configurator_TP1_PP1_MBS124: needs: [cicd-test-container-setup] @@ -4323,7 +4323,7 @@ jobs: - L0_Unit_Tests_GPU_TTS #- OPTIONAL_L0_Unit_Tests_GPU_Core - L0_Unit_Tests_GPU_Hydra - #- OPTIONAL_L0_Unit_Tests_GPU_Lightning + - L0_Unit_Tests_GPU_Lightning - L0_Unit_Tests_GPU_Others - L0_Unit_Tests_CPU_ASR @@ -4390,7 +4390,7 @@ jobs: - L2_Megatron_GPT_with_Drop_Optimizer_States_TP2 - L2_Megatron_GPT_with_ALiBi_Pretraining_and_Resume_Training_TP2 - L2_Megatron_GPT_with_KERPLE_Pretraining_and_Resume_Training_TP2 - - L2_Megatron_GPT_Pretraining_and_Resume_Training_PP2 + # - Optional_L2_Megatron_GPT_Pretraining_and_Resume_Training_PP2 #- OPTIONAL_L2_Megatron_GPT_Auto_Configurator_TP1_PP1_MBS124 - L2_Megatron_GPT_Finetuning_PP2 - L2_Megatron_GPT_Finetuning_StarCoder_PP1