Skip to content

Commit d7e82d9

Browse files
committed
Merge branch 'ko3n1g/ci/fix-notifications-2' into 'main'
ci: Fix notifications See merge request ADLR/megatron-lm!2265
2 parents 32e427d + 8bac43a commit d7e82d9

File tree

4 files changed

+7
-7
lines changed

4 files changed

+7
-7
lines changed

tests/functional_tests/jet_recipes/gpt.yaml

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -55,7 +55,6 @@ products:
5555
- gpt3_mr_mcore_te_tp1_pp4_vp1_decoupled_lr_dgx_a100_1N8G
5656
- gpt3_mr_mcore_te_tp1_pp4_vp1_uneven_pipeline_dgx_a100_1N8G
5757
- gpt3_mr_mcore_te_tp1_pp4_vp1_dgx_a100_1N8G
58-
- gpt3_mr_mcore_te_tp1_pp4_vp1_dist_optimizer_overlap_grad_reduce_dgx_a100_1N8G
5958
- gpt3_mr_mcore_te_tp1_pp4_vp1_dist_optimizer_overlap_grad_reduce_param_gather_overlap_optimizer_dgx_a100_1N8G
6059
- gpt3_mr_mcore_te_tp1_pp4_vp1_dist_optimizer_overlap_grad_reduce_untied_dgx_a100_1N8G
6160
- gpt3_mr_mcore_te_tp1_pp4_vp1_resume_torch_decoupled_lr_dgx_a100_1N8G
@@ -73,10 +72,9 @@ products:
7372
- gpt3_mr_mcore_te_tp2_pp1_te_8experts2parallel_dist_optimizer_dgx_a100_1N8G
7473
- gpt3_mr_mcore_te_tp2_pp1_te_8experts2parallel_groupedGEMM_dgx_a100_1N8G
7574
- gpt3_mr_mcore_te_tp2_pp1_te_8experts2parallel_overlap_grad_reduce_param_gather_groupedGEMM_dgx_a100_1N8G
76-
- gpt3_mr_mcore_te_tp2_pp1_te_8experts2parallel_top2router_dgx_a100_1N8G
75+
# - gpt3_mr_mcore_te_tp2_pp1_te_8experts2parallel_top2router_dgx_a100_1N8G
7776
- gpt3_mr_mcore_te_tp2_pp2_cross_entropy_loss_fusion_dgx_a100_1N8G
7877
- gpt3_mr_mcore_te_tp2_pp2_ddp_average_in_collective_dgx_a100_1N8G
79-
- gpt3_mr_mcore_te_tp2_pp2_defer_embedding_wgrad_compute_dgx_a100_1N8G
8078
- gpt3_mr_mcore_te_tp2_pp2_dgx_a100_1N8G
8179
- gpt3_mr_mcore_te_tp2_pp2_no_create_attention_mask_in_dataloader_dgx_a100_1N8G
8280
- gpt3_mr_mcore_te_tp2_pp2_no_mmap_bin_files_dgx_a100_1N8G
@@ -139,11 +137,13 @@ products:
139137
platforms: [dgx_a100]
140138
time_limit: [1800]
141139
test_case:
140+
- gpt3_mr_mcore_te_tp2_pp2_defer_embedding_wgrad_compute_dgx_a100_1N8G
142141
- gpt3_mr_mcore_te_tp1_pp4_vp1_dist_optimizer_overlap_grad_reduce_param_gather_dgx_a100_1N8G
143142
- gpt3_mr_mcore_te_tp2_pp1_cp2_nondeterministic_dgx_a100_1N8G
144143
- gpt3_mr_mcore_te_tp2_pp1_resume_torch_dist_cp2_nondeterministic_dgx_a100_1N8G
145144
- gpt3_mr_mcore_te_tp2_pp2_cp2_nondeterministic_dgx_a100_1N8G
146145
- gpt3_mr_mcore_te_tp2_pp2_resume_torch_dist_cp2_nondeterministic_dgx_a100_1N8G
146+
- gpt3_mr_mcore_te_tp1_pp4_vp1_dist_optimizer_overlap_grad_reduce_dgx_a100_1N8G
147147
- environment: [lts]
148148
scope: [weekly]
149149
platforms: [dgx_h100]

tests/functional_tests/jet_recipes/t5.yaml

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -36,14 +36,14 @@ products:
3636
- t5_220m_mr_mcore_te_tp4_pp1_dgx_a100_1N8G
3737
- t5_220m_mr_mcore_te_tp4_pp1_resume_torch_dist_dgx_a100_1N8G
3838
- t5_220m_mr_mcore_te_tp2_pp2_resume_torch_dgx_a100_1N8G
39-
- t5_220m_mr_mcore_tp4_pp1_dgx_a100_1N8G
4039
- t5_220m_mr_mcore_tp4_pp1_resume_torch_dist_dgx_a100_1N8G
4140
- t5_220m_mr_mcore_tp2_pp2_resume_torch_dgx_a100_1N8G
42-
- t5_220m_mr_mcore_tp2_pp2_dgx_a100_1N8G
4341
- environment: [lts]
4442
scope: [mr]
4543
time_limit: [1800]
4644
test_case:
45+
- t5_220m_mr_mcore_tp4_pp1_dgx_a100_1N8G
46+
- t5_220m_mr_mcore_tp2_pp2_dgx_a100_1N8G
4747
- t5_220m_mr_mcore_te_tp2_pp2_dgx_a100_1N8G
4848
- environment: [lts]
4949
scope: [weekly]

tests/functional_tests/shell_test_utils/notify.sh

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -48,7 +48,7 @@ if [[ ${ret_code:-0} -ne 0 ]]; then
4848
fi
4949

5050
# Fetch GitLab logs of JET downstream pipeline
51-
DOWNSTREAM_PIPELINE_ID=$(jq --arg environment "$ENVIRONMENT" '.[] |select(.name == "jet-trigger-" + $environment) | .downstream_pipeline.id' <<< "$PIPELINE_JSON")
51+
DOWNSTREAM_PIPELINE_ID=$(jq --arg environment "$ENVIRONMENT" '.[] |select(.name == "functional:run_" + $environment) | .downstream_pipeline.id' <<< "$PIPELINE_JSON")
5252

5353
PIPELINE_URL=https://${GITLAB_ENDPOINT}/ADLR/megatron-lm/-/pipelines/$CI_PIPELINE_ID
5454
JOB_URL=https://${GITLAB_ENDPOINT}/ADLR/megatron-lm/-/jobs/

tests/functional_tests/shell_test_utils/notify_unit_tests.sh

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -48,7 +48,7 @@ if [[ ${ret_code:-0} -ne 0 ]]; then
4848
exit 1
4949
fi
5050

51-
UNIT_TESTS_JOBS=$(echo -E $PIPELINE_JSON | jq '[.[] | select(.name | startswith("test:unit_tests_"))]')
51+
UNIT_TESTS_JOBS=$(echo -E $PIPELINE_JSON | jq '[.[] | select(.name | startswith("test:pyt"))]')
5252

5353
if [[ $UNIT_TESTS_JOBS == null ]]; then
5454
FAILED_JOBS=$(curl \

0 commit comments

Comments
 (0)