Skip to content

Commit 611c70f

Browse files
committed
Merge branch 'main' into ahmadki/simulated-user-rec
Signed-off-by: Ahmad Kiswani <[email protected]>
2 parents 6c6b723 + 3a69c21 commit 611c70f

File tree

232 files changed

+23768
-7864
lines changed

Some content is hidden

Large Commits have some content hidden by default. Use the searchbox below for content that may be hidden.

232 files changed

+23768
-7864
lines changed

.github/ISSUE_TEMPLATE/bug_report.md

Lines changed: 0 additions & 42 deletions
This file was deleted.

.github/ISSUE_TEMPLATE/feature_request.md

Lines changed: 0 additions & 25 deletions
This file was deleted.

.github/workflows/cherry-pick-release-commit.yml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -20,7 +20,7 @@ on:
2020

2121
jobs:
2222
cherry-pick:
23-
uses: NVIDIA-NeMo/FW-CI-templates/.github/workflows/_cherry_pick.yml@v0.31.0
23+
uses: NVIDIA-NeMo/FW-CI-templates/.github/workflows/_cherry_pick.yml@v0.63.0
2424
secrets:
2525
PAT: ${{ secrets.PAT }}
2626
SLACK_WEBHOOK_ADMIN: ${{ secrets.SLACK_WEBHOOK_ADMIN }}

.github/workflows/cicd-main.yml

Lines changed: 7 additions & 10 deletions
Original file line numberDiff line numberDiff line change
@@ -288,7 +288,7 @@ jobs:
288288
is_fork_pr: ${{ github.event_name == 'pull_request' && github.event.pull_request.head.repo.full_name != github.event.pull_request.base.repo.full_name }}
289289

290290
CI_QA_Gate:
291-
name: CI quality check
291+
name: "CI quality check${{ needs.pre-flight.outputs.test_level == 'none' && ' (No tests run: Label CI:L*)' || '' }}"
292292
if: always()
293293
runs-on: ubuntu-latest
294294
needs:
@@ -310,17 +310,14 @@ jobs:
310310
needs.lint-check.result == 'success' &&
311311
(needs.pr-branch-up-to-date-check.result == 'success' || needs.pr-branch-up-to-date-check.result == 'skipped') &&
312312
(
313-
needs.pre-flight.outputs.test_level == 'none' ||
313+
needs.pre-flight.outputs.test_level != 'none' &&
314+
needs.sphinx-build.result == 'success' &&
315+
needs.build-container.result == 'success' &&
314316
(
315-
needs.pre-flight.outputs.test_level != 'none' &&
316-
needs.sphinx-build.result == 'success' &&
317-
needs.build-container.result == 'success' &&
318317
(
319-
(
320-
(needs.cicd-doc-tests.result == 'skipped' || needs.cicd-doc-tests.result == 'success') &&
321-
(needs.cicd-unit-tests.result == 'skipped' || needs.cicd-unit-tests.result == 'success') &&
322-
(needs.cicd-functional-tests.result == 'skipped' || needs.cicd-functional-tests.result == 'success')
323-
)
318+
needs.cicd-doc-tests.result == 'success' &&
319+
(needs.cicd-unit-tests.result == 'skipped' || needs.cicd-unit-tests.result == 'success') &&
320+
(needs.cicd-functional-tests.result == 'skipped' || needs.cicd-functional-tests.result == 'success')
324321
)
325322
)
326323
)

.gitignore

Lines changed: 2 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -1,6 +1,6 @@
11
# Adding to .gitignore helps reduce the size of your working_dir
22

3-
.git
3+
/.git
44
*.out
55
*.log
66
*.tar
@@ -17,7 +17,6 @@ dist/
1717
*.vscode/
1818
release_run*
1919
ckpts/
20-
3rdparty/vllm
2120

2221
# Test
2322
coverage.json
@@ -33,7 +32,7 @@ uv_cache/
3332
hf_home/
3433
hf_datasets_cache/
3534
*logs/
36-
datasets/
35+
/datasets/
3736
docker/*
3837
!docker/Dockerfile
3938
!docker/Dockerfile.ngc_pytorch

.gitmodules

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1,7 +1,7 @@
11
[submodule "3rdparty/Megatron-LM"]
22
path = 3rdparty/Megatron-LM-workspace/Megatron-LM
33
url = https://github.com/terrykong/Megatron-LM.git
4-
branch = yuya/nemo-rl-use-2
4+
branch = guyueh/yuya/nemo-rl-use-2
55
shallow = true
66
[submodule "3rdparty/Megatron-Bridge"]
77
path = 3rdparty/Megatron-Bridge-workspace/Megatron-Bridge

.pre-commit-config.yaml

Lines changed: 35 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -46,3 +46,38 @@ repos:
4646
require_serial: true
4747
additional_dependencies: []
4848
minimum_pre_commit_version: "2.9.2"
49+
50+
# This pre-commit hook ensures that the config file is minimized and reflects exactly what you
51+
# intend to merge. Without it, you might run experiments with one config, but when merging upstream,
52+
# the config could silently fall back to the base defaults—resulting in different hyperparameters.
53+
#
54+
# For example, we’ve seen cases where an SFT recipe runs without a custom chat_template. When merged,
55+
# it unexpectedly picks up the default recommended chat_template from upstream, which doesn’t match
56+
# the original experiment setup.
57+
#
58+
# If this check is disruptive, you can disable the pre-commit hook locally. However, before a recipe
59+
# is accepted upstream, we expect the config to be minimized.
60+
- repo: local
61+
hooks:
62+
- id: configs-minimize-check-llm
63+
name: minimize-check llm recipes
64+
language: system
65+
pass_filenames: false
66+
entry: bash
67+
args:
68+
- -lc
69+
- |
70+
set -euo pipefail
71+
base="examples/configs/dpo.yaml"; for f in examples/configs/recipes/llm/dpo-*.yaml; do [ -e "$f" ] && ./tools/config_cli.py minimize-check "$base" "$f"; done
72+
base="examples/configs/grpo_math_1B.yaml"; for f in examples/configs/recipes/llm/grpo-*.yaml; do [ -e "$f" ] && ./tools/config_cli.py minimize-check "$base" "$f"; done
73+
base="examples/configs/sft.yaml"; for f in examples/configs/recipes/llm/sft-*.yaml; do [ -e "$f" ] && ./tools/config_cli.py minimize-check "$base" "$f"; done
74+
- id: configs-minimize-check-vlm
75+
name: minimize-check vlm recipes
76+
language: system
77+
pass_filenames: false
78+
entry: bash
79+
args:
80+
- -lc
81+
- |
82+
set -euo pipefail
83+
base="examples/configs/vlm_grpo_3B.yaml"; for f in examples/configs/recipes/vlm/vlm_grpo-*.yaml; do [ -e "$f" ] && ./tools/config_cli.py minimize-check "$base" "$f"; done

3rdparty/Megatron-Bridge-workspace/setup.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -33,7 +33,7 @@
3333
"packaging",
3434
"tensorboard>=2.19.0",
3535
"torch",
36-
"transformers>=4.51.3",
36+
"transformers>=4.55.0",
3737
"typing-extensions",
3838
"rich",
3939
"wandb>=0.19.10",

0 commit comments

Comments
 (0)