Commit b79f75f
authored
File tree
7 files changed
+321
-105
lines changed- 3rdparty
- examples/evaluation
- scripts/performance
- configs/qwen
7 files changed
+321
-105
lines changedSubmodule Megatron-LM updated 58 files
- .github/copy-pr-bot.yaml+1-1
- README.md+4-4
- docs/user-guide/features/multi_token_prediction.md+2-2
- docs/user-guide/quickstart.md-3
- examples/rl/README.md-1
- examples/rl/environment_configs/gsm8k_nanov3.yaml-2
- examples/rl/environments/countdown/countdown_agent.py+1-8
- examples/rl/environments/math/gsm8k_agent.py-4
- examples/rl/environments/math/math_agent.py+2-16
- examples/rl/model_configs/common.sh+1-1
- examples/rl/model_configs/llama3p1_8b_instruct.sh+1-3
- examples/rl/model_configs/nemotron6_3b_moe.sh+1-1
- examples/rl/model_configs/qwen3_4b.sh-2
- examples/rl/model_configs/qwen3_8b.sh-2
- examples/rl/model_configs/qwen_2p5_3b.sh+2-2
- examples/rl/model_configs/qwen_2p5_distill_7b.sh-2
- megatron/core/QuickStart.md+1-1
- megatron/core/inference/config.py+6
- megatron/core/inference/contexts/dynamic_context.py+35-7
- megatron/core/inference/text_generation_server/dynamic_text_gen_server/endpoints/chat_completions.py+83-34
- megatron/core/inference/text_generation_server/dynamic_text_gen_server/flask_server.py+21-8
- megatron/core/inference/unified_memory.py+6
- megatron/core/ssm/mamba_block.py+42-4
- megatron/core/tokenizers/text/libraries/huggingface_tokenizer.py+4-2
- megatron/core/tokenizers/text/parsers/__init__.py+12
- megatron/core/tokenizers/text/parsers/base_parser.py+21
- megatron/core/tokenizers/text/parsers/deepseek_r1_reasoning_parser.py+33
- megatron/core/tokenizers/text/parsers/qwen3_coder_tool_parser.py+282
- megatron/core/transformer/experimental_attention_variant/dsa.py+395-98
- megatron/core/transformer/module.py+5-1
- megatron/core/transformer/multi_token_prediction.py+4-4
- megatron/core/transformer/transformer_block.py+83-5
- megatron/inference/utils.py+1
- megatron/rl/agent/api.py-18
- megatron/rl/agent/pass_at_evaluation_agent.py+1-1
- megatron/rl/agent/reward_only_agent.py+9-43
- megatron/rl/inference/api.py+2-29
- megatron/rl/inference/chat_templates.py-51
- megatron/rl/inference/inference_interface.py+10-105
- megatron/rl/inference/megatron.py+45-86
- megatron/rl/rl_utils.py+21-38
- megatron/rl/server/inference/inference_interface_server.py+6-9
- megatron/training/arguments.py+4-6
- megatron/training/checkpointing.py+1-1
- pyproject.toml+3
- tests/functional_tests/test_cases/gpt/gpt_grpo_basic_function/model_config.yaml-2
- tests/functional_tests/test_cases/gpt/gpt_grpo_tp1tp2_pp1_dp8_583m_throughputtest/model_config.yaml-1
- tests/functional_tests/test_cases/gpt/gpt_grpo_tp1tp2_pp1_dp8_583m_throughputtest_github/model_config.yaml-1
- tests/functional_tests/test_cases/gpt/gpt_grpo_tp4_pp1_dp2_8b_cudagraphs_throughput/model_config.yaml-2
- tests/functional_tests/test_cases/gpt/gpt_grpo_tp4_pp1_dp2_8b_throughput/model_config.yaml-2
- tests/functional_tests/test_cases/gpt/gpt_grpo_tp4_pp1_dp2_8b_throughput_github/model_config.yaml-2
- tests/functional_tests/test_cases/moe/gpt_grpo_tp8tp4_pp1_ep8ep2_dp8_throughputtest/model_config.yaml-1
- tests/unit_tests/inference/contexts/test_dynamic_context.py+78
- tests/unit_tests/transformer/test_attention_variant_dsa.py+317
- tests/unit_tests/transformer/test_transformer_block.py+174
- tools/run_dynamic_text_generation_server.py+2
- train_rl.py-1
- uv.lock+201
| Original file line number | Diff line number | Diff line change | |
|---|---|---|---|
| |||
13 | 13 | | |
14 | 14 | | |
15 | 15 | | |
16 | | - | |
17 | | - | |
18 | | - | |
19 | | - | |
| 16 | + | |
| Original file line number | Diff line number | Diff line change | |
|---|---|---|---|
| |||
111 | 111 | | |
112 | 112 | | |
113 | 113 | | |
114 | | - | |
| 114 | + | |
| 115 | + | |
| 116 | + | |
| 117 | + | |
| 118 | + | |
| 119 | + | |
| 120 | + | |
| 121 | + | |
| 122 | + | |
| 123 | + | |
115 | 124 | | |
116 | 125 | | |
117 | 126 | | |
| |||
| Original file line number | Diff line number | Diff line change | |
|---|---|---|---|
| |||
89 | 89 | | |
90 | 90 | | |
91 | 91 | | |
| 92 | + | |
92 | 93 | | |
93 | 94 | | |
94 | 95 | | |
| |||
| Original file line number | Diff line number | Diff line change | |
|---|---|---|---|
| |||
78 | 78 | | |
79 | 79 | | |
80 | 80 | | |
| 81 | + | |
81 | 82 | | |
82 | 83 | | |
83 | 84 | | |
| |||
103 | 104 | | |
104 | 105 | | |
105 | 106 | | |
| 107 | + | |
106 | 108 | | |
107 | 109 | | |
108 | 110 | | |
| |||
206 | 208 | | |
207 | 209 | | |
208 | 210 | | |
| 211 | + | |
209 | 212 | | |
210 | 213 | | |
211 | 214 | | |
| |||
231 | 234 | | |
232 | 235 | | |
233 | 236 | | |
| 237 | + | |
234 | 238 | | |
235 | 239 | | |
236 | 240 | | |
| |||
256 | 260 | | |
257 | 261 | | |
258 | 262 | | |
| 263 | + | |
259 | 264 | | |
260 | 265 | | |
261 | 266 | | |
| |||
| Original file line number | Diff line number | Diff line change | |
|---|---|---|---|
| |||
403 | 403 | | |
404 | 404 | | |
405 | 405 | | |
406 | | - | |
| 406 | + | |
407 | 407 | | |
408 | 408 | | |
409 | 409 | | |
| |||
0 commit comments