File tree Expand file tree Collapse file tree 4 files changed +5
-5
lines changed Expand file tree Collapse file tree 4 files changed +5
-5
lines changed Original file line number Diff line number Diff line change 44# Global configuration
55group_size : 8
66batch_size : 16
7- max_req_tokens : 468
8- max_res_tokens : 468
7+ max_req_tokens : 512
8+ max_res_tokens : 512
99model : " Qwen/Qwen3-8B"
1010off_by_n : 1 # Off by one by default
1111
Original file line number Diff line number Diff line change @@ -18,7 +18,7 @@ NC='\033[0m'
1818PYTORCH_VERSION=" 2.9.0.dev20250905"
1919VLLM_BRANCH=" v0.10.0"
2020MONARCH_COMMIT=" 9c41b5c16edadeab7cfb8521ba7efe68a1e2bc87"
21- TORCHTITAN_COMMIT=" a3104201ba3a0fa19e9c3cc5ba748b0398551410 "
21+ TORCHTITAN_COMMIT=" 9f3fe08635356b829e6bf41883760679a8207697 "
2222TORCHSTORE_COMMIT=" 0052f6d8b686b9cff0cf4ce203a836c4b5d5ac94"
2323BUILD_DIR=" $HOME /forge-build"
2424WHEEL_DIR=" $( pwd) /assets/wheels"
Original file line number Diff line number Diff line change 2727 Checkpoint ,
2828 Comm ,
2929 Compile ,
30- Float8Dense ,
30+ Float8Linear ,
3131 LRScheduler ,
3232 Model ,
3333 Optimizer ,
@@ -104,7 +104,7 @@ class RLTrainer(ForgeActor):
104104 )
105105 use_vllm_builtin_load : bool = True
106106 compile : Compile = field (default_factory = Compile )
107- float8 : Float8Dense = field (default_factory = Float8Dense )
107+ float8 : Float8Linear = field (default_factory = Float8Linear )
108108 comm : Comm = field (default_factory = Comm )
109109 loss : Callable = lambda logits , ** targets : logits
110110 state_dict_key : str = "model_state_dict"
You can’t perform that action at this time.
0 commit comments