We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
1 parent d1cfaa0 commit 6d43f53Copy full SHA for 6d43f53
slime/utils/arguments.py
@@ -149,9 +149,8 @@ def add_train_arguments(parser):
149
help="The method to convert megatron weights to hugging face weights for SGLang.",
150
)
151
parser.add_argument(
152
- "--disable-recompute-loss-function",
153
- action="store_false",
154
- dest="recompute_loss_function",
+ "--recompute-loss-function",
+ action="store_true",
155
help="Whether to disable recompute loss function to save memory during training.",
156
157
0 commit comments