We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 9d03959 commit ac54218Copy full SHA for ac54218
open_diloco/train_fsdp.py
@@ -185,7 +185,11 @@ def _get_cosine_schedule_with_warmup_lr_lambda(
185
num_cycles: float,
186
min_lr_rate: float = 0.0,
187
):
188
- if warmup_outerstep is not None and current_step % num_inner_steps < warmup_outerstep:
+ if (
189
+ warmup_outerstep is not None
190
+ and current_step > num_warmup_steps
191
+ and current_step % num_inner_steps < warmup_outerstep
192
+ ):
193
return 0
194
195
if current_step < num_warmup_steps:
0 commit comments