We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 55ecef3 commit 6d27c86Copy full SHA for 6d27c86
apps/grpo/qwen3_8b.yaml
@@ -53,7 +53,7 @@ trainer:
53
lr_scheduler:
54
warmup_steps: 1
55
training:
56
- local_local_batch_size: ${local_batch_size}
+ local_batch_size: ${local_batch_size}
57
seq_len: 2048
58
max_norm: 1.0
59
steps: 1000000
0 commit comments