diff --git a/apps/grpo/qwen3_8b.yaml b/apps/grpo/qwen3_8b.yaml index 22a4a3961..a2815c5c0 100644 --- a/apps/grpo/qwen3_8b.yaml +++ b/apps/grpo/qwen3_8b.yaml @@ -3,7 +3,7 @@ # Global configuration group_size: 8 -local_batch_size: 16 # per-device batch size +local_batch_size: 12 # per-device batch size max_req_tokens: 1024 max_res_tokens: 1024 model: "Qwen/Qwen3-8B"