diff --git a/chapters/en/chapter12/4.mdx b/chapters/en/chapter12/4.mdx index 769bb561c..4e440bd61 100644 --- a/chapters/en/chapter12/4.mdx +++ b/chapters/en/chapter12/4.mdx @@ -89,7 +89,7 @@ training_args = GRPOConfig( # Essential parameters output_dir="output", num_train_epochs=3, - num_generation=4, # Number of completions to generate for each prompt + num_generations=4, # Number of completions to generate for each prompt per_device_train_batch_size=4, # We want to get all generations in one device batch # Optional but useful gradient_accumulation_steps=2,