We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 4f8cb4c commit 3e4f747Copy full SHA for 3e4f747
examples/mix_math/mix_math.yaml
@@ -11,7 +11,6 @@ algorithm:
11
clip_range: 0.2
12
use_token_level_loss_in_sft: true
13
use_dynamic_bsz: true
14
- repeat_times: 8
15
ppo_mini_batch_size: 320
16
ppo_micro_batch_size_per_gpu: 4
17
ngpus_trainer: 4
@@ -25,7 +24,7 @@ cluster:
25
24
node_num: 1
26
gpu_per_node: 8
27
buffer:
28
- total_epochs: 1
+ total_epochs: 10
29
batch_size: 40
30
max_retry_times: 3
31
max_retry_interval: 1
@@ -56,6 +55,7 @@ buffer:
56
55
storage_type: queue
57
path: /PATH/TO/BUFFER/
58
sft_warmup_dataset:
59
name: math_sft
60
storage_type: file
61
algorithm_type: sft
0 commit comments