File tree Expand file tree Collapse file tree 3 files changed +13
-15
lines changed Expand file tree Collapse file tree 3 files changed +13
-15
lines changed Original file line number Diff line number Diff line change @@ -14,15 +14,14 @@ rollout_threads: 1   # Recommended to set equal to policy.num_replicas
1414
1515
1616#  Observability configuration
17- #  logging_mode: global_reduce, per_rank_reduce, per_rank_no_reduce
1817metric_logging :
1918  wandb :
20-     project : " grpo-training" 
21-     group : " grpo_exp_${oc.env:USER}" 
22-     logging_mode : " global_reduce" 
19+     project : grpo-training 
20+     group : grpo_exp_${oc.env:USER} 
21+     logging_mode : global_reduce   #  global_reduce, per_rank_reduce, per_rank_no_reduce 
2322    per_rank_share_run : False 
2423  console :
25-     logging_mode : " global_reduce" 
24+     logging_mode : global_reduce 
2625
2726#  Dataset configuration
2827dataset :
Original file line number Diff line number Diff line change @@ -17,15 +17,14 @@ provisioner:
1717rollout_threads : 1    #  Recommended to set equal to policy.num_replicas
1818
1919#  Observability configuration
20- #  logging_mode: global_reduce, per_rank_reduce, per_rank_no_reduce
2120metric_logging :
2221  wandb :
23-     project : " grpo-training" 
24-     group : " grpo_exp_${oc.env:USER}" 
25-     logging_mode : " global_reduce" 
22+     project : grpo-training 
23+     group : grpo_exp_${oc.env:USER} 
24+     logging_mode : global_reduce   #  global_reduce, per_rank_reduce, per_rank_no_reduce 
2625    per_rank_share_run : False 
2726  console :
28-     logging_mode : " global_reduce" 
27+     logging_mode : global_reduce 
2928
3029#  Dataset configuration
3130dataset :
Original file line number Diff line number Diff line change @@ -10,15 +10,15 @@ model: "Qwen/Qwen3-8B"
1010off_by_n : 1  #  Off by one by default
1111
1212#  Observability configuration
13- #  logging_mode: global_reduce, per_rank_reduce, per_rank_no_reduce 
13+ #  Observability configuration 
1414metric_logging :
1515  wandb :
16-     project : " grpo-training" 
17-     group : " grpo_exp_${oc.env:USER}" 
18-     logging_mode : " global_reduce" 
16+     project : grpo-training 
17+     group : grpo_exp_${oc.env:USER} 
18+     logging_mode : global_reduce   #  global_reduce, per_rank_reduce, per_rank_no_reduce 
1919    per_rank_share_run : False 
2020  console :
21-     logging_mode : " global_reduce" 
21+     logging_mode : global_reduce 
2222
2323#  Dataset configuration
2424dataset :
 
 
   
 
     
   
   
          
    
    
     
    
      
     
     
    You can’t perform that action at this time.
  
 
    
  
    
      
        
     
       
      
     
   
 
    
    
  
 
  
 
     
    
0 commit comments