Skip to content

Commit b33e440

Browse files
Zeyi-Linclumsyazzhipaterrykong
authored
fix: swanlab logger error caused by define_metric (#1615)
Signed-off-by: ZeYi Lin <[email protected]> Signed-off-by: Alexander Zhipa <[email protected]> Co-authored-by: Alexander Zhipa <[email protected]> Co-authored-by: Alexander Zhipa <[email protected]> Co-authored-by: Terry Kong <[email protected]>
1 parent 32f5bef commit b33e440

File tree

14 files changed

+66
-69
lines changed

14 files changed

+66
-69
lines changed

examples/configs/distillation_math.yaml

Lines changed: 3 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -226,6 +226,9 @@ logger:
226226
wandb:
227227
project: "nemo-distillation"
228228
name: "distillation-${data.dataset_name}-${teacher.model_name}-${policy.model_name}-${loss_fn.kl_type}-${distillation.topk_logits_k}"
229+
swanlab:
230+
project: "nemo-distillation"
231+
name: "distillation-${data.dataset_name}-${teacher.model_name}-${policy.model_name}-${loss_fn.kl_type}-${distillation.topk_logits_k}"
229232
tensorboard:
230233
log_dir: "tb_logs-distillation-${data.dataset_name}"
231234
mlflow:

examples/configs/dpo.yaml

Lines changed: 3 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -207,6 +207,9 @@ logger:
207207
wandb:
208208
project: "dpo-dev"
209209
name: "dpo"
210+
swanlab:
211+
project: "dpo-dev"
212+
name: "dpo"
210213
tensorboard:
211214
log_dir: "tb_logs-dpo-dev"
212215
mlflow:

examples/configs/grpo_math_1B.yaml

Lines changed: 3 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -283,6 +283,9 @@ logger:
283283
wandb:
284284
project: "grpo-dev"
285285
name: "grpo-dev-logger"
286+
swanlab:
287+
project: "grpo-dev"
288+
name: "grpo-dev-logger"
286289
tensorboard: {}
287290
mlflow:
288291
experiment_name: "grpo-dev"

examples/configs/grpo_math_1B_megatron.yaml

Lines changed: 3 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -175,6 +175,9 @@ logger:
175175
wandb:
176176
project: "grpo-dev"
177177
name: "sj_megatron_1B"
178+
swanlab:
179+
project: "grpo-dev"
180+
name: "sj_megatron_1B"
178181
tensorboard: {}
179182
mlflow:
180183
experiment_name: "grpo-dev"

examples/configs/grpo_sliding_puzzle.yaml

Lines changed: 3 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -68,6 +68,9 @@ logger:
6868
wandb:
6969
project: "grpo-dev"
7070
name: "grpo-dev-sliding_puzzle"
71+
swanlab:
72+
project: "grpo-dev"
73+
name: "grpo-dev-sliding_puzzle"
7174
tensorboard: {}
7275
mlflow:
7376
experiment_name: "grpo-dev"

examples/configs/rm.yaml

Lines changed: 3 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -171,6 +171,9 @@ logger:
171171
wandb:
172172
project: "rm-dev"
173173
name: "rm-dev-${data.dataset_name}"
174+
swanlab:
175+
project: "rm-dev"
176+
name: "rm-dev-${data.dataset_name}"
174177
tensorboard:
175178
log_dir: "tb_logs-rm-dev-${data.dataset_name}"
176179
gpu_monitoring:

examples/configs/sft.yaml

Lines changed: 3 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -203,6 +203,9 @@ logger:
203203
wandb:
204204
project: "sft-dev"
205205
name: "sft-dev-${data.dataset_name}"
206+
swanlab:
207+
project: "sft-dev"
208+
name: "sft-dev-${data.dataset_name}"
206209
tensorboard:
207210
log_dir: "tb_logs-sft-dev-${data.dataset_name}"
208211
mlflow:

examples/configs/sft_openmathinstruct2.yaml

Lines changed: 3 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -88,6 +88,9 @@ logger:
8888
wandb:
8989
project: "sft-dev"
9090
name: "openmathinstruct-nemorl-1M_train"
91+
swanlab:
92+
project: "sft-dev"
93+
name: "openmathinstruct-nemorl-1M_train"
9194
tensorboard:
9295
log_dir: "tb_logs-openmathinstruct-nemorl-1M_train"
9396
mlflow:

examples/configs/vlm_grpo_3B.yaml

Lines changed: 3 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -271,6 +271,9 @@ logger:
271271
wandb:
272272
project: "grpo-dev"
273273
name: "grpo-dev-logger"
274+
swanlab:
275+
project: "grpo-dev"
276+
name: "grpo-dev-logger"
274277
tensorboard: {}
275278
gpu_monitoring:
276279
collection_interval: 10 # How often to collect GPU usage metrics (in seconds)

examples/configs/vlm_grpo_3B_megatron.yaml

Lines changed: 3 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -221,6 +221,9 @@ logger:
221221
wandb:
222222
project: grpo-dev
223223
name: vlm-grpo-3b-megatron
224+
swanlab:
225+
project: grpo-dev
226+
name: vlm-grpo-3b-megatron
224227
tensorboard: {}
225228
gpu_monitoring:
226229
collection_interval: 10

0 commit comments

Comments
 (0)