We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
1 parent f3e63c6 commit 0ca37bfCopy full SHA for 0ca37bf
examples/configs/sft_nemotron_super_49b.yaml
@@ -24,7 +24,7 @@ policy:
24
# name: Qwen/Qwen2.5-7B-Instruct
25
model_name: "/lustre/fsw/portfolios/coreai/users/joyang/models/llama-3_3-nemotron-49b-instruct-128k-v1_2-hf"
26
tokenizer:
27
- name: "nvidia/Llama-3_3-Nemotron-Super-49B-v1_5"
+ name: ${policy.model_name}
28
max_total_sequence_length: 4096
29
precision: "bfloat16"
30
train_global_batch_size: 128
0 commit comments