115115if [[ $USE_MOCK_DATA -eq 1 ]]; then
116116 # EXTRA_ARGS+=" --mock-data --sft-mock-dataset-config-json '{\"mode\":\"file\",\"path\":\"path/to/file\"}'"
117117 if [[ $BATCH -eq 0 ]]; then
118- EXTRA_ARGS+=" --mock-data --sft-mock-dataset-config-json {\" mode\" :\" distribution\" ,\" type\" :\" lognormal\" ,\" min_seq_len\" :1024,\" max_seq_len\" :16384,\" mean_seq_len\" :8192,\" lognormal_sigma\" :1.1} "
118+ EXTRA_ARGS+=" --mock-data --sft-mock-dataset-config-json {\" mode\" :\" distribution\" ,\" type\" :\" lognormal\" ,\" min_seq_len\" :1024,\" max_seq_len\" :16384,\" mean_seq_len\" :8192,\" lognormal_sigma\" :1.1} --tokenizer-type NullTokenizer --vocab-size 131072 "
119119 else
120- EXTRA_ARGS+=" --mock-data --sft-mock-dataset-config-json '{\" mode\" :\" distribution\" ,\" type\" :\" lognormal\" ,\" min_seq_len\" :1024,\" max_seq_len\" :16384,\" mean_seq_len\" :8192,\" lognormal_sigma\" :1.1}' "
120+ EXTRA_ARGS+=" --mock-data --sft-mock-dataset-config-json '{\" mode\" :\" distribution\" ,\" type\" :\" lognormal\" ,\" min_seq_len\" :1024,\" max_seq_len\" :16384,\" mean_seq_len\" :8192,\" lognormal_sigma\" :1.1}' --tokenizer-type NullTokenizer --vocab-size 131072 "
121121 fi
122122else
123- EXTRA_ARGS+=" --data-path ${DATA_TRAIN} "
123+ EXTRA_ARGS+=" --data-path ${DATA_TRAIN} --tokenizer-model ${TOKENIZER} "
124124fi
125125
126126if [[ $USE_FSDP -eq 1 ]]; then
@@ -143,7 +143,6 @@ OPTIONS=" \
143143 --use-distributed-optimizer \
144144 --disable-bias-linear \
145145 --sft-tokenizer-prompt-format nemotron-h-aligned \
146- --tokenizer-model ${TOKENIZER} \
147146 --transformer-impl transformer_engine \
148147 --normalization RMSNorm \
149148 --norm-epsilon 1e-06 \
0 commit comments