We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
1 parent 8cc497f commit 9a8dc6dCopy full SHA for 9a8dc6d
src/megatron/bridge/recipes/qwen_vl/qwen3_vl.py
@@ -248,7 +248,7 @@ def qwen3_omni_30b_a3b_finetune_config(**user_kwargs: Unpack[Qwen3VLCommonKwargs
248
is_full_sft = peft_value is None or (isinstance(peft_value, str) and peft_value.lower() == "none")
249
250
recommended_kwargs: Qwen3VLCommonKwargs = {
251
- "hf_path": "../hf-hub/Qwen/Qwen3-Omni-30B-A3B-Instruct",
+ "hf_path": "Qwen/Qwen3-Omni-30B-A3B-Instruct",
252
"tensor_model_parallel_size": 1,
253
"pipeline_model_parallel_size": 1,
254
"pipeline_dtype": torch.bfloat16,
0 commit comments