Skip to content

Commit 96d08aa

Browse files
committed
[megatron] support qwen3_omni dense (#7217)
1 parent b89e931 commit 96d08aa

File tree

1 file changed

+2
-2
lines changed

1 file changed

+2
-2
lines changed

swift/megatron/utils/config.py

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -110,8 +110,8 @@ def convert_hf_config(config) -> Dict[str, Any]:
110110
interleave_moe_layer_step = res.pop('interleave_moe_layer_step', None)
111111
window_size = res.pop('window_size', None)
112112
if llm_architectures in {'Qwen3ForCausalLM', 'Qwen3MoeForCausalLM', 'Qwen3NextForCausalLM'} or architectures in {
113-
'Qwen3OmniMoeForConditionalGeneration', 'Qwen3VLForConditionalGeneration',
114-
'Qwen3VLMoeForConditionalGeneration'
113+
'Qwen3OmniMoeForConditionalGeneration', 'Qwen3OmniForConditionalGeneration',
114+
'Qwen3VLForConditionalGeneration', 'Qwen3VLMoeForConditionalGeneration'
115115
}:
116116
res['qk_layernorm'] = True
117117
if llm_architectures in {'Qwen2MoeForCausalLM', 'Qwen3MoeForCausalLM', 'Qwen3NextForCausalLM'} or architectures in {

0 commit comments

Comments
 (0)