Add AWQ mapping for GlmMoeDsaForCausalLM (GLM-5)

Yatimai · Yatimai · commit c53d4dcf69eb · 2026-02-27T00:00:30.000+01:00
GLM-5 uses Multi-head Latent Attention identical to DeepSeek V3 —
same projection names (q_a_proj, kv_a_proj_with_mqa, etc.) and
same MoE structure. Reuses _deepseek_mappings.

Also moves Glm4MoeForCausalLM to its correct alphabetical position.
diff --git a/src/llmcompressor/modifiers/awq/mappings.py b/src/llmcompressor/modifiers/awq/mappings.py
@@ -251,6 +251,8 @@ class AWQMapping:
     "Gemma2ForCausalLM": _gemma_mappings,
     "Gemma3ForCausalLM": _gemma_mappings,
     "Gemma3ForConditionalGeneration": _gemma_mappings,
+    "Glm4MoeForCausalLM": _default_mappings,
+    "GlmMoeDsaForCausalLM": _deepseek_mappings,
     "LlamaForCausalLM": _default_mappings,
     "Llama4ForConditionalGeneration": _default_mappings,
     "Mistral3ForConditionalGeneration": _default_mappings,
@@ -264,7 +266,6 @@ class AWQMapping:
     "Qwen3ForCausalLM": _default_mappings,
     "Qwen3MoeForCausalLM": _moe_default_mappings,
     "Qwen3NextForCausalLM": _qwen3_next_moe_mappings,
-    "Glm4MoeForCausalLM": _default_mappings,
     "SeedOssForCausalLM": _default_mappings,
     "Ernie4_5_MoeForCausalLM": _default_mappings,
 }