Skip to content

Commit d6b3150

Browse files
pwilkinCISC
andauthored
Update convert_hf_to_gguf.py
Co-authored-by: Sigbjørn Skjæret <[email protected]>
1 parent 0dda56d commit d6b3150

File tree

1 file changed

+7
-7
lines changed

1 file changed

+7
-7
lines changed

convert_hf_to_gguf.py

Lines changed: 7 additions & 7 deletions
Original file line numberDiff line numberDiff line change
@@ -4184,16 +4184,16 @@ def set_vocab(self):
41844184

41854185

41864186
@ModelBase.register("Qwen3NextForCausalLM")
4187-
class Qwen3NextModel(Qwen3MoeModel):
4187+
class Qwen3NextModel(Qwen2MoeModel):
41884188
model_arch = gguf.MODEL_ARCH.QWEN3NEXT
41894189

41904190
def set_gguf_parameters(self):
41914191
super().set_gguf_parameters()
4192-
self.gguf_writer.add_ssm_conv_kernel(self.find_hparam(["linear_conv_kernel_dim"]))
4193-
self.gguf_writer.add_ssm_state_size(self.find_hparam(["linear_key_head_dim"]))
4194-
self.gguf_writer.add_ssm_group_count(self.find_hparam(["linear_num_key_heads"]))
4195-
self.gguf_writer.add_ssm_time_step_rank(self.find_hparam(["linear_num_value_heads"]))
4196-
self.gguf_writer.add_ssm_inner_size(self.find_hparam(['linear_value_head_dim']) * self.find_hparam(['linear_num_value_heads']))
4192+
self.gguf_writer.add_ssm_conv_kernel(self.hparams["linear_conv_kernel_dim"])
4193+
self.gguf_writer.add_ssm_state_size(self.hparams["linear_key_head_dim"])
4194+
self.gguf_writer.add_ssm_group_count(self.hparams["linear_num_key_heads"])
4195+
self.gguf_writer.add_ssm_time_step_rank(self.hparams["linear_num_value_heads"])
4196+
self.gguf_writer.add_ssm_inner_size(self.hparams["linear_value_head_dim"] * self.hparams["linear_num_value_heads"])
41974197
if (rope_dim := self.hparams.get("head_dim")) is None:
41984198
rope_dim = self.hparams["hidden_size"] // self.hparams["num_attention_heads"]
41994199
self.gguf_writer.add_rope_dimension_count(int(rope_dim * self.hparams.get("partial_rotary_factor", 0.25)))
@@ -4210,7 +4210,7 @@ def modify_tensors(self, data_torch: Tensor, name: str, bid: int | None) -> Iter
42104210
elif name.endswith("norm.weight") and not name.endswith("linear_attn.norm.weight"):
42114211
data_torch = data_torch + 1
42124212

4213-
yield from Qwen2MoeModel.modify_tensors(self, data_torch, name, bid)
4213+
yield from super().modify_tensors(self, data_torch, name, bid)
42144214

42154215

42164216
@ModelBase.register("RND1")

0 commit comments

Comments
 (0)