Skip to content

Commit adff470

Browse files
committed
more cleanups and fixed conversion
1 parent 823696b commit adff470

File tree

3 files changed

+1
-3
lines changed

3 files changed

+1
-3
lines changed

convert_hf_to_gguf.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -6655,7 +6655,7 @@ def set_gguf_parameters(self):
66556655
## Mamba mixer params ##
66566656
self.gguf_writer.add_ssm_conv_kernel(self.find_hparam(["conv_kernel", "d_conv"]))
66576657
self.gguf_writer.add_ssm_group_count(self.n_group)
6658-
self.gguf_writer.add_ssm_inner_size(self.d_inner)
6658+
self.gguf_writer.add_ssm_inner_size(self.find_hparam(["mamba_d_ssm"]))
66596659
self.gguf_writer.add_ssm_head_dim(d_head := self.find_hparam(["d_head"]))
66606660
self.gguf_writer.add_ssm_time_step_rank(self.find_hparam(["n_heads"]))
66616661

src/llama-arch.cpp

Lines changed: 0 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1736,7 +1736,6 @@ static const std::map<llm_tensor, llm_tensor_info> LLM_TENSOR_INFOS = {
17361736
{LLM_TENSOR_CLS, {LLM_TENSOR_LAYER_OUTPUT, GGML_OP_MUL_MAT}},
17371737
{LLM_TENSOR_CLS_OUT, {LLM_TENSOR_LAYER_OUTPUT, GGML_OP_MUL_MAT}},
17381738
{LLM_TENSOR_OUTPUT_NORM, {LLM_TENSOR_LAYER_OUTPUT, GGML_OP_MUL}},
1739-
{LLM_TENSOR_FINAL_NORM, {LLM_TENSOR_LAYER_OUTPUT, GGML_OP_MUL}},
17401739
{LLM_TENSOR_DEC_OUTPUT_NORM, {LLM_TENSOR_LAYER_OUTPUT, GGML_OP_MUL}},
17411740
{LLM_TENSOR_ENC_OUTPUT_NORM, {LLM_TENSOR_LAYER_OUTPUT, GGML_OP_MUL}},
17421741
{LLM_TENSOR_ROPE_FREQS, {LLM_TENSOR_LAYER_REPEATING, GGML_OP_ROPE}},

src/llama-arch.h

Lines changed: 0 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -390,7 +390,6 @@ enum llm_tensor {
390390
LLM_TENSOR_POS_NET_ATTN_K,
391391
LLM_TENSOR_POS_NET_ATTN_V,
392392
LLM_TENSOR_POS_NET_ATTN_OUT,
393-
LLM_TENSOR_FINAL_NORM,
394393
};
395394

396395
enum llm_tensor_layer {

0 commit comments

Comments
 (0)