Skip to content

Commit b023e53

Browse files
Updated with kimi-k2 get_vocab_base_pre hash
1 parent 4def063 commit b023e53

File tree

1 file changed

+4
-1
lines changed

1 file changed

+4
-1
lines changed

convert_hf_to_gguf.py

Lines changed: 4 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -840,6 +840,9 @@ def get_vocab_base_pre(self, tokenizer) -> str:
840840
if chkhsh == "169bf0296a13c4d9b7672313f749eb36501d931022de052aad6e36f2bf34dd51":
841841
# ref: https://huggingface.co/LiquidAI/LFM2-Tokenizer
842842
res = "lfm2"
843+
if chkhsh == "81212dc7cdb7e0c1074ca62c5aeab0d43c9f52b8a737be7b12a777c953027890":
844+
# ref: https://huggingface.co/moonshotai/Kimi-K2-Base
845+
res = "kimi-k2"
843846

844847
if res is None:
845848
logger.warning("\n")
@@ -5566,7 +5569,7 @@ def set_vocab(self):
55665569
if(self.hparams["vocab_size"]==163840): # Kimi-K2 model
55675570
from transformers import AutoTokenizer
55685571
tokenizer = AutoTokenizer.from_pretrained(self.dir_model, trust_remote_code=True)
5569-
tokpre = "kimi-k2" # TODO: add identifier hash
5572+
tokpre = self.get_vocab_base_pre(tokenizer)
55705573

55715574
# Build merges list using the approach similar to HunYuanMoE
55725575
merges = []

0 commit comments

Comments
 (0)