File tree Expand file tree Collapse file tree 1 file changed +4
-1
lines changed Expand file tree Collapse file tree 1 file changed +4
-1
lines changed Original file line number Diff line number Diff line change @@ -840,6 +840,9 @@ def get_vocab_base_pre(self, tokenizer) -> str:
840840 if chkhsh == "169bf0296a13c4d9b7672313f749eb36501d931022de052aad6e36f2bf34dd51" :
841841 # ref: https://huggingface.co/LiquidAI/LFM2-Tokenizer
842842 res = "lfm2"
843+ if chkhsh == "81212dc7cdb7e0c1074ca62c5aeab0d43c9f52b8a737be7b12a777c953027890" :
844+ # ref: https://huggingface.co/moonshotai/Kimi-K2-Base
845+ res = "kimi-k2"
843846
844847 if res is None :
845848 logger .warning ("\n " )
@@ -5566,7 +5569,7 @@ def set_vocab(self):
55665569 if (self .hparams ["vocab_size" ]== 163840 ): # Kimi-K2 model
55675570 from transformers import AutoTokenizer
55685571 tokenizer = AutoTokenizer .from_pretrained (self .dir_model , trust_remote_code = True )
5569- tokpre = "kimi-k2" # TODO: add identifier hash
5572+ tokpre = self . get_vocab_base_pre ( tokenizer )
55705573
55715574 # Build merges list using the approach similar to HunYuanMoE
55725575 merges = []
You can’t perform that action at this time.
0 commit comments