Skip to content

Commit 6ef6aa1

Browse files
change set_vocab() flow
1 parent 29c1532 commit 6ef6aa1

File tree

1 file changed

+11
-5
lines changed

1 file changed

+11
-5
lines changed

convert_hf_to_gguf.py

Lines changed: 11 additions & 5 deletions
Original file line numberDiff line numberDiff line change
@@ -5566,11 +5566,17 @@ class DeepseekV2Model(TextModel):
55665566
model_arch = gguf.MODEL_ARCH.DEEPSEEK2
55675567

55685568
def set_vocab(self):
5569-
if(self.hparams["vocab_size"]==163840): # Kimi-K2 model
5570-
from transformers import AutoTokenizer
5571-
tokenizer = AutoTokenizer.from_pretrained(self.dir_model, trust_remote_code=True)
5572-
tokpre = self.get_vocab_base_pre(tokenizer)
5569+
try:
5570+
self._set_vocab_gpt2()
5571+
return
5572+
except:
5573+
pass
55735574

5575+
from transformers import AutoTokenizer
5576+
tokenizer = AutoTokenizer.from_pretrained(self.dir_model, trust_remote_code=True)
5577+
tokpre = self.get_vocab_base_pre(tokenizer)
5578+
5579+
if tokpre == "kimi-k2":
55745580
# Build merges list using the approach similar to HunYuanMoE
55755581
merges = []
55765582
vocab = {}
@@ -5611,7 +5617,7 @@ def set_vocab(self):
56115617
special_vocab = gguf.SpecialVocab(self.dir_model, load_merges=False)
56125618
special_vocab.add_to_gguf(self.gguf_writer)
56135619
else:
5614-
self._set_vocab_gpt2()
5620+
raise NotImplementedError(f"{self.dir_model} is not supported yet!")
56155621

56165622
def set_gguf_parameters(self):
56175623

0 commit comments

Comments
 (0)