Skip to content

Commit b4a4455

Browse files
committed
Sync llama.cpp API 20250806
1 parent 7f6315b commit b4a4455

File tree

1 file changed

+4
-0
lines changed

1 file changed

+4
-0
lines changed

llama_cpp/llama_cpp.py

Lines changed: 4 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -262,6 +262,7 @@
262262
# LLAMA_VOCAB_PRE_TYPE_SEED_CODER = 35,
263263
# LLAMA_VOCAB_PRE_TYPE_HUNYUAN = 36,
264264
# LLAMA_VOCAB_PRE_TYPE_KIMI_K2 = 37,
265+
# LLAMA_VOCAB_PRE_TYPE_HUNYUAN_DENSE = 38,
265266
# };
266267
LLAMA_VOCAB_PRE_TYPE_DEFAULT = 0
267268
LLAMA_VOCAB_PRE_TYPE_LLAMA3 = 1
@@ -301,6 +302,7 @@
301302
LLAMA_VOCAB_PRE_TYPE_SEED_CODER = 35
302303
LLAMA_VOCAB_PRE_TYPE_HUNYUAN = 36
303304
LLAMA_VOCAB_PRE_TYPE_KIMI_K2 = 37
305+
LLAMA_VOCAB_PRE_TYPE_HUNYUAN_DENSE = 38
304306

305307

306308
# // note: these values should be synchronized with ggml_rope
@@ -403,6 +405,7 @@
403405
# //LLAMA_FTYPE_MOSTLY_Q4_0_8_8 = 35, // removed from gguf files, use Q4_0 and runtime repack
404406
# LLAMA_FTYPE_MOSTLY_TQ1_0 = 36, // except 1d tensors
405407
# LLAMA_FTYPE_MOSTLY_TQ2_0 = 37, // except 1d tensors
408+
# LLAMA_FTYPE_MOSTLY_MXFP4_MOE = 38, // except 1d tensors
406409
#
407410
# LLAMA_FTYPE_GUESSED = 1024, // not specified in the model file
408411
# };
@@ -441,6 +444,7 @@
441444
# LLAMA_FTYPE_MOSTLY_Q4_0_8_8 = 35
442445
LLAMA_FTYPE_MOSTLY_TQ1_0 = 36
443446
LLAMA_FTYPE_MOSTLY_TQ2_0 = 37
447+
LLAMA_FTYPE_MOSTLY_MXFP4_MOE = 38
444448
LLAMA_FTYPE_GUESSED = 1024
445449

446450
# enum llama_rope_scaling_type {

0 commit comments

Comments
 (0)