Update llama.cpp api 20251031

JamePeng · JamePeng · commit ee6963e47a58 · 2025-10-31T04:40:05.000+08:00
diff --git a/llama_cpp/llama_cpp.py b/llama_cpp/llama_cpp.py
@@ -315,12 +315,14 @@
 #     LLAMA_ROPE_TYPE_NORM   = 0,
 #     LLAMA_ROPE_TYPE_NEOX   = GGML_ROPE_TYPE_NEOX,
 #     LLAMA_ROPE_TYPE_MROPE  = GGML_ROPE_TYPE_MROPE,
+#     LLAMA_ROPE_TYPE_IMROPE = GGML_ROPE_TYPE_IMROPE,
 #     LLAMA_ROPE_TYPE_VISION = GGML_ROPE_TYPE_VISION,
 # };
 LLAMA_ROPE_TYPE_NONE = -1
 LLAMA_ROPE_TYPE_NORM = 0
 LLAMA_ROPE_TYPE_NEOX = GGML_ROPE_TYPE_NEOX = 2
 LLAMA_ROPE_TYPE_MROPE = GGML_ROPE_TYPE_MROPE = 8
+LLAMA_ROPE_TYPE_IMROPE = GGML_ROPE_TYPE_IMROPE = 40
 LLAMA_ROPE_TYPE_VISION = GGML_ROPE_TYPE_VISION = 24
 
 
diff --git a/llama_cpp/mtmd_cpp.py b/llama_cpp/mtmd_cpp.py
@@ -398,12 +398,12 @@ def mtmd_input_chunk_get_id(chunk: mtmd_input_chunk_p) -> c_char_p:
     """
     ...
 
-# // number of temporal positions (always 1 for M-RoPE, n_tokens otherwise)
+# // number of temporal positions (equals to max(t,h,w) for M-RoPE; equals to n_tokens otherwise)
 # MTMD_API llama_pos                  mtmd_input_chunk_get_n_pos       (const mtmd_input_chunk * chunk);
 @ctypes_function_mtmd("mtmd_input_chunk_get_n_pos", [mtmd_input_chunk_p_ctypes], c_int32)
 def mtmd_input_chunk_get_n_pos(chunk: mtmd_input_chunk_p) -> c_int32:
     """
-    number of temporal positions (always 1 for M-RoPE, n_tokens otherwise)
+    number of temporal positions (equals to max(t,h,w) for M-RoPE; equals to n_tokens otherwise)
     """
     ...
 
@@ -457,11 +457,12 @@ def mtmd_image_tokens_get_ny(image_tokens: mtmd_image_tokens_p) -> c_size_t:
 def mtmd_image_tokens_get_id(image_tokens: mtmd_image_tokens_p) -> c_char_p:
     ...
 
-# // number of temporal positions (always 1 for M-RoPE, n_tokens otherwise)
+# // number of temporal positions (equals to max(t,h,w) for M-RoPE; equals to n_tokens otherwise)
 # MTMD_API llama_pos    mtmd_image_tokens_get_n_pos   (const mtmd_image_tokens * image_tokens); // TODO: deprecate
 @ctypes_function_mtmd(
     "mtmd_image_tokens_get_n_pos", [mtmd_image_tokens_p_ctypes], c_int32)
 def mtmd_image_tokens_get_n_pos(image_tokens: mtmd_image_tokens_p) -> c_int32:
+    """number of temporal positions (equals to max(t,h,w) for M-RoPE; equals to n_tokens otherwise)"""
     ...
 
 # // tokenize an input text prompt and a list of bitmaps (images/audio)