@@ -256,12 +256,14 @@ def byref(obj: CtypesCData, offset: Optional[int] = None) -> CtypesRef[CtypesCDa
256256#     LLAMA_FTYPE_MOSTLY_IQ2_XXS       = 19, // except 1d tensors 
257257#     LLAMA_FTYPE_MOSTLY_IQ2_XS        = 20, // except 1d tensors 
258258#     LLAMA_FTYPE_MOSTLY_Q2_K_S        = 21, // except 1d tensors 
259- #     LLAMA_FTYPE_MOSTLY_Q3_K_XS        = 22, // except 1d tensors 
259+ #     LLAMA_FTYPE_MOSTLY_IQ3_XS         = 22, // except 1d tensors 
260260#     LLAMA_FTYPE_MOSTLY_IQ3_XXS       = 23, // except 1d tensors 
261261#     LLAMA_FTYPE_MOSTLY_IQ1_S         = 24, // except 1d tensors 
262262#     LLAMA_FTYPE_MOSTLY_IQ4_NL        = 25, // except 1d tensors 
263263#     LLAMA_FTYPE_MOSTLY_IQ3_S         = 26, // except 1d tensors 
264264#     LLAMA_FTYPE_MOSTLY_IQ3_M         = 27, // except 1d tensors 
265+ #     LLAMA_FTYPE_MOSTLY_IQ2_S         = 28, // except 1d tensors 
266+ #     LLAMA_FTYPE_MOSTLY_IQ2_M         = 29, // except 1d tensors 
265267
266268#     LLAMA_FTYPE_GUESSED = 1024, // not specified in the model file 
267269# }; 
@@ -285,12 +287,14 @@ def byref(obj: CtypesCData, offset: Optional[int] = None) -> CtypesRef[CtypesCDa
285287LLAMA_FTYPE_MOSTLY_IQ2_XXS  =  19 
286288LLAMA_FTYPE_MOSTLY_IQ2_XS  =  20 
287289LLAMA_FTYPE_MOSTLY_Q2_K_S  =  21 
288- LLAMA_FTYPE_MOSTLY_Q3_K_XS  =  22 
290+ LLAMA_FTYPE_MOSTLY_IQ3_XS  =  22 
289291LLAMA_FTYPE_MOSTLY_IQ3_XXS  =  23 
290292LLAMA_FTYPE_MOSTLY_IQ1_S  =  24 
291293LLAMA_FTYPE_MOSTLY_IQ4_NL  =  25 
292294LLAMA_FTYPE_MOSTLY_IQ3_S  =  26 
293295LLAMA_FTYPE_MOSTLY_IQ3_M  =  27 
296+ LLAMA_FTYPE_MOSTLY_IQ2_S  =  28 
297+ LLAMA_FTYPE_MOSTLY_IQ2_M  =  29 
294298LLAMA_FTYPE_GUESSED  =  1024 
295299
296300# enum llama_rope_scaling_type { 
0 commit comments