@@ -256,12 +256,14 @@ def byref(obj: CtypesCData, offset: Optional[int] = None) -> CtypesRef[CtypesCDa
256256# LLAMA_FTYPE_MOSTLY_IQ2_XXS = 19, // except 1d tensors
257257# LLAMA_FTYPE_MOSTLY_IQ2_XS = 20, // except 1d tensors
258258# LLAMA_FTYPE_MOSTLY_Q2_K_S = 21, // except 1d tensors
259- # LLAMA_FTYPE_MOSTLY_Q3_K_XS = 22, // except 1d tensors
259+ # LLAMA_FTYPE_MOSTLY_IQ3_XS = 22, // except 1d tensors
260260# LLAMA_FTYPE_MOSTLY_IQ3_XXS = 23, // except 1d tensors
261261# LLAMA_FTYPE_MOSTLY_IQ1_S = 24, // except 1d tensors
262262# LLAMA_FTYPE_MOSTLY_IQ4_NL = 25, // except 1d tensors
263263# LLAMA_FTYPE_MOSTLY_IQ3_S = 26, // except 1d tensors
264264# LLAMA_FTYPE_MOSTLY_IQ3_M = 27, // except 1d tensors
265+ # LLAMA_FTYPE_MOSTLY_IQ2_S = 28, // except 1d tensors
266+ # LLAMA_FTYPE_MOSTLY_IQ2_M = 29, // except 1d tensors
265267
266268# LLAMA_FTYPE_GUESSED = 1024, // not specified in the model file
267269# };
@@ -285,12 +287,14 @@ def byref(obj: CtypesCData, offset: Optional[int] = None) -> CtypesRef[CtypesCDa
285287LLAMA_FTYPE_MOSTLY_IQ2_XXS = 19
286288LLAMA_FTYPE_MOSTLY_IQ2_XS = 20
287289LLAMA_FTYPE_MOSTLY_Q2_K_S = 21
288- LLAMA_FTYPE_MOSTLY_Q3_K_XS = 22
290+ LLAMA_FTYPE_MOSTLY_IQ3_XS = 22
289291LLAMA_FTYPE_MOSTLY_IQ3_XXS = 23
290292LLAMA_FTYPE_MOSTLY_IQ1_S = 24
291293LLAMA_FTYPE_MOSTLY_IQ4_NL = 25
292294LLAMA_FTYPE_MOSTLY_IQ3_S = 26
293295LLAMA_FTYPE_MOSTLY_IQ3_M = 27
296+ LLAMA_FTYPE_MOSTLY_IQ2_S = 28
297+ LLAMA_FTYPE_MOSTLY_IQ2_M = 29
294298LLAMA_FTYPE_GUESSED = 1024
295299
296300# enum llama_rope_scaling_type {
0 commit comments