File tree Expand file tree Collapse file tree 2 files changed +5
-5
lines changed Expand file tree Collapse file tree 2 files changed +5
-5
lines changed Original file line number Diff line number Diff line change @@ -1346,8 +1346,8 @@ enum ggml_type ggml_ftype_to_ggml_type(enum ggml_ftype ftype) {
13461346 case GGML_FTYPE_MOSTLY_Q5_1 : wtype = GGML_TYPE_Q5_1 ; break ;
13471347 case GGML_FTYPE_MOSTLY_Q8_0 : wtype = GGML_TYPE_Q8_0 ; break ;
13481348 case GGML_FTYPE_MOSTLY_MXFP4 : wtype = GGML_TYPE_MXFP4 ; break ;
1349- case GGML_FTYPE_MOSTLY_MXFP6_E3M2 : wtype = GGML_TYPE_MXFP6_E3M2 ; break ;
1350- case GGML_FTYPE_MOSTLY_MXFP6_E2M3 : wtype = GGML_TYPE_MXFP6_E2M3 ; break ;
1349+ case GGML_FTYPE_MOSTLY_MXFP6_E3M2 : wtype = GGML_TYPE_MXFP6_E3M2 ; break ;
1350+ case GGML_FTYPE_MOSTLY_MXFP6_E2M3 : wtype = GGML_TYPE_MXFP6_E2M3 ; break ;
13511351 case GGML_FTYPE_MOSTLY_Q2_K : wtype = GGML_TYPE_Q2_K ; break ;
13521352 case GGML_FTYPE_MOSTLY_Q3_K : wtype = GGML_TYPE_Q3_K ; break ;
13531353 case GGML_FTYPE_MOSTLY_Q4_K : wtype = GGML_TYPE_Q4_K ; break ;
Original file line number Diff line number Diff line change @@ -3009,9 +3009,9 @@ class LlamaFileType(IntEnum):
30093009 # MOSTLY_Q4_0_8_8 = 35 # removed from gguf files, use Q4_0 and runtime repack
30103010 MOSTLY_TQ1_0 = 36 # except 1d tensors
30113011 MOSTLY_TQ2_0 = 37 # except 1d tensors
3012- LLAMA_FTYPE_MOSTLY_MXFP4_MOE = 38 # except 1d tensors
3013- LLAMA_FTYPE_MOSTLY_MXFP6_E3M2_MOE = 39 # except 1d tensors
3014- LLAMA_FTYPE_MOSTLY_MXFP6_E2M3_MOE = 40 # except 1d tensors
3012+ MOSTLY_MXFP4_MOE = 38 # except 1d tensors
3013+ MOSTLY_MXFP6_E3M2_MOE = 39 # except 1d tensors
3014+ MOSTLY_MXFP6_E2M3_MOE = 40 # except 1d tensors
30153015
30163016 GUESSED = 1024 # not specified in the model file
30173017
You can’t perform that action at this time.
0 commit comments