convert : allow quantizing lora again (ggml-org#17453)

CISC · web-flow · commit b61de2b2df4f · 2025-11-24T15:50:55.000+01:00
diff --git a/convert_hf_to_gguf.py b/convert_hf_to_gguf.py
@@ -565,7 +565,7 @@ def prepare_tensors(self):
                             gguf.MODEL_TENSOR.ALTUP_PREDICT_COEF,
                         )
                     )
-                    or not new_name.endswith(".weight")
+                    or new_name[-7:] not in (".weight", ".lora_a", ".lora_b")
                 ):
                     data_qtype = gguf.GGMLQuantizationType.F32
 
diff --git a/convert_lora_to_gguf.py b/convert_lora_to_gguf.py
@@ -242,7 +242,7 @@ def parse_args() -> argparse.Namespace:
         help="path to write to; default: based on input. {ftype} will be replaced by the outtype.",
     )
     parser.add_argument(
-        "--outtype", type=str, choices=["f32", "f16", "bf16", "q8_0", "auto"], default="f16",
+        "--outtype", type=str, choices=["f32", "f16", "bf16", "q8_0", "auto"], default="f32",
         help="output format - use f32 for float32, f16 for float16, bf16 for bfloat16, q8_0 for Q8_0, auto for the highest-fidelity 16-bit float type depending on the first loaded tensor type",
     )
     parser.add_argument(

Original file line number	Diff line number	Diff line change
`@@ -565,7 +565,7 @@ def prepare_tensors(self):`
`565`	`565`	`gguf.MODEL_TENSOR.ALTUP_PREDICT_COEF,`
`566`	`566`	`)`
`567`	`567`	`)`
`568`		`- or not new_name.endswith(".weight")`
	`568`	`+ or new_name[-7:] not in (".weight", ".lora_a", ".lora_b")`
`569`	`569`	`):`
`570`	`570`	`data_qtype = gguf.GGMLQuantizationType.F32`
`571`	`571`
Original file line number	Diff line number	Diff line change
`@@ -242,7 +242,7 @@ def parse_args() -> argparse.Namespace:`
`242`	`242`	`help="path to write to; default: based on input. {ftype} will be replaced by the outtype.",`
`243`	`243`	`)`
`244`	`244`	`parser.add_argument(`
`245`		`- "--outtype", type=str, choices=["f32", "f16", "bf16", "q8_0", "auto"], default="f16",`
	`245`	`+ "--outtype", type=str, choices=["f32", "f16", "bf16", "q8_0", "auto"], default="f32",`
`246`	`246`	`help="output format - use f32 for float32, f16 for float16, bf16 for bfloat16, q8_0 for Q8_0, auto for the highest-fidelity 16-bit float type depending on the first loaded tensor type",`
`247`	`247`	`)`
`248`	`248`	`parser.add_argument(`