Fix logic flaw so that when two or more quant types are specified via --tensor-type for the same tensor, the last list entry wins

EAddario · EAddario · commit 272a845578aa · 2025-07-07T21:09:27.000+01:00
diff --git a/src/llama-quant.cpp b/src/llama-quant.cpp
@@ -883,8 +883,7 @@ static void llama_model_quantize_impl(const std::string & fname_inp, const std::
                         if (std::regex pattern(tname); std::regex_search(tensor_name, pattern)) {
                             if  (qtype != new_type) {
                                 LLAMA_LOG_DEBUG("(overriding %s) ", ggml_type_name(new_type));
-                                new_type = qtype;
-                                break; // if two or more types are specified for the tensor, first match wins
+                                new_type = qtype; // if two or more types are specified for the same tensor, the last match wins
                             }
                         }
                     }

Original file line number	Diff line number	Diff line change
`@@ -883,8 +883,7 @@ static void llama_model_quantize_impl(const std::string & fname_inp, const std::`
`883`	`883`	`if (std::regex pattern(tname); std::regex_search(tensor_name, pattern)) {`
`884`	`884`	`if (qtype != new_type) {`
`885`	`885`	`LLAMA_LOG_DEBUG("(overriding %s) ", ggml_type_name(new_type));`
`886`		`- new_type = qtype;`
`887`		`- break; // if two or more types are specified for the tensor, first match wins`
	`886`	`+ new_type = qtype; // if two or more types are specified for the same tensor, the last match wins`
`888`	`887`	`}`
`889`	`888`	`}`
`890`	`889`	`}`