Fix importance matrix requirement

countzero · countzero · commit 9ac4b7b1ee2f · 2024-02-29T12:42:28.000+01:00
diff --git a/quantize_weights_for_llama.cpp.ps1 b/quantize_weights_for_llama.cpp.ps1
@@ -81,9 +81,10 @@ ForEach ($repositoryName in $repositoryDirectories) {
             }
         }
 
-        # We do need to compute an importance matrix for some 2-bit quantized models:
+        # We need to compute an importance matrix for all i-quants and
+        # small k-quants to enhance the quality of the quantum models.
         # https://github.com/ggerganov/llama.cpp/tree/master/examples/imatrix
-        $requiresImportanceMatrix = "IQ2_XXS IQ2_XS Q2_K_S".Contains($type)
+        $requiresImportanceMatrix = $type.Contains("IQ") -or "Q2_K Q2_K_S".Contains($type)
 
         if ($requiresImportanceMatrix -and !(Test-Path -Path $importanceMatrixPath)) {
 

Original file line number	Diff line number	Diff line change
`@@ -81,9 +81,10 @@ ForEach ($repositoryName in $repositoryDirectories) {`
`81`	`81`	`}`
`82`	`82`	`}`
`83`	`83`
`84`		`- # We do need to compute an importance matrix for some 2-bit quantized models:`
	`84`	`+ # We need to compute an importance matrix for all i-quants and`
	`85`	`+ # small k-quants to enhance the quality of the quantum models.`
`85`	`86`	`# https://github.com/ggerganov/llama.cpp/tree/master/examples/imatrix`
`86`		`- $requiresImportanceMatrix = "IQ2_XXS IQ2_XS Q2_K_S".Contains($type)`
	`87`	`+ $requiresImportanceMatrix = $type.Contains("IQ") -or "Q2_K Q2_K_S".Contains($type)`
`87`	`88`
`88`	`89`	`if ($requiresImportanceMatrix -and !(Test-Path -Path $importanceMatrixPath)) {`
`89`	`90`