Change multimodal projector type to BF16 and F32

countzero · countzero · commit 0808979a2bde · 2025-11-05T12:15:12.000+01:00
diff --git a/quantize_weights_for_llama.cpp.ps1 b/quantize_weights_for_llama.cpp.ps1
@@ -52,32 +52,36 @@ ForEach ($repositoryName in $repositoryDirectories) {
         $unquantizedModelPath = $unquantizedModelPathFromSource
     }
 
-    ForEach ($type in $quantizationTypes) {
+    # We are computing a multimodal projector model in BF16 format
+    # for current hardware and F32 format as a fallback for older
+    # hardware for each model to enable vision capabilities.
+    ForEach ($multimodalProjectorType in @('BF16', 'F32')) {
 
-        $quantizedModelPath = Join-Path -Path $targetDirectoryPath -ChildPath "${repositoryName}.${type}.gguf"
+        $multimodalProjectorPath = Join-Path -Path $targetDirectoryPath -ChildPath "${repositoryName}.mmproj.${multimodalProjectorType}.gguf"
 
-        if (!(Test-Path -Path $quantizedModelPath) -and !(Test-Path -Path $unquantizedModelPath)) {
+        if (!(Test-Path -Path $multimodalProjectorPath)) {
 
-            Write-Host "Converting ${sourceDirectoryPath} to ${unquantizedModelPath}..." -ForegroundColor "DarkYellow"
+            Write-Host "Creating multimodal projector model from ${unquantizedModelPath} to ${multimodalProjectorPath}..." -ForegroundColor "DarkYellow"
 
             Invoke-Expression "python ${llamaCppDirectory}\convert_hf_to_gguf.py ``
-                --outfile '${unquantizedModelPath}' ``
-                '${sourceDirectoryPath}'"
+                --outfile '${multimodalProjectorPath}' ``
+                --outtype '${multimodalProjectorType}'.ToLower() ``
+                '${sourceDirectoryPath}' ``
+                --mmproj"
         }
+    }
 
-        $multimodalProjectorPath = Join-Path -Path $targetDirectoryPath -ChildPath "${repositoryName}.mmproj.F16.gguf"
+    ForEach ($type in $quantizationTypes) {
 
-        # We are computing a multimodal projector model in F16
-        # format for each model to enable vision capabilities.
-        if (!(Test-Path -Path $multimodalProjectorPath)) {
+        $quantizedModelPath = Join-Path -Path $targetDirectoryPath -ChildPath "${repositoryName}.${type}.gguf"
 
-            Write-Host "Creating multimodal projector model from ${unquantizedModelPath} to ${multimodalProjectorPath}..." -ForegroundColor "DarkYellow"
+        if (!(Test-Path -Path $quantizedModelPath) -and !(Test-Path -Path $unquantizedModelPath)) {
+
+            Write-Host "Converting ${sourceDirectoryPath} to ${unquantizedModelPath}..." -ForegroundColor "DarkYellow"
 
             Invoke-Expression "python ${llamaCppDirectory}\convert_hf_to_gguf.py ``
-                --outfile '${multimodalProjectorPath}' ``
-                --outtype 'f16' ``
-                '${sourceDirectoryPath}' ``
-                --mmproj"
+                --outfile '${unquantizedModelPath}' ``
+                '${sourceDirectoryPath}'"
         }
 
         # We are computing an importance matrix to enhance the quality of the models.