ggml-org
diff --git a/‎.devops/cuda.Dockerfile‎
Lines changed: 1 addition & 0 deletions b/‎.devops/cuda.Dockerfile‎
Lines changed: 1 addition & 0 deletions
diff --git a/‎README.md‎
Lines changed: 1 addition & 0 deletions b/‎README.md‎
Lines changed: 1 addition & 0 deletions
diff --git a/‎ggml/src/ggml-quants.c‎
Lines changed: 5 additions & 5 deletions b/‎ggml/src/ggml-quants.c‎
Lines changed: 5 additions & 5 deletions
diff --git a/‎ggml/src/ggml-vulkan/vulkan-shaders/vulkan-shaders-gen.cpp‎
Lines changed: 2 additions & 1 deletion b/‎ggml/src/ggml-vulkan/vulkan-shaders/vulkan-shaders-gen.cpp‎
Lines changed: 2 additions & 1 deletion
@@ -60,6 +60,7 @@ RUN apt-get update \
     git \
     python3 \
     python3-pip \
+    && pip install --upgrade pip setuptools wheel \
     && pip install --break-system-packages -r requirements.txt \
     && apt autoremove -y \
     && apt clean -y \
 
@@ -17,6 +17,7 @@ LLM inference in C/C++
 
 ## Hot topics
 
+- **[guide : running gpt-oss with llama.cpp](https://github.com/ggml-org/llama.cpp/discussions/15396)**
 - **[[FEEDBACK] Better packaging for llama.cpp to support downstream consumers 🤗](https://github.com/ggml-org/llama.cpp/discussions/15313)**
 - Support for the `gpt-oss` model with native MXFP4 format has been added | [PR](https://github.com/ggml-org/llama.cpp/pull/15091) | [Collaboration with NVIDIA](https://blogs.nvidia.com/blog/rtx-ai-garage-openai-oss) | [Comment](https://github.com/ggml-org/llama.cpp/discussions/15095)
 - Hot PRs: [All](https://github.com/ggml-org/llama.cpp/pulls?q=is%3Apr+label%3Ahot+) | [Open](https://github.com/ggml-org/llama.cpp/pulls?q=is%3Apr+label%3Ahot+is%3Aopen)
 
@@ -566,7 +566,7 @@ static float make_q3_quants(int n, int nmax, const float * GGML_RESTRICT x, int8
         for (int i = 0; i < n; ++i) {
             L[i] += nmax;
         }
-        return sumlx / suml2;
+        return suml2 > 0.0f ? sumlx / suml2 : 0.0f;
     }
     for (int i = 0; i < n; ++i) {
         int l = nearest_int(iscale * x[i]);
@@ -901,7 +901,7 @@ static float make_qp_quants(int n, int nmax, const float * GGML_RESTRICT x, uint
     for (int i = 0; i < n; ++i) {
         max = MAX(max, x[i]);
     }
-    if (!max) { // all zero
+    if (max < GROUP_MAX_EPS) { // all zero
         for (int i = 0; i < n; ++i) { L[i] = 0; }
         return 0.f;
     }
@@ -966,7 +966,7 @@ static float make_qp_quants(int n, int nmax, const float * GGML_RESTRICT x, uint
             break;
         }
     }
-    return sumlx/suml2;
+    return suml2 > 0.0f ? sumlx / suml2 : 0.0f;
 }
 
 static void quantize_row_q2_K_impl(const float * GGML_RESTRICT x, block_q2_K * GGML_RESTRICT y, int k, const float * GGML_RESTRICT quant_weights) {
@@ -4266,7 +4266,7 @@ static void quantize_row_iq1_s_impl(const float * GGML_RESTRICT x, void * GGML_R
                     sumw[j+1] = sumw[j] + weight[i];
                 }
             }
-            float best_score = -FLT_MIN, scale = max;
+            float best_score = -FLT_MAX, scale = max;
             int besti1 = -1, besti2 = -1, best_shift = 0;
             for (int i1 = 0; i1 <= block_size; ++i1) {
                 for (int i2 = i1; i2 <= block_size; ++i2) {
@@ -4442,7 +4442,7 @@ static void quantize_row_iq1_m_impl(const float * GGML_RESTRICT x, void * GGML_R
                 idx[2*j] = j;
             }
             qsort(pairs, block_size, 2*sizeof(float), iq1_sort_helper);
-            float best_score = -FLT_MIN, scale = max;
+            float best_score = -FLT_MAX, scale = max;
             int besti1 = -1, besti2 = -1, best_k = -1;
             // 0: +, +
             // 1: +, -
 
@@ -223,7 +223,8 @@ void string_to_spv_func(const std::string& _name, const std::string& in_fname, c
     std::string target_env = (name.find("_cm2") != std::string::npos) ? "--target-env=vulkan1.3" : "--target-env=vulkan1.2";
 
     // disable spirv-opt for coopmat shaders for https://github.com/ggerganov/llama.cpp/issues/10734
-    std::string opt_level = coopmat ? "" : "-O";
+    // disable spirv-opt for bf16 shaders for https://github.com/ggml-org/llama.cpp/issues/15344
+    std::string opt_level = (coopmat || name.find("bf16") != std::string::npos) ? "" : "-O";
 
     #ifdef _WIN32
         std::vector<std::string> cmd = {GLSLC, "-fshader-stage=compute", target_env, opt_level, "\"" + in_path + "\"", "-o", "\"" + out_fname + "\""};
Original file line number	Diff line number	Diff line change
`@@ -566,7 +566,7 @@ static float make_q3_quants(int n, int nmax, const float * GGML_RESTRICT x, int8`
`566`	`566`	`for (int i = 0; i < n; ++i) {`
`567`	`567`	`L[i] += nmax;`
`568`	`568`	`}`
`569`		`- return sumlx / suml2;`
	`569`	`+ return suml2 > 0.0f ? sumlx / suml2 : 0.0f;`
`570`	`570`	`}`
`571`	`571`	`for (int i = 0; i < n; ++i) {`
`572`	`572`	`int l = nearest_int(iscale * x[i]);`
`@@ -901,7 +901,7 @@ static float make_qp_quants(int n, int nmax, const float * GGML_RESTRICT x, uint`
`901`	`901`	`for (int i = 0; i < n; ++i) {`
`902`	`902`	`max = MAX(max, x[i]);`
`903`	`903`	`}`
`904`		`- if (!max) { // all zero`
	`904`	`+ if (max < GROUP_MAX_EPS) { // all zero`
`905`	`905`	`for (int i = 0; i < n; ++i) { L[i] = 0; }`
`906`	`906`	`return 0.f;`
`907`	`907`	`}`
`@@ -966,7 +966,7 @@ static float make_qp_quants(int n, int nmax, const float * GGML_RESTRICT x, uint`
`966`	`966`	`break;`
`967`	`967`	`}`
`968`	`968`	`}`
`969`		`- return sumlx/suml2;`
	`969`	`+ return suml2 > 0.0f ? sumlx / suml2 : 0.0f;`
`970`	`970`	`}`
`971`	`971`
`972`	`972`	`static void quantize_row_q2_K_impl(const float * GGML_RESTRICT x, block_q2_K * GGML_RESTRICT y, int k, const float * GGML_RESTRICT quant_weights) {`
`@@ -4266,7 +4266,7 @@ static void quantize_row_iq1_s_impl(const float * GGML_RESTRICT x, void * GGML_R`
`4266`	`4266`	`sumw[j+1] = sumw[j] + weight[i];`
`4267`	`4267`	`}`
`4268`	`4268`	`}`
`4269`		`- float best_score = -FLT_MIN, scale = max;`
	`4269`	`+ float best_score = -FLT_MAX, scale = max;`
`4270`	`4270`	`int besti1 = -1, besti2 = -1, best_shift = 0;`
`4271`	`4271`	`for (int i1 = 0; i1 <= block_size; ++i1) {`
`4272`	`4272`	`for (int i2 = i1; i2 <= block_size; ++i2) {`
`@@ -4442,7 +4442,7 @@ static void quantize_row_iq1_m_impl(const float * GGML_RESTRICT x, void * GGML_R`
`4442`	`4442`	`idx[2*j] = j;`
`4443`	`4443`	`}`
`4444`	`4444`	`qsort(pairs, block_size, 2*sizeof(float), iq1_sort_helper);`
`4445`		`- float best_score = -FLT_MIN, scale = max;`
	`4445`	`+ float best_score = -FLT_MAX, scale = max;`
`4446`	`4446`	`int besti1 = -1, besti2 = -1, best_k = -1;`
`4447`	`4447`	`// 0: +, +`
`4448`	`4448`	`// 1: +, -`