We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent c24b666 commit 834acb1Copy full SHA for 834acb1
ggml/src/ggml-opencl/kernels/mul_mat_f16_f32.cl
@@ -47,7 +47,7 @@ __kernel void mul_mat_f16_f32(
47
}
48
49
const int numTiles = (K + CPWK - 1) / CPWK;
50
-
+
51
const int load_row_a = lid % OPWM;
52
const int load_vec_k_a = lid / OPWM;
53
const int global_row_a = offsetM + load_row_a;
0 commit comments