We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
mul_mv_mxfp4_f32_flat
1 parent 36676c0 commit 7184682Copy full SHA for 7184682
ggml/src/ggml-opencl/kernels/mul_mv_mxfp4_f32_flat.cl
@@ -108,7 +108,9 @@ kernel void kernel_mul_mv_mxfp4_f32_flat(
108
uint i12 = im % ne12;
109
uint i13 = im / ne12;
110
111
- ulong offset_src0 = first_row * nb;
+ uint offset_src0 = first_row*nb01 + (i12/r2)*nb02 + (i13/r3)*nb03;
112
+ // 17 = sizeof(block_mxfp4)
113
+ offset_src0 /= 17;
114
#ifdef SRC0Q_IMG
115
ulong offset_q = offset_src0;
116
#else
0 commit comments