File tree Expand file tree Collapse file tree 1 file changed +3
-3
lines changed Expand file tree Collapse file tree 1 file changed +3
-3
lines changed Original file line number Diff line number Diff line change @@ -104,7 +104,7 @@ __device__ void iqk_mul_mat_vec_q_kerne(
104104 }
105105
106106 if (threadIdx .x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx .x < nrows_dst)) {
107- dst[j*nrows_dst + row0 + threadIdx .x ] = bias ? tmp[j][threadIdx .x ] + bias[j*nrows_dst + row0 + threadIdx .x ] : tmp[j][threadIdx .x ];
107+ dst[j*nrows_dst + row0 + threadIdx .x ] = bias ? tmp[j][threadIdx .x ] + bias[row0 + threadIdx .x ] : tmp[j][threadIdx .x ];
108108 }
109109 }
110110}
@@ -211,8 +211,8 @@ __device__ void iqk_fused_mul_mat_vec_q_kernel(
211211 default : {
212212 constexpr float alpha = 1 .702f ;
213213 constexpr float limit = 7 .0f ;
214- g += bias_g[j*nrows_dst + row0 + threadIdx .x ];
215- u += bias_u[j*nrows_dst + row0 + threadIdx .x ];
214+ g += bias_g[row0 + threadIdx .x ];
215+ u += bias_u[row0 + threadIdx .x ];
216216 g = fminf (g, limit);
217217 u = fmaxf (fminf (u, limit), -limit);
218218 r = g / (1 .0f + expf (-g * alpha)) * (1 .0f + u);
You can’t perform that action at this time.
0 commit comments