@@ -286,7 +286,7 @@ template <> struct reorder_vec_dot_q_sycl<GGML_TYPE_Q4_0> {
286286
287287 __dpct_inline__ float operator ()(const void * __restrict__ vbq, const std::pair<int , int > ibx_offset,
288288 const std::pair<int , int > d_offset, const int8_t * q8_1_quant_ptr,
289- const sycl::half2 * q8_1_ds, const int & iqs, int /* nblocks */ ) {
289+ const sycl::half2 * q8_1_ds, const int & iqs) {
290290 const uint8_t * bq4_0 = static_cast <const uint8_t *>(vbq) + ibx_offset.first ;
291291 const ggml_half d = *(reinterpret_cast <const ggml_half *>(static_cast <const uint8_t *>(vbq) + d_offset.first ));
292292 int v[q4_0_traits::vdr_mmvq];
@@ -349,14 +349,13 @@ template <> struct reorder_vec_dot_q_sycl<GGML_TYPE_Q4_K> {
349349
350350 __dpct_inline__ float operator ()(const void * __restrict__ vbq, const std::pair<int , int > ibx_offset,
351351 const std::pair<int , int > d_offset, const int8_t * q8_1_quant_ptr,
352- const sycl::half2 * q8_1_ds, const int & iqs, int nblocks ) {
352+ const sycl::half2 * q8_1_ds, const int & iqs) {
353353 const int ib = ibx_offset.first / (QK_K / 2 );
354354
355355 const uint8_t * base = static_cast <const uint8_t *>(vbq);
356356 const uint8_t * qs = base + ibx_offset.first ;
357- const int total_qs_bytes = nblocks * (QK_K / 2 );
358- const uint8_t * scs = base + total_qs_bytes + ib * K_SCALE_SIZE;
359- const ggml_half2 * dms = reinterpret_cast <const ggml_half2 *>(base + d_offset.first );
357+ const uint8_t * scs = base + d_offset.first + ib * K_SCALE_SIZE;
358+ const ggml_half2 * dms = reinterpret_cast <const ggml_half2 *>(base + d_offset.second );
360359
361360 const int bq8_offset = QR4_K * ((iqs / 2 ) / (QI8_1 / 2 ));
362361 const int * q4 = (const int *) (qs + 16 * bq8_offset + 4 * ((iqs / 2 ) % 4 ));
@@ -427,7 +426,7 @@ template <> struct reorder_vec_dot_q_sycl<GGML_TYPE_Q6_K> {
427426
428427 float operator ()(const void * __restrict__ vbq, const std::pair<int , int > ibx_offset,
429428 const std::pair<int , int > d_offset, const int8_t * q8_1_quant_ptr, const sycl::half2 * q8_1_ds,
430- const int & iqs, int /* nblocks */ ) {
429+ const int & iqs) {
431430 const int ib = ibx_offset.first / (QK_K / 2 );
432431
433432 const uint8_t * base = static_cast <const uint8_t *>(vbq);
0 commit comments