@@ -121,7 +121,7 @@ static inline __m256 __avx_rearranged_f32cx8_load(ggml_fp16_t *x, __m128i arrang
121121
122122#if  defined(__AVX2__ ) ||  defined(__AVX512F__ )
123123#if  defined(__AVX512F__ )
124- // add int16_t pairwise and return as int vector 
124+ // add int16_t pairwise and return as 512 bit  int vector 
125125static  inline  __m512i  sum_i16_pairs_int_32x16 (const  __m512i  x ) {
126126    const  __m512i  ones  =  _mm512_set1_epi16 (1 );
127127    return  _mm512_madd_epi16 (ones , x );
@@ -138,7 +138,7 @@ static inline __m512i mul_sum_us8_pairs_int32x16(const __m512i ax, const __m512i
138138#endif 
139139}
140140
141- // multiply int8_t, add results pairwise twice and return as int vector 
141+ // multiply int8_t, add results pairwise twice and return as 512 bit  int vector 
142142static  inline  __m512i  mul_sum_i8_pairs_int32x16 (const  __m512i  x , const  __m512i  y ) {
143143    const  __m512i  zero  =  _mm512_setzero_si512 ();
144144    // Get absolute values of x vectors 
@@ -150,6 +150,7 @@ static inline __m512i mul_sum_i8_pairs_int32x16(const __m512i x, const __m512i y
150150}
151151#endif 
152152
153+ // add int16_t pairwise and return as 256 bit int vector 
153154static  inline  __m256i  sum_i16_pairs_int32x8 (const  __m256i  x ) {
154155    const  __m256i  ones  =  _mm256_set1_epi16 (1 );
155156    return  _mm256_madd_epi16 (ones , x );
@@ -167,7 +168,7 @@ static inline __m256i mul_sum_us8_pairs_int32x8(const __m256i ax, const __m256i
167168}
168169
169170// Integer variant of the function defined in ggml-quants.c 
170- // multiply int8_t, add results pairwise twice and return as int vector 
171+ // multiply int8_t, add results pairwise twice and return as 256 bit  int vector 
171172static  inline  __m256i  mul_sum_i8_pairs_int32x8 (const  __m256i  x , const  __m256i  y ) {
172173#if  __AVXVNNIINT8__ 
173174    const  __m256i  zero  =  _mm256_setzero_si256 ();
0 commit comments