File tree Expand file tree Collapse file tree 5 files changed +6
-6
lines changed Expand file tree Collapse file tree 5 files changed +6
-6
lines changed Original file line number Diff line number Diff line change @@ -96,10 +96,6 @@ if (NOT DEFINED GGML_LLAMAFILE)
9696 set (GGML_LLAMAFILE_DEFAULT ON )
9797endif ()
9898
99- if (NOT DEFINED GGML_AMX)
100- set (GGML_AMX ON )
101- endif ()
102-
10399if (NOT DEFINED GGML_CUDA_GRAPHS)
104100 set (GGML_CUDA_GRAPHS_DEFAULT ON )
105101endif ()
Original file line number Diff line number Diff line change @@ -96,6 +96,7 @@ option(GGML_CPU_HBM "ggml: use memkind for CPU HBM" OFF)
9696option (GGML_CPU_AARCH64 "ggml: use runtime weight conversion of Q4_0 to Q4_X_X" ON )
9797
9898option (GGML_AVX "ggml: enable AVX" ${INS_ENB} )
99+ option (GGML_AVX_VNNI "ggml: enable AVX-VNNI" OFF )
99100option (GGML_AVX2 "ggml: enable AVX2" ${INS_ENB} )
100101option (GGML_AVX512 "ggml: enable AVX512" OFF )
101102option (GGML_AVX512_VBMI "ggml: enable AVX512-VBMI" OFF )
Original file line number Diff line number Diff line change @@ -233,6 +233,9 @@ elseif (CMAKE_OSX_ARCHITECTURES STREQUAL "x86_64" OR CMAKE_GENERATOR_PLATFORM_LW
233233 if (GGML_AVX2)
234234 list (APPEND ARCH_FLAGS -mavx2)
235235 endif ()
236+ if (GGML_AVX_VNNI)
237+ list (APPEND ARCH_FLAGS -mavxvnni)
238+ endif ()
236239 if (GGML_AVX512)
237240 list (APPEND ARCH_FLAGS -mavx512f)
238241 list (APPEND ARCH_FLAGS -mavx512dq)
Original file line number Diff line number Diff line change @@ -281,8 +281,8 @@ static int ggml_backend_cpu_x86_score() {
281281 score += ggml_cpu_has_f16c () * 1 <<1 ;
282282 score += ggml_cpu_has_ssse3 () * 1 <<2 ;
283283 score += ggml_cpu_has_sse3 () * 1 <<3 ;
284- score += ggml_cpu_has_avx () * 1 <<5 ;
285284 score += ggml_cpu_has_avx_vnni () * 1 <<4 ;
285+ score += ggml_cpu_has_avx () * 1 <<5 ;
286286 score += ggml_cpu_has_avx2 () * 1 <<6 ;
287287 score += ggml_cpu_has_avx512 () * 1 <<7 ;
288288 // score += ggml_cpu_has_avx512_vbmi() * 1<<8; // not used
Original file line number Diff line number Diff line change @@ -128,7 +128,7 @@ static inline __m512i sum_i16_pairs_int_32x16(const __m512i x) {
128128}
129129
130130static inline __m512i mul_sum_us8_pairs_int32x16 (const __m512i ax , const __m512i sy ) {
131- #if defined(__AVXVNNI__ ) || (defined( __AVX512VNNI__ ) && defined( __AVX512VL__ ) )
131+ #if defined(__AVX512VNNI__ )
132132 const __m512i zero = _mm512_setzero_si512 ();
133133 return _mm512_dpbusd_epi32 (zero , ax , sy );
134134#else
You can’t perform that action at this time.
0 commit comments