Skip to content

Commit c6cfe31

Browse files
committed
add GGML_AVX_VNNI to enable avx-vnni, fix checks
1 parent 6d78e0f commit c6cfe31

File tree

5 files changed

+6
-6
lines changed

5 files changed

+6
-6
lines changed

CMakeLists.txt

Lines changed: 0 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -96,10 +96,6 @@ if (NOT DEFINED GGML_LLAMAFILE)
9696
set(GGML_LLAMAFILE_DEFAULT ON)
9797
endif()
9898

99-
if (NOT DEFINED GGML_AMX)
100-
set(GGML_AMX ON)
101-
endif()
102-
10399
if (NOT DEFINED GGML_CUDA_GRAPHS)
104100
set(GGML_CUDA_GRAPHS_DEFAULT ON)
105101
endif()

ggml/CMakeLists.txt

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -96,6 +96,7 @@ option(GGML_CPU_HBM "ggml: use memkind for CPU HBM" OFF)
9696
option(GGML_CPU_AARCH64 "ggml: use runtime weight conversion of Q4_0 to Q4_X_X" ON)
9797

9898
option(GGML_AVX "ggml: enable AVX" ${INS_ENB})
99+
option(GGML_AVX_VNNI "ggml: enable AVX-VNNI" OFF)
99100
option(GGML_AVX2 "ggml: enable AVX2" ${INS_ENB})
100101
option(GGML_AVX512 "ggml: enable AVX512" OFF)
101102
option(GGML_AVX512_VBMI "ggml: enable AVX512-VBMI" OFF)

ggml/src/ggml-cpu/CMakeLists.txt

Lines changed: 3 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -233,6 +233,9 @@ elseif (CMAKE_OSX_ARCHITECTURES STREQUAL "x86_64" OR CMAKE_GENERATOR_PLATFORM_LW
233233
if (GGML_AVX2)
234234
list(APPEND ARCH_FLAGS -mavx2)
235235
endif()
236+
if (GGML_AVX_VNNI)
237+
list(APPEND ARCH_FLAGS -mavxvnni)
238+
endif()
236239
if (GGML_AVX512)
237240
list(APPEND ARCH_FLAGS -mavx512f)
238241
list(APPEND ARCH_FLAGS -mavx512dq)

ggml/src/ggml-cpu/cpu-feats-x86.cpp

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -281,8 +281,8 @@ static int ggml_backend_cpu_x86_score() {
281281
score += ggml_cpu_has_f16c () * 1<<1;
282282
score += ggml_cpu_has_ssse3 () * 1<<2;
283283
score += ggml_cpu_has_sse3 () * 1<<3;
284-
score += ggml_cpu_has_avx () * 1<<5;
285284
score += ggml_cpu_has_avx_vnni () * 1<<4;
285+
score += ggml_cpu_has_avx () * 1<<5;
286286
score += ggml_cpu_has_avx2 () * 1<<6;
287287
score += ggml_cpu_has_avx512 () * 1<<7;
288288
// score += ggml_cpu_has_avx512_vbmi() * 1<<8; // not used

ggml/src/ggml-cpu/ggml-cpu-aarch64.c

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -128,7 +128,7 @@ static inline __m512i sum_i16_pairs_int_32x16(const __m512i x) {
128128
}
129129

130130
static inline __m512i mul_sum_us8_pairs_int32x16(const __m512i ax, const __m512i sy) {
131-
#if defined(__AVXVNNI__) || (defined(__AVX512VNNI__) && defined(__AVX512VL__))
131+
#if defined(__AVX512VNNI__)
132132
const __m512i zero = _mm512_setzero_si512();
133133
return _mm512_dpbusd_epi32(zero, ax, sy);
134134
#else

0 commit comments

Comments
 (0)