From bd9c3195159a575ebf124528f55f9f7a14f043ba Mon Sep 17 00:00:00 2001 From: Milot Mirdita Date: Sat, 11 Jan 2025 15:24:17 +0900 Subject: [PATCH] ggml doesn't use sse42, specify only up to sse4.1 --- ggml/src/ggml-cpu/CMakeLists.txt | 8 ++++---- ggml/src/ggml-cpu/cpu-feats-x86.cpp | 4 ++-- 2 files changed, 6 insertions(+), 6 deletions(-) diff --git a/ggml/src/ggml-cpu/CMakeLists.txt b/ggml/src/ggml-cpu/CMakeLists.txt index 6b3641c42..b8d1bc06d 100644 --- a/ggml/src/ggml-cpu/CMakeLists.txt +++ b/ggml/src/ggml-cpu/CMakeLists.txt @@ -211,8 +211,8 @@ function(ggml_add_cpu_backend_variant_impl tag_name) list(APPEND ARCH_FLAGS /arch:AVX) list(APPEND ARCH_DEFINITIONS GGML_AVX) else () - list(APPEND ARCH_FLAGS /arch:SSE4.2) - list(APPEND ARCH_DEFINITIONS GGML_SSE42) + list(APPEND ARCH_FLAGS /arch:SSE4.1) + list(APPEND ARCH_DEFINITIONS GGML_SSE41) endif() if (GGML_AVX_VNNI) list(APPEND ARCH_DEFINITIONS __AVXVNNI__ GGML_AVX_VNNI) @@ -221,8 +221,8 @@ function(ggml_add_cpu_backend_variant_impl tag_name) if (GGML_NATIVE) list(APPEND ARCH_FLAGS -march=native) else () - list(APPEND ARCH_FLAGS -msse4.2) - list(APPEND ARCH_DEFINITIONS GGML_SSE42) + list(APPEND ARCH_FLAGS -msse2 -msse3 -mssse3 -msse4.1) + list(APPEND ARCH_DEFINITIONS GGML_SSE41) if (GGML_F16C) list(APPEND ARCH_FLAGS -mf16c) list(APPEND ARCH_DEFINITIONS GGML_F16C) diff --git a/ggml/src/ggml-cpu/cpu-feats-x86.cpp b/ggml/src/ggml-cpu/cpu-feats-x86.cpp index e8133d411..3d3bc088e 100644 --- a/ggml/src/ggml-cpu/cpu-feats-x86.cpp +++ b/ggml/src/ggml-cpu/cpu-feats-x86.cpp @@ -274,8 +274,8 @@ static int ggml_backend_cpu_x86_score() { if (!is.F16C()) { return 0; } score += 1<<1; #endif -#ifdef GGML_SSE42 - if (!is.SSE42()) { return 0; } +#ifdef GGML_SSE41 + if (!is.SSE41()) { return 0; } score += 1<<2; #endif #ifdef GGML_AVX