From bbf30d416df2ff283bd30291e5eb2b676005b469 Mon Sep 17 00:00:00 2001 From: Bas Hulsken Date: Mon, 17 Feb 2025 09:32:21 +0100 Subject: [PATCH] fix: change initialization order of llama-cpp-avx512 to go before avx2 variant (#4837) changed to initialization order of the avx512 version of llama.cpp, now tries before avx2 Signed-off-by: Bas Hulsken --- pkg/model/initializers.go | 14 +++++++------- 1 file changed, 7 insertions(+), 7 deletions(-) diff --git a/pkg/model/initializers.go b/pkg/model/initializers.go index 8cda7fec..1a51eb2a 100644 --- a/pkg/model/initializers.go +++ b/pkg/model/initializers.go @@ -262,18 +262,18 @@ func selectGRPCProcessByHostCapabilities(backend, assetDir string, f16 bool) str } // IF we find any optimized binary, we use that - if xsysinfo.HasCPUCaps(cpuid.AVX2) { - p := backendPath(assetDir, LLamaCPPAVX2) - if _, err := os.Stat(p); err == nil { - log.Info().Msgf("[%s] attempting to load with AVX2 variant", backend) - selectedProcess = p - } - } else if xsysinfo.HasCPUCaps(cpuid.AVX512F) { + if xsysinfo.HasCPUCaps(cpuid.AVX512F) { p := backendPath(assetDir, LLamaCPPAVX512) if _, err := os.Stat(p); err == nil { log.Info().Msgf("[%s] attempting to load with AVX512 variant", backend) selectedProcess = p } + } else if xsysinfo.HasCPUCaps(cpuid.AVX2) { + p := backendPath(assetDir, LLamaCPPAVX2) + if _, err := os.Stat(p); err == nil { + log.Info().Msgf("[%s] attempting to load with AVX2 variant", backend) + selectedProcess = p + } } else if xsysinfo.HasCPUCaps(cpuid.AVX) { p := backendPath(assetDir, LLamaCPPAVX) if _, err := os.Stat(p); err == nil {