cann : add Ascend NPU support (#2336)

* enable Ascend NPU in src/whisper.cpp * sync test-backend-ops with llama.cpp
2025-06-18 14:58:09 +00:00 · 2024-08-09 20:21:56 +08:00
parent 4b7de08bfd
commit 81c999fe0a
3 changed files with 128 additions and 21 deletions
--- a/src/whisper.cpp
+++ b/src/whisper.cpp
@ -29,6 +29,10 @@
 #include "openvino/whisper-openvino-encoder.h"
 #endif

+#ifdef GGML_USE_CANN
+#include "ggml-cann.h"
+#endif
+
 #include "ggml.h"
 #include "ggml-alloc.h"
 #include "ggml-backend.h"
@ -1283,6 +1287,16 @@ static ggml_backend_t whisper_backend_init_gpu(const whisper_context_params & pa
    }
 #endif

+#ifdef GGML_USE_CANN
+    if (params.use_gpu) {
+        WHISPER_LOG_INFO("%s: using CANN backend\n", __func__);
+        result = ggml_backend_cann_init(params.gpu_device);
+        if (!result) {
+            WHISPER_LOG_ERROR("%s: ggml_backend_cann_init() failed\n", __func__);
+        }
+    }
+#endif
+
    return result;
 }

@ -1335,6 +1349,10 @@ static ggml_backend_buffer_type_t whisper_default_buffer_type(const whisper_cont
    result || (result = ggml_backend_vk_buffer_type(params.gpu_device));
 #endif

+#ifdef GGML_USE_CANN
+    result || (result == ggml_backend_cann_buffer_type(params.gpu_device));
+#endif
+
    result || (result = ggml_backend_cpu_buffer_type());

    return result;
@ -4337,8 +4355,8 @@ const char * whisper_print_system_info(void) {
    s += "VSX = "       + std::to_string(ggml_cpu_has_vsx())       + " | ";
    s += "CUDA = "      + std::to_string(ggml_cpu_has_cuda())      + " | ";
    s += "COREML = "    + std::to_string(whisper_has_coreml())     + " | ";
-    s += "OPENVINO = "  + std::to_string(whisper_has_openvino())          ;
-
+    s += "OPENVINO = "  + std::to_string(whisper_has_openvino())   + " | ";
+    s += "CANN = "      + std::to_string(ggml_cpu_has_cann())             ;
    return s.c_str();
 }