chore(model gallery): add qwen_qwq-32b (#4952)

Signed-off-by: Ettore Di Giacinto <mudler@localai.io>
2025-05-29 05:24:15 +00:00 · 2025-03-06 10:28:03 +01:00 · 2025-03-06 10:28:03 +01:00 · 957dcfb6a9
commit 957dcfb6a9
parent 67f7bffd18
1 changed files with 14 additions and 0 deletions
--- a/gallery/index.yaml
+++ b/gallery/index.yaml
@ -4374,6 +4374,20 @@
    - filename: Azura-Qwen2.5-32B.i1-Q4_K_M.gguf
      sha256: a3ec93f192dc4ce062fd176d6615d4da34af81d909b89c372678b779a46b8d3b
      uri: huggingface://mradermacher/Azura-Qwen2.5-32B-i1-GGUF/Azura-Qwen2.5-32B.i1-Q4_K_M.gguf
+- !!merge <<: *qwen25
+  name: "qwen_qwq-32b"
+  urls:
+    - https://huggingface.co/Qwen/QwQ-32B
+    - https://huggingface.co/bartowski/Qwen_QwQ-32B-GGUF
+  description: |
+    QwQ is the reasoning model of the Qwen series. Compared with conventional instruction-tuned models, QwQ, which is capable of thinking and reasoning, can achieve significantly enhanced performance in downstream tasks, especially hard problems. QwQ-32B is the medium-sized reasoning model, which is capable of achieving competitive performance against state-of-the-art reasoning models, e.g., DeepSeek-R1, o1-mini.
+  overrides:
+    parameters:
+      model: Qwen_QwQ-32B-Q4_K_M.gguf
+  files:
+    - filename: Qwen_QwQ-32B-Q4_K_M.gguf
+      sha256: 87cc1894a68008856cde6ff24bfb9b99488a0d18c2e0a2b1ddeabd43cd0498e0
+      uri: huggingface://bartowski/Qwen_QwQ-32B-GGUF/Qwen_QwQ-32B-Q4_K_M.gguf
 - &llama31
  url: "github:mudler/LocalAI/gallery/llama3.1-instruct.yaml@master" ## LLama3.1
  icon: https://avatars.githubusercontent.com/u/153379578