From 369110e6bfe6cceb8e2ffee2883c8fdd0bb5723d Mon Sep 17 00:00:00 2001 From: Ettore Di Giacinto Date: Tue, 26 Nov 2024 14:51:37 +0100 Subject: [PATCH] chore(model): add rwkv-6-world-7b to the gallery (#4270) Signed-off-by: Ettore Di Giacinto --- gallery/index.yaml | 23 +++++++++++++++++++++++ gallery/rwkv.yaml | 23 +++++++++++++++++++++++ 2 files changed, 46 insertions(+) create mode 100644 gallery/rwkv.yaml diff --git a/gallery/index.yaml b/gallery/index.yaml index 4f95cf4e..bdd952c8 100644 --- a/gallery/index.yaml +++ b/gallery/index.yaml @@ -1,4 +1,27 @@ --- +- &rwkv + url: "github:mudler/LocalAI/gallery/rwkv.yaml@master" + name: "rwkv-6-world-7b" + license: apache-2.0 + urls: + - https://huggingface.co/RWKV/rwkv-6-world-7b + - https://huggingface.co/bartowski/rwkv-6-world-7b-GGUF + tags: + - llm + - rwkv + - cpu + - gpu + - rnn + description: | + RWKV (pronounced RwaKuv) is an RNN with GPT-level LLM performance, and can also be directly trained like a GPT transformer (parallelizable). We are at RWKV-7. + So it's combining the best of RNN and transformer - great performance, fast inference, fast training, saves VRAM, "infinite" ctxlen, and free text embedding. Moreover it's 100% attention-free, and a Linux Foundation AI project. + overrides: + parameters: + model: rwkv-6-world-7b-Q4_K_M.gguf + files: + - filename: rwkv-6-world-7b-Q4_K_M.gguf + sha256: f74574186fa4584f405e92198605680db6ad00fd77974ffa14bf02073bb90273 + uri: huggingface://bartowski/rwkv-6-world-7b-GGUF/rwkv-6-world-7b-Q4_K_M.gguf - &qwen25coder name: "qwen2.5-coder-14b" url: "github:mudler/LocalAI/gallery/chatml.yaml@master" diff --git a/gallery/rwkv.yaml b/gallery/rwkv.yaml new file mode 100644 index 00000000..41dfcfad --- /dev/null +++ b/gallery/rwkv.yaml @@ -0,0 +1,23 @@ +--- +name: "rwkv" + +config_file: | + parameters: + top_k: 80 + temperature: 0.9 + max_tokens: 4098 + top_p: 0.8 + context_size: 4098 + + roles: + user: "User: " + system: "System: " + assistant: "Assistant: " + + stopwords: + - 'Assistant:' + + template: + chat: "{{.Input}}\nAssistant: " + completion: | + {{.Input}}