mirror of
https://github.com/mudler/LocalAI.git
synced 2024-12-18 20:27:57 +00:00
chore(model): add rwkv-6-world-7b to the gallery (#4270)
Signed-off-by: Ettore Di Giacinto <mudler@localai.io>
This commit is contained in:
parent
2b62260b6d
commit
369110e6bf
@ -1,4 +1,27 @@
|
|||||||
---
|
---
|
||||||
|
- &rwkv
|
||||||
|
url: "github:mudler/LocalAI/gallery/rwkv.yaml@master"
|
||||||
|
name: "rwkv-6-world-7b"
|
||||||
|
license: apache-2.0
|
||||||
|
urls:
|
||||||
|
- https://huggingface.co/RWKV/rwkv-6-world-7b
|
||||||
|
- https://huggingface.co/bartowski/rwkv-6-world-7b-GGUF
|
||||||
|
tags:
|
||||||
|
- llm
|
||||||
|
- rwkv
|
||||||
|
- cpu
|
||||||
|
- gpu
|
||||||
|
- rnn
|
||||||
|
description: |
|
||||||
|
RWKV (pronounced RwaKuv) is an RNN with GPT-level LLM performance, and can also be directly trained like a GPT transformer (parallelizable). We are at RWKV-7.
|
||||||
|
So it's combining the best of RNN and transformer - great performance, fast inference, fast training, saves VRAM, "infinite" ctxlen, and free text embedding. Moreover it's 100% attention-free, and a Linux Foundation AI project.
|
||||||
|
overrides:
|
||||||
|
parameters:
|
||||||
|
model: rwkv-6-world-7b-Q4_K_M.gguf
|
||||||
|
files:
|
||||||
|
- filename: rwkv-6-world-7b-Q4_K_M.gguf
|
||||||
|
sha256: f74574186fa4584f405e92198605680db6ad00fd77974ffa14bf02073bb90273
|
||||||
|
uri: huggingface://bartowski/rwkv-6-world-7b-GGUF/rwkv-6-world-7b-Q4_K_M.gguf
|
||||||
- &qwen25coder
|
- &qwen25coder
|
||||||
name: "qwen2.5-coder-14b"
|
name: "qwen2.5-coder-14b"
|
||||||
url: "github:mudler/LocalAI/gallery/chatml.yaml@master"
|
url: "github:mudler/LocalAI/gallery/chatml.yaml@master"
|
||||||
|
23
gallery/rwkv.yaml
Normal file
23
gallery/rwkv.yaml
Normal file
@ -0,0 +1,23 @@
|
|||||||
|
---
|
||||||
|
name: "rwkv"
|
||||||
|
|
||||||
|
config_file: |
|
||||||
|
parameters:
|
||||||
|
top_k: 80
|
||||||
|
temperature: 0.9
|
||||||
|
max_tokens: 4098
|
||||||
|
top_p: 0.8
|
||||||
|
context_size: 4098
|
||||||
|
|
||||||
|
roles:
|
||||||
|
user: "User: "
|
||||||
|
system: "System: "
|
||||||
|
assistant: "Assistant: "
|
||||||
|
|
||||||
|
stopwords:
|
||||||
|
- 'Assistant:'
|
||||||
|
|
||||||
|
template:
|
||||||
|
chat: "{{.Input}}\nAssistant: "
|
||||||
|
completion: |
|
||||||
|
{{.Input}}
|
Loading…
Reference in New Issue
Block a user