From f505d7ab3f4dabf927413d42691adb37bd46f131 Mon Sep 17 00:00:00 2001 From: Ettore Di Giacinto Date: Sat, 20 Jul 2024 16:17:34 +0200 Subject: [PATCH] models(gallery): add archangel_sft_pythia2-8b (#2933) Signed-off-by: Ettore Di Giacinto --- gallery/index.yaml | 27 +++++++++++++++++++++++++++ gallery/tuluv2.yaml | 43 +++++++++++++++++++++++++++++++++++++++++++ 2 files changed, 70 insertions(+) create mode 100644 gallery/tuluv2.yaml diff --git a/gallery/index.yaml b/gallery/index.yaml index 63664070..2ef3d46b 100644 --- a/gallery/index.yaml +++ b/gallery/index.yaml @@ -24,6 +24,33 @@ - filename: DeepSeek-Coder-V2-Lite-Instruct-Q4_K_M.gguf sha256: 50ec78036433265965ed1afd0667c00c71c12aa70bcf383be462cb8e159db6c0 uri: huggingface://LoneStriker/DeepSeek-Coder-V2-Lite-Instruct-GGUF/DeepSeek-Coder-V2-Lite-Instruct-Q4_K_M.gguf +- name: "archangel_sft_pythia2-8b" + url: "github:mudler/LocalAI/gallery/tuluv2.yaml@master" + icon: https://gist.github.com/assets/29318529/fe2d8391-dbd1-4b7e-9dc4-7cb97e55bc06 + license: apache-2.0 + urls: + - https://huggingface.co/ContextualAI/archangel_sft_pythia2-8b + - https://huggingface.co/RichardErkhov/ContextualAI_-_archangel_sft_pythia2-8b-gguf + - https://github.com/ContextualAI/HALOs + description: | + datasets: + - stanfordnlp/SHP + - Anthropic/hh-rlhf + - OpenAssistant/oasst1 + + This repo contains the model checkpoints for: + - model family pythia2-8b + - optimized with the loss SFT + - aligned using the SHP, Anthropic HH and Open Assistant datasets. + + Please refer to our [code repository](https://github.com/ContextualAI/HALOs) or [blog](https://contextual.ai/better-cheaper-faster-llm-alignment-with-kto/) which contains intructions for training your own HALOs and links to our model cards. + overrides: + parameters: + model: archangel_sft_pythia2-8b.Q4_K_M.gguf + files: + - filename: archangel_sft_pythia2-8b.Q4_K_M.gguf + sha256: a47782c55ef2b39b19644213720a599d9849511a73c9ebb0c1de749383c0a0f8 + uri: huggingface://RichardErkhov/ContextualAI_-_archangel_sft_pythia2-8b-gguf/archangel_sft_pythia2-8b.Q4_K_M.gguf - &qwen2 ## Start QWEN2 url: "github:mudler/LocalAI/gallery/chatml.yaml@master" diff --git a/gallery/tuluv2.yaml b/gallery/tuluv2.yaml new file mode 100644 index 00000000..ca2785a2 --- /dev/null +++ b/gallery/tuluv2.yaml @@ -0,0 +1,43 @@ +--- +name: "tuluv2" + +config_file: | + mmap: true + template: + chat_message: | + <|{{ .RoleName }}|> + {{ if .FunctionCall -}} + Function call: + {{ else if eq .RoleName "tool" -}} + Function response: + {{ end -}} + {{ if .Content -}} + {{.Content }} + {{ end -}} + {{ if .FunctionCall -}} + {{toJson .FunctionCall}} + {{ end -}} + function: | + <|{{ .RoleName }}|> + {{ if .FunctionCall -}} + Function call: + {{ else if eq .RoleName "tool" -}} + Function response: + {{ end -}} + {{ if .Content -}} + {{.Content }} + {{ end -}} + {{ if .FunctionCall -}} + {{toJson .FunctionCall}} + {{ end -}} + chat: | + {{.Input -}} + <|assistant|> + completion: | + {{.Input}} + context_size: 4096 + f16: true + stopwords: + - '<|im_end|>' + - '' + - '<|endoftext|>'