models(gallery): add openvino models (#2184)

Signed-off-by: Ettore Di Giacinto <mudler@localai.io>
This commit is contained in:
Ettore Di Giacinto 2024-04-29 18:17:47 +02:00 committed by GitHub
parent ea13863221
commit baff5ff8c2
No known key found for this signature in database
GPG Key ID: B5690EEEBB952194
2 changed files with 57 additions and 1 deletions

View File

@ -778,7 +778,51 @@
- filename: "codellama-7b.Q4_0.gguf"
sha256: "33052f6dd41436db2f83bd48017b6fff8ce0184e15a8a227368b4230f1da97b5"
uri: "huggingface://TheBloke/CodeLlama-7B-GGUF/codellama-7b.Q4_0.gguf"
### START OpenVINO
- &openvino
url: "github:mudler/LocalAI/gallery/openvino.yaml@master"
name: "openvino-llama-3-8b-instruct-ov-int8"
license: llama3
urls:
- https://huggingface.co/fakezeta/llama-3-8b-instruct-ov-int8
overrides:
parameters:
model: fakezeta/llama-3-8b-instruct-ov-int8
stopwords:
- "<|eot_id|>"
- "<|end_of_text|>"
tags:
- llm
- openvino
- gpu
- llama3
- cpu
- <<: *openvino
name: "openvino-phi3"
urls:
- https://huggingface.co/fakezeta/Phi-3-mini-128k-instruct-ov-int8
overrides:
context_size: 131072
parameters:
model: fakezeta/Phi-3-mini-128k-instruct-ov-int8
stopwords:
- <|end|>
- <<: *openvino
name: "openvino-starling-lm-7b-beta-openvino-int8"
urls:
- https://huggingface.co/fakezeta/Starling-LM-7B-beta-openvino-int8
overrides:
context_size: 8192
parameters:
model: fakezeta/Starling-LM-7B-beta-openvino-int8
- <<: *openvino
name: "openvino-wizardlm2"
urls:
- https://huggingface.co/fakezeta/Not-WizardLM-2-7B-ov-int8
overrides:
context_size: 8192
parameters:
model: fakezeta/Not-WizardLM-2-7B-ov-int8
### START Embeddings
- &sentencentransformers
description: |

12
gallery/openvino.yaml Normal file
View File

@ -0,0 +1,12 @@
---
name: openvino
config_file: |
backend: transformers
context_size: 8192
type: OVModelForCausalLM
template:
use_tokenizer_template: true
stopwords:
- "<|eot_id|>"
- "<|end_of_text|>"