2024-03-21 21:09:04 +00:00
|
|
|
backend: bert-embeddings
|
2024-03-21 00:12:20 +00:00
|
|
|
embeddings: true
|
2024-03-21 21:09:04 +00:00
|
|
|
f16: true
|
|
|
|
|
|
|
|
gpu_layers: 90
|
|
|
|
mmap: true
|
|
|
|
name: text-embedding-ada-002
|
|
|
|
|
2024-03-21 00:12:20 +00:00
|
|
|
parameters:
|
2024-03-21 21:09:04 +00:00
|
|
|
model: huggingface://mudler/all-MiniLM-L6-v2/ggml-model-q4_0.bin
|
2024-03-21 00:12:20 +00:00
|
|
|
|
|
|
|
usage: |
|
|
|
|
You can test this model with curl like this:
|
|
|
|
|
|
|
|
curl http://localhost:8080/embeddings -X POST -H "Content-Type: application/json" -d '{
|
|
|
|
"input": "Your text string goes here",
|
2024-03-21 21:09:04 +00:00
|
|
|
"model": "text-embedding-ada-002"
|
2024-03-21 00:12:20 +00:00
|
|
|
}'
|