mirror of
https://github.com/mudler/LocalAI.git
synced 2025-01-03 11:24:10 +00:00
62 lines
1.7 KiB
Go
62 lines
1.7 KiB
Go
|
package gpt4all
|
||
|
|
||
|
// This is a wrapper to statisfy the GRPC service interface
|
||
|
// It is meant to be used by the main executable that is the server for the specific backend type (falcon, gpt3, etc)
|
||
|
import (
|
||
|
"fmt"
|
||
|
|
||
|
pb "github.com/go-skynet/LocalAI/pkg/grpc/proto"
|
||
|
gpt4all "github.com/nomic-ai/gpt4all/gpt4all-bindings/golang"
|
||
|
)
|
||
|
|
||
|
type LLM struct {
|
||
|
gpt4all *gpt4all.Model
|
||
|
}
|
||
|
|
||
|
func (llm *LLM) Load(opts *pb.ModelOptions) error {
|
||
|
model, err := gpt4all.New(opts.Model,
|
||
|
gpt4all.SetThreads(int(opts.Threads)),
|
||
|
gpt4all.SetLibrarySearchPath(opts.LibrarySearchPath))
|
||
|
llm.gpt4all = model
|
||
|
return err
|
||
|
}
|
||
|
|
||
|
func buildPredictOptions(opts *pb.PredictOptions) []gpt4all.PredictOption {
|
||
|
predictOptions := []gpt4all.PredictOption{
|
||
|
gpt4all.SetTemperature(float64(opts.Temperature)),
|
||
|
gpt4all.SetTopP(float64(opts.TopP)),
|
||
|
gpt4all.SetTopK(int(opts.TopK)),
|
||
|
gpt4all.SetTokens(int(opts.Tokens)),
|
||
|
}
|
||
|
|
||
|
if opts.Batch != 0 {
|
||
|
predictOptions = append(predictOptions, gpt4all.SetBatch(int(opts.Batch)))
|
||
|
}
|
||
|
return predictOptions
|
||
|
}
|
||
|
|
||
|
func (llm *LLM) Predict(opts *pb.PredictOptions) (string, error) {
|
||
|
return llm.gpt4all.Predict(opts.Prompt, buildPredictOptions(opts)...)
|
||
|
}
|
||
|
|
||
|
func (llm *LLM) PredictStream(opts *pb.PredictOptions, results chan string) {
|
||
|
predictOptions := buildPredictOptions(opts)
|
||
|
|
||
|
go func() {
|
||
|
llm.gpt4all.SetTokenCallback(func(token string) bool {
|
||
|
results <- token
|
||
|
return true
|
||
|
})
|
||
|
_, err := llm.gpt4all.Predict(opts.Prompt, predictOptions...)
|
||
|
if err != nil {
|
||
|
fmt.Println("err: ", err)
|
||
|
}
|
||
|
llm.gpt4all.SetTokenCallback(nil)
|
||
|
close(results)
|
||
|
}()
|
||
|
}
|
||
|
|
||
|
func (llm *LLM) Embeddings(opts *pb.PredictOptions) ([]float32, error) {
|
||
|
return []float32{}, fmt.Errorf("not implemented")
|
||
|
}
|