mirror of
https://github.com/mudler/LocalAI.git
synced 2025-01-11 07:23:09 +00:00
ad0e30bca5
* refactor: move backends into the backends directory Signed-off-by: Ettore Di Giacinto <mudler@localai.io> * refactor: move main close to implementation for every backend Signed-off-by: Ettore Di Giacinto <mudler@localai.io> --------- Signed-off-by: Ettore Di Giacinto <mudler@localai.io>
43 lines
1.0 KiB
Go
43 lines
1.0 KiB
Go
package transformers
|
|
|
|
// This is a wrapper to statisfy the GRPC service interface
|
|
// It is meant to be used by the main executable that is the server for the specific backend type (falcon, gpt3, etc)
|
|
import (
|
|
"fmt"
|
|
|
|
"github.com/go-skynet/LocalAI/pkg/grpc/base"
|
|
pb "github.com/go-skynet/LocalAI/pkg/grpc/proto"
|
|
|
|
transformers "github.com/go-skynet/go-ggml-transformers.cpp"
|
|
)
|
|
|
|
type GPTNeoX struct {
|
|
base.SingleThread
|
|
|
|
gptneox *transformers.GPTNeoX
|
|
}
|
|
|
|
func (llm *GPTNeoX) Load(opts *pb.ModelOptions) error {
|
|
model, err := transformers.NewGPTNeoX(opts.ModelFile)
|
|
llm.gptneox = model
|
|
return err
|
|
}
|
|
|
|
func (llm *GPTNeoX) Predict(opts *pb.PredictOptions) (string, error) {
|
|
return llm.gptneox.Predict(opts.Prompt, buildPredictOptions(opts)...)
|
|
}
|
|
|
|
// fallback to Predict
|
|
func (llm *GPTNeoX) PredictStream(opts *pb.PredictOptions, results chan string) error {
|
|
go func() {
|
|
res, err := llm.gptneox.Predict(opts.Prompt, buildPredictOptions(opts)...)
|
|
|
|
if err != nil {
|
|
fmt.Println("err: ", err)
|
|
}
|
|
results <- res
|
|
close(results)
|
|
}()
|
|
return nil
|
|
}
|