mirror of
https://github.com/mudler/LocalAI.git
synced 2025-01-11 23:42:48 +00:00
54 lines
1.3 KiB
Go
54 lines
1.3 KiB
Go
package transformers
|
|
|
|
// This is a wrapper to statisfy the GRPC service interface
|
|
// It is meant to be used by the main executable that is the server for the specific backend type (falcon, gpt3, etc)
|
|
import (
|
|
"fmt"
|
|
|
|
"github.com/go-skynet/LocalAI/pkg/grpc/base"
|
|
pb "github.com/go-skynet/LocalAI/pkg/grpc/proto"
|
|
"github.com/rs/zerolog/log"
|
|
|
|
transformers "github.com/go-skynet/go-ggml-transformers.cpp"
|
|
)
|
|
|
|
type GPT2 struct {
|
|
base.Base
|
|
|
|
gpt2 *transformers.GPT2
|
|
}
|
|
|
|
func (llm *GPT2) Load(opts *pb.ModelOptions) error {
|
|
if llm.Base.State != pb.StatusResponse_UNINITIALIZED {
|
|
log.Warn().Msgf("gpt2 backend loading %s while already in state %s!", opts.Model, llm.Base.State.String())
|
|
}
|
|
|
|
llm.Base.Lock()
|
|
defer llm.Base.Unlock()
|
|
model, err := transformers.New(opts.ModelFile)
|
|
llm.gpt2 = model
|
|
return err
|
|
}
|
|
|
|
func (llm *GPT2) Predict(opts *pb.PredictOptions) (string, error) {
|
|
llm.Base.Lock()
|
|
defer llm.Base.Unlock()
|
|
return llm.gpt2.Predict(opts.Prompt, buildPredictOptions(opts)...)
|
|
}
|
|
|
|
// fallback to Predict
|
|
func (llm *GPT2) PredictStream(opts *pb.PredictOptions, results chan string) error {
|
|
llm.Base.Lock()
|
|
go func() {
|
|
res, err := llm.gpt2.Predict(opts.Prompt, buildPredictOptions(opts)...)
|
|
|
|
if err != nil {
|
|
fmt.Println("err: ", err)
|
|
}
|
|
results <- res
|
|
close(results)
|
|
llm.Base.Unlock()
|
|
}()
|
|
return nil
|
|
}
|