mirror of
https://github.com/mudler/LocalAI.git
synced 2025-01-13 00:10:14 +00:00
72 lines
1.7 KiB
Go
72 lines
1.7 KiB
Go
package rwkv
|
|
|
|
// This is a wrapper to statisfy the GRPC service interface
|
|
// It is meant to be used by the main executable that is the server for the specific backend type (falcon, gpt3, etc)
|
|
import (
|
|
"fmt"
|
|
"path/filepath"
|
|
|
|
"github.com/donomii/go-rwkv.cpp"
|
|
"github.com/go-skynet/LocalAI/pkg/grpc/base"
|
|
pb "github.com/go-skynet/LocalAI/pkg/grpc/proto"
|
|
)
|
|
|
|
const tokenizerSuffix = ".tokenizer.json"
|
|
|
|
type LLM struct {
|
|
base.Base
|
|
|
|
rwkv *rwkv.RwkvState
|
|
}
|
|
|
|
func (llm *LLM) Load(opts *pb.ModelOptions) error {
|
|
modelPath := filepath.Dir(opts.ModelFile)
|
|
modelFile := filepath.Base(opts.ModelFile)
|
|
model := rwkv.LoadFiles(opts.ModelFile, filepath.Join(modelPath, modelFile+tokenizerSuffix), uint32(opts.GetThreads()))
|
|
|
|
if model == nil {
|
|
return fmt.Errorf("could not load model")
|
|
}
|
|
llm.rwkv = model
|
|
return nil
|
|
}
|
|
|
|
func (llm *LLM) Predict(opts *pb.PredictOptions) (string, error) {
|
|
|
|
stopWord := "\n"
|
|
if len(opts.StopPrompts) > 0 {
|
|
stopWord = opts.StopPrompts[0]
|
|
}
|
|
|
|
if err := llm.rwkv.ProcessInput(opts.Prompt); err != nil {
|
|
return "", err
|
|
}
|
|
|
|
response := llm.rwkv.GenerateResponse(int(opts.Tokens), stopWord, float32(opts.Temperature), float32(opts.TopP), nil)
|
|
|
|
return response, nil
|
|
}
|
|
|
|
func (llm *LLM) PredictStream(opts *pb.PredictOptions, results chan string) error {
|
|
go func() {
|
|
|
|
stopWord := "\n"
|
|
if len(opts.StopPrompts) > 0 {
|
|
stopWord = opts.StopPrompts[0]
|
|
}
|
|
|
|
if err := llm.rwkv.ProcessInput(opts.Prompt); err != nil {
|
|
fmt.Println("Error processing input: ", err)
|
|
return
|
|
}
|
|
|
|
llm.rwkv.GenerateResponse(int(opts.Tokens), stopWord, float32(opts.Temperature), float32(opts.TopP), func(s string) bool {
|
|
results <- s
|
|
return true
|
|
})
|
|
close(results)
|
|
}()
|
|
|
|
return nil
|
|
}
|