2023-07-15 01:19:43 +02:00
|
|
|
package grpc
|
|
|
|
|
|
|
|
import (
|
|
|
|
"context"
|
|
|
|
"fmt"
|
|
|
|
"io"
|
2023-08-19 01:49:33 +02:00
|
|
|
"sync"
|
2023-07-15 01:19:43 +02:00
|
|
|
"time"
|
|
|
|
|
2024-02-20 20:21:19 -05:00
|
|
|
"github.com/go-skynet/LocalAI/core/schema"
|
2023-07-15 01:19:43 +02:00
|
|
|
pb "github.com/go-skynet/LocalAI/pkg/grpc/proto"
|
|
|
|
"google.golang.org/grpc"
|
|
|
|
"google.golang.org/grpc/credentials/insecure"
|
|
|
|
)
|
|
|
|
|
|
|
|
type Client struct {
|
2023-11-16 22:20:16 +01:00
|
|
|
address string
|
|
|
|
busy bool
|
|
|
|
parallel bool
|
2023-08-19 01:49:33 +02:00
|
|
|
sync.Mutex
|
2023-11-16 22:20:16 +01:00
|
|
|
opMutex sync.Mutex
|
2023-11-26 18:36:23 +01:00
|
|
|
wd WatchDog
|
2023-07-15 01:19:43 +02:00
|
|
|
}
|
|
|
|
|
2023-11-26 18:36:23 +01:00
|
|
|
type WatchDog interface {
|
|
|
|
Mark(address string)
|
|
|
|
UnMark(address string)
|
|
|
|
}
|
|
|
|
|
2023-08-19 01:49:33 +02:00
|
|
|
func (c *Client) IsBusy() bool {
|
|
|
|
c.Lock()
|
|
|
|
defer c.Unlock()
|
|
|
|
return c.busy
|
|
|
|
}
|
|
|
|
|
|
|
|
func (c *Client) setBusy(v bool) {
|
|
|
|
c.Lock()
|
|
|
|
c.busy = v
|
|
|
|
c.Unlock()
|
|
|
|
}
|
|
|
|
|
2024-01-08 00:37:02 +01:00
|
|
|
func (c *Client) HealthCheck(ctx context.Context) (bool, error) {
|
2023-11-16 22:20:16 +01:00
|
|
|
if !c.parallel {
|
|
|
|
c.opMutex.Lock()
|
|
|
|
defer c.opMutex.Unlock()
|
|
|
|
}
|
2023-08-19 01:49:33 +02:00
|
|
|
c.setBusy(true)
|
|
|
|
defer c.setBusy(false)
|
2023-07-15 01:19:43 +02:00
|
|
|
conn, err := grpc.Dial(c.address, grpc.WithTransportCredentials(insecure.NewCredentials()))
|
|
|
|
if err != nil {
|
2024-01-08 00:37:02 +01:00
|
|
|
return false, err
|
2023-07-15 01:19:43 +02:00
|
|
|
}
|
|
|
|
defer conn.Close()
|
2023-07-15 01:19:43 +02:00
|
|
|
client := pb.NewBackendClient(conn)
|
2023-07-15 01:19:43 +02:00
|
|
|
|
|
|
|
// The healthcheck call shouldn't take long time
|
|
|
|
ctx, cancel := context.WithTimeout(ctx, 10*time.Second)
|
|
|
|
defer cancel()
|
|
|
|
|
|
|
|
res, err := client.Health(ctx, &pb.HealthMessage{})
|
|
|
|
if err != nil {
|
2024-01-08 00:37:02 +01:00
|
|
|
return false, err
|
2023-07-15 01:19:43 +02:00
|
|
|
}
|
|
|
|
|
2023-07-27 18:41:04 +02:00
|
|
|
if string(res.Message) == "OK" {
|
2024-01-08 00:37:02 +01:00
|
|
|
return true, nil
|
2023-07-15 01:19:43 +02:00
|
|
|
}
|
2024-01-08 00:37:02 +01:00
|
|
|
|
|
|
|
return false, fmt.Errorf("health check failed: %s", res.Message)
|
2023-07-15 01:19:43 +02:00
|
|
|
}
|
|
|
|
|
2023-07-15 01:19:43 +02:00
|
|
|
func (c *Client) Embeddings(ctx context.Context, in *pb.PredictOptions, opts ...grpc.CallOption) (*pb.EmbeddingResult, error) {
|
2023-11-16 22:20:16 +01:00
|
|
|
if !c.parallel {
|
|
|
|
c.opMutex.Lock()
|
|
|
|
defer c.opMutex.Unlock()
|
|
|
|
}
|
2023-08-19 01:49:33 +02:00
|
|
|
c.setBusy(true)
|
|
|
|
defer c.setBusy(false)
|
2023-11-26 18:36:23 +01:00
|
|
|
if c.wd != nil {
|
|
|
|
c.wd.Mark(c.address)
|
|
|
|
defer c.wd.UnMark(c.address)
|
|
|
|
}
|
2023-07-15 01:19:43 +02:00
|
|
|
conn, err := grpc.Dial(c.address, grpc.WithTransportCredentials(insecure.NewCredentials()))
|
|
|
|
if err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
defer conn.Close()
|
2023-07-15 01:19:43 +02:00
|
|
|
client := pb.NewBackendClient(conn)
|
2023-07-15 01:19:43 +02:00
|
|
|
|
|
|
|
return client.Embedding(ctx, in, opts...)
|
|
|
|
}
|
|
|
|
|
2023-07-15 01:19:43 +02:00
|
|
|
func (c *Client) Predict(ctx context.Context, in *pb.PredictOptions, opts ...grpc.CallOption) (*pb.Reply, error) {
|
2023-11-16 22:20:16 +01:00
|
|
|
if !c.parallel {
|
|
|
|
c.opMutex.Lock()
|
|
|
|
defer c.opMutex.Unlock()
|
|
|
|
}
|
2023-08-19 01:49:33 +02:00
|
|
|
c.setBusy(true)
|
|
|
|
defer c.setBusy(false)
|
2023-11-26 18:36:23 +01:00
|
|
|
if c.wd != nil {
|
|
|
|
c.wd.Mark(c.address)
|
|
|
|
defer c.wd.UnMark(c.address)
|
|
|
|
}
|
2023-07-15 01:19:43 +02:00
|
|
|
conn, err := grpc.Dial(c.address, grpc.WithTransportCredentials(insecure.NewCredentials()))
|
|
|
|
if err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
defer conn.Close()
|
2023-07-15 01:19:43 +02:00
|
|
|
client := pb.NewBackendClient(conn)
|
2023-07-15 01:19:43 +02:00
|
|
|
|
|
|
|
return client.Predict(ctx, in, opts...)
|
|
|
|
}
|
|
|
|
|
|
|
|
func (c *Client) LoadModel(ctx context.Context, in *pb.ModelOptions, opts ...grpc.CallOption) (*pb.Result, error) {
|
2023-11-16 22:20:16 +01:00
|
|
|
if !c.parallel {
|
|
|
|
c.opMutex.Lock()
|
|
|
|
defer c.opMutex.Unlock()
|
|
|
|
}
|
2023-08-19 01:49:33 +02:00
|
|
|
c.setBusy(true)
|
|
|
|
defer c.setBusy(false)
|
2023-11-26 18:36:23 +01:00
|
|
|
if c.wd != nil {
|
|
|
|
c.wd.Mark(c.address)
|
|
|
|
defer c.wd.UnMark(c.address)
|
|
|
|
}
|
2023-07-15 01:19:43 +02:00
|
|
|
conn, err := grpc.Dial(c.address, grpc.WithTransportCredentials(insecure.NewCredentials()))
|
|
|
|
if err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
defer conn.Close()
|
2023-07-15 01:19:43 +02:00
|
|
|
client := pb.NewBackendClient(conn)
|
2023-07-15 01:19:43 +02:00
|
|
|
return client.LoadModel(ctx, in, opts...)
|
|
|
|
}
|
|
|
|
|
2023-07-27 18:41:04 +02:00
|
|
|
func (c *Client) PredictStream(ctx context.Context, in *pb.PredictOptions, f func(s []byte), opts ...grpc.CallOption) error {
|
2023-11-16 22:20:16 +01:00
|
|
|
if !c.parallel {
|
|
|
|
c.opMutex.Lock()
|
|
|
|
defer c.opMutex.Unlock()
|
|
|
|
}
|
2023-08-19 01:49:33 +02:00
|
|
|
c.setBusy(true)
|
|
|
|
defer c.setBusy(false)
|
2023-11-26 18:36:23 +01:00
|
|
|
if c.wd != nil {
|
|
|
|
c.wd.Mark(c.address)
|
|
|
|
defer c.wd.UnMark(c.address)
|
|
|
|
}
|
2023-07-15 01:19:43 +02:00
|
|
|
conn, err := grpc.Dial(c.address, grpc.WithTransportCredentials(insecure.NewCredentials()))
|
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
defer conn.Close()
|
2023-07-15 01:19:43 +02:00
|
|
|
client := pb.NewBackendClient(conn)
|
2023-07-15 01:19:43 +02:00
|
|
|
|
|
|
|
stream, err := client.PredictStream(ctx, in, opts...)
|
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
|
|
|
|
for {
|
|
|
|
feature, err := stream.Recv()
|
|
|
|
if err == io.EOF {
|
|
|
|
break
|
|
|
|
}
|
|
|
|
if err != nil {
|
|
|
|
fmt.Println("Error", err)
|
|
|
|
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
f(feature.GetMessage())
|
|
|
|
}
|
|
|
|
|
|
|
|
return nil
|
|
|
|
}
|
2023-07-15 01:19:43 +02:00
|
|
|
|
|
|
|
func (c *Client) GenerateImage(ctx context.Context, in *pb.GenerateImageRequest, opts ...grpc.CallOption) (*pb.Result, error) {
|
2023-11-16 22:20:16 +01:00
|
|
|
if !c.parallel {
|
|
|
|
c.opMutex.Lock()
|
|
|
|
defer c.opMutex.Unlock()
|
|
|
|
}
|
2023-08-19 01:49:33 +02:00
|
|
|
c.setBusy(true)
|
|
|
|
defer c.setBusy(false)
|
2023-11-26 18:36:23 +01:00
|
|
|
if c.wd != nil {
|
|
|
|
c.wd.Mark(c.address)
|
|
|
|
defer c.wd.UnMark(c.address)
|
|
|
|
}
|
2023-07-15 01:19:43 +02:00
|
|
|
conn, err := grpc.Dial(c.address, grpc.WithTransportCredentials(insecure.NewCredentials()))
|
|
|
|
if err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
defer conn.Close()
|
|
|
|
client := pb.NewBackendClient(conn)
|
|
|
|
return client.GenerateImage(ctx, in, opts...)
|
|
|
|
}
|
|
|
|
|
|
|
|
func (c *Client) TTS(ctx context.Context, in *pb.TTSRequest, opts ...grpc.CallOption) (*pb.Result, error) {
|
2023-11-16 22:20:16 +01:00
|
|
|
if !c.parallel {
|
|
|
|
c.opMutex.Lock()
|
|
|
|
defer c.opMutex.Unlock()
|
|
|
|
}
|
2023-08-19 01:49:33 +02:00
|
|
|
c.setBusy(true)
|
|
|
|
defer c.setBusy(false)
|
2023-11-26 18:36:23 +01:00
|
|
|
if c.wd != nil {
|
|
|
|
c.wd.Mark(c.address)
|
|
|
|
defer c.wd.UnMark(c.address)
|
|
|
|
}
|
2023-07-15 01:19:43 +02:00
|
|
|
conn, err := grpc.Dial(c.address, grpc.WithTransportCredentials(insecure.NewCredentials()))
|
|
|
|
if err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
defer conn.Close()
|
|
|
|
client := pb.NewBackendClient(conn)
|
|
|
|
return client.TTS(ctx, in, opts...)
|
|
|
|
}
|
|
|
|
|
2024-01-05 12:04:46 -05:00
|
|
|
func (c *Client) AudioTranscription(ctx context.Context, in *pb.TranscriptRequest, opts ...grpc.CallOption) (*schema.Result, error) {
|
2023-11-16 22:20:16 +01:00
|
|
|
if !c.parallel {
|
|
|
|
c.opMutex.Lock()
|
|
|
|
defer c.opMutex.Unlock()
|
|
|
|
}
|
2023-08-19 01:49:33 +02:00
|
|
|
c.setBusy(true)
|
|
|
|
defer c.setBusy(false)
|
2023-11-26 18:36:23 +01:00
|
|
|
if c.wd != nil {
|
|
|
|
c.wd.Mark(c.address)
|
|
|
|
defer c.wd.UnMark(c.address)
|
|
|
|
}
|
2023-07-15 01:19:43 +02:00
|
|
|
conn, err := grpc.Dial(c.address, grpc.WithTransportCredentials(insecure.NewCredentials()))
|
|
|
|
if err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
defer conn.Close()
|
|
|
|
client := pb.NewBackendClient(conn)
|
|
|
|
res, err := client.AudioTranscription(ctx, in, opts...)
|
|
|
|
if err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
2024-01-05 12:04:46 -05:00
|
|
|
tresult := &schema.Result{}
|
2023-07-15 01:19:43 +02:00
|
|
|
for _, s := range res.Segments {
|
|
|
|
tks := []int{}
|
|
|
|
for _, t := range s.Tokens {
|
|
|
|
tks = append(tks, int(t))
|
|
|
|
}
|
|
|
|
tresult.Segments = append(tresult.Segments,
|
2024-01-05 12:04:46 -05:00
|
|
|
schema.Segment{
|
2023-07-15 01:19:43 +02:00
|
|
|
Text: s.Text,
|
|
|
|
Id: int(s.Id),
|
|
|
|
Start: time.Duration(s.Start),
|
|
|
|
End: time.Duration(s.End),
|
|
|
|
Tokens: tks,
|
|
|
|
})
|
|
|
|
}
|
|
|
|
tresult.Text = res.Text
|
|
|
|
return tresult, err
|
|
|
|
}
|
2023-08-18 15:23:14 -04:00
|
|
|
|
|
|
|
func (c *Client) TokenizeString(ctx context.Context, in *pb.PredictOptions, opts ...grpc.CallOption) (*pb.TokenizationResponse, error) {
|
2023-11-16 22:20:16 +01:00
|
|
|
if !c.parallel {
|
|
|
|
c.opMutex.Lock()
|
|
|
|
defer c.opMutex.Unlock()
|
|
|
|
}
|
2023-08-19 01:49:33 +02:00
|
|
|
c.setBusy(true)
|
|
|
|
defer c.setBusy(false)
|
2023-11-26 18:36:23 +01:00
|
|
|
if c.wd != nil {
|
|
|
|
c.wd.Mark(c.address)
|
|
|
|
defer c.wd.UnMark(c.address)
|
|
|
|
}
|
2023-08-18 15:23:14 -04:00
|
|
|
conn, err := grpc.Dial(c.address, grpc.WithTransportCredentials(insecure.NewCredentials()))
|
|
|
|
if err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
defer conn.Close()
|
|
|
|
client := pb.NewBackendClient(conn)
|
|
|
|
|
|
|
|
res, err := client.TokenizeString(ctx, in, opts...)
|
|
|
|
|
|
|
|
if err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
return res, nil
|
|
|
|
}
|
|
|
|
|
|
|
|
func (c *Client) Status(ctx context.Context) (*pb.StatusResponse, error) {
|
2023-11-16 22:20:16 +01:00
|
|
|
if !c.parallel {
|
|
|
|
c.opMutex.Lock()
|
|
|
|
defer c.opMutex.Unlock()
|
|
|
|
}
|
2023-08-19 01:49:33 +02:00
|
|
|
c.setBusy(true)
|
|
|
|
defer c.setBusy(false)
|
2023-08-18 15:23:14 -04:00
|
|
|
conn, err := grpc.Dial(c.address, grpc.WithTransportCredentials(insecure.NewCredentials()))
|
|
|
|
if err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
defer conn.Close()
|
|
|
|
client := pb.NewBackendClient(conn)
|
|
|
|
return client.Status(ctx, &pb.HealthMessage{})
|
|
|
|
}
|