mirror of
https://github.com/mudler/LocalAI.git
synced 2025-04-25 13:29:58 +00:00
* chore: drop double call to stop all backends, refactors Signed-off-by: Ettore Di Giacinto <mudler@localai.io> * fix: do lock when cycling to models to delete Signed-off-by: Ettore Di Giacinto <mudler@localai.io> --------- Signed-off-by: Ettore Di Giacinto <mudler@localai.io>
159 lines
3.8 KiB
Go
159 lines
3.8 KiB
Go
package model
|
|
|
|
import (
|
|
"errors"
|
|
"fmt"
|
|
"os"
|
|
"os/signal"
|
|
"path/filepath"
|
|
"strconv"
|
|
"strings"
|
|
"syscall"
|
|
"time"
|
|
|
|
"github.com/hpcloud/tail"
|
|
process "github.com/mudler/go-processmanager"
|
|
"github.com/rs/zerolog/log"
|
|
)
|
|
|
|
var forceBackendShutdown bool = os.Getenv("LOCALAI_FORCE_BACKEND_SHUTDOWN") == "true"
|
|
|
|
func (ml *ModelLoader) deleteProcess(s string) error {
|
|
model, ok := ml.models[s]
|
|
if !ok {
|
|
log.Debug().Msgf("Model %s not found", s)
|
|
return fmt.Errorf("model %s not found", s)
|
|
}
|
|
|
|
defer delete(ml.models, s)
|
|
|
|
retries := 1
|
|
for model.GRPC(false, ml.wd).IsBusy() {
|
|
log.Debug().Msgf("%s busy. Waiting.", s)
|
|
dur := time.Duration(retries*2) * time.Second
|
|
if dur > retryTimeout {
|
|
dur = retryTimeout
|
|
}
|
|
time.Sleep(dur)
|
|
retries++
|
|
|
|
if retries > 10 && forceBackendShutdown {
|
|
log.Warn().Msgf("Model %s is still busy after %d retries. Forcing shutdown.", s, retries)
|
|
break
|
|
}
|
|
}
|
|
|
|
log.Debug().Msgf("Deleting process %s", s)
|
|
|
|
process := model.Process()
|
|
if process == nil {
|
|
log.Error().Msgf("No process for %s", s)
|
|
// Nothing to do as there is no process
|
|
return nil
|
|
}
|
|
|
|
err := process.Stop()
|
|
if err != nil {
|
|
log.Error().Err(err).Msgf("(deleteProcess) error while deleting process %s", s)
|
|
}
|
|
|
|
return err
|
|
}
|
|
|
|
func (ml *ModelLoader) StopGRPC(filter GRPCProcessFilter) error {
|
|
var err error = nil
|
|
ml.mu.Lock()
|
|
defer ml.mu.Unlock()
|
|
|
|
for k, m := range ml.models {
|
|
if filter(k, m.Process()) {
|
|
e := ml.deleteProcess(k)
|
|
err = errors.Join(err, e)
|
|
}
|
|
}
|
|
return err
|
|
}
|
|
|
|
func (ml *ModelLoader) StopAllGRPC() error {
|
|
return ml.StopGRPC(all)
|
|
}
|
|
|
|
func (ml *ModelLoader) GetGRPCPID(id string) (int, error) {
|
|
ml.mu.Lock()
|
|
defer ml.mu.Unlock()
|
|
p, exists := ml.models[id]
|
|
if !exists {
|
|
return -1, fmt.Errorf("no grpc backend found for %s", id)
|
|
}
|
|
if p.Process() == nil {
|
|
return -1, fmt.Errorf("no grpc backend found for %s", id)
|
|
}
|
|
return strconv.Atoi(p.Process().PID)
|
|
}
|
|
|
|
func (ml *ModelLoader) startProcess(grpcProcess, id string, serverAddress string, args ...string) (*process.Process, error) {
|
|
// Make sure the process is executable
|
|
if err := os.Chmod(grpcProcess, 0700); err != nil {
|
|
return nil, err
|
|
}
|
|
|
|
log.Debug().Msgf("Loading GRPC Process: %s", grpcProcess)
|
|
|
|
log.Debug().Msgf("GRPC Service for %s will be running at: '%s'", id, serverAddress)
|
|
|
|
workDir, err := filepath.Abs(filepath.Dir(grpcProcess))
|
|
if err != nil {
|
|
return nil, err
|
|
}
|
|
|
|
grpcControlProcess := process.New(
|
|
process.WithTemporaryStateDir(),
|
|
process.WithName(filepath.Base(grpcProcess)),
|
|
process.WithArgs(append(args, []string{"--addr", serverAddress}...)...),
|
|
process.WithEnvironment(os.Environ()...),
|
|
process.WithWorkDir(workDir),
|
|
)
|
|
|
|
if ml.wd != nil {
|
|
ml.wd.Add(serverAddress, grpcControlProcess)
|
|
ml.wd.AddAddressModelMap(serverAddress, id)
|
|
}
|
|
|
|
if err := grpcControlProcess.Run(); err != nil {
|
|
return grpcControlProcess, err
|
|
}
|
|
|
|
log.Debug().Msgf("GRPC Service state dir: %s", grpcControlProcess.StateDir())
|
|
// clean up process
|
|
go func() {
|
|
c := make(chan os.Signal, 1)
|
|
signal.Notify(c, os.Interrupt, syscall.SIGTERM)
|
|
<-c
|
|
err := grpcControlProcess.Stop()
|
|
if err != nil {
|
|
log.Error().Err(err).Msg("error while shutting down grpc process")
|
|
}
|
|
}()
|
|
|
|
go func() {
|
|
t, err := tail.TailFile(grpcControlProcess.StderrPath(), tail.Config{Follow: true})
|
|
if err != nil {
|
|
log.Debug().Msgf("Could not tail stderr")
|
|
}
|
|
for line := range t.Lines {
|
|
log.Debug().Msgf("GRPC(%s): stderr %s", strings.Join([]string{id, serverAddress}, "-"), line.Text)
|
|
}
|
|
}()
|
|
go func() {
|
|
t, err := tail.TailFile(grpcControlProcess.StdoutPath(), tail.Config{Follow: true})
|
|
if err != nil {
|
|
log.Debug().Msgf("Could not tail stdout")
|
|
}
|
|
for line := range t.Lines {
|
|
log.Debug().Msgf("GRPC(%s): stdout %s", strings.Join([]string{id, serverAddress}, "-"), line.Text)
|
|
}
|
|
}()
|
|
|
|
return grpcControlProcess, nil
|
|
}
|