2023-03-18 23:59:06 +01:00
package main
import (
2023-10-14 12:27:35 +02:00
"context"
2023-10-12 10:45:34 +02:00
"encoding/json"
2023-10-14 12:27:35 +02:00
"errors"
2023-10-12 10:45:34 +02:00
"fmt"
2023-03-18 23:59:06 +01:00
"os"
2023-07-15 01:19:43 +02:00
"os/signal"
2023-05-03 23:03:31 +02:00
"path/filepath"
2023-07-20 22:10:12 +02:00
"strings"
2023-07-15 01:19:43 +02:00
"syscall"
2023-11-26 18:36:23 +01:00
"time"
2023-05-03 23:03:31 +02:00
2023-04-19 18:43:10 +02:00
api "github.com/go-skynet/LocalAI/api"
2023-10-14 12:27:35 +02:00
"github.com/go-skynet/LocalAI/api/backend"
2023-10-15 09:17:41 +02:00
config "github.com/go-skynet/LocalAI/api/config"
2023-07-15 01:19:43 +02:00
"github.com/go-skynet/LocalAI/api/options"
2023-06-26 15:12:43 +02:00
"github.com/go-skynet/LocalAI/internal"
2023-11-16 08:20:05 +01:00
"github.com/go-skynet/LocalAI/metrics"
2023-10-12 10:45:34 +02:00
"github.com/go-skynet/LocalAI/pkg/gallery"
2023-04-19 18:43:10 +02:00
model "github.com/go-skynet/LocalAI/pkg/model"
2023-04-20 18:33:02 +02:00
"github.com/rs/zerolog"
"github.com/rs/zerolog/log"
2023-10-12 10:45:34 +02:00
progressbar "github.com/schollz/progressbar/v3"
2023-03-18 23:59:06 +01:00
"github.com/urfave/cli/v2"
)
2023-04-19 18:43:10 +02:00
func main ( ) {
2023-04-20 18:33:02 +02:00
log . Logger = log . Output ( zerolog . ConsoleWriter { Out : os . Stderr } )
2023-07-15 01:19:43 +02:00
// clean up process
go func ( ) {
c := make ( chan os . Signal , 1 ) // we need to reserve to buffer size 1, so the notifier are not blocked
signal . Notify ( c , os . Interrupt , syscall . SIGTERM )
<- c
os . Exit ( 1 )
} ( )
2023-04-20 18:33:02 +02:00
2023-04-19 18:43:10 +02:00
path , err := os . Getwd ( )
2023-03-18 23:59:06 +01:00
if err != nil {
2023-04-20 18:33:02 +02:00
log . Error ( ) . Msgf ( "error: %s" , err . Error ( ) )
2023-04-19 18:43:10 +02:00
os . Exit ( 1 )
2023-03-18 23:59:06 +01:00
}
app := & cli . App {
2023-06-26 15:12:43 +02:00
Name : "LocalAI" ,
Version : internal . PrintableVersion ( ) ,
Usage : "OpenAI compatible API for running LLaMA/GPT models locally on CPU with consumer grade hardware." ,
2023-04-19 18:43:10 +02:00
Flags : [ ] cli . Flag {
& cli . BoolFlag {
Name : "f16" ,
EnvVars : [ ] string { "F16" } ,
} ,
2023-07-20 22:10:12 +02:00
& cli . BoolFlag {
Name : "autoload-galleries" ,
EnvVars : [ ] string { "AUTOLOAD_GALLERIES" } ,
} ,
2023-04-20 18:33:02 +02:00
& cli . BoolFlag {
Name : "debug" ,
EnvVars : [ ] string { "DEBUG" } ,
} ,
2023-08-19 01:49:33 +02:00
& cli . BoolFlag {
Name : "single-active-backend" ,
EnvVars : [ ] string { "SINGLE_ACTIVE_BACKEND" } ,
Usage : "Allow only one backend to be running." ,
} ,
2023-11-16 08:20:05 +01:00
& cli . BoolFlag {
Name : "parallel-requests" ,
EnvVars : [ ] string { "PARALLEL_REQUESTS" } ,
Usage : "Enable backends to handle multiple requests in parallel. This is for backends that supports multiple requests in parallel, like llama.cpp or vllm" ,
} ,
2023-05-21 14:38:25 +02:00
& cli . BoolFlag {
Name : "cors" ,
EnvVars : [ ] string { "CORS" } ,
} ,
& cli . StringFlag {
Name : "cors-allow-origins" ,
EnvVars : [ ] string { "CORS_ALLOW_ORIGINS" } ,
} ,
2023-04-19 18:43:10 +02:00
& cli . IntFlag {
2023-06-03 14:25:30 +02:00
Name : "threads" ,
Usage : "Number of threads used for parallel computation. Usage of the number of physical cores in the system is suggested." ,
EnvVars : [ ] string { "THREADS" } ,
Value : 4 ,
2023-03-18 23:59:06 +01:00
} ,
& cli . StringFlag {
2023-06-03 14:25:30 +02:00
Name : "models-path" ,
Usage : "Path containing models used for inferencing" ,
EnvVars : [ ] string { "MODELS_PATH" } ,
Value : filepath . Join ( path , "models" ) ,
2023-03-18 23:59:06 +01:00
} ,
2023-06-24 08:18:17 +02:00
& cli . StringFlag {
Name : "galleries" ,
Usage : "JSON list of galleries" ,
EnvVars : [ ] string { "GALLERIES" } ,
} ,
2023-05-27 09:26:33 +02:00
& cli . StringFlag {
2023-06-03 14:25:30 +02:00
Name : "preload-models" ,
Usage : "A List of models to apply in JSON at start" ,
EnvVars : [ ] string { "PRELOAD_MODELS" } ,
2023-05-27 09:26:33 +02:00
} ,
& cli . StringFlag {
2023-06-03 14:25:30 +02:00
Name : "preload-models-config" ,
Usage : "A List of models to apply at startup. Path to a YAML config file" ,
EnvVars : [ ] string { "PRELOAD_MODELS_CONFIG" } ,
2023-05-27 09:26:33 +02:00
} ,
2023-04-27 06:18:18 +02:00
& cli . StringFlag {
2023-06-03 14:25:30 +02:00
Name : "config-file" ,
Usage : "Config file" ,
EnvVars : [ ] string { "CONFIG_FILE" } ,
2023-04-27 06:18:18 +02:00
} ,
2023-03-18 23:59:06 +01:00
& cli . StringFlag {
2023-06-03 14:25:30 +02:00
Name : "address" ,
Usage : "Bind address for the API server." ,
EnvVars : [ ] string { "ADDRESS" } ,
Value : ":8080" ,
2023-04-19 18:43:10 +02:00
} ,
2023-05-16 19:32:53 +02:00
& cli . StringFlag {
2023-06-03 14:25:30 +02:00
Name : "image-path" ,
Usage : "Image directory" ,
EnvVars : [ ] string { "IMAGE_PATH" } ,
2023-06-22 17:53:10 +02:00
Value : "/tmp/generated/images" ,
} ,
& cli . StringFlag {
Name : "audio-path" ,
Usage : "audio directory" ,
EnvVars : [ ] string { "AUDIO_PATH" } ,
Value : "/tmp/generated/audio" ,
2023-05-16 19:32:53 +02:00
} ,
2023-06-01 23:38:52 +02:00
& cli . StringFlag {
2023-06-03 14:25:30 +02:00
Name : "backend-assets-path" ,
Usage : "Path used to extract libraries that are required by some of the backends in runtime." ,
EnvVars : [ ] string { "BACKEND_ASSETS_PATH" } ,
Value : "/tmp/localai/backend_data" ,
2023-06-01 23:38:52 +02:00
} ,
2023-07-20 22:10:12 +02:00
& cli . StringSliceFlag {
Name : "external-grpc-backends" ,
Usage : "A list of external grpc backends" ,
EnvVars : [ ] string { "EXTERNAL_GRPC_BACKENDS" } ,
} ,
2023-04-19 18:43:10 +02:00
& cli . IntFlag {
2023-06-03 14:25:30 +02:00
Name : "context-size" ,
Usage : "Default context size of the model" ,
EnvVars : [ ] string { "CONTEXT_SIZE" } ,
Value : 512 ,
2023-04-19 18:43:10 +02:00
} ,
2023-05-12 10:04:20 +02:00
& cli . IntFlag {
2023-06-03 14:25:30 +02:00
Name : "upload-limit" ,
Usage : "Default upload-limit. MB" ,
EnvVars : [ ] string { "UPLOAD_LIMIT" } ,
Value : 15 ,
2023-05-12 10:04:20 +02:00
} ,
2023-08-09 17:06:21 -05:00
& cli . StringSliceFlag {
Name : "api-keys" ,
Usage : "List of API Keys to enable API authentication. When this is set, all the requests must be authenticated with one of these API keys." ,
EnvVars : [ ] string { "API_KEY" } ,
} ,
2023-11-26 18:36:23 +01:00
& cli . BoolFlag {
Name : "enable-watchdog-idle" ,
Usage : "Enable watchdog for stopping idle backends. This will stop the backends if are in idle state for too long." ,
EnvVars : [ ] string { "WATCHDOG_IDLE" } ,
Value : false ,
} ,
& cli . BoolFlag {
Name : "enable-watchdog-busy" ,
Usage : "Enable watchdog for stopping busy backends that exceed a defined threshold." ,
EnvVars : [ ] string { "WATCHDOG_BUSY" } ,
Value : false ,
} ,
& cli . StringFlag {
Name : "watchdog-busy-timeout" ,
Usage : "Watchdog timeout. This will restart the backend if it crashes." ,
EnvVars : [ ] string { "WATCHDOG_BUSY_TIMEOUT" } ,
Value : "5m" ,
} ,
& cli . StringFlag {
Name : "watchdog-idle-timeout" ,
Usage : "Watchdog idle timeout. This will restart the backend if it crashes." ,
EnvVars : [ ] string { "WATCHDOG_IDLE_TIMEOUT" } ,
Value : "15m" ,
} ,
2023-08-18 15:23:14 -04:00
& cli . BoolFlag {
Name : "preload-backend-only" ,
Usage : "If set, the api is NOT launched, and only the preloaded models / backends are started. This is intended for multi-node setups." ,
EnvVars : [ ] string { "PRELOAD_BACKEND_ONLY" } ,
Value : false ,
} ,
2023-04-19 18:43:10 +02:00
} ,
Description : `
LocalAI is a drop - in replacement OpenAI API which runs inference locally .
2023-03-18 23:59:06 +01:00
2023-04-19 18:43:10 +02:00
Some of the models compatible are :
- Vicuna
- Koala
- GPT4ALL
- GPT4ALL - J
2023-04-21 00:06:55 +02:00
- Cerebras
2023-04-19 18:43:10 +02:00
- Alpaca
2023-04-21 00:06:55 +02:00
- StableLM ( ggml quantized )
2023-03-18 23:59:06 +01:00
2023-07-02 11:15:05 +02:00
For a list of compatible model , check out : https : //localai.io/model-compatibility/index.html
2023-03-18 23:59:06 +01:00
` ,
2023-04-19 18:43:10 +02:00
UsageText : ` local-ai [options] ` ,
2023-07-02 11:15:05 +02:00
Copyright : "Ettore Di Giacinto" ,
2023-03-18 23:59:06 +01:00
Action : func ( ctx * cli . Context ) error {
2023-07-20 22:10:12 +02:00
opts := [ ] options . AppOption {
2023-07-15 01:19:43 +02:00
options . WithConfigFile ( ctx . String ( "config-file" ) ) ,
options . WithJSONStringPreload ( ctx . String ( "preload-models" ) ) ,
options . WithYAMLConfigPreload ( ctx . String ( "preload-models-config" ) ) ,
options . WithModelLoader ( model . NewModelLoader ( ctx . String ( "models-path" ) ) ) ,
options . WithContextSize ( ctx . Int ( "context-size" ) ) ,
options . WithDebug ( ctx . Bool ( "debug" ) ) ,
options . WithImageDir ( ctx . String ( "image-path" ) ) ,
options . WithAudioDir ( ctx . String ( "audio-path" ) ) ,
options . WithF16 ( ctx . Bool ( "f16" ) ) ,
options . WithStringGalleries ( ctx . String ( "galleries" ) ) ,
options . WithDisableMessage ( false ) ,
options . WithCors ( ctx . Bool ( "cors" ) ) ,
options . WithCorsAllowOrigins ( ctx . String ( "cors-allow-origins" ) ) ,
options . WithThreads ( ctx . Int ( "threads" ) ) ,
options . WithBackendAssets ( backendAssets ) ,
options . WithBackendAssetsOutput ( ctx . String ( "backend-assets-path" ) ) ,
2023-07-20 22:10:12 +02:00
options . WithUploadLimitMB ( ctx . Int ( "upload-limit" ) ) ,
2023-08-09 17:06:21 -05:00
options . WithApiKeys ( ctx . StringSlice ( "api-keys" ) ) ,
2023-07-20 22:10:12 +02:00
}
2023-11-26 18:36:23 +01:00
idleWatchDog := ctx . Bool ( "enable-watchdog-idle" )
busyWatchDog := ctx . Bool ( "enable-watchdog-busy" )
if idleWatchDog || busyWatchDog {
opts = append ( opts , options . EnableWatchDog )
if idleWatchDog {
opts = append ( opts , options . EnableWatchDogIdleCheck )
dur , err := time . ParseDuration ( ctx . String ( "watchdog-idle-timeout" ) )
if err != nil {
return err
}
opts = append ( opts , options . SetWatchDogIdleTimeout ( dur ) )
}
if busyWatchDog {
opts = append ( opts , options . EnableWatchDogBusyCheck )
dur , err := time . ParseDuration ( ctx . String ( "watchdog-busy-timeout" ) )
if err != nil {
return err
}
opts = append ( opts , options . SetWatchDogBusyTimeout ( dur ) )
}
}
2023-11-16 08:20:05 +01:00
if ctx . Bool ( "parallel-requests" ) {
opts = append ( opts , options . EnableParallelBackendRequests )
}
2023-08-19 01:49:33 +02:00
if ctx . Bool ( "single-active-backend" ) {
opts = append ( opts , options . EnableSingleBackend )
}
2023-07-20 22:10:12 +02:00
externalgRPC := ctx . StringSlice ( "external-grpc-backends" )
// split ":" to get backend name and the uri
for _ , v := range externalgRPC {
backend := v [ : strings . IndexByte ( v , ':' ) ]
uri := v [ strings . IndexByte ( v , ':' ) + 1 : ]
opts = append ( opts , options . WithExternalBackend ( backend , uri ) )
}
if ctx . Bool ( "autoload-galleries" ) {
opts = append ( opts , options . EnableGalleriesAutoload )
}
2023-08-18 15:23:14 -04:00
if ctx . Bool ( "preload-backend-only" ) {
_ , _ , err := api . Startup ( opts ... )
return err
}
2023-10-17 18:22:53 +02:00
metrics , err := metrics . SetupMetrics ( )
if err != nil {
return err
}
opts = append ( opts , options . WithMetrics ( metrics ) )
2023-07-20 22:10:12 +02:00
app , err := api . App ( opts ... )
2023-05-30 12:00:30 +02:00
if err != nil {
return err
}
return app . Listen ( ctx . String ( "address" ) )
2023-03-18 23:59:06 +01:00
} ,
2023-10-12 10:45:34 +02:00
Commands : [ ] * cli . Command {
{
Name : "models" ,
Usage : "List or install models" ,
Subcommands : [ ] * cli . Command {
{
Name : "list" ,
Usage : "List the models avaiable in your galleries" ,
Action : func ( ctx * cli . Context ) error {
var galleries [ ] gallery . Gallery
if err := json . Unmarshal ( [ ] byte ( ctx . String ( "galleries" ) ) , & galleries ) ; err != nil {
log . Error ( ) . Msgf ( "unable to load galleries: %s" , err . Error ( ) )
}
models , err := gallery . AvailableGalleryModels ( galleries , ctx . String ( "models-path" ) )
if err != nil {
return err
}
for _ , model := range models {
if model . Installed {
fmt . Printf ( " * %s@%s (installed)\n" , model . Gallery . Name , model . Name )
} else {
fmt . Printf ( " - %s@%s\n" , model . Gallery . Name , model . Name )
}
}
return nil
} ,
} ,
{
Name : "install" ,
Usage : "Install a model from the gallery" ,
Action : func ( ctx * cli . Context ) error {
modelName := ctx . Args ( ) . First ( )
var galleries [ ] gallery . Gallery
if err := json . Unmarshal ( [ ] byte ( ctx . String ( "galleries" ) ) , & galleries ) ; err != nil {
log . Error ( ) . Msgf ( "unable to load galleries: %s" , err . Error ( ) )
}
progressBar := progressbar . NewOptions (
1000 ,
progressbar . OptionSetDescription ( fmt . Sprintf ( "downloading model %s" , modelName ) ) ,
progressbar . OptionShowBytes ( false ) ,
progressbar . OptionClearOnFinish ( ) ,
)
progressCallback := func ( fileName string , current string , total string , percentage float64 ) {
progressBar . Set ( int ( percentage * 10 ) )
}
err = gallery . InstallModelFromGallery ( galleries , modelName , ctx . String ( "models-path" ) , gallery . GalleryModel { } , progressCallback )
if err != nil {
return err
}
return nil
} ,
} ,
} ,
} ,
2023-10-14 12:27:35 +02:00
{
Name : "tts" ,
Usage : "Convert text to speech" ,
Flags : [ ] cli . Flag {
& cli . StringFlag {
Name : "backend" ,
Value : "piper" ,
Aliases : [ ] string { "b" } ,
Usage : "Backend to run the TTS model" ,
} ,
& cli . StringFlag {
Name : "model" ,
Aliases : [ ] string { "m" } ,
Usage : "Model name to run the TTS" ,
Required : true ,
} ,
& cli . StringFlag {
Name : "output-file" ,
Aliases : [ ] string { "o" } ,
Usage : "The path to write the output wav file" ,
} ,
} ,
Action : func ( ctx * cli . Context ) error {
modelOption := ctx . String ( "model" )
if modelOption == "" {
return errors . New ( "--model parameter is required" )
}
backendOption := ctx . String ( "backend" )
if backendOption == "" {
backendOption = "piper"
}
outputFile := ctx . String ( "output-file" )
outputDir := ctx . String ( "backend-assets-path" )
if outputFile != "" {
outputDir = filepath . Dir ( outputFile )
}
text := strings . Join ( ctx . Args ( ) . Slice ( ) , " " )
opts := & options . Option {
Loader : model . NewModelLoader ( ctx . String ( "models-path" ) ) ,
Context : context . Background ( ) ,
AudioDir : outputDir ,
AssetsDestination : ctx . String ( "backend-assets-path" ) ,
}
defer opts . Loader . StopAllGRPC ( )
filePath , _ , err := backend . ModelTTS ( backendOption , text , modelOption , opts . Loader , opts )
if err != nil {
return err
}
if outputFile != "" {
if err := os . Rename ( filePath , outputFile ) ; err != nil {
return err
}
fmt . Printf ( "Generate file %s\n" , outputFile )
} else {
fmt . Printf ( "Generate file %s\n" , filePath )
}
return nil
} ,
} ,
2023-10-15 09:17:41 +02:00
{
Name : "transcript" ,
Usage : "Convert audio to text" ,
Flags : [ ] cli . Flag {
& cli . StringFlag {
Name : "backend" ,
Value : "whisper" ,
Aliases : [ ] string { "b" } ,
Usage : "Backend to run the transcription model" ,
} ,
& cli . StringFlag {
Name : "model" ,
Aliases : [ ] string { "m" } ,
Usage : "Model name to run the transcription" ,
} ,
& cli . StringFlag {
Name : "language" ,
Aliases : [ ] string { "l" } ,
Usage : "Language of the audio file" ,
} ,
& cli . IntFlag {
Name : "threads" ,
Aliases : [ ] string { "t" } ,
Usage : "Threads to use" ,
Value : 1 ,
} ,
& cli . StringFlag {
Name : "output-file" ,
Aliases : [ ] string { "o" } ,
Usage : "The path to write the output wav file" ,
} ,
} ,
Action : func ( ctx * cli . Context ) error {
modelOption := ctx . String ( "model" )
filename := ctx . Args ( ) . First ( )
language := ctx . String ( "language" )
threads := ctx . Int ( "threads" )
opts := & options . Option {
Loader : model . NewModelLoader ( ctx . String ( "models-path" ) ) ,
Context : context . Background ( ) ,
AssetsDestination : ctx . String ( "backend-assets-path" ) ,
}
cl := config . NewConfigLoader ( )
if err := cl . LoadConfigs ( ctx . String ( "models-path" ) ) ; err != nil {
return err
}
c , exists := cl . GetConfig ( modelOption )
if ! exists {
return errors . New ( "model not found" )
}
c . Threads = threads
defer opts . Loader . StopAllGRPC ( )
tr , err := backend . ModelTranscription ( filename , language , opts . Loader , c , opts )
if err != nil {
return err
}
for _ , segment := range tr . Segments {
fmt . Println ( segment . Start . String ( ) , "-" , segment . Text )
}
return nil
} ,
} ,
2023-10-12 10:45:34 +02:00
} ,
2023-03-18 23:59:06 +01:00
}
2023-04-19 18:43:10 +02:00
err = app . Run ( os . Args )
2023-03-18 23:59:06 +01:00
if err != nil {
2023-04-20 18:33:02 +02:00
log . Error ( ) . Msgf ( "error: %s" , err . Error ( ) )
2023-03-18 23:59:06 +01:00
os . Exit ( 1 )
}
}