2024-04-18 22:43:12 +02:00
package functions
import (
"encoding/json"
2024-07-18 17:52:22 +02:00
"errors"
"io"
2024-04-18 22:43:12 +02:00
"regexp"
2024-05-28 21:06:09 +02:00
"strings"
2024-04-18 22:43:12 +02:00
2024-07-26 20:11:29 +02:00
"github.com/mudler/LocalAI/pkg/functions/grammars"
2024-06-23 01:24:36 -07:00
"github.com/mudler/LocalAI/pkg/utils"
2024-04-18 22:43:12 +02:00
"github.com/rs/zerolog/log"
)
2024-05-22 00:14:16 +02:00
type GrammarConfig struct {
// ParallelCalls enables the LLM to return multiple function calls in the same response
ParallelCalls bool ` yaml:"parallel_calls" `
2024-05-23 19:16:08 +02:00
DisableParallelNewLines bool ` yaml:"disable_parallel_new_lines" `
2024-05-22 00:14:16 +02:00
// MixedMode enables the LLM to return strings and not only JSON objects
// This is useful for models to not constraing returning only JSON and also messages back to the user
MixedMode bool ` yaml:"mixed_mode" `
// NoMixedFreeString disables the mixed mode for free strings
2024-07-26 20:11:29 +02:00
// In this way if the LLM selects a free string, it won't be mixed necessarly with JSON objects.
// For example, if enabled the LLM or returns a JSON object or a free string, but not a mix of both
// If disabled(default): the LLM can return a JSON object surrounded by free strings (e.g. `this is the JSON result: { "bar": "baz" } for your question`). This forces the LLM to return at least a JSON object, but its not going to be strict
2024-05-22 00:14:16 +02:00
NoMixedFreeString bool ` yaml:"no_mixed_free_string" `
// NoGrammar disables the grammar parsing and parses the responses directly from the LLM
NoGrammar bool ` yaml:"disable" `
// Prefix is the suffix to append to the grammar when being generated
// This is useful when models prepend a tag before returning JSON
Prefix string ` yaml:"prefix" `
2024-05-31 09:36:27 +02:00
// ExpectStringsAfterJSON enables mixed string suffix
ExpectStringsAfterJSON bool ` yaml:"expect_strings_after_json" `
2024-06-26 14:59:02 +02:00
// PropOrder selects what order to print properties
// for instance name,arguments will make print { "name": "foo", "arguments": { "bar": "baz" } }
// instead of { "arguments": { "bar": "baz" }, "name": "foo" }
PropOrder string ` yaml:"properties_order" `
2024-07-26 20:11:29 +02:00
// SchemaType can be configured to use a specific schema type to force the grammar
// available : json, llama3.1
SchemaType string ` yaml:"schema_type" `
2024-05-22 00:14:16 +02:00
}
2024-05-15 20:03:18 +02:00
// FunctionsConfig is the configuration for the tool/function call.
// It includes setting to map the function name and arguments from the response
// and, for instance, also if processing the requests with BNF grammars.
2024-04-18 22:43:12 +02:00
type FunctionsConfig struct {
2024-05-15 20:03:18 +02:00
// DisableNoAction disables the "no action" tool
// By default we inject a tool that does nothing and is used to return an answer from the LLM
DisableNoAction bool ` yaml:"disable_no_action" `
2024-05-22 00:14:16 +02:00
// Grammar is the configuration for the grammar
GrammarConfig GrammarConfig ` yaml:"grammar" `
2024-05-15 20:03:18 +02:00
// NoActionFunctionName is the name of the function that does nothing. It defaults to "answer"
NoActionFunctionName string ` yaml:"no_action_function_name" `
// NoActionDescriptionName is the name of the function that returns the description of the no action function
2024-04-18 22:43:12 +02:00
NoActionDescriptionName string ` yaml:"no_action_description_name" `
2024-05-12 01:13:22 +02:00
2024-05-15 20:03:18 +02:00
// ResponseRegex is a named regex to extract the function name and arguments from the response
2024-05-31 22:52:02 +02:00
ResponseRegex [ ] string ` yaml:"response_regex" `
2024-05-15 20:03:18 +02:00
// JSONRegexMatch is a regex to extract the JSON object from the response
2024-05-19 18:24:49 +02:00
JSONRegexMatch [ ] string ` yaml:"json_regex_match" `
2024-05-14 09:39:20 +02:00
2024-05-22 00:14:16 +02:00
// ReplaceFunctionResults allow to replace strings in the results before parsing them
ReplaceFunctionResults [ ] ReplaceResult ` yaml:"replace_function_results" `
2024-05-15 20:03:18 +02:00
2024-05-22 00:14:16 +02:00
// ReplaceLLMResult allow to replace strings in the results before parsing them
ReplaceLLMResult [ ] ReplaceResult ` yaml:"replace_llm_results" `
2024-05-15 20:03:18 +02:00
2024-05-28 21:06:09 +02:00
// CaptureLLMResult is a regex to extract a string from the LLM response
// that is used as return string when using tools.
// This is useful for e.g. if the LLM outputs a reasoning and we want to get the reasoning as a string back
CaptureLLMResult [ ] string ` yaml:"capture_llm_results" `
2024-05-12 01:13:22 +02:00
// FunctionName enable the LLM to return { "name": "function_name", "arguments": { "arg1": "value1", "arg2": "value2" } }
// instead of { "function": "function_name", "arguments": { "arg1": "value1", "arg2": "value2" } }.
// This might be useful for certain models trained with the function name as the first token.
2024-07-18 17:52:22 +02:00
FunctionNameKey string ` yaml:"function_name_key" `
FunctionArgumentsKey string ` yaml:"function_arguments_key" `
2024-04-18 22:43:12 +02:00
}
2024-05-20 08:31:06 +02:00
type ReplaceResult struct {
Key string ` yaml:"key" `
Value string ` yaml:"value" `
}
2024-04-18 22:43:12 +02:00
type FuncCallResults struct {
Name string
Arguments string
}
2024-07-26 20:11:29 +02:00
func ( g FunctionsConfig ) GrammarOptions ( ) [ ] func ( o * grammars . GrammarOption ) {
opts := [ ] func ( o * grammars . GrammarOption ) { }
if g . GrammarConfig . MixedMode {
opts = append ( opts , grammars . EnableMaybeString )
}
if g . GrammarConfig . ParallelCalls {
opts = append ( opts , grammars . EnableMaybeArray )
2024-05-22 00:14:16 +02:00
}
2024-07-26 20:11:29 +02:00
if g . GrammarConfig . DisableParallelNewLines {
opts = append ( opts , grammars . DisableParallelNewLines )
2024-05-22 00:14:16 +02:00
}
2024-07-26 20:11:29 +02:00
if g . GrammarConfig . Prefix != "" {
opts = append ( opts , grammars . SetPrefix ( g . GrammarConfig . Prefix ) )
2024-05-23 19:16:08 +02:00
}
2024-07-26 20:11:29 +02:00
if g . GrammarConfig . NoMixedFreeString {
opts = append ( opts , grammars . NoMixedFreeString )
2024-05-22 00:14:16 +02:00
}
2024-07-26 20:11:29 +02:00
if g . GrammarConfig . ExpectStringsAfterJSON {
opts = append ( opts , grammars . ExpectStringsAfterJSON )
2024-05-22 00:14:16 +02:00
}
2024-07-26 20:11:29 +02:00
if g . GrammarConfig . SchemaType != "" {
opts = append ( opts , grammars . WithSchemaType ( grammars . NewType ( g . GrammarConfig . SchemaType ) ) )
}
if g . FunctionNameKey != "" {
opts = append ( opts , grammars . WithFunctionName ( g . FunctionNameKey ) )
2024-05-31 09:36:27 +02:00
}
2024-06-26 14:59:02 +02:00
2024-07-26 20:11:29 +02:00
opts = append ( opts , grammars . SetPropOrder ( g . GrammarConfig . PropOrder ) )
2024-05-22 00:14:16 +02:00
return opts
}
func CleanupLLMResult ( llmresult string , functionConfig FunctionsConfig ) string {
2024-05-15 20:03:18 +02:00
log . Debug ( ) . Msgf ( "LLM result: %s" , llmresult )
2024-05-22 00:14:16 +02:00
for _ , item := range functionConfig . ReplaceLLMResult {
2024-05-20 08:31:06 +02:00
k , v := item . Key , item . Value
2024-05-15 20:03:18 +02:00
log . Debug ( ) . Msgf ( "Replacing %s with %s" , k , v )
2024-05-18 16:29:10 -07:00
re := regexp . MustCompile ( k )
llmresult = re . ReplaceAllString ( llmresult , v )
2024-05-15 20:03:18 +02:00
}
log . Debug ( ) . Msgf ( "LLM result(processed): %s" , llmresult )
2024-05-22 00:14:16 +02:00
return llmresult
}
2024-05-28 21:06:09 +02:00
func ParseTextContent ( llmresult string , functionConfig FunctionsConfig ) string {
2024-05-31 09:36:27 +02:00
log . Debug ( ) . Msgf ( "ParseTextContent: %s" , llmresult )
log . Debug ( ) . Msgf ( "CaptureLLMResult: %s" , functionConfig . CaptureLLMResult )
2024-05-28 21:06:09 +02:00
for _ , r := range functionConfig . CaptureLLMResult {
// We use a regex to extract the JSON object from the response
var respRegex = regexp . MustCompile ( r )
match := respRegex . FindStringSubmatch ( llmresult )
if len ( match ) >= 1 {
m := strings . TrimSpace ( match [ 1 ] )
return m
}
}
return ""
}
2024-07-18 17:52:22 +02:00
// ParseJSON is a function that parses a JSON string that might contain multiple JSON objects
// and syntax errors in between by shifting the offset
// This for e.g. allow to parse
// { "foo": "bar" } invalid { "baz": "qux" }
// into
// [ { "foo": "bar" }, { "baz": "qux" } ]
// Credits to Michael Yang (https://github.com/mxyng) for the original implementation
// This is a slighly reworked version, improved for readability and error handling
func ParseJSON ( s string ) ( [ ] map [ string ] any , error ) {
var objs [ ] map [ string ] any
offset := 0
for offset < len ( s ) {
var obj map [ string ] any
decoder := json . NewDecoder ( strings . NewReader ( s [ offset : ] ) )
err := decoder . Decode ( & obj )
switch {
case errors . Is ( err , io . EOF ) :
return objs , nil
case err == nil :
offset += int ( decoder . InputOffset ( ) )
objs = append ( objs , obj )
default : // handle the error type
var syntaxErr * json . SyntaxError
var unmarshalTypeErr * json . UnmarshalTypeError
switch {
case errors . As ( err , & syntaxErr ) :
offset += int ( syntaxErr . Offset )
case errors . As ( err , & unmarshalTypeErr ) :
offset += int ( unmarshalTypeErr . Offset )
default :
return objs , err
}
}
}
return objs , nil
}
2024-05-22 00:14:16 +02:00
func ParseFunctionCall ( llmresult string , functionConfig FunctionsConfig ) [ ] FuncCallResults {
log . Debug ( ) . Msgf ( "LLM result: %s" , llmresult )
for _ , item := range functionConfig . ReplaceFunctionResults {
k , v := item . Key , item . Value
log . Debug ( ) . Msgf ( "Replacing %s with %s" , k , v )
re := regexp . MustCompile ( k )
llmresult = re . ReplaceAllString ( llmresult , v )
}
log . Debug ( ) . Msgf ( "LLM result(function cleanup): %s" , llmresult )
2024-07-18 17:52:22 +02:00
functionNameKey := defaultFunctionNameKey
functionArgumentsKey := defaultFunctionArgumentsKey
if functionConfig . FunctionNameKey != "" {
functionNameKey = functionConfig . FunctionNameKey
}
if functionConfig . FunctionArgumentsKey != "" {
functionArgumentsKey = functionConfig . FunctionArgumentsKey
2024-05-12 01:13:22 +02:00
}
2024-04-18 22:43:12 +02:00
results := [ ] FuncCallResults { }
2024-05-28 21:06:09 +02:00
llmResults := [ ] string { }
2024-04-18 22:43:12 +02:00
2024-05-28 21:06:09 +02:00
returnResult := func ( results [ ] string ) ( result [ ] FuncCallResults , e error ) {
2024-05-14 09:39:20 +02:00
// As we have to change the result before processing, we can't stream the answer token-by-token (yet?)
2024-05-18 09:35:28 +02:00
result = make ( [ ] FuncCallResults , 0 )
2024-04-18 22:43:12 +02:00
2024-05-28 21:06:09 +02:00
for _ , s := range results {
2024-07-18 17:52:22 +02:00
var ss [ ] map [ string ] any
2024-04-18 22:43:12 +02:00
2024-05-28 21:06:09 +02:00
s = utils . EscapeNewLines ( s )
2024-07-18 17:52:22 +02:00
ss , err := ParseJSON ( s )
//err := json.Unmarshal([]byte(s), &ss)
2024-05-28 21:06:09 +02:00
if err != nil {
2024-07-18 17:52:22 +02:00
log . Debug ( ) . Err ( err ) . Str ( "escapedLLMResult" , s ) . Msg ( "unable to unmarshal llm result in a single object or an array of JSON objects" )
2024-04-18 22:43:12 +02:00
}
2024-05-18 09:35:28 +02:00
2024-05-28 21:06:09 +02:00
log . Debug ( ) . Msgf ( "Function return: %s %+v" , s , ss )
for _ , s := range ss {
// The grammar defines the function name as "function", while OpenAI returns "name"
func_name , ok := s [ functionNameKey ]
if ! ok {
continue
//return result, fmt.Errorf("unable to find function name in result")
}
// Similarly, while here arguments is a map[string]interface{}, OpenAI actually want a stringified object
2024-07-18 17:52:22 +02:00
args , ok := s [ functionArgumentsKey ] // arguments needs to be a string, but we return an object from the grammar result (TODO: fix)
2024-05-28 21:06:09 +02:00
if ! ok {
continue
//return result, fmt.Errorf("unable to find arguments in result")
}
d , _ := json . Marshal ( args )
funcName , ok := func_name . ( string )
if ! ok {
continue
//return result, fmt.Errorf("unable to cast function name to string")
}
result = append ( result , FuncCallResults { Name : funcName , Arguments : string ( d ) } )
}
2024-04-18 22:43:12 +02:00
}
2024-05-18 09:35:28 +02:00
return result , nil
}
// the response is a string that we have to parse
result := make ( map [ string ] string )
2024-05-19 18:24:49 +02:00
if len ( functionConfig . JSONRegexMatch ) != 0 {
for _ , r := range functionConfig . JSONRegexMatch {
// We use a regex to extract the JSON object from the response
var respRegex = regexp . MustCompile ( r )
2024-05-28 21:06:09 +02:00
match := respRegex . FindAllStringSubmatch ( llmresult , - 1 )
var allMatches [ ] string
for _ , m := range match {
if len ( m ) > 1 {
// we match the first group
allMatches = append ( allMatches , m [ 1 ] )
}
}
if len ( allMatches ) > 0 {
llmResults = append ( llmResults , allMatches ... )
2024-05-19 18:24:49 +02:00
break
}
}
}
2024-05-31 22:52:02 +02:00
if len ( functionConfig . ResponseRegex ) > 0 {
2024-05-18 09:35:28 +02:00
// We use named regexes here to extract the function name and arguments
// obviously, this expects the LLM to be stable and return correctly formatted JSON
// TODO: optimize this and pre-compile it
2024-05-31 22:52:02 +02:00
for _ , r := range functionConfig . ResponseRegex {
var respRegex = regexp . MustCompile ( r )
matches := respRegex . FindAllStringSubmatch ( llmresult , - 1 )
for _ , match := range matches {
for i , name := range respRegex . SubexpNames ( ) {
if i != 0 && name != "" && len ( match ) > i {
result [ name ] = match [ i ]
}
2024-05-28 21:06:09 +02:00
}
2024-05-18 09:35:28 +02:00
2024-05-31 22:52:02 +02:00
functionName := result [ functionNameKey ]
if functionName == "" {
return results
}
2024-07-18 17:52:22 +02:00
results = append ( results , FuncCallResults { Name : result [ functionNameKey ] , Arguments : result [ functionArgumentsKey ] } )
2024-05-28 21:06:09 +02:00
}
2024-04-18 22:43:12 +02:00
}
2024-05-18 09:35:28 +02:00
} else {
2024-05-28 21:06:09 +02:00
if len ( llmResults ) == 0 {
llmResults = append ( llmResults , llmresult )
}
results , _ = returnResult ( llmResults )
2024-04-18 22:43:12 +02:00
}
return results
}