lollms-webui/lollms_webui.py

1228 lines
61 KiB
Python
Raw Normal View History

2024-01-01 03:18:49 +00:00
"""
File: lollms_web_ui.py
Author: ParisNeo
Description: Singleton class for the LoLLMS web UI.
This class provides a singleton instance of the LoLLMS web UI, allowing access to its functionality and data across multiple endpoints.
"""
2024-01-04 02:57:42 +00:00
from lollms.server.elf_server import LOLLMSElfServer
2024-01-05 02:40:55 +00:00
from datetime import datetime
from lollms.databases.discussions_database import DiscussionsDB, Discussion
2024-01-05 02:40:55 +00:00
from pathlib import Path
from lollms.config import InstallOption
from lollms.types import MSG_TYPE, SENDER_TYPES
from lollms.extension import LOLLMSExtension, ExtensionBuilder
from lollms.personality import AIPersonality, PersonalityBuilder
from lollms.binding import LOLLMSConfig, BindingBuilder, LLMBinding, ModelBuilder, BindingType
from lollms.paths import LollmsPaths
from lollms.helpers import ASCIIColors, trace_exception
from lollms.com import NotificationType, NotificationDisplayType, LoLLMsCom
from lollms.app import LollmsApplication
2024-02-18 23:23:15 +00:00
from lollms.utilities import File64BitsManager, PromptReshaper, PackageManager, find_first_available_file_index, run_async, is_asyncio_loop_running, yes_or_no_input
from lollms.generation import RECEPTION_MANAGER, ROLE_CHANGE_DECISION, ROLE_CHANGE_OURTPUT
2024-01-21 04:35:29 +00:00
import git
2024-01-07 14:27:14 +00:00
import asyncio
2024-01-07 21:34:33 +00:00
import os
2024-01-29 21:21:45 +00:00
2024-01-05 02:40:55 +00:00
from safe_store import TextVectorizer, VectorizationMethod, VisualizationMethod
import threading
from tqdm import tqdm
import traceback
import sys
import gc
import ctypes
from functools import partial
import json
import shutil
import re
import string
import requests
from datetime import datetime
from typing import List, Tuple
import time
import numpy as np
from lollms.utilities import find_first_available_file_index, convert_language_name
if not PackageManager.check_package_installed("requests"):
PackageManager.install_package("requests")
if not PackageManager.check_package_installed("bs4"):
PackageManager.install_package("beautifulsoup4")
import requests
from bs4 import BeautifulSoup
def terminate_thread(thread):
if thread:
if not thread.is_alive():
ASCIIColors.yellow("Thread not alive")
return
thread_id = thread.ident
exc = ctypes.py_object(SystemExit)
res = ctypes.pythonapi.PyThreadState_SetAsyncExc(thread_id, exc)
if res > 1:
ctypes.pythonapi.PyThreadState_SetAsyncExc(thread_id, None)
del thread
gc.collect()
raise SystemError("Failed to terminate the thread.")
else:
ASCIIColors.yellow("Canceled successfully")# The current version of the webui
2024-02-15 00:02:40 +00:00
2024-02-23 20:20:37 +00:00
lollms_webui_version="9.5 (Alpha)"
2024-01-01 03:18:49 +00:00
2024-01-04 02:57:42 +00:00
class LOLLMSWebUI(LOLLMSElfServer):
2024-01-05 02:40:55 +00:00
__instance = None
@staticmethod
def build_instance(
config: LOLLMSConfig,
lollms_paths: LollmsPaths,
load_binding=True,
load_model=True,
load_voice_service=True,
load_sd_service=True,
try_select_binding=False,
try_select_model=False,
callback=None,
2024-01-15 19:38:54 +00:00
args=None,
2024-01-16 23:06:38 +00:00
sio = None
2024-01-05 02:40:55 +00:00
):
if LOLLMSWebUI.__instance is None:
LOLLMSWebUI(
config,
lollms_paths,
load_binding=load_binding,
load_model=load_model,
load_sd_service=load_sd_service,
load_voice_service=load_voice_service,
try_select_binding=try_select_binding,
try_select_model=try_select_model,
callback=callback,
2024-01-15 19:38:54 +00:00
args=args,
2024-01-16 23:06:38 +00:00
sio=sio
2024-01-05 02:40:55 +00:00
)
return LOLLMSWebUI.__instance
2024-01-01 03:18:49 +00:00
def __init__(
self,
config: LOLLMSConfig,
lollms_paths: LollmsPaths,
load_binding=True,
load_model=True,
2024-01-04 02:57:42 +00:00
load_voice_service=True,
load_sd_service=True,
2024-01-01 03:18:49 +00:00
try_select_binding=False,
try_select_model=False,
callback=None,
2024-01-15 19:38:54 +00:00
args=None,
2024-01-16 23:06:38 +00:00
sio=None
2024-01-01 03:18:49 +00:00
) -> None:
super().__init__(
config,
lollms_paths,
load_binding=load_binding,
load_model=load_model,
try_select_binding=try_select_binding,
try_select_model=try_select_model,
callback=callback,
2024-01-16 23:06:38 +00:00
sio=sio
2024-01-01 03:18:49 +00:00
)
2024-01-10 20:22:17 +00:00
self.app_name:str = "LOLLMSWebUI"
self.version:str = lollms_webui_version
2024-01-15 19:38:54 +00:00
self.args = args
2024-01-01 03:18:49 +00:00
2024-01-05 02:40:55 +00:00
self.busy = False
self.nb_received_tokens = 0
self.config_file_path = config.file_path
self.cancel_gen = False
2024-01-11 17:00:11 +00:00
if self.config.auto_update:
if self.check_update_():
ASCIIColors.info("New version found. Updating!")
self.run_update_script()
2024-01-05 02:40:55 +00:00
# Keeping track of current discussion and message
self._current_user_message_id = 0
self._current_ai_message_id = 0
self._message_id = 0
2024-02-18 23:23:15 +00:00
# migrate old databases to new ones:
databases_path = self.lollms_paths.personal_path/"databases"
if databases_path.exists() and len([f for f in databases_path.iterdir() if f.suffix==".db"])>0:
if yes_or_no_input("Old databases have been spotted on your system. Do you want me to migrate them to the new format?"):
databases_found = False
for database_path in databases_path.iterdir():
if database_path.suffix==".db":
ASCIIColors.red(f"Found old discussion database format : {database_path}")
ASCIIColors.red(f"Migrating to new format... ",end="")
new_db_path = self.lollms_paths.personal_discussions_path/database_path.stem
new_db_path.mkdir(exist_ok=True, parents=True)
try:
shutil.copy(database_path,new_db_path/"database.db")
ASCIIColors.green("ok")
databases_found = True
except Exception as ex:
ASCIIColors.warning(ex)
if databases_found:
ASCIIColors.green(f"Databases are migrated from {databases_path} to the new {self.lollms_paths.personal_discussions_path} path")
if yes_or_no_input("Databases are migrated to the new format. Do you want me to delete the previous version?"):
for database_path in databases_path.iterdir():
if database_path.suffix==".db":
ASCIIColors.red(f"Deleting {database_path}")
database_path.unlink()
if config["discussion_db_name"].endswith(".db"):
config["discussion_db_name"]=config["discussion_db_name"].replace(".db","")
config.save_config()
self.discussion_db_name = config["discussion_db_name"]
# Create database object
self.db = DiscussionsDB(self.lollms_paths, self.discussion_db_name)
2024-01-05 02:40:55 +00:00
# If the database is empty, populate it with tables
ASCIIColors.info("Checking discussions database... ",end="")
self.db.create_tables()
self.db.add_missing_columns()
ASCIIColors.success("ok")
# prepare vectorization
2024-02-26 21:59:03 +00:00
if self.config.data_vectorization_activate and self.config.activate_skills_lib:
2024-01-05 02:40:55 +00:00
try:
ASCIIColors.yellow("Loading long term memory")
2024-02-18 23:23:15 +00:00
folder = self.lollms_paths.personal_discussions_path/"vectorized_dbs"
2024-01-05 02:40:55 +00:00
folder.mkdir(parents=True, exist_ok=True)
self.build_long_term_skills_memory()
ASCIIColors.yellow("Ready")
except Exception as ex:
trace_exception(ex)
self.long_term_memory = None
else:
self.long_term_memory = None
# This is used to keep track of messages
self.download_infos={}
# Define a WebSocket event handler
2024-01-16 23:06:38 +00:00
@sio.event
async def connect(sid, environ):
self.session.add_client(sid, sid, self.db.load_last_discussion(), self.db)
2024-01-16 23:06:38 +00:00
await self.sio.emit('connected', to=sid)
ASCIIColors.success(f'Client {sid} connected')
2024-01-16 23:06:38 +00:00
@sio.event
def disconnect(sid):
try:
self.session.add_client(sid, sid, self.db.load_last_discussion(), self.db)
if self.session.get_client(sid).processing:
self.session.get_client(sid).schedule_for_deletion=True
else:
self.session.remove_client(sid, sid)
except Exception as ex:
pass
ASCIIColors.error(f'Client {sid} disconnected')
# generation status
self.generating=False
ASCIIColors.blue(f"Your personal data is stored here :",end="")
ASCIIColors.green(f"{self.lollms_paths.personal_path}")
2024-02-19 21:40:28 +00:00
self.start_servers()
2024-02-18 23:23:15 +00:00
def get_uploads_path(self, client_id):
return self.session.get_client(client_id).discussion_path # self.db.discussion_db_path/f'{["discussion"].discussion_id}'
2024-01-01 03:18:49 +00:00
# Other methods and properties of the LoLLMSWebUI singleton class
def check_module_update_(self, repo_path, branch_name="main"):
try:
# Open the repository
ASCIIColors.yellow(f"Checking for updates from {repo_path}")
repo = git.Repo(repo_path)
# Fetch updates from the remote for the specified branch
repo.remotes.origin.fetch(refspec=f"refs/heads/{branch_name}:refs/remotes/origin/{branch_name}")
# Compare the local and remote commit IDs for the specified branch
local_commit = repo.head.commit
remote_commit = repo.remotes.origin.refs[branch_name].commit
# Check if the local branch is behind the remote branch
is_behind = repo.is_ancestor(local_commit, remote_commit) and local_commit!= remote_commit
ASCIIColors.yellow(f"update availability: {is_behind}")
# Return True if the local branch is behind the remote branch
return is_behind
except Exception as e:
# Handle any errors that may occur during the fetch process
# trace_exception(e)
return False
def check_update_(self, branch_name="main"):
try:
# Open the repository
repo_path = str(Path(__file__).parent)
if self.check_module_update_(repo_path, branch_name):
return True
repo_path = str(Path(__file__).parent/"lollms_core")
if self.check_module_update_(repo_path, branch_name):
return True
repo_path = str(Path(__file__).parent/"utilities/safe_store")
if self.check_module_update_(repo_path, branch_name):
return True
return False
except Exception as e:
# Handle any errors that may occur during the fetch process
# trace_exception(e)
return False
def run_update_script(self, args=None):
update_script = Path(__file__).parent/"update_script.py"
# Convert Namespace object to a dictionary
if args:
args_dict = vars(args)
else:
args_dict = {}
# Filter out any key-value pairs where the value is None
valid_args = {key: value for key, value in args_dict.items() if value is not None}
# Save the arguments to a temporary file
temp_file = Path(__file__).parent/"temp_args.txt"
with open(temp_file, "w") as file:
# Convert the valid_args dictionary to a string in the format "key1 value1 key2 value2 ..."
arg_string = " ".join([f"--{key} {value}" for key, value in valid_args.items()])
file.write(arg_string)
os.system(f"python {update_script}")
sys.exit(0)
2024-01-07 21:34:33 +00:00
def run_restart_script(self, args):
restart_script = Path(__file__).parent/"restart_script.py"
# Convert Namespace object to a dictionary
args_dict = vars(args)
2024-01-07 21:34:33 +00:00
# Filter out any key-value pairs where the value is None
valid_args = {key: value for key, value in args_dict.items() if value is not None}
# Save the arguments to a temporary file
temp_file = Path(__file__).parent/"temp_args.txt"
with open(temp_file, "w") as file:
# Convert the valid_args dictionary to a string in the format "key1 value1 key2 value2 ..."
arg_string = " ".join([f"--{key} {value}" for key, value in valid_args.items()])
file.write(arg_string)
os.system(f"python {restart_script}")
sys.exit(0)
2024-01-10 20:22:17 +00:00
def audio_callback(self, text):
if self.summoned:
client_id = 0
self.cancel_gen = False
client = self.session.get_client(client_id)
client.generated_text=""
client.cancel_generation=False
client.continuing=False
client.first_chunk=True
if not self.model:
ASCIIColors.error("Model not selected. Please select a model")
self.error("Model not selected. Please select a model", client_id=client_id)
return
if not self.busy:
if client.discussion is None:
if self.db.does_last_discussion_have_messages():
client.discussion = self.db.create_discussion()
else:
client.discussion = self.db.load_last_discussion()
prompt = text
ump = self.config.discussion_prompt_separator +self.config.user_name.strip() if self.config.use_user_name_in_discussions else self.personality.user_message_prefix
message = client.discussion.add_message(
message_type = MSG_TYPE.MSG_TYPE_FULL.value,
sender_type = SENDER_TYPES.SENDER_TYPES_USER.value,
sender = ump.replace(self.config.discussion_prompt_separator,"").replace(":",""),
content=prompt,
metadata=None,
parent_message_id=self.message_id
)
ASCIIColors.green("Starting message generation by "+self.personality.name)
client.generation_thread = threading.Thread(target=self.start_message_generation, args=(message, message.id, client_id))
client.generation_thread.start()
2024-01-16 23:06:38 +00:00
self.sio.sleep(0.01)
ASCIIColors.info("Started generation task")
self.busy=True
#tpe = threading.Thread(target=self.start_message_generation, args=(message, message_id, client_id))
#tpe.start()
else:
self.error("I am busy. Come back later.", client_id=client_id)
else:
2024-02-10 11:12:44 +00:00
if "lollms" in text.lower():
self.summoned = True
def scrape_and_save(self, url, file_path):
# Send a GET request to the URL
response = requests.get(url)
# Parse the HTML content using BeautifulSoup
soup = BeautifulSoup(response.content, 'html.parser')
# Find all the text content in the webpage
text_content = soup.get_text()
# Remove extra returns and spaces
text_content = ' '.join(text_content.split())
# Save the text content as a text file
with open(file_path, 'w', encoding="utf-8") as file:
file.write(text_content)
self.info(f"Webpage content saved to {file_path}")
def rebuild_personalities(self, reload_all=False):
if reload_all:
self.mounted_personalities=[]
loaded = self.mounted_personalities
2024-03-01 00:34:54 +00:00
loaded_names = [f"{p.category}/{p.personality_folder_name}:{p.selected_language}" if p.selected_language else f"{p.category}/{p.personality_folder_name}" for p in loaded if p is not None]
mounted_personalities=[]
ASCIIColors.success(f" ╔══════════════════════════════════════════════════╗ ")
ASCIIColors.success(f" ║ Building mounted Personalities ║ ")
ASCIIColors.success(f" ╚══════════════════════════════════════════════════╝ ")
to_remove=[]
for i,personality in enumerate(self.config['personalities']):
if i==self.config["active_personality_id"]:
ASCIIColors.red("*", end="")
ASCIIColors.green(f" {personality}")
else:
ASCIIColors.yellow(f" {personality}")
if personality in loaded_names:
mounted_personalities.append(loaded[loaded_names.index(personality)])
else:
personality_path = f"{personality}" if not ":" in personality else f"{personality.split(':')[0]}"
try:
personality = AIPersonality(personality_path,
self.lollms_paths,
self.config,
model=self.model,
app=self,
selected_language=personality.split(":")[1] if ":" in personality else None,
run_scripts=True)
2024-02-11 17:29:24 +00:00
mounted_personalities.append(personality)
if self.config.enable_voice_service and self.config.auto_read and len(personality.audio_samples)>0:
try:
2024-01-10 20:22:17 +00:00
from lollms.services.xtts.lollms_xtts import LollmsXTTS
if self.tts is None:
2024-01-28 22:37:57 +00:00
self.tts = LollmsXTTS(self, voice_samples_path=Path(__file__).parent.parent/"voices", xtts_base_url= self.config.xtts_base_url)
except:
self.warning(f"Personality {personality.name} request using custom voice but couldn't load XTTS")
except Exception as ex:
ASCIIColors.error(f"Personality file not found or is corrupted ({personality_path}).\nReturned the following exception:{ex}\nPlease verify that the personality you have selected exists or select another personality. Some updates may lead to change in personality name or category, so check the personality selection in settings to be sure.")
ASCIIColors.info("Trying to force reinstall")
if self.config["debug"]:
print(ex)
try:
personality = AIPersonality(
personality_path,
self.lollms_paths,
self.config,
self.model,
app = self,
run_scripts=True,
selected_language=personality.split(":")[1] if ":" in personality else None,
installation_option=InstallOption.FORCE_INSTALL)
mounted_personalities.append(personality)
if personality.processor:
personality.processor.mounted()
except Exception as ex:
ASCIIColors.error(f"Couldn't load personality at {personality_path}")
trace_exception(ex)
ASCIIColors.info(f"Unmounting personality")
to_remove.append(i)
personality = AIPersonality(None,
self.lollms_paths,
self.config,
self.model,
app=self,
run_scripts=True,
installation_option=InstallOption.FORCE_INSTALL)
mounted_personalities.append(personality)
if personality.processor:
personality.processor.mounted()
ASCIIColors.info("Reverted to default personality")
if self.config["active_personality_id"]>=0 and self.config["active_personality_id"]<len(self.config["personalities"]):
ASCIIColors.success(f'selected model : {self.config["personalities"][self.config["active_personality_id"]]}')
else:
ASCIIColors.warning('An error was encountered while trying to mount personality')
ASCIIColors.success(f" ╔══════════════════════════════════════════════════╗ ")
ASCIIColors.success(f" ║ Done ║ ")
ASCIIColors.success(f" ╚══════════════════════════════════════════════════╝ ")
# Sort the indices in descending order to ensure correct removal
to_remove.sort(reverse=True)
# Remove elements from the list based on the indices
for index in to_remove:
if 0 <= index < len(mounted_personalities):
mounted_personalities.pop(index)
self.config["personalities"].pop(index)
ASCIIColors.info(f"removed personality {personality_path}")
if self.config["active_personality_id"]>=len(self.config["personalities"]):
self.config["active_personality_id"]=0
return mounted_personalities
def rebuild_extensions(self, reload_all=False):
if reload_all:
self.mounted_extensions=[]
loaded = self.mounted_extensions
loaded_names = [f"{p.category}/{p.extension_folder_name}" for p in loaded]
mounted_extensions=[]
ASCIIColors.success(f" ╔══════════════════════════════════════════════════╗ ")
ASCIIColors.success(f" ║ Building mounted Extensions ║ ")
ASCIIColors.success(f" ╚══════════════════════════════════════════════════╝ ")
to_remove=[]
for i,extension in enumerate(self.config['extensions']):
ASCIIColors.yellow(f" {extension}")
if extension in loaded_names:
mounted_extensions.append(loaded[loaded_names.index(extension)])
else:
extension_path = self.lollms_paths.extensions_zoo_path/f"{extension}"
try:
extension = ExtensionBuilder().build_extension(extension_path,self.lollms_paths, self)
mounted_extensions.append(extension)
except Exception as ex:
ASCIIColors.error(f"Extension file not found or is corrupted ({extension_path}).\nReturned the following exception:{ex}\nPlease verify that the personality you have selected exists or select another personality. Some updates may lead to change in personality name or category, so check the personality selection in settings to be sure.")
trace_exception(ex)
ASCIIColors.info("Trying to force reinstall")
if self.config["debug"]:
print(ex)
ASCIIColors.success(f" ╔══════════════════════════════════════════════════╗ ")
ASCIIColors.success(f" ║ Done ║ ")
ASCIIColors.success(f" ╚══════════════════════════════════════════════════╝ ")
# Sort the indices in descending order to ensure correct removal
to_remove.sort(reverse=True)
# Remove elements from the list based on the indices
for index in to_remove:
if 0 <= index < len(mounted_extensions):
mounted_extensions.pop(index)
self.config["extensions"].pop(index)
ASCIIColors.info(f"removed personality {extension_path}")
return mounted_extensions
# ================================== LOLLMSApp
#properties
@property
def message_id(self):
return self._message_id
@message_id.setter
def message_id(self, id):
self._message_id=id
@property
def current_user_message_id(self):
return self._current_user_message_id
@current_user_message_id.setter
def current_user_message_id(self, id):
self._current_user_message_id=id
self._message_id = id
@property
def current_ai_message_id(self):
return self._current_ai_message_id
@current_ai_message_id.setter
def current_ai_message_id(self, id):
self._current_ai_message_id=id
self._message_id = id
def download_file(self, url, installation_path, callback=None):
"""
Downloads a file from a URL, reports the download progress using a callback function, and displays a progress bar.
Args:
url (str): The URL of the file to download.
installation_path (str): The path where the file should be saved.
callback (function, optional): A callback function to be called during the download
with the progress percentage as an argument. Defaults to None.
"""
try:
response = requests.get(url, stream=True)
# Get the file size from the response headers
total_size = int(response.headers.get('content-length', 0))
with open(installation_path, 'wb') as file:
downloaded_size = 0
with tqdm(total=total_size, unit='B', unit_scale=True, ncols=80) as progress_bar:
for chunk in response.iter_content(chunk_size=8192):
if chunk:
file.write(chunk)
downloaded_size += len(chunk)
if callback is not None:
callback(downloaded_size, total_size)
progress_bar.update(len(chunk))
if callback is not None:
callback(total_size, total_size)
print("File downloaded successfully")
except Exception as e:
print("Couldn't download file:", str(e))
def clean_string(self, input_string):
# Remove extra spaces by replacing multiple spaces with a single space
#cleaned_string = re.sub(r'\s+', ' ', input_string)
# Remove extra line breaks by replacing multiple consecutive line breaks with a single line break
cleaned_string = re.sub(r'\n\s*\n', '\n', input_string)
# Create a string containing all punctuation characters
punctuation_chars = string.punctuation
# Define a regular expression pattern to match and remove non-alphanumeric characters
#pattern = f'[^a-zA-Z0-9\s{re.escape(punctuation_chars)}]' # This pattern matches any character that is not a letter, digit, space, or punctuation
pattern = f'[^a-zA-Z0-9\u00C0-\u017F\s{re.escape(punctuation_chars)}]'
# Use re.sub to replace the matched characters with an empty string
cleaned_string = re.sub(pattern, '', cleaned_string)
return cleaned_string
def make_discussion_title(self, discussion, client_id=None):
"""
Builds a title for a discussion
"""
# Get the list of messages
messages = discussion.get_messages()
discussion_messages = "!@>instruction: Create a short title to this discussion\n"
discussion_title = "\n!@>Discussion title:"
available_space = self.config.ctx_size - 150 - len(self.model.tokenize(discussion_messages))- len(self.model.tokenize(discussion_title))
# Initialize a list to store the full messages
full_message_list = []
# Accumulate messages until the cumulative number of tokens exceeds available_space
tokens_accumulated = 0
# Accumulate messages starting from message_index
for message in messages:
# Check if the message content is not empty and visible to the AI
if message.content != '' and (
message.message_type <= MSG_TYPE.MSG_TYPE_FULL_INVISIBLE_TO_USER.value and message.message_type != MSG_TYPE.MSG_TYPE_FULL_INVISIBLE_TO_AI.value):
# Tokenize the message content
message_tokenized = self.model.tokenize(
"\n" + self.config.discussion_prompt_separator + message.sender + ": " + message.content.strip())
# Check if adding the message will exceed the available space
if tokens_accumulated + len(message_tokenized) > available_space:
break
# Add the tokenized message to the full_message_list
full_message_list.insert(0, message_tokenized)
# Update the cumulative number of tokens
tokens_accumulated += len(message_tokenized)
# Build the final discussion messages by detokenizing the full_message_list
for message_tokens in full_message_list:
discussion_messages += self.model.detokenize(message_tokens)
discussion_messages += discussion_title
title = [""]
def receive(
chunk:str,
message_type:MSG_TYPE
):
if chunk:
title[0] += chunk
antiprompt = self.personality.detect_antiprompt(title[0])
if antiprompt:
ASCIIColors.warning(f"\nDetected hallucination with antiprompt: {antiprompt}")
title[0] = self.remove_text_from_string(title[0],antiprompt)
return False
else:
return True
self._generate(discussion_messages, 150, client_id, receive)
ASCIIColors.info(title[0])
return title[0]
def recover_discussion(self,client_id, message_index=-1):
messages = self.session.get_client(client_id).discussion.get_messages()
discussion=""
for msg in messages:
if message_index!=-1 and msg>message_index:
break
discussion += "\n" + self.config.discussion_prompt_separator + msg.sender + ": " + msg.content.strip()
return discussion
def get_discussion_to(self, client_id, message_id=-1):
messages = self.session.get_client(client_id).discussion.get_messages()
full_message_list = []
ump = self.config.discussion_prompt_separator +self.config.user_name.strip() if self.config.use_user_name_in_discussions else self.personality.user_message_prefix
for message in messages:
if message["id"]<= message_id or message_id==-1:
if message["type"]!=MSG_TYPE.MSG_TYPE_FULL_INVISIBLE_TO_USER:
if message["sender"]==self.personality.name:
full_message_list.append(self.personality.ai_message_prefix+message["content"])
else:
full_message_list.append(ump + message["content"])
link_text = "\n"# self.personality.link_text
if len(full_message_list) > self.config["nb_messages_to_remember"]:
discussion_messages = self.personality.personality_conditioning+ link_text.join(full_message_list[-self.config["nb_messages_to_remember"]:])
else:
discussion_messages = self.personality.personality_conditioning+ link_text.join(full_message_list)
return discussion_messages # Removes the last return
def notify(
self,
content,
notification_type:NotificationType=NotificationType.NOTIF_SUCCESS,
duration:int=4,
client_id=None,
display_type:NotificationDisplayType=NotificationDisplayType.TOAST,
2024-01-24 19:34:23 +00:00
verbose:bool|None=None,
):
2024-01-24 19:34:23 +00:00
if verbose is None:
verbose = self.verbose
2024-01-16 23:06:38 +00:00
run_async(partial(self.sio.emit,'notification', {
'content': content,
2024-01-07 10:45:10 +00:00
'notification_type': notification_type.value,
"duration": duration,
'display_type':display_type.value
}, to=client_id
)
)
if verbose:
if notification_type==NotificationType.NOTIF_SUCCESS:
ASCIIColors.success(content)
elif notification_type==NotificationType.NOTIF_INFO:
ASCIIColors.info(content)
elif notification_type==NotificationType.NOTIF_WARNING:
ASCIIColors.warning(content)
else:
ASCIIColors.red(content)
def new_message(self,
client_id,
sender=None,
content="",
parameters=None,
metadata=None,
ui=None,
message_type:MSG_TYPE=MSG_TYPE.MSG_TYPE_FULL,
sender_type:SENDER_TYPES=SENDER_TYPES.SENDER_TYPES_AI,
open=False
):
client = self.session.get_client(client_id)
2024-02-08 23:44:38 +00:00
self.close_message(client_id)
mtdt = metadata if metadata is None or type(metadata) == str else json.dumps(metadata, indent=4)
if sender==None:
sender= self.personality.name
msg = client.discussion.add_message(
message_type = message_type.value,
sender_type = sender_type.value,
sender = sender,
content = content,
metadata = mtdt,
ui = ui,
rank = 0,
parent_message_id = client.discussion.current_message.id,
binding = self.config["binding_name"],
model = self.config["model_name"],
personality = self.config["personalities"][self.config["active_personality_id"]],
) # first the content is empty, but we'll fill it at the end
2024-01-08 00:38:42 +00:00
run_async(partial(
2024-01-16 23:06:38 +00:00
self.sio.emit,'new_message',
2024-01-08 00:38:42 +00:00
{
"sender": sender,
"message_type": message_type.value,
"sender_type": SENDER_TYPES.SENDER_TYPES_AI.value,
"content": content,
"parameters": parameters,
"metadata": metadata,
"ui": ui,
"id": msg.id,
"parent_message_id": msg.parent_message_id,
'binding': self.config["binding_name"],
'model' : self.config["model_name"],
'personality': self.config["personalities"][self.config["active_personality_id"]],
'created_at': client.discussion.current_message.created_at,
'finished_generating_at': client.discussion.current_message.finished_generating_at,
2024-01-08 00:38:42 +00:00
'open': open
}, to=client_id
)
2024-01-07 14:27:14 +00:00
)
2024-01-08 00:38:42 +00:00
def update_message(self, client_id, chunk,
parameters=None,
metadata=[],
ui=None,
msg_type:MSG_TYPE=None
):
client = self.session.get_client(client_id)
client.discussion.current_message.finished_generating_at=datetime.now().strftime('%Y-%m-%d %H:%M:%S')
mtdt = json.dumps(metadata, indent=4) if metadata is not None and type(metadata)== list else metadata
if self.nb_received_tokens==1:
2024-01-09 00:15:51 +00:00
run_async(
2024-01-16 23:06:38 +00:00
partial(self.sio.emit,'update_message', {
2024-01-07 14:27:14 +00:00
"sender": self.personality.name,
'id':client.discussion.current_message.id,
'content': "✍ warming up ...",
2024-01-07 14:27:14 +00:00
'ui': ui,
'discussion_id':client.discussion.discussion_id,
2024-01-07 14:27:14 +00:00
'message_type': MSG_TYPE.MSG_TYPE_STEP_END.value,
'finished_generating_at': client.discussion.current_message.finished_generating_at,
2024-01-07 14:27:14 +00:00
'parameters':parameters,
'metadata':metadata
}, to=client_id
)
)
2024-01-09 00:15:51 +00:00
run_async(
2024-01-16 23:06:38 +00:00
partial(self.sio.emit,'update_message', {
"sender": self.personality.name,
'id':client.discussion.current_message.id,
'content': chunk,
'ui': ui,
'discussion_id':client.discussion.discussion_id,
2024-01-07 14:27:14 +00:00
'message_type': msg_type.value if msg_type is not None else MSG_TYPE.MSG_TYPE_CHUNK.value if self.nb_received_tokens>1 else MSG_TYPE.MSG_TYPE_FULL.value,
'finished_generating_at': client.discussion.current_message.finished_generating_at,
'parameters':parameters,
'metadata':metadata
2024-01-07 10:45:10 +00:00
}, to=client_id
)
2024-01-07 14:27:14 +00:00
)
if msg_type != MSG_TYPE.MSG_TYPE_INFO:
client.discussion.update_message(client.generated_text, new_metadata=mtdt, new_ui=ui)
def close_message(self, client_id):
client = self.session.get_client(client_id)
if not client.discussion:
return
#fix halucination
client.generated_text=client.generated_text.split("!@>")[0]
# Send final message
client.discussion.current_message.finished_generating_at=datetime.now().strftime('%Y-%m-%d %H:%M:%S')
2024-01-09 00:15:51 +00:00
run_async(
2024-01-16 23:06:38 +00:00
partial(self.sio.emit,'close_message', {
2024-01-07 14:27:14 +00:00
"sender": self.personality.name,
"id": client.discussion.current_message.id,
"content":client.generated_text,
2024-01-07 14:27:14 +00:00
'binding': self.config["binding_name"],
'model' : self.config["model_name"],
'personality':self.config["personalities"][self.config["active_personality_id"]],
'created_at': client.discussion.current_message.created_at,
'finished_generating_at': client.discussion.current_message.finished_generating_at,
2024-01-07 14:27:14 +00:00
}, to=client_id
)
)
def process_chunk(
self,
chunk:str,
message_type:MSG_TYPE,
parameters:dict=None,
metadata:list=None,
client_id:int=0,
personality:AIPersonality=None
):
"""
Processes a chunk of generated text
"""
client = self.session.get_client(client_id)
if chunk is None:
return True
if not client_id in list(self.session.clients.keys()):
self.error("Connection lost", client_id=client_id)
return
if message_type == MSG_TYPE.MSG_TYPE_STEP:
ASCIIColors.info("--> Step:"+chunk)
if message_type == MSG_TYPE.MSG_TYPE_STEP_START:
ASCIIColors.info("--> Step started:"+chunk)
if message_type == MSG_TYPE.MSG_TYPE_STEP_END:
if parameters['status']:
ASCIIColors.success("--> Step ended:"+chunk)
else:
ASCIIColors.error("--> Step ended:"+chunk)
if message_type == MSG_TYPE.MSG_TYPE_EXCEPTION:
self.error(chunk, client_id=client_id)
ASCIIColors.error("--> Exception from personality:"+chunk)
if message_type == MSG_TYPE.MSG_TYPE_WARNING:
self.warning(chunk,client_id=client_id)
ASCIIColors.error("--> Exception from personality:"+chunk)
if message_type == MSG_TYPE.MSG_TYPE_INFO:
self.info(chunk, client_id=client_id)
ASCIIColors.info("--> Info:"+chunk)
if message_type == MSG_TYPE.MSG_TYPE_UI:
self.update_message(client_id, "", parameters, metadata, chunk, MSG_TYPE.MSG_TYPE_UI)
if message_type == MSG_TYPE.MSG_TYPE_NEW_MESSAGE:
self.nb_received_tokens = 0
self.start_time = datetime.now()
2024-01-09 23:08:41 +00:00
self.new_message(
2024-01-07 14:27:14 +00:00
client_id,
self.personality.name if personality is None else personality.name,
chunk if parameters["type"]!=MSG_TYPE.MSG_TYPE_UI.value else '',
metadata = [{
"title":chunk,
"content":parameters["metadata"]
}
] if parameters["type"]==MSG_TYPE.MSG_TYPE_JSON_INFOS.value else None,
ui= chunk if parameters["type"]==MSG_TYPE.MSG_TYPE_UI.value else None,
2024-01-09 23:08:41 +00:00
message_type= MSG_TYPE(parameters["type"])
2024-01-07 14:27:14 +00:00
)
elif message_type == MSG_TYPE.MSG_TYPE_FINISHED_MESSAGE:
self.close_message(client_id)
elif message_type == MSG_TYPE.MSG_TYPE_CHUNK:
2024-01-21 04:35:29 +00:00
if self.nb_received_tokens==0:
self.start_time = datetime.now()
2024-02-11 17:29:24 +00:00
try:
self.update_message(client_id, "✍ warming up ...", msg_type=MSG_TYPE.MSG_TYPE_STEP_END, parameters= {'status':True})
self.update_message(client_id, "Generating ...", msg_type=MSG_TYPE.MSG_TYPE_STEP_START)
except Exception as ex:
ASCIIColors.warning("Couldn't send status update to client")
dt =(datetime.now() - self.start_time).seconds
if dt==0:
dt=1
spd = self.nb_received_tokens/dt
ASCIIColors.green(f"Received {self.nb_received_tokens} tokens (speed: {spd:.2f}t/s) ",end="\r",flush=True)
sys.stdout = sys.__stdout__
sys.stdout.flush()
if chunk:
2024-01-21 04:35:29 +00:00
client.generated_text += chunk
antiprompt = self.personality.detect_antiprompt(client.generated_text)
if antiprompt:
ASCIIColors.warning(f"\nDetected hallucination with antiprompt: {antiprompt}")
client.generated_text = self.remove_text_from_string(client.generated_text,antiprompt)
self.update_message(client_id, client.generated_text, parameters, metadata, None, MSG_TYPE.MSG_TYPE_FULL)
return False
else:
self.nb_received_tokens += 1
if client.continuing and client.first_chunk:
self.update_message(client_id, client.generated_text, parameters, metadata)
else:
self.update_message(client_id, chunk, parameters, metadata, msg_type=MSG_TYPE.MSG_TYPE_CHUNK)
client.first_chunk=False
# if stop generation is detected then stop
if not self.cancel_gen:
return True
else:
self.cancel_gen = False
ASCIIColors.warning("Generation canceled")
return False
# Stream the generated text to the main process
elif message_type == MSG_TYPE.MSG_TYPE_FULL:
client.generated_text = chunk
self.nb_received_tokens += 1
dt =(datetime.now() - self.start_time).seconds
if dt==0:
dt=1
spd = self.nb_received_tokens/dt
ASCIIColors.green(f"Received {self.nb_received_tokens} tokens (speed: {spd:.2f}t/s) ",end="\r",flush=True)
antiprompt = self.personality.detect_antiprompt(client.generated_text)
if antiprompt:
ASCIIColors.warning(f"\nDetected hallucination with antiprompt: {antiprompt}")
client.generated_text = self.remove_text_from_string(client.generated_text,antiprompt)
self.update_message(client_id, client.generated_text, parameters, metadata, None, MSG_TYPE.MSG_TYPE_FULL)
return False
self.update_message(client_id, chunk, parameters, metadata, ui=None, msg_type=message_type)
return True
# Stream the generated text to the frontend
else:
self.update_message(client_id, chunk, parameters, metadata, ui=None, msg_type=message_type)
return True
2024-01-10 20:22:17 +00:00
def generate(self, full_prompt, prompt, context_details, n_predict, client_id, callback=None):
if self.personality.processor is not None:
ASCIIColors.info("Running workflow")
try:
self.personality.callback = callback
2024-02-26 07:56:42 +00:00
self.personality.processor.run_workflow(prompt, full_prompt, callback, context_details)
except Exception as ex:
trace_exception(ex)
# Catch the exception and get the traceback as a list of strings
traceback_lines = traceback.format_exception(type(ex), ex, ex.__traceback__)
# Join the traceback lines into a single string
traceback_text = ''.join(traceback_lines)
ASCIIColors.error(f"Workflow run failed.\nError:{ex}")
ASCIIColors.error(traceback_text)
if callback:
callback(f"Workflow run failed\nError:{ex}", MSG_TYPE.MSG_TYPE_EXCEPTION)
print("Finished executing the workflow")
return
self._generate(full_prompt, n_predict, client_id, callback)
ASCIIColors.success("\nFinished executing the generation")
def _generate(self, prompt, n_predict, client_id, callback=None):
self.nb_received_tokens = 0
self.start_time = datetime.now()
if self.model is not None:
if self.model.binding_type==BindingType.TEXT_IMAGE and len(self.personality.image_files)>0:
ASCIIColors.info(f"warmup for generating up to {n_predict} tokens")
if self.config["override_personality_model_parameters"]:
output = self.model.generate_with_images(
prompt,
self.personality.image_files,
callback=callback,
n_predict=n_predict,
temperature=self.config['temperature'],
top_k=self.config['top_k'],
top_p=self.config['top_p'],
repeat_penalty=self.config['repeat_penalty'],
repeat_last_n = self.config['repeat_last_n'],
seed=self.config['seed'],
n_threads=self.config['n_threads']
)
else:
output = self.model.generate_with_images(
prompt,
self.personality.image_files,
callback=callback,
n_predict=min(n_predict,self.personality.model_n_predicts),
temperature=self.personality.model_temperature,
top_k=self.personality.model_top_k,
top_p=self.personality.model_top_p,
repeat_penalty=self.personality.model_repeat_penalty,
repeat_last_n = self.personality.model_repeat_last_n,
seed=self.config['seed'],
n_threads=self.config['n_threads']
)
else:
ASCIIColors.info(f"warmup for generating up to {n_predict} tokens")
if self.config["override_personality_model_parameters"]:
output = self.model.generate(
prompt,
callback=callback,
n_predict=n_predict,
temperature=self.config['temperature'],
top_k=self.config['top_k'],
top_p=self.config['top_p'],
repeat_penalty=self.config['repeat_penalty'],
repeat_last_n = self.config['repeat_last_n'],
seed=self.config['seed'],
n_threads=self.config['n_threads']
)
else:
output = self.model.generate(
prompt,
callback=callback,
n_predict=min(n_predict,self.personality.model_n_predicts),
temperature=self.personality.model_temperature,
top_k=self.personality.model_top_k,
top_p=self.personality.model_top_p,
repeat_penalty=self.personality.model_repeat_penalty,
repeat_last_n = self.personality.model_repeat_last_n,
seed=self.config['seed'],
n_threads=self.config['n_threads']
)
else:
print("No model is installed or selected. Please make sure to install a model and select it inside your configuration before attempting to communicate with the model.")
print("To do this: Install the model to your models/<binding name> folder.")
print("Then set your model information in your local configuration file that you can find in configs/local_config.yaml")
print("You can also use the ui to set your model in the settings page.")
output = ""
return output
def start_message_generation(self, message, message_id, client_id, is_continue=False, generation_type=None):
client = self.session.get_client(client_id)
if self.personality is None:
self.warning("Select a personality")
return
ASCIIColors.info(f"Text generation requested by client: {client_id}")
# send the message to the bot
print(f"Received message : {message.content}")
if client.discussion:
try:
2024-02-11 01:09:31 +00:00
if not self.model:
self.error("No model selected. Please make sure you select a model before starting generation", client_id=client_id)
return
# First we need to send the new message ID to the client
if is_continue:
client.discussion.load_message(message_id)
client.generated_text = message.content
2024-02-11 01:09:31 +00:00
else:
self.new_message(client_id, self.personality.name, "")
self.update_message(client_id, "✍ warming up ...", msg_type=MSG_TYPE.MSG_TYPE_STEP_START)
# prepare query and reception
self.discussion_messages, self.current_message, tokens, context_details, internet_search_infos = self.prepare_query(client_id, message_id, is_continue, n_tokens=self.config.min_n_predict, generation_type=generation_type)
self.prepare_reception(client_id)
self.generating = True
client.processing=True
2024-02-11 01:09:31 +00:00
try:
self.generate(
self.discussion_messages,
self.current_message,
context_details=context_details,
n_predict = self.config.ctx_size-len(tokens)-1,
client_id=client_id,
callback=partial(self.process_chunk,client_id = client_id)
)
if self.config.enable_voice_service and self.config.auto_read and len(self.personality.audio_samples)>0:
try:
self.process_chunk("Generating voice output",MSG_TYPE.MSG_TYPE_STEP_START,client_id=client_id)
from lollms.services.xtts.lollms_xtts import LollmsXTTS
if self.tts is None:
self.tts = LollmsXTTS(self, voice_samples_path=Path(__file__).parent.parent/"voices", xtts_base_url= self.config.xtts_base_url)
language = convert_language_name(self.personality.language)
self.tts.set_speaker_folder(Path(self.personality.audio_samples[0]).parent)
fn = self.personality.name.lower().replace(' ',"_").replace('.','')
fn = f"{fn}_{message_id}.wav"
url = f"audio/{fn}"
self.tts.tts_to_file(client.generated_text, Path(self.personality.audio_samples[0]).name, f"{fn}", language=language)
2024-02-11 01:09:31 +00:00
fl = f"\n".join([
f"<audio controls>",
f' <source src="{url}" type="audio/wav">',
f' Your browser does not support the audio element.',
f'</audio>'
])
self.process_chunk("Generating voice output", MSG_TYPE.MSG_TYPE_STEP_END, {'status':True},client_id=client_id)
self.process_chunk(fl,MSG_TYPE.MSG_TYPE_UI, client_id=client_id)
2024-02-11 01:09:31 +00:00
"""
self.info("Creating audio output",10)
self.personality.step_start("Creating audio output")
if not PackageManager.check_package_installed("tortoise"):
PackageManager.install_package("tortoise-tts")
from tortoise import utils, api
import sounddevice as sd
if self.tts is None:
self.tts = api.TextToSpeech( kv_cache=True, half=True)
reference_clips = [utils.audio.load_audio(str(p), 22050) for p in self.personality.audio_samples]
tk = self.model.tokenize(client.generated_text)
2024-02-11 01:09:31 +00:00
if len(tk)>100:
chunk_size = 100
for i in range(0, len(tk), chunk_size):
chunk = self.model.detokenize(tk[i:i+chunk_size])
if i==0:
pcm_audio = self.tts.tts_with_preset(chunk, voice_samples=reference_clips, preset='fast').numpy().flatten()
else:
pcm_audio = np.concatenate([pcm_audio, self.tts.tts_with_preset(chunk, voice_samples=reference_clips, preset='ultra_fast').numpy().flatten()])
else:
pcm_audio = self.tts.tts_with_preset(client.generated_text, voice_samples=reference_clips, preset='fast').numpy().flatten()
2024-02-11 01:09:31 +00:00
sd.play(pcm_audio, 22050)
self.personality.step_end("Creating audio output")
"""
except Exception as ex:
ASCIIColors.error("Couldn't read")
trace_exception(ex)
print()
ASCIIColors.success("## Done Generation ##")
print()
except Exception as ex:
trace_exception(ex)
print()
ASCIIColors.error("## Generation Error ##")
print()
self.cancel_gen = False
# Send final message
if self.config.activate_internet_search:
from lollms.internet import get_favicon_url, get_root_url
sources_text = '<div class="mt-4 flex flex-wrap items-center gap-x-2 gap-y-1.5 text-sm ">'
sources_text += '<div class="text-gray-400 mr-10px">Sources:</div>'
for source in internet_search_infos:
url = source["url"]
title = source["title"]
brief = source["brief"]
favicon_url = get_favicon_url(url)
if favicon_url is None:
favicon_url ="/personalities/internet/loi/assets/logo.png"
root_url = get_root_url(url)
sources_text += "\n".join([
f'<a class="relative flex items-center gap-2 whitespace-nowrap rounded-lg border bg-white px-2 py-1.5 leading-none hover:border-gray-300 dark:border-gray-800 dark:bg-gray-900 dark:hover:border-gray-700" target="_blank" href="{url}" title="{brief}">',
f' <img class="h-3.5 w-3.5 rounded" src="{favicon_url}">',
f' <div>{root_url}</div>',
f'</a>',
])
sources_text += '</div>'
client.generated_text=client.generated_text.split("!@>")[0] + "\n" + sources_text
self.personality.full(client.generated_text)
except Exception as ex:
trace_exception(ex)
self.close_message(client_id)
2024-02-10 20:35:27 +00:00
self.update_message(client_id, "Generating ...", msg_type=MSG_TYPE.MSG_TYPE_STEP_END)
2024-02-10 10:33:09 +00:00
client.processing=False
if client.schedule_for_deletion:
self.session.remove_client(client.client_id, client.client_id)
ASCIIColors.success(f" ╔══════════════════════════════════════════════════╗ ")
ASCIIColors.success(f" ║ Done ║ ")
ASCIIColors.success(f" ╚══════════════════════════════════════════════════╝ ")
if self.config.auto_title:
d = client.discussion
ttl = d.title()
if ttl is None or ttl=="" or ttl=="untitled":
title = self.make_discussion_title(d, client_id=client_id)
d.rename(title)
2024-01-08 00:38:42 +00:00
asyncio.run(
2024-01-16 23:06:38 +00:00
self.sio.emit('disucssion_renamed',{
2024-01-27 18:44:58 +00:00
'status': True,
'discussion_id':d.discussion_id,
'title':title
}, to=client_id)
2024-01-07 14:27:14 +00:00
)
self.busy=False
else:
ump = self.config.discussion_prompt_separator +self.config.user_name.strip() if self.config.use_user_name_in_discussions else self.personality.user_message_prefix
self.cancel_gen = False
#No discussion available
ASCIIColors.warning("No discussion selected!!!")
self.error("No discussion selected!!!", client_id=client_id)
print()
self.busy=False
2024-01-07 21:34:33 +00:00
return ""