mirror of
https://github.com/ParisNeo/lollms-webui.git
synced 2025-01-05 12:04:08 +00:00
configuration is now percistant
This commit is contained in:
parent
8f93b856c1
commit
cc24c28188
129
app.py
129
app.py
@ -32,14 +32,15 @@ from pathlib import Path
|
|||||||
import gc
|
import gc
|
||||||
app = Flask("GPT4All-WebUI", static_url_path="/static", static_folder="static")
|
app = Flask("GPT4All-WebUI", static_url_path="/static", static_folder="static")
|
||||||
import time
|
import time
|
||||||
|
from config import load_config
|
||||||
|
|
||||||
class Gpt4AllWebUI:
|
class Gpt4AllWebUI:
|
||||||
|
|
||||||
def __init__(self, _app, args) -> None:
|
def __init__(self, _app, config:dict) -> None:
|
||||||
self.args = args
|
self.config = config
|
||||||
self.current_discussion = None
|
self.current_discussion = None
|
||||||
self.app = _app
|
self.app = _app
|
||||||
self.db_path = args.db_path
|
self.db_path = config["db_path"]
|
||||||
self.db = DiscussionsDB(self.db_path)
|
self.db = DiscussionsDB(self.db_path)
|
||||||
# If the database is empty, populate it with tables
|
# If the database is empty, populate it with tables
|
||||||
self.db.populate()
|
self.db.populate()
|
||||||
@ -92,7 +93,7 @@ class Gpt4AllWebUI:
|
|||||||
)
|
)
|
||||||
|
|
||||||
self.add_endpoint(
|
self.add_endpoint(
|
||||||
"/get_args", "get_args", self.get_args, methods=["GET"]
|
"/get_config", "get_config", self.get_config, methods=["GET"]
|
||||||
)
|
)
|
||||||
|
|
||||||
self.add_endpoint(
|
self.add_endpoint(
|
||||||
@ -128,9 +129,9 @@ class Gpt4AllWebUI:
|
|||||||
|
|
||||||
def create_chatbot(self):
|
def create_chatbot(self):
|
||||||
return Model(
|
return Model(
|
||||||
ggml_model=f"./models/{self.args.model}",
|
ggml_model=f"./models/{self.config['model']}",
|
||||||
n_ctx=self.args.ctx_size,
|
n_ctx=self.config['ctx_size'],
|
||||||
seed=self.args.seed,
|
seed=self.config['seed'],
|
||||||
)
|
)
|
||||||
|
|
||||||
def condition_chatbot(self, conditionning_message = """
|
def condition_chatbot(self, conditionning_message = """
|
||||||
@ -151,23 +152,6 @@ GPT4All:Welcome! I'm here to assist you with anything you need. What can I do fo
|
|||||||
self.full_message_list.append(conditionning_message)
|
self.full_message_list.append(conditionning_message)
|
||||||
|
|
||||||
|
|
||||||
# self.prepare_query(conditionning_message)
|
|
||||||
# self.chatbot_bindings.generate(
|
|
||||||
# conditionning_message,
|
|
||||||
# new_text_callback=self.new_text_callback,
|
|
||||||
|
|
||||||
# n_predict=len(conditionning_message),
|
|
||||||
# temp=self.args.temp,
|
|
||||||
# top_k=self.args.top_k,
|
|
||||||
# top_p=self.args.top_p,
|
|
||||||
# repeat_penalty=self.args.repeat_penalty,
|
|
||||||
# repeat_last_n = self.args.repeat_last_n,
|
|
||||||
# seed=self.args.seed,
|
|
||||||
# n_threads=8
|
|
||||||
# )
|
|
||||||
# print(f"Bot said:{self.bot_says}")
|
|
||||||
|
|
||||||
|
|
||||||
def prepare_query(self):
|
def prepare_query(self):
|
||||||
self.bot_says = ""
|
self.bot_says = ""
|
||||||
self.full_text = ""
|
self.full_text = ""
|
||||||
@ -229,13 +213,13 @@ GPT4All:Welcome! I'm here to assist you with anything you need. What can I do fo
|
|||||||
self.chatbot_bindings.generate(
|
self.chatbot_bindings.generate(
|
||||||
self.prompt_message,#self.full_message,#self.current_message,
|
self.prompt_message,#self.full_message,#self.current_message,
|
||||||
new_text_callback=self.new_text_callback,
|
new_text_callback=self.new_text_callback,
|
||||||
n_predict=len(self.current_message)+self.args.n_predict,
|
n_predict=len(self.current_message)+self.config['n_predict'],
|
||||||
temp=self.args.temp,
|
temp=self.config['temp'],
|
||||||
top_k=self.args.top_k,
|
top_k=self.config['top_k'],
|
||||||
top_p=self.args.top_p,
|
top_p=self.config['top_p'],
|
||||||
repeat_penalty=self.args.repeat_penalty,
|
repeat_penalty=self.config['repeat_penalty'],
|
||||||
repeat_last_n = self.args.repeat_last_n,
|
repeat_last_n = self.config['repeat_last_n'],
|
||||||
#seed=self.args.seed,
|
#seed=self.config['seed'],
|
||||||
n_threads=8
|
n_threads=8
|
||||||
)
|
)
|
||||||
self.generating=False
|
self.generating=False
|
||||||
@ -327,11 +311,11 @@ GPT4All:Welcome! I'm here to assist you with anything you need. What can I do fo
|
|||||||
self.prompt_message,#full_message,
|
self.prompt_message,#full_message,
|
||||||
new_text_callback=self.new_text_callback,
|
new_text_callback=self.new_text_callback,
|
||||||
n_predict=0,#len(full_message),
|
n_predict=0,#len(full_message),
|
||||||
temp=self.args.temp,
|
temp=self.config['temp'],
|
||||||
top_k=self.args.top_k,
|
top_k=self.config['top_k'],
|
||||||
top_p=self.args.top_p,
|
top_p=self.config['top_p'],
|
||||||
repeat_penalty= self.args.repeat_penalty,
|
repeat_penalty= self.config['repeat_penalty'],
|
||||||
repeat_last_n = self.args.repeat_last_n,
|
repeat_last_n = self.config['repeat_last_n'],
|
||||||
n_threads=8
|
n_threads=8
|
||||||
)
|
)
|
||||||
|
|
||||||
@ -390,33 +374,33 @@ GPT4All:Welcome! I'm here to assist you with anything you need. What can I do fo
|
|||||||
def update_model_params(self):
|
def update_model_params(self):
|
||||||
data = request.get_json()
|
data = request.get_json()
|
||||||
model = str(data["model"])
|
model = str(data["model"])
|
||||||
if self.args.model != model:
|
if self.config['model'] != model:
|
||||||
print("New model selected")
|
print("New model selected")
|
||||||
self.args.model = model
|
self.config['model'] = model
|
||||||
self.prepare_a_new_chatbot()
|
self.prepare_a_new_chatbot()
|
||||||
|
|
||||||
self.args.n_predict = int(data["nPredict"])
|
self.config['n_predict'] = int(data["nPredict"])
|
||||||
self.args.seed = int(data["seed"])
|
self.config['seed'] = int(data["seed"])
|
||||||
|
|
||||||
self.args.temp = float(data["temp"])
|
self.config['temp'] = float(data["temp"])
|
||||||
self.args.top_k = int(data["topK"])
|
self.config['top_k'] = int(data["topK"])
|
||||||
self.args.top_p = float(data["topP"])
|
self.config['top_p'] = float(data["topP"])
|
||||||
self.args.repeat_penalty = int(data["repeatPenalty"])
|
self.config['repeat_penalty'] = float(data["repeatPenalty"])
|
||||||
self.args.repeat_last_n = int(data["repeatLastN"])
|
self.config['repeat_last_n'] = int(data["repeatLastN"])
|
||||||
|
|
||||||
print("Parameters changed to:")
|
print("Parameters changed to:")
|
||||||
print(f"\tTemperature:{self.args.temp}")
|
print(f"\tTemperature:{self.config['temp']}")
|
||||||
print(f"\tNPredict:{self.args.n_predict}")
|
print(f"\tNPredict:{self.config['n_predict']}")
|
||||||
print(f"\tSeed:{self.args.seed}")
|
print(f"\tSeed:{self.config['seed']}")
|
||||||
print(f"\top_k:{self.args.top_k}")
|
print(f"\top_k:{self.config['top_k']}")
|
||||||
print(f"\top_p:{self.args.top_p}")
|
print(f"\top_p:{self.config['top_p']}")
|
||||||
print(f"\trepeat_penalty:{self.args.repeat_penalty}")
|
print(f"\trepeat_penalty:{self.config['repeat_penalty']}")
|
||||||
print(f"\trepeat_last_n:{self.args.repeat_last_n}")
|
print(f"\trepeat_last_n:{self.config['repeat_last_n']}")
|
||||||
return jsonify({"status":"ok"})
|
return jsonify({"status":"ok"})
|
||||||
|
|
||||||
|
|
||||||
def get_args(self):
|
def get_config(self):
|
||||||
return jsonify(self.args)
|
return jsonify(self.config)
|
||||||
|
|
||||||
def help(self):
|
def help(self):
|
||||||
return render_template("help.html")
|
return render_template("help.html")
|
||||||
@ -432,40 +416,40 @@ GPT4All:Welcome! I'm here to assist you with anything you need. What can I do fo
|
|||||||
if __name__ == "__main__":
|
if __name__ == "__main__":
|
||||||
parser = argparse.ArgumentParser(description="Start the chatbot Flask app.")
|
parser = argparse.ArgumentParser(description="Start the chatbot Flask app.")
|
||||||
parser.add_argument(
|
parser.add_argument(
|
||||||
"-s", "--seed", type=int, default=0, help="Force using a specific model."
|
"-s", "--seed", type=int, default=None, help="Force using a specific model."
|
||||||
)
|
)
|
||||||
|
|
||||||
parser.add_argument(
|
parser.add_argument(
|
||||||
"-m", "--model", type=str, default="gpt4all-lora-quantized-ggml.bin", help="Force using a specific model."
|
"-m", "--model", type=str, default=None, help="Force using a specific model."
|
||||||
)
|
)
|
||||||
parser.add_argument(
|
parser.add_argument(
|
||||||
"--temp", type=float, default=0.1, help="Temperature parameter for the model."
|
"--temp", type=float, default=None, help="Temperature parameter for the model."
|
||||||
)
|
)
|
||||||
parser.add_argument(
|
parser.add_argument(
|
||||||
"--n_predict",
|
"--n_predict",
|
||||||
type=int,
|
type=int,
|
||||||
default=256,
|
default=None,
|
||||||
help="Number of tokens to predict at each step.",
|
help="Number of tokens to predict at each step.",
|
||||||
)
|
)
|
||||||
parser.add_argument(
|
parser.add_argument(
|
||||||
"--top_k", type=int, default=40, help="Value for the top-k sampling."
|
"--top_k", type=int, default=None, help="Value for the top-k sampling."
|
||||||
)
|
)
|
||||||
parser.add_argument(
|
parser.add_argument(
|
||||||
"--top_p", type=float, default=0.95, help="Value for the top-p sampling."
|
"--top_p", type=float, default=None, help="Value for the top-p sampling."
|
||||||
)
|
)
|
||||||
parser.add_argument(
|
parser.add_argument(
|
||||||
"--repeat_penalty", type=float, default=1.3, help="Penalty for repeated tokens."
|
"--repeat_penalty", type=float, default=None, help="Penalty for repeated tokens."
|
||||||
)
|
)
|
||||||
parser.add_argument(
|
parser.add_argument(
|
||||||
"--repeat_last_n",
|
"--repeat_last_n",
|
||||||
type=int,
|
type=int,
|
||||||
default=64,
|
default=None,
|
||||||
help="Number of previous tokens to consider for the repeat penalty.",
|
help="Number of previous tokens to consider for the repeat penalty.",
|
||||||
)
|
)
|
||||||
parser.add_argument(
|
parser.add_argument(
|
||||||
"--ctx_size",
|
"--ctx_size",
|
||||||
type=int,
|
type=int,
|
||||||
default=512,#2048,
|
default=None,#2048,
|
||||||
help="Size of the context window for the model.",
|
help="Size of the context window for the model.",
|
||||||
)
|
)
|
||||||
parser.add_argument(
|
parser.add_argument(
|
||||||
@ -477,19 +461,26 @@ if __name__ == "__main__":
|
|||||||
parser.add_argument(
|
parser.add_argument(
|
||||||
"--host", type=str, default="localhost", help="the hostname to listen on"
|
"--host", type=str, default="localhost", help="the hostname to listen on"
|
||||||
)
|
)
|
||||||
parser.add_argument("--port", type=int, default=9600, help="the port to listen on")
|
parser.add_argument("--port", type=int, default=None, help="the port to listen on")
|
||||||
parser.add_argument(
|
parser.add_argument(
|
||||||
"--db_path", type=str, default="database.db", help="Database path"
|
"--db_path", type=str, default=None, help="Database path"
|
||||||
)
|
)
|
||||||
parser.set_defaults(debug=False)
|
parser.set_defaults(debug=False)
|
||||||
args = parser.parse_args()
|
args = parser.parse_args()
|
||||||
|
config_file_path = "configs/default.yaml"
|
||||||
|
config = load_config(config_file_path)
|
||||||
|
|
||||||
|
# Override values in config with command-line arguments
|
||||||
|
for arg_name, arg_value in vars(args).items():
|
||||||
|
if arg_value is not None:
|
||||||
|
config[arg_name] = arg_value
|
||||||
|
|
||||||
executor = ThreadPoolExecutor(max_workers=2)
|
executor = ThreadPoolExecutor(max_workers=2)
|
||||||
app.config['executor'] = executor
|
app.config['executor'] = executor
|
||||||
|
|
||||||
bot = Gpt4AllWebUI(app, args)
|
bot = Gpt4AllWebUI(app, config)
|
||||||
|
|
||||||
if args.debug:
|
if config["debug"]:
|
||||||
app.run(debug=True, host=args.host, port=args.port)
|
app.run(debug=True, host=config["host"], port=config["port"])
|
||||||
else:
|
else:
|
||||||
app.run(host=args.host, port=args.port)
|
app.run(host=config["host"], port=config["port"])
|
||||||
|
22
config.py
Normal file
22
config.py
Normal file
@ -0,0 +1,22 @@
|
|||||||
|
######
|
||||||
|
# Project : GPT4ALL-UI
|
||||||
|
# File : config.py
|
||||||
|
# Author : ParisNeo with the help of the community
|
||||||
|
# Supported by Nomic-AI
|
||||||
|
# Licence : Apache 2.0
|
||||||
|
# Description :
|
||||||
|
# A front end Flask application for llamacpp models.
|
||||||
|
# The official GPT4All Web ui
|
||||||
|
# Made by the community for the community
|
||||||
|
######
|
||||||
|
import yaml
|
||||||
|
|
||||||
|
def load_config(file_path):
|
||||||
|
with open(file_path, 'r') as stream:
|
||||||
|
config = yaml.safe_load(stream)
|
||||||
|
return config
|
||||||
|
|
||||||
|
|
||||||
|
def save_config(config, filepath):
|
||||||
|
with open(filepath, "w") as f:
|
||||||
|
yaml.dump(config, f)
|
13
configs/default.yaml
Normal file
13
configs/default.yaml
Normal file
@ -0,0 +1,13 @@
|
|||||||
|
seed: 0
|
||||||
|
model: "gpt4all-lora-quantized-ggml.bin"
|
||||||
|
temp: 0.1
|
||||||
|
n_predict: 256
|
||||||
|
top_k: 40
|
||||||
|
top_p: 0.95
|
||||||
|
repeat_penalty: 1.3
|
||||||
|
repeat_last_n: 64
|
||||||
|
ctx_size: 512
|
||||||
|
debug: false
|
||||||
|
host: "localhost"
|
||||||
|
port: 9600
|
||||||
|
db_path: "database.db"
|
@ -2,3 +2,4 @@ flask
|
|||||||
nomic
|
nomic
|
||||||
pytest
|
pytest
|
||||||
pyllamacpp
|
pyllamacpp
|
||||||
|
pyyaml
|
@ -69,7 +69,7 @@
|
|||||||
</form>
|
</form>
|
||||||
</div>
|
</div>
|
||||||
<div class="tab-pane" id="settings" style="display: none;">
|
<div class="tab-pane" id="settings" style="display: none;">
|
||||||
<div class="h-96 overflow-y-auto">
|
<div class="h-full overflow-y-auto">
|
||||||
<form id="model-params-form" class="bg-gray-700 shadow-md rounded px-8 py-8 pt-6 pb-8 mb-4 text-white">
|
<form id="model-params-form" class="bg-gray-700 shadow-md rounded px-8 py-8 pt-6 pb-8 mb-4 text-white">
|
||||||
<div class="mb-4">
|
<div class="mb-4">
|
||||||
<label class="block font-bold mb-2" for="model">Model</label>
|
<label class="block font-bold mb-2" for="model">Model</label>
|
||||||
@ -81,28 +81,27 @@
|
|||||||
<input class="bg-gray-700 shadow appearance-none border rounded w-full py-2 px-3 leading-tight focus:outline-none focus:shadow-outline" id="seed" type="text" name="seed" value="0">
|
<input class="bg-gray-700 shadow appearance-none border rounded w-full py-2 px-3 leading-tight focus:outline-none focus:shadow-outline" id="seed" type="text" name="seed" value="0">
|
||||||
</div>
|
</div>
|
||||||
<div class="mb-4">
|
<div class="mb-4">
|
||||||
<label class="block font-bold mb-2" for="temp">Temperature</label>
|
<label class="block font-bold mb-2" for="temp" id="temperature-value">Temperature (0.1)</label>
|
||||||
<input class="w-full slider-value" id="temp" type="range" min="0" max="1" step="0.1" value="0.1" name="temp">
|
<input class="w-full slider-value" id="temp" type="range" min="0" max="1" step="0.1" value="0.1" name="temp">
|
||||||
<p id="slider-value">0.1</p>
|
|
||||||
</div>
|
</div>
|
||||||
<div class="mb-4">
|
<div class="mb-4">
|
||||||
<label class="block font-bold mb-2" for="n-predict">N Predict</label>
|
<label class="block font-bold mb-2" for="n-predict" id="n-predict-value">N Predict (256)</label>
|
||||||
<input class="w-full slider-value" id="n-predict" type="range" min="0" max="2048" step="1" value="256" name="n-predict">
|
<input class="w-full slider-value" id="n-predict" type="range" min="0" max="2048" step="1" value="256" name="n-predict">
|
||||||
</div>
|
</div>
|
||||||
<div class="mb-4">
|
<div class="mb-4">
|
||||||
<label class="block font-bold mb-2" for="top-k">Top K</label>
|
<label class="block font-bold mb-2" for="top-k" id="top-k-value">Top K</label>
|
||||||
<input class="w-full slider-value" id="top-k" type="range" min="0" max="100" step="1" value="40" name="top-k">
|
<input class="w-full slider-value" id="top-k" type="range" min="0" max="100" step="1" value="40" name="top-k">
|
||||||
</div>
|
</div>
|
||||||
<div class="mb-4">
|
<div class="mb-4">
|
||||||
<label class="block font-bold mb-2" for="top-p">Top P</label>
|
<label class="block font-bold mb-2" for="top-p" id="top-p-value">Top P</label>
|
||||||
<input class="w-full slider-value" id="top-p" type="range" min="0" max="100" step="1" value="40" name="top-p">
|
<input class="w-full slider-value" id="top-p" type="range" min="0" max="100" step="1" value="40" name="top-p">
|
||||||
</div>
|
</div>
|
||||||
<div class="mb-4">
|
<div class="mb-4">
|
||||||
<label class="block font-bold mb-2" for="repeat-penalty">Repeat penalty</label>
|
<label class="block font-bold mb-2" for="repeat-penalty" id="repeat-penalty-value">Repeat penalty</label>
|
||||||
<input class="w-full slider-value" id="repeat-penalty" type="range" min="0" max="100" step="1" value="40" name="repeat-penalty">
|
<input class="w-full slider-value" id="repeat-penalty" type="range" min="0" max="2" step="0.1" value="1.3" name="repeat-penalty">
|
||||||
</div>
|
</div>
|
||||||
<div class="mb-4">
|
<div class="mb-4">
|
||||||
<label class="block font-bold mb-2" for="repeat-last-n">Repeat penalty</label>
|
<label class="block font-bold mb-2" for="repeat-last-n" id="repeat-last-n-value">Repeat last N</label>
|
||||||
<input class="w-full slider-value" id="repeat-last-n" type="range" min="0" max="100" step="1" value="40" name="repeat-last-n">
|
<input class="w-full slider-value" id="repeat-last-n" type="range" min="0" max="100" step="1" value="40" name="repeat-last-n">
|
||||||
</div>
|
</div>
|
||||||
<div class="mb-4">
|
<div class="mb-4">
|
||||||
|
Loading…
Reference in New Issue
Block a user