From d93b670cd6112df87754b18b65a34f76d77be5d0 Mon Sep 17 00:00:00 2001
From: Saifeddine ALOUI <aloui.seifeddine@gmail.com>
Date: Thu, 4 Jul 2024 17:11:54 +0200
Subject: [PATCH] added better handling

---
 lollms/app.py         | 8 +++++---
 lollms/personality.py | 6 +++---
 2 files changed, 8 insertions(+), 6 deletions(-)
diff --git a/lollms/app.py b/lollms/app.py
index ee88e1f..9454930 100644
--- a/lollms/app.py
+++ b/lollms/app.py
@@ -1038,7 +1038,8 @@ class LollmsApplication(LoLLMsCom):
                         query = current_message.content
                     if documentation=="":
                         documentation=f"{self.separator_template}".join([
-                            f"{self.separator_template}{self.start_header_id_template}important information{self.end_header_id_template}Utilize Documentation Data: Always refer to the provided documentation to answer user questions accurately.",
+                            f"{self.separator_template}{self.start_header_id_template}important information{self.end_header_id_template}",
+                            "Always refer to the provided documentation to answer user questions accurately.",
                             "Absence of Information: If the required information is not available in the documentation, inform the user that the requested information is not present in the documentation section.",
                             "Strict Adherence to Documentation: It is strictly prohibited to provide answers without concrete evidence from the documentation.",
                             "Cite Your Sources: After providing an answer, include the full path to the document where the information was found.",
@@ -1246,7 +1247,7 @@ class LollmsApplication(LoLLMsCom):
         total_tokens = n_cond_tk + n_isearch_tk + n_doc_tk + n_history_tk + n_user_description_tk + n_positive_boost + n_negative_boost + n_fun_mode
 
         # Calculate the available space for the messages
-        available_space = min(self.config.ctx_size - n_tokens - total_tokens, self.config.max_n_predict)
+        available_space = self.config.ctx_size - n_tokens - total_tokens
 
         # if self.config.debug:
         #     self.info(f"Tokens summary:\nConditionning:{n_cond_tk}\nn_isearch_tk:{n_isearch_tk}\ndoc:{n_doc_tk}\nhistory:{n_history_tk}\nuser description:{n_user_description_tk}\nAvailable space:{available_space}",10)
@@ -1371,7 +1372,8 @@ class LollmsApplication(LoLLMsCom):
             "current_language":self.config.current_language,
             "fun_mode":fun_mode,
             "ai_prefix":ai_prefix,
-            "extra":""
+            "extra":"",
+            "available_space":available_space
         }    
         if self.config.debug:
             ASCIIColors.highlight(documentation,"source_document_title", ASCIIColors.color_yellow, ASCIIColors.color_red, False)
diff --git a/lollms/personality.py b/lollms/personality.py
index 52a9d93..78be997 100644
--- a/lollms/personality.py
+++ b/lollms/personality.py
@@ -693,7 +693,7 @@ class AIPersonality:
 
         if max_generation_size is None:
             prompt_size = self.model.tokenize(prompt)
-            max_generation_size = self.model.config.ctx_size - len(prompt_size)
+            max_generation_size = min(self.model.config.ctx_size - len(prompt_size),self.config.max_n_predict)
 
         pr = PromptReshaper(prompt)
         prompt = pr.build(placeholders,
@@ -703,7 +703,7 @@ class AIPersonality:
                         sacrifice
                         )
         ntk = len(self.model.tokenize(prompt))
-        max_generation_size = min(self.model.config.ctx_size - ntk, max_generation_size)
+        max_generation_size = min(min(self.model.config.ctx_size - ntk, max_generation_size), self.config.max_n_predict)
         # TODO : add show progress
 
         gen = self.generate(prompt, max_generation_size, temperature = temperature, top_k = top_k, top_p=top_p, repeat_penalty=repeat_penalty, repeat_last_n=repeat_last_n, callback=callback, show_progress=show_progress).strip().replace("</s>", "").replace("<s>", "")
@@ -774,7 +774,7 @@ class AIPersonality:
             self.print_prompt("gen",prompt)
         self.model.generate(
                                 prompt,
-                                max_size if max_size else (self.config.ctx_size-len(self.model.tokenize(prompt))),
+                                max_size if max_size else min(self.config.ctx_size-len(self.model.tokenize(prompt)), self.config.max_n_predict),
                                 partial(self.process, callback=callback, show_progress=show_progress),
                                 temperature=self.model_temperature if temperature is None else temperature,
                                 top_k=self.model_top_k if top_k is None else top_k,