From fe562543b4e6811f98bc42e58aa06c46dd441c46 Mon Sep 17 00:00:00 2001
From: Saifeddine ALOUI <aloui.seifeddine@gmail.com>
Date: Fri, 13 Sep 2024 01:19:02 +0200
Subject: [PATCH] upgraded elevenlabs settings

---
 configs/config.yaml                           |  2 +-
 .../personal/configs/lollms_elf_config.yaml   |  2 +-
 .../personal/configs/lollms_elf_config.yaml   |  2 +-
 .../configs/lollms_elf_local_config.yaml      |  2 +-
 .../eleven_labs_tts/lollms_eleven_labs_tts.py | 58 +++++++++++++++++--
 5 files changed, 56 insertions(+), 10 deletions(-)

diff --git a/configs/config.yaml b/configs/config.yaml
index fcb8f5e..b618038 100644
--- a/configs/config.yaml
+++ b/configs/config.yaml
@@ -164,7 +164,7 @@ openai_tts_voice: "alloy"
 
 
 elevenlabs_tts_key: ""
-elevenlabs_tts_model_id: "eleven_monolingual_v2"
+elevenlabs_tts_model_id: "eleven_turbo_v2_5"
 elevenlabs_tts_voice_stability: 0.5
 elevenlabs_tts_voice_boost: 0.5
 elevenlabs_tts_voice_id: EXAVITQu4vr4xnSDxMaL
diff --git a/elf_docker_cfg/personal/configs/lollms_elf_config.yaml b/elf_docker_cfg/personal/configs/lollms_elf_config.yaml
index 0c751e1..87c2b66 100644
--- a/elf_docker_cfg/personal/configs/lollms_elf_config.yaml
+++ b/elf_docker_cfg/personal/configs/lollms_elf_config.yaml
@@ -163,7 +163,7 @@ openai_tts_voice: "alloy"
 
 
 elevenlabs_tts_key: ""
-elevenlabs_tts_model_id: "eleven_monolingual_v2"
+elevenlabs_tts_model_id: "eleven_turbo_v2_5"
 elevenlabs_tts_voice_stability: 0.5
 elevenlabs_tts_voice_boost: 0.5
 elevenlabs_tts_voice_id: EXAVITQu4vr4xnSDxMaL
diff --git a/elf_test_cfg/personal/configs/lollms_elf_config.yaml b/elf_test_cfg/personal/configs/lollms_elf_config.yaml
index 0c751e1..87c2b66 100644
--- a/elf_test_cfg/personal/configs/lollms_elf_config.yaml
+++ b/elf_test_cfg/personal/configs/lollms_elf_config.yaml
@@ -163,7 +163,7 @@ openai_tts_voice: "alloy"
 
 
 elevenlabs_tts_key: ""
-elevenlabs_tts_model_id: "eleven_monolingual_v2"
+elevenlabs_tts_model_id: "eleven_turbo_v2_5"
 elevenlabs_tts_voice_stability: 0.5
 elevenlabs_tts_voice_boost: 0.5
 elevenlabs_tts_voice_id: EXAVITQu4vr4xnSDxMaL
diff --git a/elf_test_cfg/personal/configs/lollms_elf_local_config.yaml b/elf_test_cfg/personal/configs/lollms_elf_local_config.yaml
index 0c751e1..87c2b66 100644
--- a/elf_test_cfg/personal/configs/lollms_elf_local_config.yaml
+++ b/elf_test_cfg/personal/configs/lollms_elf_local_config.yaml
@@ -163,7 +163,7 @@ openai_tts_voice: "alloy"
 
 
 elevenlabs_tts_key: ""
-elevenlabs_tts_model_id: "eleven_monolingual_v2"
+elevenlabs_tts_model_id: "eleven_turbo_v2_5"
 elevenlabs_tts_voice_stability: 0.5
 elevenlabs_tts_voice_boost: 0.5
 elevenlabs_tts_voice_id: EXAVITQu4vr4xnSDxMaL
diff --git a/lollms/services/tts/eleven_labs_tts/lollms_eleven_labs_tts.py b/lollms/services/tts/eleven_labs_tts/lollms_eleven_labs_tts.py
index c88b2f8..e546a2e 100644
--- a/lollms/services/tts/eleven_labs_tts/lollms_eleven_labs_tts.py
+++ b/lollms/services/tts/eleven_labs_tts/lollms_eleven_labs_tts.py
@@ -30,17 +30,17 @@ def get_Whisper(lollms_paths:LollmsPaths):
 class LollmsElevenLabsTTS(LollmsTTS):
     def __init__(
                     self, 
-                    app:LollmsApplication,
-                    model_id: str = "eleven_monolingual_v2",
-                    voice_id: str = "EXAVITQu4vr4xnSDxMaL",
+                    app: LollmsApplication,
+                    model_id: str = "eleven_turbo_v2_5",
+                    voice_name: str = "Sarah",
                     api_key: str = "",
                     output_path: Path | str = None,
                     stability: float = 0.5,
                     similarity_boost: float = 0.5,
                     streaming: bool = False
                     ):
-        super().__init__("elevenlabs_tts", app, model_id, voice_id, api_key, output_path)
-        self.voice_id = voice_id
+        super().__init__("elevenlabs_tts", app, model_id, voice_name, api_key, output_path)
+        self.voice_name = voice_name
         self.model_id = model_id
         self.api_key = api_key
         self.output_path = output_path
@@ -48,13 +48,54 @@ class LollmsElevenLabsTTS(LollmsTTS):
         self.similarity_boost = similarity_boost
         self.streaming = streaming
         self.ready = True
+        
+        self.voices = []
+        self.voice_id_map = {}
+        try:
+            self._fetch_voices()
+            self.voice_id = self._get_voice_id(voice_name)
+        except:
+            pass
+    def _fetch_voices(self):
+        url = "https://api.elevenlabs.io/v1/voices"
+        headers = {"xi-api-key": self.api_key}
+        
+        try:
+            response = requests.get(url, headers=headers)
+            response.raise_for_status()
+            data = response.json()
+            
+            for voice in data.get("voices", []):
+                name = voice.get("name")
+                voice_id = voice.get("voice_id")
+                if name and voice_id:
+                    self.voices.append(name)
+                    self.voice_id_map[name] = voice_id
+        except requests.RequestException as e:
+            print(f"Error fetching voices: {e}")
+            # Fallback to default voice
+            self.voices = ["Sarah"]
+            self.voice_id_map = {"Sarah": "EXAVITQu4vr4xnSDxMaL"}
+
+    def _get_voice_id(self, voice_name: str) -> str:
+        return self.voice_id_map.get(voice_name, "EXAVITQu4vr4xnSDxMaL")  # Default to Sarah if not found
+
+    def set_voice(self, voice_name: str):
+        if voice_name in self.voices:
+            self.voice_name = voice_name
+            self.voice_id = self._get_voice_id(voice_name)
+        else:
+            raise ValueError(f"Voice '{voice_name}' not found. Available voices: {', '.join(self.voices)}")
+
+
 
     def tts_file(self, text, file_name_or_path: Path | str = None, speaker=None, language="en", use_threading=False):
         speech_file_path = file_name_or_path
         payload = {
             "text": text,
+            "language_code": language,
             "model_id": self.model_id,
-            "voice_settings": {
+                "voice_settings": {
                 "stability": self.stability,
                 "similarity_boost": self.similarity_boost
             }
@@ -71,6 +112,10 @@ class LollmsElevenLabsTTS(LollmsTTS):
         else:
             url = f"https://api.elevenlabs.io/v1/text-to-speech/{self.voice_id}"
             response = requests.post(url, json=payload, headers=headers)
+            if response.status_code==400:
+                del payload["language_code"]
+                url = f"https://api.elevenlabs.io/v1/text-to-speech/{self.voice_id}"
+                response = requests.post(url, json=payload, headers=headers)
             with open(speech_file_path, 'wb') as f:
                 f.write(response.content)
 
@@ -80,6 +125,7 @@ class LollmsElevenLabsTTS(LollmsTTS):
         speech_file_path = file_name_or_path
         payload = {
             "text": text,
+            "language_code": language,
             "model_id": self.model_id,
             "voice_settings": {
                 "stability": self.stability,