From 1ee216e2f314ff85afb5ec855c6a28075e5720c1 Mon Sep 17 00:00:00 2001 From: Saifeddine ALOUI Date: Thu, 29 Aug 2024 00:16:24 +0200 Subject: [PATCH] Update download_transcript.py --- lollms/functions/youtube/download_transcript.py | 8 +++++--- 1 file changed, 5 insertions(+), 3 deletions(-) diff --git a/lollms/functions/youtube/download_transcript.py b/lollms/functions/youtube/download_transcript.py index e9f02dd..5b1d411 100644 --- a/lollms/functions/youtube/download_transcript.py +++ b/lollms/functions/youtube/download_transcript.py @@ -8,6 +8,7 @@ from functools import partial from typing import List from lollms.utilities import PackageManager from ascii_colors import trace_exception +from typing import Any # Installing necessary packages if not PackageManager.check_package_installed("youtube_transcript_api"): @@ -16,19 +17,20 @@ if not PackageManager.check_package_installed("youtube_transcript_api"): # Importing the package after installation from youtube_transcript_api import YouTubeTranscriptApi -def download_youtube_transcript(video_id: str) -> str: +def download_youtube_transcript(video_id: str, language_code: str = 'en') -> str: """ This function downloads the transcript of a YouTube video given its video ID. Parameters: video_id (str): The ID of the YouTube video. + languages (tuple): A list of languages to extract. Returns: str: The transcript of the video. """ try: # Fetching the transcript - transcript = YouTubeTranscriptApi.get_transcript(video_id) + transcript = YouTubeTranscriptApi.get_transcript(video_id, (language_code,)) # Combining the transcript into a single string transcript_text = " ".join([entry['text'] for entry in transcript]) @@ -42,5 +44,5 @@ def download_youtube_transcript_function(): "function_name": "download_youtube_transcript", "function": download_youtube_transcript, "function_description": "This function goes online to YouTube and downloads the transcript from any video.", - "function_parameters": [{"name": "video_id", "type": "str"}] + "function_parameters": [{"name": "video_id", "type": "str"},{"name": "language_code", "type": "str"}] }