Spaces:

WhisperTube
/

whispertube_backend

Runtime error

App Files Files Community

uzi007 commited on Oct 13, 2023

Commit

fe9dbf9

•

1 Parent(s): bc72637

APIs updated & yt-dlp added

Browse files

Files changed (8) hide show

helperfunctions.py +108 -0
languages.py +411 -0
main.py +131 -37
media_download.py +319 -212
summarizer.py +8 -8
temp/translated_subtitles.json +227 -0
temp/translated_transcript.txt +1 -0
translation.py +127 -0

helperfunctions.py ADDED Viewed

	@@ -0,0 +1,108 @@

+import os
+import subprocess
+def extract_audio(video_path):
+    """
+    Extract audio from a video file (MP4 or WebM) and save it as an MP3 file using ffmpeg.
+    Args:
+        video_path (str): Path to the input video file.
+    Returns:
+        str: Path of extracted audio.
+    """
+    try:
+        # Path for Extracted Audio File
+        filename, extension = os.path.splitext(video_path)
+        audio_path = filename + '.mp3'
+        # Choosing the Appropriate Codec for the Output Audio Format (MP3)
+        audio_codec = "libmp3lame" if extension.lower() in (".mp4", ".webm") else "mp3"
+        # Extracting Audio using FFMPEG Command
+        command = ["ffmpeg", "-i", video_path, "-vn", "-acodec",
+                    audio_codec, audio_path, '-loglevel', 'quiet']
+        subprocess.run(command, check=True)
+        return audio_path
+    except Exception as e:
+        print(f"Error in extract_audio: {e}")
+def burn_subtitles(video_file_path, subtitle_file_path):
+    '''
+    Burns the subtitles onto the video
+    Args:
+        video_file_path (str): Path to the input video file.
+        subtitle_file_path (str): Path to the subtitle file.
+    Returns:
+        str: Path of output video with subtitles.
+    '''
+    try:
+        # Getting Output File Path
+        video_filename, video_extension = os.path.splitext(video_file_path)
+        subtitle_filename, subtitle_extension = os.path.splitext(subtitle_file_path)
+        output_file_path = video_filename + subtitle_extension.replace('.', '_') + video_extension
+        # Burning the Subtitles onto Video using FFMPEG Command
+        command = ['ffmpeg', '-i', video_file_path,
+                '-vf', f'subtitles={subtitle_file_path}',
+                output_file_path, '-loglevel', 'quiet']
+        subprocess.run(command, check=True)
+        return output_file_path
+    except Exception as e:
+        print(f"Error in burn_subtitles: {e}")
+def convert_to_srt_time_format(seconds):
+    '''
+    Converts seconds into .srt format
+    '''
+    try:
+        hours = seconds // 3600
+        seconds %= 3600
+        minutes = seconds // 60
+        seconds %= 60
+        milliseconds = int((seconds - int(seconds)) * 1000)
+        return f"{int(hours):02d}:{int(minutes):02d}:{int(seconds):02d},{milliseconds:03d}"
+    except Exception as e:
+        print(f"Error in save_translated_subtitles: {e}")
+def save_translated_subtitles(subtitles, media_path):
+    '''
+    Saves the translated subtitles into .srt file
+    '''
+    try:
+        # Converting to SRT Format
+        srt_content = ""
+        counter = 1
+        for subtitle in subtitles:
+            start_time = subtitle['start']
+            end_time = subtitle['end']
+            text = subtitle['text']
+            srt_content += f"{counter}\n"
+            srt_content += f"{convert_to_srt_time_format(start_time)} --> {convert_to_srt_time_format(end_time)}\n"
+            srt_content += f"{text}\n\n"
+            counter += 1
+        # Saving SRT content to a .srt file
+        print(media_path)
+        subtitles_filename = os.path.splitext(media_path)[0]
+        subtitles_filename = f'{subtitles_filename}.srt'
+        print(subtitles_filename)
+        with open(subtitles_filename, 'w', encoding='utf-8') as srt_file:
+            srt_file.write(srt_content)
+        return subtitles_filename
+    except Exception as e:
+        print(f"Error in save_translated_subtitles: {e}")

languages.py ADDED Viewed

	@@ -0,0 +1,411 @@

+# OpenAI Whisper - Supported Languages
+whisper_languages = [
+    'afrikaans',
+    'arabic',
+    'armenian',
+    'azerbaijani',
+    'belarusian',
+    'bosnian',
+    'bulgarian',
+    'catalan',
+    'chinese',
+    'croatian',
+    'czech',
+    'danish',
+    'dutch',
+    'english',
+    'estonian',
+    'finnish',
+    'french',
+    'galician',
+    'german',
+    'greek',
+    'hebrew',
+    'hindi',
+    'hungarian',
+    'icelandic',
+    'indonesian',
+    'italian',
+    'japanese',
+    'kannada',
+    'kazakh',
+    'korean',
+    'latvian',
+    'lithuanian',
+    'macedonian',
+    'malay',
+    'marathi',
+    'maori',
+    'nepali',
+    'norwegian',
+    'persian',
+    'polish',
+    'portuguese',
+    'romanian',
+    'russian',
+    'serbian',
+    'slovak',
+    'slovenian',
+    'spanish',
+    'swahili',
+    'swedish',
+    'tagalog',
+    'tamil',
+    'thai',
+    'turkish',
+    'ukrainian',
+    'urdu',
+    'vietnamese',
+    'welsh'
+]
+# Google Translate - Supported Languages
+gt_languages = {
+    'afrikaans': 'af',
+    'albanian': 'sq',
+    'amharic': 'am',
+    'arabic': 'ar',
+    'armenian': 'hy',
+    'assamese': 'as',
+    'aymara': 'ay',
+    'azerbaijani': 'az',
+    'bambara': 'bm',
+    'basque': 'eu',
+    'belarusian': 'be',
+    'bengali': 'bn',
+    'bhojpuri': 'bho',
+    'bosnian': 'bs',
+    'bulgarian': 'bg',
+    'catalan': 'ca',
+    'cebuano': 'ceb',
+    'chichewa': 'ny',
+    'chinese (simplified)': 'zh-CN',
+    'chinese (traditional)': 'zh-TW',
+    'corsican': 'co',
+    'croatian': 'hr',
+    'czech': 'cs',
+    'danish': 'da',
+    'dhivehi': 'dv',
+    'dogri': 'doi',
+    'dutch': 'nl',
+    'english': 'en',
+    'esperanto': 'eo',
+    'estonian': 'et',
+    'ewe': 'ee',
+    'filipino': 'tl',
+    'finnish': 'fi',
+    'french': 'fr',
+    'frisian': 'fy',
+    'galician': 'gl',
+    'georgian': 'ka',
+    'german': 'de',
+    'greek': 'el',
+    'guarani': 'gn',
+    'gujarati': 'gu',
+    'haitian creole': 'ht',
+    'hausa': 'ha',
+    'hawaiian': 'haw',
+    'hebrew': 'iw',
+    'hindi': 'hi',
+    'hmong': 'hmn',
+    'hungarian': 'hu',
+    'icelandic': 'is',
+    'igbo': 'ig',
+    'ilocano': 'ilo',
+    'indonesian': 'id',
+    'irish': 'ga',
+    'italian': 'it',
+    'japanese': 'ja',
+    'javanese': 'jw',
+    'kannada': 'kn',
+    'kazakh': 'kk',
+    'khmer': 'km',
+    'kinyarwanda': 'rw',
+    'konkani': 'gom',
+    'korean': 'ko',
+    'krio': 'kri',
+    'kurdish (kurmanji)': 'ku',
+    'kurdish (sorani)': 'ckb',
+    'kyrgyz': 'ky',
+    'lao': 'lo',
+    'latin': 'la',
+    'latvian': 'lv',
+    'lingala': 'ln',
+    'lithuanian': 'lt',
+    'luganda': 'lg',
+    'luxembourgish': 'lb',
+    'macedonian': 'mk',
+    'maithili': 'mai',
+    'malagasy': 'mg',
+    'malay': 'ms',
+    'malayalam': 'ml',
+    'maltese': 'mt',
+    'maori': 'mi',
+    'marathi': 'mr',
+    'meiteilon (manipuri)': 'mni-Mtei',
+    'mizo': 'lus',
+    'mongolian': 'mn',
+    'myanmar': 'my',
+    'nepali': 'ne',
+    'norwegian': 'no',
+    'odia (oriya)': 'or',
+    'oromo': 'om',
+    'pashto': 'ps',
+    'persian': 'fa',
+    'polish': 'pl',
+    'portuguese': 'pt',
+    'punjabi': 'pa',
+    'quechua': 'qu',
+    'romanian': 'ro',
+    'russian': 'ru',
+    'samoan': 'sm',
+    'sanskrit': 'sa',
+    'scots gaelic': 'gd',
+    'sepedi': 'nso',
+    'serbian': 'sr',
+    'sesotho': 'st',
+    'shona': 'sn',
+    'sindhi': 'sd',
+    'sinhala': 'si',
+    'slovak': 'sk',
+    'slovenian': 'sl',
+    'somali': 'so',
+    'spanish': 'es',
+    'sundanese': 'su',
+    'swahili': 'sw',
+    'swedish': 'sv',
+    'tajik': 'tg',
+    'tamil': 'ta',
+    'tatar': 'tt',
+    'telugu': 'te',
+    'thai': 'th',
+    'tigrinya': 'ti',
+    'tsonga': 'ts',
+    'turkish': 'tr',
+    'turkmen': 'tk',
+    'twi': 'ak',
+    'ukrainian': 'uk',
+    'urdu': 'ur',
+    'uyghur': 'ug',
+    'uzbek': 'uz',
+    'vietnamese': 'vi',
+    'welsh': 'cy',
+    'xhosa': 'xh',
+    'yiddish': 'yi',
+    'yoruba': 'yo',
+    'zulu': 'zu'
+}
+# NLLB - Supported Languages
+nllb_languages = [
+    'Acehnese (Arabic script)',
+    'Acehnese (Latin script)',
+    'Afrikaans',
+    'Akan',
+    'Amharic',
+    'Armenian',
+    'Assamese',
+    'Asturian',
+    'Awadhi',
+    'Ayacucho Quechua',
+    'Balinese',
+    'Bambara',
+    'Banjar (Arabic script)',
+    'Banjar (Latin script)',
+    'Bashkir',
+    'Basque',
+    'Belarusian',
+    'Bemba',
+    'Bengali',
+    'Bhojpuri',
+    'Bosnian',
+    'Buginese',
+    'Bulgarian',
+    'Burmese',
+    'Catalan',
+    'Cebuano',
+    'Central Atlas Tamazight',
+    'Central Aymara',
+    'Central Kanuri (Arabic script)',
+    'Central Kanuri (Latin script)',
+    'Central Kurdish',
+    'Chhattisgarhi',
+    'Chinese (Simplified)',
+    'Chinese (Traditional)',
+    'Chokwe',
+    'Crimean Tatar',
+    'Croatian',
+    'Czech',
+    'Danish',
+    'Dari',
+    'Dutch',
+    'Dyula',
+    'Dzongkha',
+    'Eastern Panjabi',
+    'Eastern Yiddish',
+    'Egyptian Arabic',
+    'English',
+    'Esperanto',
+    'Estonian',
+    'Ewe',
+    'Faroese',
+    'Fijian',
+    'Finnish',
+    'Fon',
+    'French',
+    'Friulian',
+    'Galician',
+    'Ganda',
+    'Georgian',
+    'German',
+    'Greek',
+    'Guarani',
+    'Gujarati',
+    'Haitian Creole',
+    'Halh Mongolian',
+    'Hausa',
+    'Hebrew',
+    'Hindi',
+    'Hungarian',
+    'Icelandic',
+    'Igbo',
+    'Ilocano',
+    'Indonesian',
+    'Irish',
+    'Italian',
+    'Japanese',
+    'Javanese',
+    'Jingpho',
+    'Kabiyè',
+    'Kabuverdianu',
+    'Kabyle',
+    'Kamba',
+    'Kannada',
+    'Kashmiri (Arabic script)',
+    'Kashmiri (Devanagari script)',
+    'Kazakh',
+    'Khmer',
+    'Kikongo',
+    'Kikuyu',
+    'Kimbundu',
+    'Kinyarwanda',
+    'Korean',
+    'Kyrgyz',
+    'Lao',
+    'Latgalian',
+    'Ligurian',
+    'Limburgish',
+    'Lingala',
+    'Lithuanian',
+    'Lombard',
+    'Luba-Kasai',
+    'Luo',
+    'Luxembourgish',
+    'Macedonian',
+    'Magahi',
+    'Maithili',
+    'Malayalam',
+    'Maltese',
+    'Maori',
+    'Marathi',
+    'Meitei (Bengali script)',
+    'Mesopotamian Arabic',
+    'Minangkabau (Arabic script)',
+    'Minangkabau (Latin script)',
+    'Mizo',
+    'Modern Standard Arabic',
+    'Modern Standard Arabic (Romanized)',
+    'Moroccan Arabic',
+    'Mossi',
+    'Najdi Arabic',
+    'Nepali',
+    'Nigerian Fulfulde',
+    'North Azerbaijani',
+    'North Levantine Arabic',
+    'Northern Kurdish',
+    'Northern Sotho',
+    'Northern Uzbek',
+    'Norwegian Bokmål',
+    'Norwegian Nynorsk',
+    'Nuer',
+    'Nyanja',
+    'Occitan',
+    'Odia',
+    'Pangasinan',
+    'Papiamento',
+    'Plateau Malagasy',
+    'Polish',
+    'Portuguese',
+    'Romanian',
+    'Rundi',
+    'Russian',
+    'Samoan',
+    'Sango',
+    'Sanskrit',
+    'Santali',
+    'Sardinian',
+    'Scottish Gaelic',
+    'Serbian',
+    'Shan',
+    'Shona',
+    'Sicilian',
+    'Silesian',
+    'Sindhi',
+    'Sinhala',
+    'Slovak',
+    'Slovenian',
+    'Somali',
+    'South Azerbaijani',
+    'South Levantine Arabic',
+    'Southern Pashto',
+    'Southern Sotho',
+    'Southwestern Dinka',
+    'Spanish',
+    'Standard Latvian',
+    'Standard Malay',
+    'Standard Tibetan',
+    'Sundanese',
+    'Swahili',
+    'Swati',
+    'Swedish',
+    "Ta'izzi-Adeni Arabic",
+    'Tagalog',
+    'Tajik',
+    'Tamasheq (Latin script)',
+    'Tamasheq (Tifinagh script)',
+    'Tamil',
+    'Tatar',
+    'Telugu',
+    'Thai',
+    'Tigrinya',
+    'Tok Pisin',
+    'Tosk Albanian',
+    'Tsonga',
+    'Tswana',
+    'Tumbuka',
+    'Tunisian Arabic',
+    'Turkish',
+    'Turkmen',
+    'Twi',
+    'Ukrainian',
+    'Umbundu',
+    'Urdu',
+    'Uyghur',
+    'Venetian',
+    'Vietnamese',
+    'Waray',
+    'Welsh',
+    'West Central Oromo',
+    'Western Persian',
+    'Wolof',
+    'Xhosa',
+    'Yoruba',
+    'Yue Chinese',
+    'Zulu'
+]
+LANGUAGES = {}
+for lang in nllb_languages:
+    lang_code = gt_languages.get(lang.lower(), None)
+    if lang_code:
+        LANGUAGES[lang_code] = lang

main.py CHANGED Viewed

@@ -8,9 +8,10 @@ from fastapi import FastAPI, Request
 from fastapi.middleware.cors import CORSMiddleware
 from media_download import YoutubeDownloader
-from transcription import StableWhisper
-from summarizer import Extract_Summary, AudioBookNarration
-from audiobook import AudioBook
 ### API Configurations
@@ -23,25 +24,25 @@ output_folder = 'Output'
 # Create a context variable to store the contexts for each user
 users_context = dict()
-# CORS (Cross-Origin Resource Sharing)
-origins = [
-    "http://localhost",
-    "http://localhost:4200",
-]
-app.add_middleware(
-    CORSMiddleware,
-    allow_origins=["*"],  # origins,
-    allow_credentials=True,
-    allow_methods=["*"],
-    allow_headers=["*"],
-)
 ### APIs
-@app.get("/get_media_info")
-async def get_media_info(request: Request, url: str):
     # Getting User's IP
     # user_ip = request.client.host
@@ -51,15 +52,39 @@ async def get_media_info(request: Request, url: str):
     youtube_downloader = YoutubeDownloader(url, output_folder)
     # Getting Youtube Media Info
-    media_info = youtube_downloader.get_media_info()
-    # Storing Info in the context for this user's session
-    users_context[user_ip] = dict()
-    users_context[user_ip]['downloader'] = youtube_downloader
-    # users_context[user_ip]['media_info'] = media_info
-    users_context[user_ip]['url'] = url
-    return media_info
 @app.get("/download_media")
@@ -80,11 +105,11 @@ async def download_media(request: Request, media_type: str, media_format: str, m
         users_context[user_ip]['media_path'] = media_path
         users_context[user_ip]['media_type'] = media_type
-    return {"status": status}
 @app.get("/get_transcript")
-async def get_transcript(request: Request, subtitle_format: str = 'srt', word_level: bool = True):
     # Getting User's IP
     # user_ip = request.client.host
@@ -96,7 +121,7 @@ async def get_transcript(request: Request, subtitle_format: str = 'srt', word_le
     # Checking if the media_type is Video, then extract it's audio
     media_type = users_context[user_ip]['media_type']
     if media_type == 'video':
-        media_path = users_context[user_ip]['downloader'].extract_audio(media_path)
     # # Whisper based transcription
     # stable_whisper_transcript = StableWhisper(media_path, output_folder, subtitle_format=subtitle_format, word_level=word_level)
@@ -122,7 +147,44 @@ async def get_transcript(request: Request, subtitle_format: str = 'srt', word_le
         users_context[user_ip]['transcript'] = transcript
         users_context[user_ip]['transcript_path'] = transcript_path
-    return {"status": status, "transcript": transcript}
 @app.get("/get_summary")
@@ -159,7 +221,7 @@ async def get_summary(request: Request, Summary_type: str, Summary_strategy: str
         # Storing Summary Info in the context for this user's session
         users_context[user_ip]['summary'] = output
-    return {"status": status, "summary": output}
 @app.get("/get_key_info")
@@ -196,11 +258,11 @@ async def get_key_info(request: Request, Summary_type: str, Summary_strategy: st
         # Storing Key Info in the context for this user's session
         users_context[user_ip]['key_info'] = output
-    return {"status": status, "key_info": output}
 # @app.get("/get_narration")
-# async def get_narration(request: Request, Narration_style: str, text_input: str = None):
 #     # Getting User's IP
 #     # user_ip = request.client.host
@@ -212,7 +274,7 @@ async def get_key_info(request: Request, Summary_type: str, Summary_strategy: st
 #     # # Extracting Narration
 #     # narrator = AudioBookNarration(text_input=text_input)
-#     # output = narrator.define_chain(Narration_style=Narration_style)
 #     temp_dir = 'temp'
 #     file_path = os.path.join(temp_dir, 'narration.txt')
@@ -227,11 +289,11 @@ async def get_key_info(request: Request, Summary_type: str, Summary_strategy: st
 #         # Storing Narration Info in the context for this user's session
 #         users_context[user_ip]['narration'] = output
-#     return {"status": status, "narration": output}
-@app.get("/get_naration_and_audiobook")
-async def get_audiobook(request: Request,Narration_style: str, output_type : str ,speaker: str = "male", text_input: str = None,):
     # Getting User's IP
     # user_ip = request.client.host
@@ -244,7 +306,7 @@ async def get_audiobook(request: Request,Narration_style: str, output_type : str
     # # Extracting Narration
     # narrator = AudioBookNarration(text_input=text_input)
-    # output = narrator.define_chain(Narration_style=Narration_style)
     # # Generating Audiobook
     # audiobook = AudioBook(output_folder=output_folder)
@@ -262,7 +324,39 @@ async def get_audiobook(request: Request,Narration_style: str, output_type : str
         # Storing Audiobook path in the context for this user's session
         users_context[user_ip]['audiobook_path'] = audio_path
-    return {"status": status, "audiobook_path": audio_path}
 if __name__ == "__main__":

 from fastapi.middleware.cors import CORSMiddleware
 from media_download import YoutubeDownloader
+# from transcription import StableWhisper
+# from summarizer import Extract_Summary, AudioBookNarration
+# from audiobook import AudioBook
+from helperfunctions import *
 ### API Configurations
 # Create a context variable to store the contexts for each user
 users_context = dict()
+# # CORS (Cross-Origin Resource Sharing)
+# origins = [
+#     "http://localhost",
+#     "http://localhost:4200",
+# ]
+# app.add_middleware(
+#     CORSMiddleware,
+#     allow_origins=["*"],  # origins,
+#     allow_credentials=True,
+#     allow_methods=["*"],
+#     allow_headers=["*"],
+# )
 ### APIs
+@app.get("/get_media_metadata")
+async def get_media_metadata(request: Request, url: str):
     # Getting User's IP
     # user_ip = request.client.host
     youtube_downloader = YoutubeDownloader(url, output_folder)
     # Getting Youtube Media Info
+    media_metadata = youtube_downloader.get_media_metadata()
+    # Getting Status
+    status = 1 if media_metadata else 0
+    if status:
+        # Storing Info in the context for this user's session
+        users_context[user_ip] = dict()
+        users_context[user_ip]['downloader'] = youtube_downloader
+        # users_context[user_ip]['media_metadata'] = media_metadata
+        users_context[user_ip]['url'] = url
+    return {'status': status, 'media_metadata': media_metadata}
+@app.get("/get_media_formats")
+async def get_media_formats(request: Request):
+    # Getting User's IP
+    # user_ip = request.client.host
+    user_ip = 1
+    # Downloading Media for User
+    media_formats = users_context[user_ip]['downloader'].get_media_formats()
+    # Getting Status
+    status = 1 if media_formats else 0
+    if status:
+        # Storing Media Info in the context for this user's session
+        users_context[user_ip]['media_formats'] = media_formats
+    return {'status': status, 'media_formats': media_formats}
 @app.get("/download_media")
         users_context[user_ip]['media_path'] = media_path
         users_context[user_ip]['media_type'] = media_type
+    return {'status': status, 'media_path': media_path}
 @app.get("/get_transcript")
+async def get_transcript(request: Request, subtitle_format: str = 'srt', word_level: bool = False):
     # Getting User's IP
     # user_ip = request.client.host
     # Checking if the media_type is Video, then extract it's audio
     media_type = users_context[user_ip]['media_type']
     if media_type == 'video':
+        media_path = extract_audio(media_path)
     # # Whisper based transcription
     # stable_whisper_transcript = StableWhisper(media_path, output_folder, subtitle_format=subtitle_format, word_level=word_level)
         users_context[user_ip]['transcript'] = transcript
         users_context[user_ip]['transcript_path'] = transcript_path
+    return {'status': status, "transcript": transcript}
+@app.get("/get_translation")
+async def get_translation(request: Request, target_language: str = 'en'):
+    # Getting User's IP
+    # user_ip = request.client.host
+    user_ip = 1
+    # Retrieving the transcript from the context for this user's session
+    transcript = users_context[user_ip]['transcript']
+    # # # NLLB based Translation
+    # nllb_translator = Translation(transcript, transcript['language'], target_language, 'output_path')
+    # translated_transcript = nllb_translator.get_translated_transcript()
+    # translated_subtitles = nllb_translator.get_translated_subtitles()
+    temp_dir = 'temp'
+    translated_transcript_path = os.path.join(temp_dir, 'translated_transcript.txt')
+    with open(translated_transcript_path, "r", encoding="utf-8") as f:
+        translated_transcript = f.read()
+    translated_subtitles_path = os.path.join(temp_dir, 'translated_subtitles.json')
+    with open(translated_subtitles_path, "r", encoding="utf-8") as json_file:
+        translated_subtitles = json.load(json_file)
+    # Getting Status
+    status = 1 if translated_transcript and translated_subtitles else 0
+    if status:
+        # Storing Translated Transcript Info in the context for this user's session
+        users_context[user_ip]['translated_transcript'] = translated_transcript
+        users_context[user_ip]['translated_subtitles'] = translated_subtitles
+        # users_context[user_ip]['transcript_path'] = transcript_path
+    return {'status': status, "transcript": translated_transcript, "subtitles": translated_subtitles}
 @app.get("/get_summary")
         # Storing Summary Info in the context for this user's session
         users_context[user_ip]['summary'] = output
+    return {'status': status, "summary": output}
 @app.get("/get_key_info")
         # Storing Key Info in the context for this user's session
         users_context[user_ip]['key_info'] = output
+    return {'status': status, "key_info": output}
 # @app.get("/get_narration")
+# async def get_narration(request: Request, narration_style: str, text_input: str = None):
 #     # Getting User's IP
 #     # user_ip = request.client.host
 #     # # Extracting Narration
 #     # narrator = AudioBookNarration(text_input=text_input)
+#     # output = narrator.define_chain(narration_style=narration_style)
 #     temp_dir = 'temp'
 #     file_path = os.path.join(temp_dir, 'narration.txt')
 #         # Storing Narration Info in the context for this user's session
 #         users_context[user_ip]['narration'] = output
+#     return {'status': status, "narration": output}
+@app.get("/get_audiobook")
+async def get_audiobook(request: Request, output_type : str, narration_style: str, speaker: str = "male", text_input: str = None):
     # Getting User's IP
     # user_ip = request.client.host
     # # Extracting Narration
     # narrator = AudioBookNarration(text_input=text_input)
+    # output = narrator.define_chain(narration_style=narration_style)
     # # Generating Audiobook
     # audiobook = AudioBook(output_folder=output_folder)
         # Storing Audiobook path in the context for this user's session
         users_context[user_ip]['audiobook_path'] = audio_path
+    return {'status': status, "audiobook_path": audio_path}
+@app.get("/get_rendered_video")
+async def get_rendered_video(request: Request, subtitles_type: str = 'original'):
+    # Getting User's IP
+    # user_ip = request.client.host
+    user_ip = 1
+    # Retrieving the media_path from the context for this user's session
+    media_path = users_context[user_ip]['media_path']
+    # Getting Required Subtitles
+    if subtitles_type == 'original':
+        subtitles_path = users_context[user_ip]['transcript_path']
+    elif subtitles_type == 'translated':
+        # Getting Translated Subtitles from the context for this user's session
+        translated_subtitles = users_context[user_ip]['translated_subtitles']
+        # Saving Translated Subtitles
+        subtitles_path = save_translated_subtitles(translated_subtitles, media_path)
+    # Burning Subtitles & Rendering Video
+    rendered_video_path = burn_subtitles(media_path, subtitles_path)
+    # Getting Status
+    status = 1 if rendered_video_path else 0
+    return {'status': status, "rendered_video_path": rendered_video_path}
 if __name__ == "__main__":

media_download.py CHANGED Viewed

@@ -71,8 +71,26 @@ class YoutubeDownloader(MediaDownloader):
         self.thumbnail_url = self.youtube.thumbnail_url
         self.streams = self.youtube.streams
         self.streams_df, self.media_formats_dict = self._get_supported_media_formats()
-    def __get_quality_int(self, media_quality):
         '''
         Returns the Quality in Integer
         E.g: Given input 1080p, it returns 1080
@@ -87,43 +105,97 @@ class YoutubeDownloader(MediaDownloader):
         '''
         Returns all supported media formats for both audio & video
         '''
-        # Creating Pandas Dataframe for Video Streams' Details
-        streams_details = []
-        for stream in self.streams.filter(only_video=True):
-            media_type = stream.type
-            media_format = stream.mime_type.split('/')[1]
-            quality = stream.resolution
-            progressive = stream.is_progressive
-            stream_details = [media_type, media_format, quality, progressive]
-            streams_details.append(stream_details)
-        cols = ['media_type', 'media_format', 'media_quality', 'progressive']
-        streams_df = pd.DataFrame(streams_details, columns=cols)
-        # Adding Custom Audio Streams
-        streams_df.loc[len(streams_df)] = ['audio', 'mp3', '128kbps', False]
-        streams_df.loc[len(streams_df)] = ['audio', 'mp3', '256kbps', False]
-        streams_df.loc[len(streams_df)] = ['audio', 'wav', '1411kbps', False]
-        # Converting to Dictionary for Unique User Options
-        media_formats_dict = dict()
-        for media_type in sorted(streams_df['media_type'].unique()):
-            media_formats_dict[media_type] = dict()
-            media_type_df = streams_df[streams_df['media_type'] == media_type]
-            for media_format in sorted(media_type_df['media_format'].unique()):
-                media_format_df = media_type_df[media_type_df['media_format'] == media_format]
-                media_qualities = sorted(media_format_df['media_quality'].unique(), key=self.__get_quality_int)
-                media_formats_dict[media_type][media_format] = media_qualities
-        return streams_df, media_formats_dict
-    def get_media_formats(self):
-        '''
-        Returns a dictioary for supported media formats
-        '''
-        return self.media_formats_dict
-    def _select_media_format(self):
         '''
         For selecting media format to download
         '''
@@ -186,71 +258,164 @@ class YoutubeDownloader(MediaDownloader):
         return output_path
     def _download_audio(self, audio_format, audio_quality):
         '''
         Filters the required audio stream & downloads it
         '''
-        # Getting Quality Command String
-        quality = str(self.__get_quality_int(audio_quality)) + 'K'
-        # Getting Output Path
-        output_path = os.path.join(self.output_path, f"{self.title}.{audio_format}")
-        # Download Command
-        command = [
-            "yt-dlp",
-            "-x", "--audio-format", audio_format,
-            "--audio-quality",  quality,
-            "-o", output_path,
-            self.url, "-q"
-        ]
-        # Running the command using Subprocess
-        subprocess.run(command)
-        return output_path
     def _download_video(self, video_format, video_quality):
         '''
         Filters the required video stream & downloads it
         Only for Progressive media i.e containing both audio & video streams
         '''
-        stream = self.streams.filter(progressive=True, file_extension=video_format, resolution=video_quality).first()
-        print(stream)
-        video_path = stream.download(output_path=self.output_path, filename=f"{self.title}.{video_format}")
-        return video_path
-    def _download_audio_and_video(self, media_format, media_quality):
-        '''
-        Filters the required video stream & downloads it
-        Filters the best quality audio stream of the same format & downloads it
-        '''
-        # Downloading Audio
-        stream = self.streams.filter(file_extension=media_format, only_audio=True).order_by('abr').desc().first()
-        print(stream)
-        audio_filename = f"{self.title} - Audio.{media_format}"
-        audio_path = stream.download(output_path=self.output_path, filename=audio_filename)
-        # Downloading Video
-        stream = self.streams.filter(file_extension=media_format, resolution=media_quality).first()
-        print(stream)
-        video_filename = f"{self.title} - Video.{media_format}"
-        video_path = stream.download(output_path=self.output_path, filename=video_filename)
-        # Combining the Audio & Video Files using FFMPEG Command
-        output_path = os.path.join(self.output_path, f"{self.title}.{media_format}")
-        command = ['ffmpeg', '-i', video_path, '-i', audio_path,
-                   '-c:v', 'copy', '-c:a', 'copy', output_path,
-                   '-loglevel', 'quiet']
-        subprocess.run(command)
-        os.remove(audio_path)
-        os.remove(video_path)
-        return output_path
     def _download_media_chunk(self, media_type, media_format, media_quality):
         '''
@@ -270,153 +435,95 @@ class YoutubeDownloader(MediaDownloader):
         '''
         Filters the required audio stream & downloads it for particular chunk
         '''
-        # Getting Chunk Command String
-        if (self.start_time) and (self.end_time):
-            chunk_string = f"-ss {self.start_time} -to {self.end_time}"
-        elif (self.start_time) and (not self.end_time):
-            chunk_string = f"-ss {self.start_time}"
-        elif (not self.start_time) and (self.end_time):
-            chunk_string = f"-to {self.end_time}"
-        # Getting Quality Command String
-        quality = str(self.__get_quality_int(audio_quality)) + 'K'
-        # Getting Output Path
-        output_path = os.path.join(self.output_path, f"{self.title}.{audio_format}")
-        # Download Command
-        command = [
-            "yt-dlp",
-            "-x", "--audio-format", audio_format,
-            "--audio-quality",  quality,
-            "--external-downloader", "ffmpeg",
-            "--external-downloader-args", chunk_string,
-            "-o", output_path,
-            url, "-q"
-        ]
-        # Running the command using Subprocess
-        subprocess.run(command)
-        return output_path
     def _download_video_chunk(self, video_format, video_quality):
         '''
         Filters the required video stream & downloads it for particular chunk
         '''
-        # Getting Chunk Command String
-        if (self.start_time) and (self.end_time):
-            chunk_string = f"-ss {self.start_time} -to {self.end_time}"
-        elif (self.start_time) and (not self.end_time):
-            chunk_string = f"-ss {self.start_time}"
-        elif (not self.start_time) and (self.end_time):
-            chunk_string = f"-to {self.end_time}"
-        # Getting Output Path
-        output_path = os.path.join(self.output_path, f"{self.title}.{video_format}")
-        # Getting Video Quality Integer
-        video_quality = self.__get_quality_int(video_quality)
-        # Download Command
-        if video_format == 'mp4':
-            video_codec  = "h264"
-            audio_codec  = "m4a"
-        elif video_format == 'webm':
-            video_codec  = "vp9"
-            audio_codec  = "opus"
-        else:
-            print('Unexpected Video Format Encountered:', video_format)
-            os.exit(0)
-        command = [
-            "yt-dlp",
-            url,
-            "-S", f"res:{video_quality},vcodec:{video_codec},acodec:{audio_codec}",
-           "--merge-output-format", video_format,
-            "--download-sections", f"*{self.start_time}-{self.end_time}",
-            "-o", f"{output_path}",
-        #     "-q"
-        ]
-        print(' '.join(command))
-        # Running the command using Subprocess
-        subprocess.run(command)
-        return output_path
-    def get_media_info(self):
-        media_info = {
-            'title': self.title,
-            'media_length': self.media_length,
-            'thumbnail_url': self.thumbnail_url,
-            'formats': self.media_formats_dict
-        }
-        return media_info
-    @staticmethod
-    def extract_audio(video_path):
-        """
-        Extract audio from a video file (MP4 or WebM) and save it as an MP3 file using ffmpeg.
-        Args:
-            video_path (str): Path to the input video file.
-        Returns:
-            str: Path of extracted audio.
-        """
-        try:
-            # Path for Extracted Audio File
-            filename, extension = os.path.splitext(video_path)
-            audio_path = filename + '.mp3'
-            # Choosing the Appropriate Codec for the Output Audio Format (MP3)
-            audio_codec = "libmp3lame" if extension.lower() in (".mp4", ".webm") else "mp3"
-            # Extracting Audio using FFMPEG Command
-            command = ["ffmpeg", "-i", video_path, "-vn", "-acodec",
-                       audio_codec, audio_path, '-loglevel', 'quiet']
-            subprocess.run(command, check=True)
-            return audio_path
-        except subprocess.CalledProcessError as e:
-            print(f"Error: {e}")
-    @staticmethod
-    def burn_subtitles(video_file_path, subtitle_file_path):
-        '''
-        Burns the subtitles onto the video
-        Args:
-            video_file_path (str): Path to the input video file.
-            subtitle_file_path (str): Path to the subtitle file.
-        Returns:
-            str: Path of output video with subtitles.
-        '''
-        try:
-            # Getting Output File Path
-            video_filename, video_extension = os.path.splitext(video_file_path)
-            subtitle_filename, subtitle_extension = os.path.splitext(subtitle_file_path)
-            output_file_path = video_filename + subtitle_extension.replace('.', '_') + video_extension
-            # Burning the Subtitles onto Video using FFMPEG Command
-            command = ['ffmpeg', '-i', video_file_path,
-                    '-vf', f'subtitles={subtitle_file_path}',
-                    output_file_path, '-loglevel', 'quiet']
-            subprocess.run(command, check=True)
-            return output_file_path
-        except subprocess.CalledProcessError as e:
-            print(f"Error: {e}")

         self.thumbnail_url = self.youtube.thumbnail_url
         self.streams = self.youtube.streams
         self.streams_df, self.media_formats_dict = self._get_supported_media_formats()
+    def get_media_formats(self):
+        '''
+        Returns a dictionary for supported media formats
+        '''
+        return self.media_formats_dict
+    def get_media_metadata(self):
+        '''
+        Returns a dictionary for media metadata
+        '''
+        media_info = {
+            'title': self.title,
+            'media_length': self.media_length,
+            'thumbnail_url': self.thumbnail_url
+        }
+        return media_info
+    @staticmethod
+    def __get_quality_int(media_quality):
         '''
         Returns the Quality in Integer
         E.g: Given input 1080p, it returns 1080
         '''
         Returns all supported media formats for both audio & video
         '''
+        try:
+            # Creating Pandas Dataframe for Video Streams' Details
+            streams_details = []
+            for stream in self.streams.filter(only_video=True):
+                media_type = stream.type
+                media_format = stream.mime_type.split('/')[1]
+                quality = stream.resolution
+                progressive = stream.is_progressive
+                stream_details = [media_type, media_format, quality, progressive]
+                streams_details.append(stream_details)
+            cols = ['media_type', 'media_format', 'media_quality', 'progressive']
+            streams_df = pd.DataFrame(streams_details, columns=cols)
+            # Adding Custom Audio Streams
+            streams_df.loc[len(streams_df)] = ['audio', 'mp3', '128kbps', False]
+            streams_df.loc[len(streams_df)] = ['audio', 'mp3', '256kbps', False]
+            streams_df.loc[len(streams_df)] = ['audio', 'wav', '1411kbps', False]
+            # Converting to Dictionary for Unique User Options
+            media_formats_dict = dict()
+            for media_type in sorted(streams_df['media_type'].unique()):
+                media_formats_dict[media_type] = dict()
+                media_type_df = streams_df[streams_df['media_type'] == media_type]
+                for media_format in sorted(media_type_df['media_format'].unique()):
+                    media_format_df = media_type_df[media_type_df['media_format'] == media_format]
+                    media_qualities = sorted(media_format_df['media_quality'].unique(), key=self.__get_quality_int)
+                    media_formats_dict[media_type][media_format] = media_qualities
+            return streams_df, media_formats_dict
+        except Exception as pytube_error:
+            print(f"PyTube Error in _get_supported_media_formats: \n{pytube_error}\n")
+            print('Trying with yt-dlp...')
+            try:
+                # Download Command
+                command = ["yt-dlp", "--list-formats", url,
+                           "--get-filename", "--format", "best[ext=mp4]/best[ext=webm]"]
+                print(' '.join(command))
+                # Running the command using Subprocess and capturing the output
+                completed_process = subprocess.run(command, text=True, stdout=subprocess.PIPE)
+                if completed_process.returncode != 0:
+                    print(f"yt-dlp error in _get_supported_media_formats:")
+                    print(completed_process.stderr)
+                else:
+                    output_lines = completed_process.stdout.split('\n')
+                    output_lines = [line for line in output_lines if line.strip()]
+                    # Create a list of dictionaries for each format entry
+                    streams_details = []
+                    for line in output_lines[2:]:  # Skip the header lines
+                        fields = line.split()
+                        media_format = fields[1]
+                        media_quality = fields[-2]
+                        if media_format in ['mp4', 'webm']:
+                            if 'p,' in media_quality:
+                                media_type = 'video'
+                                media_quality = media_quality[:-1]
+                                progressive = False
+                                stream_details = [media_type, media_format, media_quality, progressive]
+                                streams_details.append(stream_details)
+                    # Create a pandas DataFrame from the list of dictionaries
+                    cols = ['media_type', 'media_format', 'media_quality', 'progressive']
+                    streams_df = pd.DataFrame(streams_details, columns=cols)
+                    streams_df = streams_df.drop_duplicates().reset_index(drop=True)
+                    # Adding Custom Audio Streams
+                    streams_df.loc[len(streams_df)] = ['audio', 'mp3', '128kbps', False]
+                    streams_df.loc[len(streams_df)] = ['audio', 'mp3', '256kbps', False]
+                    streams_df.loc[len(streams_df)] = ['audio', 'wav', '1411kbps', False]
+                    # Converting to Dictionary for Unique User Options
+                    media_formats_dict = dict()
+                    for media_type in sorted(streams_df['media_type'].unique()):
+                        media_formats_dict[media_type] = dict()
+                        media_type_df = streams_df[streams_df['media_type'] == media_type]
+                        for media_format in sorted(media_type_df['media_format'].unique()):
+                            media_format_df = media_type_df[media_type_df['media_format'] == media_format]
+                            media_qualities = sorted(media_format_df['media_quality'].unique(), key=self.__get_quality_int)
+                            media_formats_dict[media_type][media_format] = media_qualities
+                    return streams_df, media_formats_dict
+            except Exception as yt_dlp_error:
+                print(f"yt-dlp error in _get_supported_media_formats: \n{yt_dlp_error}\n")
+    def select_media_format(self):
         '''
         For selecting media format to download
         '''
         return output_path
     def _download_audio(self, audio_format, audio_quality):
         '''
         Filters the required audio stream & downloads it
         '''
+        try:
+            # Getting Quality Command String
+            quality = str(self.__get_quality_int(audio_quality)) + 'K'
+            # Getting Output Path
+            output_path = os.path.join(self.output_path, f"{self.title}.{audio_format}")
+            # Download Command
+            command = [
+                "yt-dlp",
+                "-x", "--audio-format", audio_format,
+                "--audio-quality",  quality,
+                "-o", output_path,
+                self.url, "-q"
+            ]
+            # Running the command using Subprocess
+            subprocess.run(command)
+            return output_path
+        except Exception as yt_dlp_error:
+            print(f"Error in _download_audio: \n{yt_dlp_error}\n")
     def _download_video(self, video_format, video_quality):
         '''
         Filters the required video stream & downloads it
         Only for Progressive media i.e containing both audio & video streams
         '''
+        try:
+            stream = self.streams.filter(progressive=True, file_extension=video_format, resolution=video_quality).first()
+            print(stream)
+            video_path = stream.download(output_path=self.output_path, filename=f"{self.title}.{video_format}")
+            return video_path
+        except Exception as pytube_error:
+            print(f"PyTube error in _download_video: \n{pytube_error}\n")
+            print('Trying with yt-dlp...')
+            try:
+                # Getting Output Path
+                output_path = os.path.join(self.output_path, f"{self.title}.{video_format}")
+                # Getting Video Quality Integer
+                video_quality = self.__get_quality_int(video_quality)
+                # Setting Formats
+                if video_format == 'mp4':
+                    video_codec  = "h264"
+                    audio_codec  = "m4a"
+                elif video_format == 'webm':
+                    video_codec  = "vp9"
+                    audio_codec  = "opus"
+                else:
+                    print('Unexpected Video Format Encountered:', video_format)
+                    os.exit(0)
+                # Download Command
+                command = [
+                    "yt-dlp",
+                    url,
+                    "-S", f"res:{video_quality},vcodec:{video_codec},acodec:{audio_codec}",
+                    "--merge-output-format", video_format,
+                    "-o", f"{output_path}",
+                    "-q"
+                ]
+                print(' '.join(command))
+                # Running the command using Subprocess
+                subprocess.run(command, check=True)
+                return output_path
+            except Exception as yt_dlp_error:
+                print(f"yt-dlp error in _download_video: \n{yt_dlp_error}\n")
+    def _download_audio_and_video(self, media_format, media_quality):
+        '''
+        Filters the required video stream & downloads it
+        Filters the best quality audio stream of the same format & downloads it
+        '''
+        try:
+            # Downloading Audio
+            stream = self.streams.filter(file_extension=media_format, only_audio=True).order_by('abr').desc().first()
+            print(stream)
+            audio_filename = f"{self.title} - Audio.{media_format}"
+            audio_path = stream.download(output_path=self.output_path, filename=audio_filename)
+            # Downloading Video
+            stream = self.streams.filter(file_extension=media_format, resolution=media_quality).first()
+            print(stream)
+            video_filename = f"{self.title} - Video.{media_format}"
+            video_path = stream.download(output_path=self.output_path, filename=video_filename)
+            # Combining the Audio & Video Files using FFMPEG Command
+            output_path = os.path.join(self.output_path, f"{self.title}.{media_format}")
+            command = ['ffmpeg', '-i', video_path, '-i', audio_path,
+                    '-c:v', 'copy', '-c:a', 'copy', output_path,
+                    '-loglevel', 'quiet']
+            subprocess.run(command)
+            os.remove(audio_path)
+            os.remove(video_path)
+            return output_path
+        except Exception as pytube_error:
+            print(f"PyTube error in _download_audio_and_video: \n{pytube_error}\n")
+            print('Trying with yt-dlp...')
+            try:
+                # Getting Output Path
+                output_path = os.path.join(self.output_path, f"{self.title}.{media_format}")
+                # Getting Video Quality Integer
+                media_quality = self.__get_quality_int(media_quality)
+                # Setting Formats
+                if media_format == 'mp4':
+                    video_codec  = "h264"
+                    audio_codec  = "m4a"
+                elif media_format == 'webm':
+                    video_codec  = "vp9"
+                    audio_codec  = "opus"
+                else:
+                    print('Unexpected Video Format Encountered:', media_format)
+                    os.exit(0)
+                # Download Command
+                command = [
+                    "yt-dlp",
+                    url,
+                    "-S", f"res:{media_quality},vcodec:{video_codec},acodec:{audio_codec}",
+                    "--merge-output-format", media_format,
+                    "-o", f"{output_path}",
+                    "-q"
+                ]
+                print(' '.join(command))
+                # Running the command using Subprocess
+                subprocess.run(command)
+                return output_path
+            except Exception as yt_dlp_error:
+                print(f"yt-dlp error in _download_audio_and_video: \n{yt_dlp_error}\n")
     def _download_media_chunk(self, media_type, media_format, media_quality):
         '''
         '''
         Filters the required audio stream & downloads it for particular chunk
         '''
+        try:
+            # Getting Chunk Command String
+            if (self.start_time) and (self.end_time):
+                chunk_string = f"-ss {self.start_time} -to {self.end_time}"
+            elif (self.start_time) and (not self.end_time):
+                chunk_string = f"-ss {self.start_time}"
+            elif (not self.start_time) and (self.end_time):
+                chunk_string = f"-to {self.end_time}"
+            # Getting Quality Command String
+            quality = str(self.__get_quality_int(audio_quality)) + 'K'
+            # Getting Output Path
+            output_path = os.path.join(self.output_path, f"{self.title}.{audio_format}")
+            # Download Command
+            command = [
+                "yt-dlp",
+                "-x", "--audio-format", audio_format,
+                "--audio-quality",  quality,
+                "--external-downloader", "ffmpeg",
+                "--external-downloader-args", chunk_string,
+                "-o", output_path,
+                url, "-q"
+            ]
+            # Running the command using Subprocess
+            subprocess.run(command)
+            return output_path
+        except Exception as e:
+            print(f"Error in _download_audio_chunk: {e}")
     def _download_video_chunk(self, video_format, video_quality):
         '''
         Filters the required video stream & downloads it for particular chunk
         '''
+        try:
+            # Getting Chunk Command String
+            if (self.start_time) and (self.end_time):
+                chunk_string = f"-ss {self.start_time} -to {self.end_time}"
+            elif (self.start_time) and (not self.end_time):
+                chunk_string = f"-ss {self.start_time}"
+            elif (not self.start_time) and (self.end_time):
+                chunk_string = f"-to {self.end_time}"
+            # Getting Output Path
+            output_path = os.path.join(self.output_path, f"{self.title}.{video_format}")
+            # Getting Video Quality Integer
+            video_quality = self.__get_quality_int(video_quality)
+            # Setting Formats
+            if video_format == 'mp4':
+                video_codec  = "h264"
+                audio_codec  = "m4a"
+            elif video_format == 'webm':
+                video_codec  = "vp9"
+                audio_codec  = "opus"
+            else:
+                print('Unexpected Video Format Encountered:', video_format)
+                os.exit(0)
+            # Download Command
+            command = [
+                "yt-dlp",
+                url,
+                "-S", f"res:{video_quality},vcodec:{video_codec},acodec:{audio_codec}",
+                "--merge-output-format", video_format,
+                "--download-sections", f"*{self.start_time}-{self.end_time}",
+                "-o", f"{output_path}",
+                "-q"
+            ]
+            print(' '.join(command))
+            # Running the command using Subprocess
+            subprocess.run(command)
+            return output_path
+        except Exception as e:
+            print(f"Error in _download_video_chunk: {e}")

summarizer.py CHANGED Viewed

@@ -415,13 +415,13 @@ class AudioBookNarration:
     def get_stuff_prompt(self):
         prompt_template = """
-            Create a {Narration_style} narration for this below text. This narration will be used for audiobook generation.
             So provide the output that is verbose, easier to understand and full of expressions.
                     {text}
                     """
         prompt = PromptTemplate(
-            template=prompt_template, input_variables=['Narration_style','text'])
         return prompt
@@ -429,29 +429,29 @@ class AudioBookNarration:
     def define_prompts(self):
         map_prompts = """
-            Create a {Narration_style} narration for this below text. This narration will be used for audiobook generation.
             So provide the output that is verbose, easier to understand and full of expressions.
                 {text}
                 """
         combine_prompt = """
             Below are the list of text that represent narration from the text.
-            Your job is to combine these narrations and craete one verbose,easier to understand and full of experssions {Narration_style} narration.
             {text}
             """
-        map_template = PromptTemplate(template=map_prompts, input_variables=['Narration_style','text']
                                       )
         combine_template = PromptTemplate(
-            template=combine_prompt, input_variables=['Narration_style','text'])
         return map_template, combine_template
         # pass
-    def define_chain(self,Narration_style=None,chain_type=None):
         docs, chain_type = self.load_docs()
@@ -470,7 +470,7 @@ class AudioBookNarration:
                 llm=llm, map_prompt=map_prompts, combine_prompt=combine_prompt, chain_type='map_reduce', verbose=False)
-        output = chain.run(Narration_style = Narration_style,input_documents = docs)
         # self.create_wordcloud(output=output)
         # display(Markdown(f"Text: {docs}"))

     def get_stuff_prompt(self):
         prompt_template = """
+            Create a {narration_style} narration for this below text. This narration will be used for audiobook generation.
             So provide the output that is verbose, easier to understand and full of expressions.
                     {text}
                     """
         prompt = PromptTemplate(
+            template=prompt_template, input_variables=['narration_style','text'])
         return prompt
     def define_prompts(self):
         map_prompts = """
+            Create a {narration_style} narration for this below text. This narration will be used for audiobook generation.
             So provide the output that is verbose, easier to understand and full of expressions.
                 {text}
                 """
         combine_prompt = """
             Below are the list of text that represent narration from the text.
+            Your job is to combine these narrations and craete one verbose,easier to understand and full of experssions {narration_style} narration.
             {text}
             """
+        map_template = PromptTemplate(template=map_prompts, input_variables=['narration_style','text']
                                       )
         combine_template = PromptTemplate(
+            template=combine_prompt, input_variables=['narration_style','text'])
         return map_template, combine_template
         # pass
+    def define_chain(self,narration_style=None,chain_type=None):
         docs, chain_type = self.load_docs()
                 llm=llm, map_prompt=map_prompts, combine_prompt=combine_prompt, chain_type='map_reduce', verbose=False)
+        output = chain.run(narration_style = narration_style,input_documents = docs)
         # self.create_wordcloud(output=output)
         # display(Markdown(f"Text: {docs}"))

temp/translated_subtitles.json ADDED Viewed

	@@ -0,0 +1,227 @@

+[
+    {
+        "start":0.0,
+        "end":6.0,
+        "text":"دوسرا پہلو ٹیلی ویژن اور فلمیں اور موسیقی ہے۔"
+    },
+    {
+        "start":6.0,
+        "end":12.0,
+        "text":"اسلام کے بارے میں دلچسپ باتوں میں سے ایک یہ ہے کہ علمائے کرام کا موسیقی کے ساتھ تناؤ تھا۔"
+    },
+    {
+        "start":12.0,
+        "end":17.0,
+        "text":"کوئی بھی یہ واضح بیان نہیں دے سکتا کہ یہ مجمل ہے۔"
+    },
+    {
+        "start":17.0,
+        "end":26.0,
+        "text":"اگر آپ شوکانی اور نیل الاوطار پڑھیں تو اس کے پاس اس پر ایک سیکشن ہے اور اس میں موسیقی کے بارے میں موجود خلافت کے بارے میں بات کرتا ہے۔"
+    },
+    {
+        "start":30.0,
+        "end":38.18,
+        "text":"سماع کے بارے میں علماء کے حصے ہیں جو کہ موسیقی کی ایک مقدس قسم ہے جسے وہ اچھی چیز اور جائز سمجھتے تھے۔"
+    },
+    {
+        "start":39.0,
+        "end":46.0,
+        "text":"لیکن علمائے کرام موسیقی سے بہت محتاط تھے کیونکہ وہ سمجھتے تھے کہ موسیقی کتنی طاقتور ہے،"
+    },
+    {
+        "start":46.0,
+        "end":50.0,
+        "text":"اور یہ کتنا پرکشش ہے، اور اس کے روح پر کیا اثرات مرتب ہوتے ہیں۔"
+    },
+    {
+        "start":50.0,
+        "end":53.0,
+        "text":"یہ اصل میں قدیم یونانیوں کو واپس جاتا ہے."
+    },
+    {
+        "start":53.0,
+        "end":58.0,
+        "text":"جمہوریہ میں افلاطون، سقراط وہ آواز ہے جسے وہ استعمال کرتا ہے۔"
+    },
+    {
+        "start":60.0,
+        "end":67.0,
+        "text":"وہ دراصل جمہوریہ میں موسیقی کی کچھ اقسام کو غیر قانونی قرار دیتا ہے کیونکہ وہ روح کے لیے بہت نقصان دہ تھے۔"
+    },
+    {
+        "start":67.0,
+        "end":71.0,
+        "text":"ایتھوس تھیوری موسیقی کے اثر کا نظریہ ہے۔"
+    },
+    {
+        "start":71.0,
+        "end":79.0,
+        "text":"درحقیقت الفارابی جس نے موسیقی کی سب سے بڑی کتاب کتاب الموسیق الکبیر لکھی۔"
+    },
+    {
+        "start":79.0,
+        "end":83.0,
+        "text":"جو میری لائبریری میں ہے، یہ ایک بہت بڑی کتاب ہے، بہت بھاری۔"
+    },
+    {
+        "start":83.0,
+        "end":89.0,
+        "text":"یہ موسیقی کی سائنس پر ابتدائی سنجیدہ کاموں میں سے ایک ہے۔"
+    },
+    {
+        "start":90.0,
+        "end":103.0,
+        "text":"وہ لوگوں کو ہنسانے، رونے، نیند آنے، یا مقام کی بنیاد پر پرجوش ہونے کے قابل ہونے کے لیے جانا جاتا تھا جو وہ عود پر بجاتا تھا۔"
+    },
+    {
+        "start":104.04,
+        "end":106.0,
+        "text":"وہ لفظی طور پر لوگوں کو رلا سکتا تھا۔"
+    },
+    {
+        "start":106.0,
+        "end":107.36,
+        "text":"اور یہ اچھی طرح سے درج ہے۔"
+    },
+    {
+        "start":108.66,
+        "end":112.0,
+        "text":"اور جب لوگ کنسرٹس میں جاتے ہیں تو آپ کو یہی ملتا ہے۔"
+    },
+    {
+        "start":112.0,
+        "end":115.0,
+        "text":"وہ بہت مشتعل ہو جاتے ہیں، انہیں حرکت کرنا پڑتی ہے۔"
+    },
+    {
+        "start":115.0,
+        "end":117.0,
+        "text":"وہ نہیں جانتے کیوں، لیکن انہیں منتقل ہونا پڑے گا."
+    },
+    {
+        "start":120.0,
+        "end":127.0,
+        "text":"آوازوں کے شیطانی اثرات ہوتے ہیں، اور پھر فرشتے کے اثرات ہوتے ہیں جو آوازوں کے ہوتے ہیں۔"
+    },
+    {
+        "start":127.0,
+        "end":133.0,
+        "text":"اور یوں علمائے کرام آواز کے شیطانی اثرات کے بارے میں بہت فکر مند تھے۔"
+    },
+    {
+        "start":134.08,
+        "end":141.0,
+        "text":"اور وہ سمجھ گئے کہ جن چیزوں کو شیاطین ہمیشہ استعمال کرتے رہے ہیں وہ موسیقی ہے لوگوں کو اپنی طرف راغب کرنے کے لیے۔"
+    },
+    {
+        "start":141.0,
+        "end":146.34,
+        "text":"درحقیقت داؤد علیہ السلام کے بارے میں حدیث میں ہے کہ جنہوں نے زبور گایا،"
+    },
+    {
+        "start":150.0,
+        "end":153.0,
+        "text":"یہ روحانی نہیں تھا، لیکن یہ فرشتہ تھا۔"
+    },
+    {
+        "start":153.46,
+        "end":158.0,
+        "text":"شیطان نے ایک چھوٹا سا بینڈ اکٹھا کیا، اور اس نے اسے سڑک کے کنارے رکھ دیا،"
+    },
+    {
+        "start":158.0,
+        "end":162.78,
+        "text":"اور لوگ داؤد کو سننے کے لیے جاتے تھے اور شیطان کے ٹولے کو سنتے تھے۔"
+    },
+    {
+        "start":163.0,
+        "end":166.0,
+        "text":"اور وہ داؤد کو بھول جائیں گے۔"
+    },
+    {
+        "start":166.0,
+        "end":170.0,
+        "text":"اور یوں یہ وہ تناؤ تھا جو علمائے کرام کو تھا، اور یہ بہت ضروری ہے کہ یہ تناؤ موجود رہے،"
+    },
+    {
+        "start":170.08,
+        "end":175.0,
+        "text":"کیونکہ کوئی بھی یہ بیان نہیں کر سکتا کہ موسیقی مکمل طور پر حرام ہے،"
+    },
+    {
+        "start":175.0,
+        "end":178.0,
+        "text":"اور کوئی بھی یہ نہیں کہہ سکتا کہ یہ حلال ہے۔"
+    },
+    {
+        "start":180.0,
+        "end":185.0,
+        "text":"اور مسلمان اس چیز میں کبھی زیادہ دور نہیں جاتے، کیونکہ اب آپ مغرب میں دیکھتے ہیں،"
+    },
+    {
+        "start":185.46,
+        "end":189.0,
+        "text":"لوگ ہر وقت موسیقی سنتے ہیں، ان کے پاس نہیں ہے، وہ ہمیشہ پلگ ان ہوتے ہیں۔"
+    },
+    {
+        "start":189.0,
+        "end":190.84,
+        "text":"وہ اپنی گاڑی میں بیٹھتے ہیں، وہ میوزک آن کرتے ہیں۔"
+    },
+    {
+        "start":191.0,
+        "end":195.0,
+        "text":"وہ چلتے ہیں، وہ اپنے ائرفون لگاتے ہیں، اور وہ اپنی موسیقی سنتے ہیں،"
+    },
+    {
+        "start":195.0,
+        "end":199.0,
+        "text":"اور لوگوں کے پاس لمبی پلے لسٹ ہوتی ہے، وہ ان چیزوں پر بہت پیسہ خرچ کرتے ہیں،"
+    },
+    {
+        "start":199.0,
+        "end":204.0,
+        "text":"اور اس طرح وہ کھو گئے ہیں، ان کے پاس مزید سوچنے کا وقت نہیں ہے،"
+    },
+    {
+        "start":204.0,
+        "end":206.0,
+        "text":"کیونکہ ان کی زندگی آوازوں سے بھری ہوئی ہے۔"
+    },
+    {
+        "start":210.0,
+        "end":215.0,
+        "text":"جو ان کے پاس پہلے کبھی نہیں تھا، اور وہ انہیں بہت مؤثر طریقے سے استعمال کر رہے ہیں۔"
+    },
+    {
+        "start":215.3,
+        "end":221.0,
+        "text":"اور بدقسمتی سے ہم حق کے لوگ ان کا مؤثر استعمال نہیں کر رہے ہیں۔"
+    },
+    {
+        "start":221.0,
+        "end":222.0,
+        "text":"اور اللہ فرماتا ہے"
+    },
+    {
+        "start":226.0,
+        "end":229.0,
+        "text":"ان اوزاروں سے لڑو جن سے آپ لڑ رہے ہیں۔"
+    },
+    {
+        "start":229.0,
+        "end":234.0,
+        "text":"اس دور کا جہاد کانوں کے درمیان ہے۔"
+    },
+    {
+        "start":234.0,
+        "end":238.0,
+        "text":"اس دور کا جہاد کانوں کے درمیان ہے۔"
+    },
+    {
+        "start":240.0,
+        "end":245.0,
+        "text":"میدان جنگ انسانوں کا دماغ ہے اور وسعت کے لحاظ سے دل۔"
+    }
+]

temp/translated_transcript.txt ADDED Viewed

	@@ -0,0 +1 @@

+ دوسرا پہلو ٹیلی ویژن، فلمیں اور موسیقی ہے. اسلام کے بارے میں ایک دلچسپ بات یہ ہے کہ علماء کی موسیقی کے ساتھ کشیدگی تھی. کوئی بھی یہ بات واضح نہیں کر سکتا کہ یہ مجمل علی ہے. اگر آپ شوکانی اور نائل الاوطار پڑھتے ہیں تو اس کے پاس اس پر ایک سیکشن ہے اور وہ موسیقی کے بارے میں موجود خلافت کے بارے میں بات کرتا ہے. علماء کے پاس سما کے بارے میں سیکشن ہیں، جو ایک مقدس قسم کی موسیقی ہے جو ان کے خیال میں ایک اچھی چیز اور جائز ہے. لیکن علماء موسیقی سے بہت محتاط تھے کیونکہ وہ سمجھتے تھے کہ موسیقی کتنی طاقتور ہے اور کتنی دلکش ہے، اور روح پر اس کے اثرات. یہ اصل میں قدیم یونانیوں سے واپس جاتا ہے. جمہوریہ میں افلاطون، سقراط وہ آواز ہے جو وہ استعمال کرتا ہے. وہ اصل میں جمہوریہ میں موسیقی کی کچھ اقسام کو غیر قانونی قرار دیتا ہے کیونکہ وہ روح کے لئے بہت نقصان دہ تھے. ایتوس تھیوری اس اثر کا نظریہ ہے کہ موسیقی. دراصل، الفارابی، جس نے کتب الموسيق الكبير لکھی، موسیقی کی بڑی کتاب، جو میرے پاس اپنی لائبریری میں ہے، یہ ایک بہت بڑی کتاب ہے، بہت بھاری. یہ موسیقی کے علم پر سب سے پہلے سنجیدہ کام میں سے ایک ہے. وہ لوگوں کو ہنسنے ، رونے ، نیند آنے یا شوق سے کھیلنے کے قابل ہونے کے لئے جانا جاتا تھا. وہ لفظی طور پر لوگوں کو روانا کر سکتا تھا. اور یہ اچھی طرح ریکارڈ کیا گیا ہے. اور یہ آپ کو ملتا ہے جب لوگ کنسرٹ پر جاتے ہیں. وہ بہت پریشان ہو جاتے ہیں، انہیں منتقل کرنا پڑتا ہے. وہ نہیں جانتے کیوں، لیکن وہ منتقل کرنا ہے. آوازوں کے شیطانی اثرات ہوتے ہیں، اور پھر فرشتے بھی ہوتے ہیں جن کے اثرات ہوتے ہیں. اور اس لئے علماء کو آواز کے شیطانی اثرات سے بہت فکر مند تھے. اور وہ سمجھ گئے کہ جنات نے ہمیشہ لوگوں کو دور کرنے کے لئے موسیقی کا استعمال کیا ہے. دراصل، داؤد، سلام ہو اس پر، جو زبور گاتا تھا کے بارے میں حدیث میں، یہ روحانی نہیں تھا، لیکن یہ فرشتہ تھا. شیطان نے ایک چھوٹا سا بینڈ اکٹھا کیا اور اس نے اسے سڑک کے کنارے رکھا اور لوگ جو داؤد کو سننے کے لئے جا رہے تھے وہ رک کر شیطان کے بینڈ کو سنتے تھے اور وہ داؤد کو بھول جاتے تھے. اور تو یہ کشیدگی تھی جو علماء نے کی تھی، اور یہ بہت اہم ہے کہ کشیدگی موجود ہے کیونکہ کوئی بھی ایک جامع بیان نہیں دے سکتا کہ موسیقی مکمل طور پر حرام ہے، اور کوئی بھی ایک جامع بیان نہیں دے سکتا کہ یہ حلال ہے. اور مسلمانوں کو کبھی بھی اس چیز میں بہت زیادہ نہیں جانا کیونکہ اب آپ دیکھ سکتے ہیں کہ مغرب میں لوگ ہر وقت موسیقی سنتے ہیں، ان کے پاس نہیں ہے، وہ ہمیشہ پلگ ان ہیں. وہ اپنی گاڑیوں میں جاتے ہیں، وہ موسیقی کو چالو کرتے ہیں. وہ چلتے ہیں، وہ اپنے کانوں میں رکھتے ہیں، اور وہ اپنی موسیقی سنتے ہیں، اور لوگوں کے پاس لمبی پلے لسٹس ہیں، وہ ان چیزوں پر بہت پیسہ خرچ کرتے ہیں، اور اس طرح وہ کھو گئے ہیں، ان کے پاس سوچنے کے لئے زیادہ مفت وقت نہیں ہے کیونکہ ان کی زندگی ایسی آواز سے بھری ہوئی ہے جو ان کے پاس پہلے کبھی نہیں تھی، اور وہ ان کا استعمال بہت مؤثر طریقے سے کر رہے ہیں. اور ہم، بدقسمتی سے، حق کے لوگ، ان کا مؤثر طریقے سے استعمال نہیں کر رہے ہیں بالکل. اور اللہ تعالیٰ فرماتا ہے، "جو اوزار سے تم لڑ رہے ہو ان سے لڑو. اس زمانے کا جہاد کانوں کے درمیان ہے. اس زمانے کا جہاد کانوں کے درمیان ہے. میدانِ جنگ انسانوں کا ذہن ہے اور اس کے علاوہ دل بھی. ".

translation.py ADDED Viewed

	@@ -0,0 +1,127 @@

+import os
+import openai
+import locale
+locale.getpreferredencoding = lambda: "UTF-8"
+import dl_translate as dlt
+from deep_translator import GoogleTranslator
+from languages import LANGUAGES
+OPENAI_API_KEY = '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'
+OPENAI_API_URL = 'https://api.openai.com/v1/chat/completions'
+openai.api_key = OPENAI_API_KEY
+class Translation:
+    def __init__(self, transcript_dict, source_lang, target_lang, output_path):
+        self.transcript_dict = transcript_dict
+        self.output_path = os.path.join(os.getcwd(), output_path)
+        # Languages
+        self.source_lang = source_lang  # Whisper Detected Language
+        self.target_lang = target_lang
+        # Transcript
+        self.transcript = transcript_dict['text'].strip()
+        self.subtitles = self.__get_subtitles()
+        # Translation Model
+        nllb_model = 'facebook/nllb-200-distilled-600M'
+        # nllb_model = 'facebook/nllb-200-1.3B'
+        # nllb_model = 'facebook/nllb-200-3.3B'
+        # nllb_model = 'facebook/nllb-moe-54b'
+        self.nllb = dlt.TranslationModel(nllb_model)
+    def __get_subtitles(self):
+        '''
+        Returns the subtitles from transcript dictionary
+        '''
+        subtitles = []
+        for s in self.transcript_dict['segments']:
+            segment = {
+                'start': s['start'],
+                'end': s['end'],
+                'text': s['text'].strip()
+            }
+            subtitles.append(segment)
+        return subtitles
+    def __correct_punctuation_gpt(self):
+        '''
+        Corrects the Punctuation from GPT
+        '''
+        system_prompt = """
+        You are a helpful NLP assistant.
+        Your task is to identify language of the provided text,
+        correct any spelling discrepancies in the transcribed text
+        as well as add punctuation in the multilingual text if they are missing.
+        Only add necessary punctuation such as periods, commas, and capitalization,
+        and use only the context provided.
+        You response should be as follows:
+        Corrected Text:
+        Here goes the corrected text with punctuation.
+        """
+        user_prompt = f"""
+        Here is the text:
+        {self.transcript}
+        """
+        response = openai.ChatCompletion.create(
+            model="gpt-3.5-turbo",
+            messages=[
+                {"role": "system", "content": system_prompt},
+                {"role": "user", "content": user_prompt},
+            ]
+        )
+        text = response.choices[0].message.content.replace('Corrected Text:\n', '')
+        return text
+    def get_translated_transcript(self):
+        '''
+        Translates the transcript into required language
+        '''
+        # Correcting Punctuation using GPT
+        transcript = self.__correct_punctuation_gpt()
+        # Splitting Text into Sentences
+        if self.source_lang in ['ar', 'ur']:
+            splitter = '۔'
+        else:
+            splitter = '.'
+        sentences = transcript.split(splitter)
+        # Getting Translation using NLLB
+        translated_transcript = ''
+        for sentence in sentences:
+            translated_sentence = self.nllb.translate(sentence, source=LANGUAGES[self.source_lang], target=LANGUAGES[self.target_lang])
+            translated_transcript += translated_sentence + splitter + ' '
+            # print('Text:', sentence)
+            # print('Text:', translated_sentence)
+            # print()
+        translated_transcript = translated_transcript.strip()
+        return translated_transcript
+    def get_translated_subtitles(self):
+        '''
+        Translates the subtitles into required language
+        '''
+        # Creating copy of Transcript Dictionary
+        subtitles = self.subtitles.copy()
+        # Creating Instance for Google Translator
+        gt = GoogleTranslator(source='auto', target=self.target_lang)
+        for i, s in enumerate(subtitles):
+            subtitles[i]['text'] = gt.translate(text=s['text'])
+        return subtitles