Spaces:

Ghana-NLP
/

demo-dubbing

Paused

Lagyamfi commited on Nov 13, 2024

Commit

db6bb35

1 Parent(s): c993592

fix issue with reload of output video

Files changed (2) hide show

app.py CHANGED Viewed

@@ -1,5 +1,7 @@
 import gradio as gr
 from tqdm.asyncio import tqdm_asyncio
 from pipeline import (
     extract_audio_from_video,
@@ -20,7 +22,18 @@ async def process_video_translation(
     total_stages = 6
-    output_video = f"{input_video.split('.')[0]}_translated.mp4"
     with tqdm_asyncio(total=total_stages, desc="Processing video translation") as pbar:
         # stage 1: extract audio from video
@@ -47,12 +60,13 @@ async def process_video_translation(
         pbar.update(1)
         progress(1.0, desc="Combining audio and video")
-        create_combined_output(input_video, output_audio, output_video)
         pbar.update(1)
         print("Video translation completed")
         gr.Info(f"Video translation completed", duration=2)
         return output_video
@@ -86,7 +100,7 @@ with gr.Blocks(
                 """
                 <div style="display: flex; align-items: center; justify-content: center;">
         <h1 style="font-size: 2em; font-weight: bold; margin-top: 1em;">
-            Video Dubbing Interface
         </h1>
     </div>

 import gradio as gr
 from tqdm.asyncio import tqdm_asyncio
+import os
+import time
 from pipeline import (
     extract_audio_from_video,
     total_stages = 6
+    # add time stamp to output video
+    timestamp = time.strftime("%M%S")
+    output_video = f"{input_video.split('.')[0]}_dubbed_{timestamp}.mp4"
+    # delete the output video if it exists
+    try:
+        os.remove(output_video)
+        print(f"Deleted existing output video: {output_video}")
+    except FileNotFoundError:
+        print(f"No existing output video found: {output_video}")
+        pass
     with tqdm_asyncio(total=total_stages, desc="Processing video translation") as pbar:
         # stage 1: extract audio from video
         pbar.update(1)
         progress(1.0, desc="Combining audio and video")
+        output_video = create_combined_output(input_video, output_audio, output_video)
         pbar.update(1)
         print("Video translation completed")
         gr.Info(f"Video translation completed", duration=2)
+        print(f"Output video: {output_video}")
         return output_video
                 """
                 <div style="display: flex; align-items: center; justify-content: center;">
         <h1 style="font-size: 2em; font-weight: bold; margin-top: 1em;">
+            African Language Video Dubbing POC
         </h1>
     </div>

pipeline.py CHANGED Viewed

@@ -90,7 +90,7 @@ async def translation_main(sentences, url, headers, lang):
 async def convert_text_to_speech(
-    session, tts_url, tts_header, text, speaker, semaphore, output_dir
 ):
     speaker_dict = {"male": "twi_speaker_5", "female": "twi_speaker_7"}
     speaker_id = speaker_dict[speaker]
@@ -100,7 +100,7 @@ async def convert_text_to_speech(
         async with semaphore:
             async with session.post(tts_url, headers=tts_header, json=data) as response:
                 response.raise_for_status()
-                output_path = os.path.join(output_dir, f"{text[:4]}_tts.wav")
                 async with aiofiles.open(output_path, "wb") as file:
                     while True:
                         chunk = await response.content.read(16384)
@@ -120,9 +120,16 @@ async def tts_main(khaya_translations, speaker):
             semaphore = asyncio.Semaphore(3)
             tasks = [
                 convert_text_to_speech(
-                    session, tts_url, tts_header, sent, speaker, semaphore, temp_dir
                 )
-                for sent in khaya_translations
             ]
             output_files = []
             for task in tqdm(

 async def convert_text_to_speech(
+    session, tts_url, tts_header, text, text_index, speaker, semaphore, output_dir
 ):
     speaker_dict = {"male": "twi_speaker_5", "female": "twi_speaker_7"}
     speaker_id = speaker_dict[speaker]
         async with semaphore:
             async with session.post(tts_url, headers=tts_header, json=data) as response:
                 response.raise_for_status()
+                output_path = os.path.join(output_dir, f"{text_index}_tts.wav")
                 async with aiofiles.open(output_path, "wb") as file:
                     while True:
                         chunk = await response.content.read(16384)
             semaphore = asyncio.Semaphore(3)
             tasks = [
                 convert_text_to_speech(
+                    session,
+                    tts_url,
+                    tts_header,
+                    sent,
+                    text_index,
+                    speaker,
+                    semaphore,
+                    temp_dir,
                 )
+                for text_index, sent in enumerate(khaya_translations)
             ]
             output_files = []
             for task in tqdm(