Update app.py
Browse files
app.py
CHANGED
@@ -27,7 +27,7 @@ canary_model.change_decoding_strategy(decode_cfg)
|
|
27 |
# tts_tokenizer = AutoTokenizer.from_pretrained("facebook/mms-tts-eng")
|
28 |
|
29 |
# Function to convert audio to text using ASR
|
30 |
-
def gen_text(audio_filepath, action):
|
31 |
if audio_filepath is None:
|
32 |
raise gr.Error("Please provide some input audio.")
|
33 |
|
@@ -45,8 +45,8 @@ def gen_text(audio_filepath, action):
|
|
45 |
manifest_data = {
|
46 |
"audio_filepath": converted_audio_filepath,
|
47 |
"taskname": action,
|
48 |
-
"source_lang":
|
49 |
-
"target_lang":
|
50 |
"pnc": "no",
|
51 |
"answer": "predict",
|
52 |
"duration": str(duration),
|
@@ -92,11 +92,11 @@ def gen_speech(text, lang):
|
|
92 |
|
93 |
# Root function for Gradio interface
|
94 |
def start_process(audio_filepath, source_lang, target_lang):
|
95 |
-
transcription = gen_text(audio_filepath, "asr")
|
96 |
print("Done transcribing")
|
97 |
-
translation = gen_text(audio_filepath, "s2t_translation")
|
98 |
print("Done translation")
|
99 |
-
audio_output_filepath = gen_speech(
|
100 |
print("Done speaking")
|
101 |
return transcription, translation, audio_output_filepath
|
102 |
|
|
|
27 |
# tts_tokenizer = AutoTokenizer.from_pretrained("facebook/mms-tts-eng")
|
28 |
|
29 |
# Function to convert audio to text using ASR
|
30 |
+
def gen_text(audio_filepath, action, source_lang, target_lang):
|
31 |
if audio_filepath is None:
|
32 |
raise gr.Error("Please provide some input audio.")
|
33 |
|
|
|
45 |
manifest_data = {
|
46 |
"audio_filepath": converted_audio_filepath,
|
47 |
"taskname": action,
|
48 |
+
"source_lang": source_lang,
|
49 |
+
"target_lang": source_lang if action=="asr" else target_lang,
|
50 |
"pnc": "no",
|
51 |
"answer": "predict",
|
52 |
"duration": str(duration),
|
|
|
92 |
|
93 |
# Root function for Gradio interface
|
94 |
def start_process(audio_filepath, source_lang, target_lang):
|
95 |
+
transcription = gen_text(audio_filepath, "asr", source_lang, target_lang)
|
96 |
print("Done transcribing")
|
97 |
+
translation = gen_text(audio_filepath, "s2t_translation", source_lang, target_lang)
|
98 |
print("Done translation")
|
99 |
+
audio_output_filepath = gen_speech(translation, target_lang)
|
100 |
print("Done speaking")
|
101 |
return transcription, translation, audio_output_filepath
|
102 |
|