rayl-aoit commited on
Commit
e796a00
1 Parent(s): 1180d04

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +6 -6
app.py CHANGED
@@ -27,7 +27,7 @@ canary_model.change_decoding_strategy(decode_cfg)
27
  # tts_tokenizer = AutoTokenizer.from_pretrained("facebook/mms-tts-eng")
28
 
29
  # Function to convert audio to text using ASR
30
- def gen_text(audio_filepath, action):
31
  if audio_filepath is None:
32
  raise gr.Error("Please provide some input audio.")
33
 
@@ -45,8 +45,8 @@ def gen_text(audio_filepath, action):
45
  manifest_data = {
46
  "audio_filepath": converted_audio_filepath,
47
  "taskname": action,
48
- "source_lang": "en",
49
- "target_lang": "en" if action=="asr" else "fr",
50
  "pnc": "no",
51
  "answer": "predict",
52
  "duration": str(duration),
@@ -92,11 +92,11 @@ def gen_speech(text, lang):
92
 
93
  # Root function for Gradio interface
94
  def start_process(audio_filepath, source_lang, target_lang):
95
- transcription = gen_text(audio_filepath, "asr")
96
  print("Done transcribing")
97
- translation = gen_text(audio_filepath, "s2t_translation")
98
  print("Done translation")
99
- audio_output_filepath = gen_speech(transcription, target_lang)
100
  print("Done speaking")
101
  return transcription, translation, audio_output_filepath
102
 
 
27
  # tts_tokenizer = AutoTokenizer.from_pretrained("facebook/mms-tts-eng")
28
 
29
  # Function to convert audio to text using ASR
30
+ def gen_text(audio_filepath, action, source_lang, target_lang):
31
  if audio_filepath is None:
32
  raise gr.Error("Please provide some input audio.")
33
 
 
45
  manifest_data = {
46
  "audio_filepath": converted_audio_filepath,
47
  "taskname": action,
48
+ "source_lang": source_lang,
49
+ "target_lang": source_lang if action=="asr" else target_lang,
50
  "pnc": "no",
51
  "answer": "predict",
52
  "duration": str(duration),
 
92
 
93
  # Root function for Gradio interface
94
  def start_process(audio_filepath, source_lang, target_lang):
95
+ transcription = gen_text(audio_filepath, "asr", source_lang, target_lang)
96
  print("Done transcribing")
97
+ translation = gen_text(audio_filepath, "s2t_translation", source_lang, target_lang)
98
  print("Done translation")
99
+ audio_output_filepath = gen_speech(translation, target_lang)
100
  print("Done speaking")
101
  return transcription, translation, audio_output_filepath
102