Spaces:

amirza
/

draw_me_a_sheep_heb

Runtime error

Amir Zait commited on Aug 18, 2022

Commit

d8ec8f4

•

1 Parent(s): 077c45d

fixed bugs

Files changed (1) hide show

app.py CHANGED Viewed

@@ -54,12 +54,12 @@ def parse_transcription(wav_file):
     convert(wav_file.name, filename + "16k.wav")
     speech, _ = sf.read(filename + "16k.wav")
     print(speech.shape)
-    input_values = trans_processor(speech, sampling_rate=16_000, return_tensors="pt").input_values
-    logits = trans_model(input_values).logits
     predicted_ids = torch.argmax(logits, dim=-1)
-    transcription = trans_processor.decode(predicted_ids[0], skip_special_tokens=True)
     translated = he_en_translator(trasncription)
-    return transcription
 output = gr.outputs.Textbox(label="TEXT")
 input_mic = gr.inputs.Audio(source="microphone", type="file", optional=True)
@@ -70,5 +70,5 @@ gr.Interface(parse_transcription, inputs=[input_mic],  outputs=output,
              show_tips=False,
              theme='huggingface',
              layout='horizontal',
-             title="Draw Me A Ship in Hebrew",
              enable_queue=True).launch(inline=False)

     convert(wav_file.name, filename + "16k.wav")
     speech, _ = sf.read(filename + "16k.wav")
     print(speech.shape)
+    input_values = asr_processor(speech, sampling_rate=16_000, return_tensors="pt").input_values
+    logits = asr_model(input_values).logits
     predicted_ids = torch.argmax(logits, dim=-1)
+    transcription = asr_processor.decode(predicted_ids[0], skip_special_tokens=True)
     translated = he_en_translator(trasncription)
+    return translated
 output = gr.outputs.Textbox(label="TEXT")
 input_mic = gr.inputs.Audio(source="microphone", type="file", optional=True)
              show_tips=False,
              theme='huggingface',
              layout='horizontal',
+             title="Draw Me A Sheep in Hebrew",
              enable_queue=True).launch(inline=False)