import nemo.collections.asr as nemo_asr | |
import gradio as gr | |
asr_model = nemo_asr.models.ASRModel.from_pretrained(model_name="QuartzNet15x5Base-En") | |
def transcribe(audio): | |
transcription = asr_model.transcribe(paths2audio_files=[audio]) | |
return transcription[0] | |
interface = gr.Interface(fn=transcribe, inputs="audio", outputs="text") | |
interface.launch() | |