import gradio as gr model = gr.Interface.load("huggingface/pyannote/voice-activity-detection") def inference(audio_file): output = model(audio_file) inputs = gr.inputs.Audio(label="Input Audio", type="filepath", source="microphone") outputs = gr.outputs.Label(type="auto", label = "Voice timestamps") title = "Voice Activity Detection" description = "Record or upload an audio file and detected human voices will be timestamped." article = "