Spaces:

Vira21
/

Whisper-Base-KhmerV2

Sleeping

Vira21 commited on Nov 6, 2024

Commit

f16c081

verified ·

1 Parent(s): 5ede744

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -1,7 +1,39 @@
-import torch
 import gradio as gr
-from huggingface_hub import model_info
-interface = gr.load("models/Vira21/Whisper-Base-KhmerV2")
-interface.launch()

 import gradio as gr
+from transformers import pipeline
+import torch
+import spaces
+# Load the Whisper model pipeline for speech recognition with optimizations
+model_name = "Vira21/Whisper-Base-KhmerV2"
+whisper_pipeline = pipeline(
+    "automatic-speech-recognition",
+    model=model_name,
+    device="cuda" if torch.cuda.is_available() else "CPU"
+)
+def transcribe_audio(audio):
+    try:
+        if audio is None:
+            return "No audio provided. Please upload an audio file or record your voice."
+        # Process and transcribe the audio
+        result = whisper_pipeline(audio)["text"]
+        return result
+    except Exception as e:
+        # Handle errors and return an error message
+        return f"An error occurred during transcription: {str(e)}"
+# Gradio Interface with optimizations
+interface = gr.Interface(
+    fn=transcribe_audio,
+    inputs=gr.Audio(type="filepath"),
+    outputs="text",
+    title="OpenAI Whisper Small KHMER-ENGLISH Speech-to-Text",
+    description="Upload an audio file or record your voice to get the transcription.",
+    examples=[["Example Audio/126.wav"], ["Example Audio/tomholland28282.wav"]],
+    allow_flagging="never"  # Disables flagging to save resources
+)
+# Launch the app with queue enabled for better handling on free CPU
+if __name__ == "__main__":
+    interface.launch()