Spaces:

riteshkr
/

transcribe-using-q-whi-L-v3

Sleeping

riteshkr commited on Sep 13

Commit

09b9573

•

1 Parent(s): 912008d

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -5,7 +5,7 @@ from transformers import pipeline, WhisperForConditionalGeneration, WhisperProce
 # Check if a GPU is available and set the device
 device = 0 if torch.cuda.is_available() else -1
-# Load the ASR model using the Hugging Face pipeline
 model_id = "riteshkr/quantized-whisper-large-v3"
 model = WhisperForConditionalGeneration.from_pretrained(model_id)
 processor = WhisperProcessor.from_pretrained(model_id)
@@ -13,7 +13,14 @@ processor = WhisperProcessor.from_pretrained(model_id)
 # Set the language to English using forced_decoder_ids
 forced_decoder_ids = processor.get_decoder_prompt_ids(language="english", task="transcribe")
-pipe = pipeline("automatic-speech-recognition", model=model, processor=processor, device=device)
 # Define the transcription function
 def transcribe_speech(filepath):

 # Check if a GPU is available and set the device
 device = 0 if torch.cuda.is_available() else -1
+# Load the ASR model and processor
 model_id = "riteshkr/quantized-whisper-large-v3"
 model = WhisperForConditionalGeneration.from_pretrained(model_id)
 processor = WhisperProcessor.from_pretrained(model_id)
 # Set the language to English using forced_decoder_ids
 forced_decoder_ids = processor.get_decoder_prompt_ids(language="english", task="transcribe")
+# Create the pipeline, explicitly setting the tokenizer and feature extractor
+pipe = pipeline(
+    "automatic-speech-recognition",
+    model=model,
+    tokenizer=processor.tokenizer,  # Use the processor's tokenizer
+    feature_extractor=processor.feature_extractor,  # Use the processor's feature extractor
+    device=device
+)
 # Define the transcription function
 def transcribe_speech(filepath):