Uganda_2_English_Speech_Translation

Runtime error

allandclive commited on Jul 20, 2023

Commit

2df5a70

1 Parent(s): 22a0e2a

Update stitched_model.py

Files changed (1) hide show

stitched_model.py CHANGED Viewed

@@ -16,7 +16,7 @@ class CombinedModel(nn.Module):
         # Use stt_model to transcribe the audio to text
         device = self.device
         audio = torch.tensor(batch["audio"][0]).to(self.device)
-        input_features = self.stt_processor(audio,sampling_rate=16000, return_tensors="pt",max_length=300000, padding=True, truncation=True)
         stt_output = self.stt_model(input_features.input_values.to(device), attention_mask= input_features.attention_mask.to(device) )
         transcription = self.stt_processor.decode(torch.squeeze(stt_output.logits.argmax(axis=-1)).to(device))
         input_nmt_tokens = self.nmt_tokenizer(transcription, return_tensors="pt", padding=True, truncation=True)

         # Use stt_model to transcribe the audio to text
         device = self.device
         audio = torch.tensor(batch["audio"][0]).to(self.device)
+        input_features = self.stt_processor(audio,sampling_rate=16000, return_tensors="pt",max_length=220000, padding=True, truncation=True)
         stt_output = self.stt_model(input_features.input_values.to(device), attention_mask= input_features.attention_mask.to(device) )
         transcription = self.stt_processor.decode(torch.squeeze(stt_output.logits.argmax(axis=-1)).to(device))
         input_nmt_tokens = self.nmt_tokenizer(transcription, return_tensors="pt", padding=True, truncation=True)