Mishmosh commited on
Commit
2cdf061
·
1 Parent(s): a9549d0

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +29 -0
app.py CHANGED
@@ -274,5 +274,34 @@ print(summarized_text)
274
  #print(summarized_text_list_list)
275
  #print(number_of_sentences)
276
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
277
 
 
 
 
 
 
 
 
 
 
278
 
 
274
  #print(summarized_text_list_list)
275
  #print(number_of_sentences)
276
 
277
+ #text to speech
278
+ #!pip install git+https://github.com/huggingface/transformers.git
279
+ #!pip install datasets sentencepiece
280
+ import torch
281
+ #import soundfile as sf
282
+ #from IPython.display import Audio
283
+ from datasets import load_dataset
284
+ from transformers import pipeline
285
+ from transformers import SpeechT5Processor, SpeechT5ForTextToSpeech
286
+ processor = SpeechT5Processor.from_pretrained("microsoft/speecht5_tts")
287
+ model = SpeechT5ForTextToSpeech.from_pretrained("microsoft/speecht5_tts")
288
+ #text = "The future belongs to those who believe in the beauty of their dreams."
289
+ #text = (summarized_text_list_list)
290
+ text = (summarized_text)
291
+
292
+ #inputs = processor(text=summarized_text_list_list, return_tensors="pt")
293
+ #inputs = processor("Michelletest", return_tensors="pt")
294
+ inputs = processor(text, return_tensors="pt")
295
+ from datasets import load_dataset
296
+ embeddings_dataset = load_dataset("Matthijs/cmu-arctic-xvectors", split="validation")
297
 
298
+ import torch
299
+ speaker_embeddings = torch.tensor(embeddings_dataset[7306]["xvector"]).unsqueeze(0)
300
+ spectrogram = model.generate_speech(inputs["input_ids"], speaker_embeddings)
301
+ from transformers import SpeechT5HifiGan
302
+ vocoder = SpeechT5HifiGan.from_pretrained("microsoft/speecht5_hifigan")
303
+ with torch.no_grad():
304
+ speech = vocoder(spectrogram)
305
+ speech = model.generate_speech(inputs["input_ids"], speaker_embeddings, vocoder=vocoder)
306
+ Audio(speech, rate=16000)
307