github-actions[bot] commited on
Commit
9ae4486
·
1 Parent(s): 6b39985

Sync with https://github.com/mozilla-ai/document-to-podcast

Browse files
Files changed (1) hide show
  1. app.py +6 -5
app.py CHANGED
@@ -6,13 +6,13 @@ from pathlib import Path
6
  import soundfile as sf
7
  import streamlit as st
8
 
 
9
  from document_to_podcast.preprocessing import DATA_LOADERS, DATA_CLEANERS
10
  from document_to_podcast.inference.model_loaders import (
11
  load_llama_cpp_model,
12
- load_outetts_model,
13
  )
14
  from document_to_podcast.config import DEFAULT_PROMPT, DEFAULT_SPEAKERS, Speaker
15
- from document_to_podcast.inference.text_to_speech import text_to_speech
16
  from document_to_podcast.inference.text_to_text import text_to_text_stream
17
  from document_to_podcast.utils import stack_audio_segments
18
 
@@ -26,7 +26,7 @@ def load_text_to_text_model():
26
 
27
  @st.cache_resource
28
  def load_text_to_speech_model():
29
- return load_outetts_model("OuteAI/OuteTTS-0.2-500M-GGUF/OuteTTS-0.2-500M-FP16.gguf")
30
 
31
 
32
  script = "script"
@@ -167,7 +167,8 @@ if "clean_text" in st.session_state:
167
  speech_model,
168
  voice_profile,
169
  )
170
- st.audio(speech, sample_rate=speech_model.audio_codec.sr)
 
171
  st.session_state.audio.append(speech)
172
  text = ""
173
 
@@ -179,7 +180,7 @@ if "clean_text" in st.session_state:
179
  sf.write(
180
  "podcast.wav",
181
  st.session_state.audio,
182
- samplerate=speech_model.audio_codec.sr,
183
  )
184
  st.markdown("Podcast saved to disk!")
185
 
 
6
  import soundfile as sf
7
  import streamlit as st
8
 
9
+ from document_to_podcast.inference.text_to_speech import text_to_speech
10
  from document_to_podcast.preprocessing import DATA_LOADERS, DATA_CLEANERS
11
  from document_to_podcast.inference.model_loaders import (
12
  load_llama_cpp_model,
13
+ load_tts_model,
14
  )
15
  from document_to_podcast.config import DEFAULT_PROMPT, DEFAULT_SPEAKERS, Speaker
 
16
  from document_to_podcast.inference.text_to_text import text_to_text_stream
17
  from document_to_podcast.utils import stack_audio_segments
18
 
 
26
 
27
  @st.cache_resource
28
  def load_text_to_speech_model():
29
+ return load_tts_model("OuteAI/OuteTTS-0.2-500M-GGUF/OuteTTS-0.2-500M-FP16.gguf")
30
 
31
 
32
  script = "script"
 
167
  speech_model,
168
  voice_profile,
169
  )
170
+ st.audio(speech, sample_rate=speech_model.sample_rate)
171
+
172
  st.session_state.audio.append(speech)
173
  text = ""
174
 
 
180
  sf.write(
181
  "podcast.wav",
182
  st.session_state.audio,
183
+ samplerate=speech_model.sample_rate,
184
  )
185
  st.markdown("Podcast saved to disk!")
186