Spaces:

mozilla-ai
/

document-to-podcast

Runtime error

github-actions[bot] commited on 24 days ago

Commit

9ae4486

1 Parent(s): 6b39985

Sync with https://github.com/mozilla-ai/document-to-podcast

Files changed (1) hide show

app.py CHANGED Viewed

@@ -6,13 +6,13 @@ from pathlib import Path
 import soundfile as sf
 import streamlit as st
 from document_to_podcast.preprocessing import DATA_LOADERS, DATA_CLEANERS
 from document_to_podcast.inference.model_loaders import (
     load_llama_cpp_model,
-    load_outetts_model,
 )
 from document_to_podcast.config import DEFAULT_PROMPT, DEFAULT_SPEAKERS, Speaker
-from document_to_podcast.inference.text_to_speech import text_to_speech
 from document_to_podcast.inference.text_to_text import text_to_text_stream
 from document_to_podcast.utils import stack_audio_segments
@@ -26,7 +26,7 @@ def load_text_to_text_model():
 @st.cache_resource
 def load_text_to_speech_model():
-    return load_outetts_model("OuteAI/OuteTTS-0.2-500M-GGUF/OuteTTS-0.2-500M-FP16.gguf")
 script = "script"
@@ -167,7 +167,8 @@ if "clean_text" in st.session_state:
                             speech_model,
                             voice_profile,
                         )
-                    st.audio(speech, sample_rate=speech_model.audio_codec.sr)
                     st.session_state.audio.append(speech)
                     text = ""
@@ -179,7 +180,7 @@ if "clean_text" in st.session_state:
             sf.write(
                 "podcast.wav",
                 st.session_state.audio,
-                samplerate=speech_model.audio_codec.sr,
             )
             st.markdown("Podcast saved to disk!")

 import soundfile as sf
 import streamlit as st
+from document_to_podcast.inference.text_to_speech import text_to_speech
 from document_to_podcast.preprocessing import DATA_LOADERS, DATA_CLEANERS
 from document_to_podcast.inference.model_loaders import (
     load_llama_cpp_model,
+    load_tts_model,
 )
 from document_to_podcast.config import DEFAULT_PROMPT, DEFAULT_SPEAKERS, Speaker
 from document_to_podcast.inference.text_to_text import text_to_text_stream
 from document_to_podcast.utils import stack_audio_segments
 @st.cache_resource
 def load_text_to_speech_model():
+    return load_tts_model("OuteAI/OuteTTS-0.2-500M-GGUF/OuteTTS-0.2-500M-FP16.gguf")
 script = "script"
                             speech_model,
                             voice_profile,
                         )
+                    st.audio(speech, sample_rate=speech_model.sample_rate)
                     st.session_state.audio.append(speech)
                     text = ""
             sf.write(
                 "podcast.wav",
                 st.session_state.audio,
+                samplerate=speech_model.sample_rate,
             )
             st.markdown("Podcast saved to disk!")