Spaces:
Running
on
Zero
Running
on
Zero
Commit
·
096bc17
1
Parent(s):
8035662
zerogpu update
Browse files- app.py +4 -1
- kokoro_tts.py +5 -2
- pyproject.toml +1 -0
- requirements.txt +3 -4
app.py
CHANGED
@@ -1,8 +1,11 @@
|
|
1 |
import gradio as gr
|
2 |
import requests
|
3 |
from bs4 import BeautifulSoup
|
4 |
-
import soundfile as sf
|
5 |
from kokoro_tts import generate_audio
|
|
|
|
|
|
|
|
|
6 |
|
7 |
|
8 |
class Voices:
|
|
|
1 |
import gradio as gr
|
2 |
import requests
|
3 |
from bs4 import BeautifulSoup
|
|
|
4 |
from kokoro_tts import generate_audio
|
5 |
+
import logging
|
6 |
+
|
7 |
+
|
8 |
+
logging.basicConfig(level=logging.INFO)
|
9 |
|
10 |
|
11 |
class Voices:
|
kokoro_tts.py
CHANGED
@@ -6,7 +6,7 @@ import logging
|
|
6 |
|
7 |
def generate_audio(
|
8 |
text,
|
9 |
-
lang_code="a",
|
10 |
voice="af_heart",
|
11 |
speed=1,
|
12 |
save_segments=False,
|
@@ -25,7 +25,10 @@ def generate_audio(
|
|
25 |
Returns:
|
26 |
numpy.ndarray: Combined audio data at 24kHz sample rate
|
27 |
"""
|
28 |
-
|
|
|
|
|
|
|
29 |
|
30 |
generator = pipeline(text, voice=voice, speed=speed, split_pattern=r"\.")
|
31 |
|
|
|
6 |
|
7 |
def generate_audio(
|
8 |
text,
|
9 |
+
pipeline=KPipeline(lang_code="a"),
|
10 |
voice="af_heart",
|
11 |
speed=1,
|
12 |
save_segments=False,
|
|
|
25 |
Returns:
|
26 |
numpy.ndarray: Combined audio data at 24kHz sample rate
|
27 |
"""
|
28 |
+
try:
|
29 |
+
pipeline = pipeline.to("cuda")
|
30 |
+
except:
|
31 |
+
logging.warning("CUDA not available, using CPU")
|
32 |
|
33 |
generator = pipeline(text, voice=voice, speed=speed, split_pattern=r"\.")
|
34 |
|
pyproject.toml
CHANGED
@@ -10,4 +10,5 @@ dependencies = [
|
|
10 |
"kokoro>=0.3.4",
|
11 |
"pip>=25.0.1",
|
12 |
"soundfile>=0.13.1",
|
|
|
13 |
]
|
|
|
10 |
"kokoro>=0.3.4",
|
11 |
"pip>=25.0.1",
|
12 |
"soundfile>=0.13.1",
|
13 |
+
"torch==2.4.0",
|
14 |
]
|
requirements.txt
CHANGED
@@ -21,9 +21,7 @@ curated-transformers==0.1.1
|
|
21 |
cymem==2.0.11
|
22 |
dlinfo==2.0.0
|
23 |
docopt==0.6.2
|
24 |
-
en_core_web_sm @ https://github.com/explosion/spacy-models/releases/download/en_core_web_sm-3.8.0/en_core_web_sm-3.8.0-py3-none-any.whl#sha256=1932429db727d4bff3deed6b34cfc05df17794f4a52eeb26cf8928f7c1a0fb85
|
25 |
espeakng-loader==0.2.4
|
26 |
-
exceptiongroup==1.2.2
|
27 |
fastapi==0.115.8
|
28 |
ffmpy==0.5.0
|
29 |
filelock==3.17.0
|
@@ -87,6 +85,7 @@ safetensors==0.5.2
|
|
87 |
scipy==1.15.1
|
88 |
segments==2.2.1
|
89 |
semantic-version==2.10.0
|
|
|
90 |
shellingham==1.5.4
|
91 |
six==1.17.0
|
92 |
smart-open==7.1.0
|
@@ -99,12 +98,12 @@ spacy-legacy==3.0.12
|
|
99 |
spacy-loggers==1.0.5
|
100 |
srsly==2.5.1
|
101 |
starlette==0.45.3
|
102 |
-
sympy==1.13.
|
103 |
tabulate==0.9.0
|
104 |
thinc==8.3.4
|
105 |
tokenizers==0.21.0
|
106 |
tomlkit==0.13.2
|
107 |
-
torch==2.
|
108 |
tqdm==4.67.1
|
109 |
transformers==4.48.3
|
110 |
typer==0.15.1
|
|
|
21 |
cymem==2.0.11
|
22 |
dlinfo==2.0.0
|
23 |
docopt==0.6.2
|
|
|
24 |
espeakng-loader==0.2.4
|
|
|
25 |
fastapi==0.115.8
|
26 |
ffmpy==0.5.0
|
27 |
filelock==3.17.0
|
|
|
85 |
scipy==1.15.1
|
86 |
segments==2.2.1
|
87 |
semantic-version==2.10.0
|
88 |
+
setuptools==75.8.0
|
89 |
shellingham==1.5.4
|
90 |
six==1.17.0
|
91 |
smart-open==7.1.0
|
|
|
98 |
spacy-loggers==1.0.5
|
99 |
srsly==2.5.1
|
100 |
starlette==0.45.3
|
101 |
+
sympy==1.13.3
|
102 |
tabulate==0.9.0
|
103 |
thinc==8.3.4
|
104 |
tokenizers==0.21.0
|
105 |
tomlkit==0.13.2
|
106 |
+
torch==2.4.0
|
107 |
tqdm==4.67.1
|
108 |
transformers==4.48.3
|
109 |
typer==0.15.1
|