Spaces:
Running
Running
NeuralFalcon
commited on
Update KOKORO/utils.py
Browse files- KOKORO/utils.py +12 -2
KOKORO/utils.py
CHANGED
@@ -274,8 +274,10 @@ def podcast(MODEL, device, gen_text, speed=1.0, trim=0.5, pad_between_segments=0
|
|
274 |
output_file = remove_silence_function(output_file, minimum_silence=minimum_silence)
|
275 |
|
276 |
return output_file
|
277 |
-
|
|
|
278 |
def tts(MODEL,device,text, voice_name, speed=1.0, trim=0.5, pad_between_segments=0.5, output_file="",remove_silence=True,minimum_silence=50):
|
|
|
279 |
language = voice_name[0]
|
280 |
voice_pack_path = f"./KOKORO/voices/{voice_name}.pt"
|
281 |
if voice_name.endswith(".pt"):
|
@@ -283,7 +285,14 @@ def tts(MODEL,device,text, voice_name, speed=1.0, trim=0.5, pad_between_segments
|
|
283 |
voice_pack_path=voice_name
|
284 |
text=clean_text(text)
|
285 |
segments = large_text(text, language)
|
286 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
287 |
speed = clamp_speed(speed)
|
288 |
trim = clamp_trim(trim)
|
289 |
silence_duration = clamp_trim(pad_between_segments)
|
@@ -343,3 +352,4 @@ def tts_file_name(text):
|
|
343 |
# Construct the file name
|
344 |
file_name = f"{temp_folder}/{truncated_text}_{random_string}.wav"
|
345 |
return file_name
|
|
|
|
274 |
output_file = remove_silence_function(output_file, minimum_silence=minimum_silence)
|
275 |
|
276 |
return output_file
|
277 |
+
old_voice_pack_path=""
|
278 |
+
old_VOICEPACK=None
|
279 |
def tts(MODEL,device,text, voice_name, speed=1.0, trim=0.5, pad_between_segments=0.5, output_file="",remove_silence=True,minimum_silence=50):
|
280 |
+
global old_voice_pack_path,old_VOICEPACK
|
281 |
language = voice_name[0]
|
282 |
voice_pack_path = f"./KOKORO/voices/{voice_name}.pt"
|
283 |
if voice_name.endswith(".pt"):
|
|
|
285 |
voice_pack_path=voice_name
|
286 |
text=clean_text(text)
|
287 |
segments = large_text(text, language)
|
288 |
+
if (old_voice_pack_path!=voice_pack_path)or ("weighted_normalised_voices.pt" in voice_pack_path):
|
289 |
+
VOICEPACK = torch.load(voice_pack_path, weights_only=True).to(device)
|
290 |
+
old_voice_pack_path=voice_pack_path
|
291 |
+
old_VOICEPACK=VOICEPACK
|
292 |
+
# print("Loaded new voice pack")
|
293 |
+
else:
|
294 |
+
VOICEPACK=old_VOICEPACK
|
295 |
+
# print("Using old voice pack")
|
296 |
speed = clamp_speed(speed)
|
297 |
trim = clamp_trim(trim)
|
298 |
silence_duration = clamp_trim(pad_between_segments)
|
|
|
352 |
# Construct the file name
|
353 |
file_name = f"{temp_folder}/{truncated_text}_{random_string}.wav"
|
354 |
return file_name
|
355 |
+
|