NeuralFalcon commited on
Commit
6789f9b
·
verified ·
1 Parent(s): b83c472

Update KOKORO/utils.py

Browse files
Files changed (1) hide show
  1. KOKORO/utils.py +12 -2
KOKORO/utils.py CHANGED
@@ -274,8 +274,10 @@ def podcast(MODEL, device, gen_text, speed=1.0, trim=0.5, pad_between_segments=0
274
  output_file = remove_silence_function(output_file, minimum_silence=minimum_silence)
275
 
276
  return output_file
277
-
 
278
  def tts(MODEL,device,text, voice_name, speed=1.0, trim=0.5, pad_between_segments=0.5, output_file="",remove_silence=True,minimum_silence=50):
 
279
  language = voice_name[0]
280
  voice_pack_path = f"./KOKORO/voices/{voice_name}.pt"
281
  if voice_name.endswith(".pt"):
@@ -283,7 +285,14 @@ def tts(MODEL,device,text, voice_name, speed=1.0, trim=0.5, pad_between_segments
283
  voice_pack_path=voice_name
284
  text=clean_text(text)
285
  segments = large_text(text, language)
286
- VOICEPACK = torch.load(voice_pack_path, weights_only=True).to(device)
 
 
 
 
 
 
 
287
  speed = clamp_speed(speed)
288
  trim = clamp_trim(trim)
289
  silence_duration = clamp_trim(pad_between_segments)
@@ -343,3 +352,4 @@ def tts_file_name(text):
343
  # Construct the file name
344
  file_name = f"{temp_folder}/{truncated_text}_{random_string}.wav"
345
  return file_name
 
 
274
  output_file = remove_silence_function(output_file, minimum_silence=minimum_silence)
275
 
276
  return output_file
277
+ old_voice_pack_path=""
278
+ old_VOICEPACK=None
279
  def tts(MODEL,device,text, voice_name, speed=1.0, trim=0.5, pad_between_segments=0.5, output_file="",remove_silence=True,minimum_silence=50):
280
+ global old_voice_pack_path,old_VOICEPACK
281
  language = voice_name[0]
282
  voice_pack_path = f"./KOKORO/voices/{voice_name}.pt"
283
  if voice_name.endswith(".pt"):
 
285
  voice_pack_path=voice_name
286
  text=clean_text(text)
287
  segments = large_text(text, language)
288
+ if (old_voice_pack_path!=voice_pack_path)or ("weighted_normalised_voices.pt" in voice_pack_path):
289
+ VOICEPACK = torch.load(voice_pack_path, weights_only=True).to(device)
290
+ old_voice_pack_path=voice_pack_path
291
+ old_VOICEPACK=VOICEPACK
292
+ # print("Loaded new voice pack")
293
+ else:
294
+ VOICEPACK=old_VOICEPACK
295
+ # print("Using old voice pack")
296
  speed = clamp_speed(speed)
297
  trim = clamp_trim(trim)
298
  silence_duration = clamp_trim(pad_between_segments)
 
352
  # Construct the file name
353
  file_name = f"{temp_folder}/{truncated_text}_{random_string}.wav"
354
  return file_name
355
+