Spaces:

gorkemgoknar
/

xtts-streaming

Running

App Files Files Community

gorkemgoknar commited on Oct 30, 2023

Commit

ef149f3

1 Parent(s): 613c465

Update app.py

Browse files

Files changed (1) hide show

app.py +58 -4

app.py CHANGED Viewed

@@ -15,6 +15,11 @@ os.environ["COQUI_TOS_AGREED"] = "1"
 # Most users expect text to be their own language, there is checkbox to disable it
 import langid
 import gradio as gr
 from scipy.io.wavfile import write
 from pydub import AudioSegment
@@ -185,9 +190,19 @@ def predict(prompt, language, audio_file_pth, mic_file_path, use_mic, voice_clea
         try:
             t_latent=time.time()
-            gpt_cond_latent, _, speaker_embedding = model.get_conditioning_latents(audio_path=speaker_wav)
             latent_calculation_time = time.time() - t_latent
             ##metrics_text=f"Embedding calculation time: {latent_calculation_time:.2f} seconds\n"
@@ -230,12 +245,51 @@ def predict(prompt, language, audio_file_pth, mic_file_path, use_mic, voice_clea
                     DEVICE_ASSERT_PROMPT=prompt
                     DEVICE_ASSERT_LANG=language
                 # HF Space specific.. This error is unrecoverable need to restart space
                 api.restart_space(repo_id=repo_id)
             else:
                 print("RuntimeError: non device-side assert error:", str(e))
-                raise e
         wav = torch.cat(wav_chunks, dim=0)
         torchaudio.save("output.wav", wav.squeeze().unsqueeze(0).cpu(), 24000)

 # Most users expect text to be their own language, there is checkbox to disable it
 import langid
+import base64
+import csv
+from io import StringIO
+import datetime
 import gradio as gr
 from scipy.io.wavfile import write
 from pydub import AudioSegment
         try:
             t_latent=time.time()
+            try:
+                gpt_cond_latent, _, speaker_embedding = model.get_conditioning_latents(audio_path=speaker_wav)
+            except Exception as e:
+                if "Failed to decode" in str(e):
+                    print("Speaker encoding error", str(e))
+                    gr.Warning("It appears something wrong with reference, did you unmute your microphone?")
+                    return (
+                        None,
+                        None,
+                        None,
+                        None,
+                    )
             latent_calculation_time = time.time() - t_latent
             ##metrics_text=f"Embedding calculation time: {latent_calculation_time:.2f} seconds\n"
                     DEVICE_ASSERT_PROMPT=prompt
                     DEVICE_ASSERT_LANG=language
+                # just before restarting save what caused the issue so we can handle it in future
+                # Uploading Error data only happens for unrecovarable error
+                error_time = datetime.datetime.now().strftime('%d-%m-%Y-%H:%M:%S')
+                error_data = [error_time, prompt, language, audio_file_pth, mic_file_path, use_mic, voice_cleanup, no_lang_auto_detect, agree]
+                error_data = [str(e) if type(e)!=str else e for e in error_data]
+                print(error_data)
+                print(speaker_wav)
+                write_io = StringIO()
+                csv.writer(write_io).writerows(error_data)
+                csv_upload= write_io.getvalue().encode()
+                filename =  error_time+"_xtts-stream_" + str(uuid.uuid4()) +".csv"
+                print("Writing error csv")
+                error_api = HfApi()
+                error_api.upload_file(
+                    path_or_fileobj=csv_upload,
+                    path_in_repo=filename,
+                    repo_id="coqui/xtts-flagged-dataset",
+                    repo_type="dataset",
+                )
+                #speaker_wav
+                print("Writing error reference audio")
+                speaker_filename =  error_time+"_reference_xtts-stream_"+ str(uuid.uuid4()) +".wav"
+                error_api = HfApi()
+                error_api.upload_file(
+                    path_or_fileobj=speaker_wav,
+                    path_in_repo=speaker_filename,
+                    repo_id="coqui/xtts-flagged-dataset",
+                    repo_type="dataset",
+                )
                 # HF Space specific.. This error is unrecoverable need to restart space
                 api.restart_space(repo_id=repo_id)
             else:
                 print("RuntimeError: non device-side assert error:", str(e))
+                gr.Warning("Something unexpected happened please retry again.")
+                return (
+                        None,
+                        None,
+                        None,
+                        None,
+                    )
         wav = torch.cat(wav_chunks, dim=0)
         torchaudio.save("output.wav", wav.squeeze().unsqueeze(0).cpu(), 24000)