Spaces:

projecte-aina
/

transcripcio-fonetica-catala

Running

App Files Files Community

ccoreilly commited on Apr 29, 2023

Commit

7f0cc16

•

1 Parent(s): 89cf23f

Add gradio app

Browse files

Files changed (3) hide show

Dockerfile +7 -1
app.py +77 -0
requirements.txt +2 -0

Dockerfile CHANGED Viewed

@@ -10,5 +10,11 @@ RUN cd espeak-ng && \
  make && \
  make install
-RUN espeak-ng "Bon dia" --ipa -v ca -q

  make && \
  make install
+COPY requirements.txt .
+COPY app.py .
+RUN pip install -r requirements.txt
+EXPOSE 7860
+CMD python app.py

app.py ADDED Viewed

	@@ -0,0 +1,77 @@

+import tempfile
+from typing import Optional
+from TTS.config import load_config
+import gradio as gr
+import numpy as np
+import os
+import json
+from TTS.utils.manage import ModelManager
+from TTS.utils.synthesizer import Synthesizer
+MAX_TXT_LEN = 100
+SPEAKERS = ['f_cen_05', 'f_cen_81', 'f_occ_31', 'f_occ_de', 'f_sep_31', 'm_cen_08', 'm_occ_44', 'm_val_89']
+def tts(text, speaker_idx):
+    if len(text) > MAX_TXT_LEN:
+        text = text[:MAX_TXT_LEN]
+        print(f"Input text was cutoff since it went over the {MAX_TXT_LEN} character limit.")
+    print(text)
+    model_path = os.getcwd() + "/best_model.pth"
+    config_path = os.getcwd() + "/config.json"
+    speakers_file_path = os.getcwd() + "/speakers.pth"
+    speakers_maping_path = os.getcwd() + "/speaker_map.json"
+    vocoder_path = None
+    vocoder_config_path = None
+    synthesizer = Synthesizer(
+        model_path, config_path, speakers_file_path, None, vocoder_path, vocoder_config_path,
+    )
+    # Map speaker aliases to speaker ids
+    with open(speakers_maping_path, 'r') as fp:
+        maping = json.load(fp)
+    speaker_idx = maping[speaker_idx]
+    # synthesize
+    if synthesizer is None:
+        raise NameError("model not found")
+    wavs = synthesizer.tts(text, speaker_idx)
+    # return output
+    with tempfile.NamedTemporaryFile(suffix=".wav", delete=False) as fp:
+        synthesizer.save_wav(wavs, fp)
+        return fp.name
+description="""
+1️⃣ Introdueix el text a sintetitzar.
+2️⃣ Selecciona una veu en el desplegable.
+3️⃣ Gaudeix!
+"""
+article= ""
+iface = gr.Interface(
+    fn=tts,
+    inputs=[
+        gr.inputs.Textbox(
+            label="Text",
+            default="L'Èlia i l'Alí a l'aula.  L'oli i l'ou.  Lulú olorava la lila.",
+        ),
+        gr.inputs.Dropdown(label="Selecciona un parlant", choices=SPEAKERS, default=None)
+    ],
+    outputs=gr.outputs.Audio(label="Output",type="filepath"),
+    title="🗣️ TTS Català Multi Parlant - VITS 🗣️",
+    theme="grass",
+    description=description,
+    article=article,
+    allow_flagging="never",
+    flagging_options=['error', 'bad-quality', 'wrong-pronounciation'],
+    layout="vertical",
+    live=False
+)
+iface.launch(share=False)

requirements.txt ADDED Viewed

	@@ -0,0 +1,2 @@


1	+ git+https://github.com/coqui-ai/TTS@dev#egg=TTS
2	+ gradio