TTS-Spaces-Arena

Running

Pendrokar commited on 20 days ago

Commit

d3e9225

•

1 Parent(s): b4395a0

added styletts space

Files changed (2) hide show

app.py CHANGED Viewed

@@ -100,7 +100,9 @@ AVAILABLE_MODELS = {
     'innoai/Edge-TTS-Text-to-Speech': 'innoai/Edge-TTS-Text-to-Speech', # 4.29
     # IMS-Toucan
-    'Flux9665/MassivelyMultilingualTTS': 'Flux9665/MassivelyMultilingualTTS', # 5.1
     # HF TTS w issues
     'LeeSangHoon/HierSpeech_TTS': 'LeeSangHoon/HierSpeech_TTS', # irresponsive to exclamation marks # 4.29
@@ -251,7 +253,17 @@ HF_SPACES = {
         'text_param_index': 0,
         'return_audio_index': 0,
         'series': 'IMS-Toucan',
-    }
     # TTS w issues
     # 'PolyAI/pheme': '/predict#0', #sleepy HF Space
@@ -375,6 +387,12 @@ OVERRIDE_INPUTS = {
 		6: None, #reference_audio
     },
 }
 hf_clients: Tuple[Client] = {}

     'innoai/Edge-TTS-Text-to-Speech': 'innoai/Edge-TTS-Text-to-Speech', # 4.29
     # IMS-Toucan
+    # StyleTTS v2
+    'Pendrokar/style-tts-2': 'Pendrokar/style-tts-2',
     # HF TTS w issues
     'LeeSangHoon/HierSpeech_TTS': 'LeeSangHoon/HierSpeech_TTS', # irresponsive to exclamation marks # 4.29
         'text_param_index': 0,
         'return_audio_index': 0,
         'series': 'IMS-Toucan',
+    },
+    # StyleTTS v2
+    'Pendrokar/style-tts-2': {
+        'name': 'StyleTTS v2',
+        'function': '/synthesize',
+        'text_param_index': 0,
+        'return_audio_index': 0,
+        'is_zero_gpu_space': True,
+        'series': 'StyleTTS',
+    },
     # TTS w issues
     # 'PolyAI/pheme': '/predict#0', #sleepy HF Space
 		6: None, #reference_audio
     },
+    # StyleTTS 2
+    'Pendrokar/style-tts-2': {
+		1: "f-us-1", #voice
+		2: 8, # lngsteps
+    },
 }
 hf_clients: Tuple[Client] = {}

test_tts_styletts.py ADDED Viewed

+import os
+from gradio_client import Client, file
+client = Client("Pendrokar/style-tts-2", hf_token=os.getenv('HF_TOKEN'))
+endpoints = client.view_api(all_endpoints=True, print_info=False, return_format='dict')
+# print(endpoints)
+result = client.predict(
+		text="Hello!!",
+		voice="f-us-1", # voice
+		lngsteps=8, # lngsteps
+		api_name="/synthesize" # api_name
+)