TTS-Spaces-Arena

Running on Zero

Pendrokar commited on about 15 hours ago

Commit

4a483c5

1 Parent(s): 2e21b3e

new tts: MARS6

Files changed (2) hide show

app/models.py CHANGED Viewed

@@ -78,6 +78,12 @@ AVAILABLE_MODELS = {
     # llasa 3b TTS
     'srinivasbilla/llasa-3b-tts': 'srinivasbilla/llasa-3b-tts',
     # HF TTS w issues
     # 'LeeSangHoon/HierSpeech_TTS': 'LeeSangHoon/HierSpeech_TTS', # irresponsive to exclamation marks # 4.29
     # 'PolyAI/pheme': '/predict#0', # sleepy HF Space
@@ -363,6 +369,17 @@ HF_SPACES = {
         'series': 'llasa 3b',
         # 'emoji': '🥵', # requires 300s reserved ZeroGPU!
     },
 }
 # for zero-shot TTS - voice sample used by XTTS (11 seconds)
@@ -569,6 +586,17 @@ OVERRIDE_INPUTS = {
     'srinivasbilla/llasa-3b-tts': {
 		'sample_audio_path': handle_file('voice_samples/EN_B00004_S00051_W000213.mp3')
     },
 }

     # llasa 3b TTS
     'srinivasbilla/llasa-3b-tts': 'srinivasbilla/llasa-3b-tts',
+    # Mars5
+    # 'CAMB-AI/mars6-turbo-demo': 'CAMB-AI/mars6-turbo-demo',
+    # Mars6
+    # 'CAMB-AI/mars6-turbo-demo': 'CAMB-AI/mars6-turbo-demo',
     # HF TTS w issues
     # 'LeeSangHoon/HierSpeech_TTS': 'LeeSangHoon/HierSpeech_TTS', # irresponsive to exclamation marks # 4.29
     # 'PolyAI/pheme': '/predict#0', # sleepy HF Space
         'series': 'llasa 3b',
         # 'emoji': '🥵', # requires 300s reserved ZeroGPU!
     },
+    # Mars6
+    'CAMB-AI/mars6-turbo-demo': {
+        'name': 'MARS 6',
+        'function': '/inference',
+        'text_param_index': 'text',
+        'return_audio_index': 0,
+        'is_zero_gpu_space': False,
+        'is_closed_source': True,
+        'series': 'llasa 3b',
+    },
 }
 # for zero-shot TTS - voice sample used by XTTS (11 seconds)
     'srinivasbilla/llasa-3b-tts': {
 		'sample_audio_path': handle_file('voice_samples/EN_B00004_S00051_W000213.mp3')
     },
+    # MARS 6
+    'CAMB-AI/mars6-turbo-demo': {
+        'reference_audio': DEFAULT_VOICE_SAMPLE,
+		'reference_text': DEFAULT_VOICE_TRANSCRIPT,
+		'ras_K': 10,
+		'ras_t_r': 0.09,
+		'top_p': 0.2,
+		'quality_prefix': "48000",
+		'clone_method': "deep-clone",
+    },
 }

test_tts_mars6.py ADDED Viewed

+import os
+from test_overrides import _get_param_examples, _override_params
+from gradio_client import Client, file
+model = "CAMB-AI/mars6-turbo-demo"
+client = Client(model, hf_token=os.getenv('HF_TOKEN'))
+endpoints = client.view_api(all_endpoints=True, print_info=False, return_format='dict')
+# print(endpoints)
+api_name = '/inference'
+fn_index = None
+end_parameters = None
+text = 'This is what my voice sounds like.'
+end_parameters = _get_param_examples(
+	endpoints['named_endpoints'][api_name]['parameters']
+)
+print(end_parameters)
+space_inputs = end_parameters
+# override some or all default parameters
+space_inputs = _override_params(end_parameters, model)
+if(type(space_inputs) == dict):
+	space_inputs['text'] = text
+	result = client.predict(
+		**space_inputs,
+		api_name=api_name,
+		fn_index=fn_index
+	)
+else:
+	space_inputs[0] = text
+	result = client.predict(
+		*space_inputs,
+		api_name=api_name,
+		fn_index=fn_index
+	)
+	# space_inputs = {str(i): value for i, value in enumerate(space_inputs)}
+print(space_inputs)
+# print(*space_inputs)
+# print(**space_inputs)
+# result = client.predict(
+# 	**space_inputs,
+# 	api_name=api_name,
+#     fn_index=fn_index
+# )
+print(result)