TTS-Spaces-Arena

Running

Pendrokar commited on 5 days ago

Commit

390ef0c

•

1 Parent(s): a4649b3

F5 TTS API fixed

Files changed (2) hide show

app.py CHANGED Viewed

@@ -251,8 +251,8 @@ HF_SPACES = {
     # E2/F5 TTS
     'mrfakename/E2-F5-TTS': {
-        'name': 'F5 of E2 TTS',
-        'function': '/infer',
         'text_param_index': 2,
         'return_audio_index': 0,
         'is_zero_gpu_space': True,
@@ -298,7 +298,7 @@ HF_SPACES = {
         'series': 'StyleTTS',
     },
-    # StyleTTS v2 kokoro fine tune
     'amphion/maskgct': {
         'name': 'MaskGCT',
         'function': '/predict',
@@ -424,10 +424,9 @@ OVERRIDE_INPUTS = {
     'mrfakename/E2-F5-TTS': {
 		0: DEFAULT_VOICE_SAMPLE, # voice sample
 		1: DEFAULT_VOICE_TRANSCRIPT, # transcript of sample (< 15 seconds required)
-		3: "F5-TTS", # model
-		4: False, # cleanup silence
-        5: 0.15, #crossfade
-        6: 1, #speed
     },
     # IMS-Toucan

     # E2/F5 TTS
     'mrfakename/E2-F5-TTS': {
+        'name': 'F5 TTS',
+        'function': '/basic_tts',
         'text_param_index': 2,
         'return_audio_index': 0,
         'is_zero_gpu_space': True,
         'series': 'StyleTTS',
     },
+    # MaskGCT (by Amphion)
     'amphion/maskgct': {
         'name': 'MaskGCT',
         'function': '/predict',
     'mrfakename/E2-F5-TTS': {
 		0: DEFAULT_VOICE_SAMPLE, # voice sample
 		1: DEFAULT_VOICE_TRANSCRIPT, # transcript of sample (< 15 seconds required)
+		3: False, # cleanup silence
+        4: 0.15, #crossfade
+        5: 1, #speed
     },
     # IMS-Toucan

test_tts_e2_f5_f5.py CHANGED Viewed

@@ -3,12 +3,12 @@ from gradio_client import Client, handle_file
 client = Client("mrfakename/E2-F5-TTS", hf_token=os.getenv('HF_TOKEN'))
 endpoints = client.view_api(all_endpoints=True, print_info=False, return_format='dict')
-print(endpoints)
 result = client.predict(
-		ref_audio_orig=handle_file('https://cdn-uploads.huggingface.co/production/uploads/63d52e0c4e5642795617f668/V6-rMmI-P59DA4leWDIcK.wav'),
-		ref_text="The Hispaniola was rolling scuppers under in the ocean swell. The booms were tearing at the blocks, the rudder was banging to and fro, and the whole ship creaking, groaning, and jumping like a manufactory.",
-		gen_text="Please surprise me and speak in whatever voice you enjoy.",
-		exp_name="F5-TTS",
 		remove_silence=False,
-		api_name="/infer",
 )

 client = Client("mrfakename/E2-F5-TTS", hf_token=os.getenv('HF_TOKEN'))
 endpoints = client.view_api(all_endpoints=True, print_info=False, return_format='dict')
 result = client.predict(
+		ref_audio_input=handle_file('https://cdn-uploads.huggingface.co/production/uploads/63d52e0c4e5642795617f668/V6-rMmI-P59DA4leWDIcK.wav'),
+		ref_text_input="The Hispaniola was rolling scuppers under in the ocean swell. The booms were tearing at the blocks, the rudder was banging to and fro, and the whole ship creaking, groaning, and jumping like a manufactory.",
+		gen_text_input="Please surprise me and speak in whatever voice you enjoy.",
 		remove_silence=False,
+		cross_fade_duration_slider=0.15,
+		speed_slider=1,
+		api_name="/basic_tts",
 )