TTS-Spaces-Arena

Running

App Files Files Community

Pendrokar commited on Oct 19, 2024

Commit

6fd6025

1 Parent(s): 57ec188

New TTS: IMS-Toucan

Browse files

Files changed (2) hide show

app.py +30 -7
test_tts_ims-toucan.py +16 -0

app.py CHANGED Viewed

@@ -74,29 +74,32 @@ AVAILABLE_MODELS = {
     # HF Gradio Spaces: # <works with gradio version #>
     # gravio version that works with most spaces: 4.29
-    'coqui/xtts': 'coqui/xtts', # 4.29 4.32
-    'collabora/WhisperSpeech': 'collabora/WhisperSpeech', # 4.32 4.36.1
     # 'myshell-ai/OpenVoice': 'myshell-ai/OpenVoice', # same devs as MeloTTS, which scores higher # 4.29
     # 'myshell-ai/OpenVoiceV2': 'myshell-ai/OpenVoiceV2', # same devs as MeloTTS, which scores higher # 4.29
-    'mrfakename/MetaVoice-1B-v0.1': 'mrfakename/MetaVoice-1B-v0.1', # 4.29 4.32
     'Pendrokar/xVASynth-TTS': 'Pendrokar/xVASynth-TTS', # 4.29 4.32 4.42.0
     # 'coqui/CoquiTTS': 'coqui/CoquiTTS',
-    'mrfakename/MeloTTS': 'mrfakename/MeloTTS', # 4.29 4.32
-    'fishaudio/fish-speech-1': 'fishaudio/fish-speech-1', # 4.29 4.32 4.36.1
     # E2 & F5 TTS
     # F5 model
-    'mrfakename/E2-F5-TTS': 'mrfakename/E2-F5-TTS', # 5.0
     # # Parler
     # Parler Large model
-    'parler-tts/parler_tts': 'parler-tts/parler_tts', # 4.29 4.32 4.36.1 4.42.0
     # Parler Mini model
     # 'parler-tts/parler_tts': 'parler-tts/parler_tts', # 4.29 4.32 4.36.1 4.42.0
     # 'parler-tts/parler_tts_mini': 'parler-tts/parler_tts_mini', # Mini is the default model of parler_tts
     # 'parler-tts/parler-tts-expresso': 'parler-tts/parler-tts-expresso', # 4.29 4.32 4.36.1 4.42.0
     # # Microsoft Edge TTS
     'innoai/Edge-TTS-Text-to-Speech': 'innoai/Edge-TTS-Text-to-Speech', # 4.29
     # HF TTS w issues
@@ -241,6 +244,15 @@ HF_SPACES = {
         'series': 'E2/F5 TTS',
     },
     # TTS w issues
     # 'PolyAI/pheme': '/predict#0', #sleepy HF Space
     # 'amphion/Text-to-Speech': '/predict#0', #takes a whole minute to synthesize
@@ -352,6 +364,17 @@ OVERRIDE_INPUTS = {
 		3: "F5-TTS", # model
 		4: False, # cleanup silence
     },
 }
 hf_clients: Tuple[Client] = {}

     # HF Gradio Spaces: # <works with gradio version #>
     # gravio version that works with most spaces: 4.29
+    # 'coqui/xtts': 'coqui/xtts', # 4.29 4.32
+    # 'collabora/WhisperSpeech': 'collabora/WhisperSpeech', # 4.32 4.36.1
     # 'myshell-ai/OpenVoice': 'myshell-ai/OpenVoice', # same devs as MeloTTS, which scores higher # 4.29
     # 'myshell-ai/OpenVoiceV2': 'myshell-ai/OpenVoiceV2', # same devs as MeloTTS, which scores higher # 4.29
+    # 'mrfakename/MetaVoice-1B-v0.1': 'mrfakename/MetaVoice-1B-v0.1', # 4.29 4.32
     'Pendrokar/xVASynth-TTS': 'Pendrokar/xVASynth-TTS', # 4.29 4.32 4.42.0
     # 'coqui/CoquiTTS': 'coqui/CoquiTTS',
+    # 'mrfakename/MeloTTS': 'mrfakename/MeloTTS', # 4.29 4.32
+    # 'fishaudio/fish-speech-1': 'fishaudio/fish-speech-1', # 4.29 4.32 4.36.1
     # E2 & F5 TTS
     # F5 model
+    # 'mrfakename/E2-F5-TTS': 'mrfakename/E2-F5-TTS', # 5.0
     # # Parler
     # Parler Large model
+    # 'parler-tts/parler_tts': 'parler-tts/parler_tts', # 4.29 4.32 4.36.1 4.42.0
     # Parler Mini model
     # 'parler-tts/parler_tts': 'parler-tts/parler_tts', # 4.29 4.32 4.36.1 4.42.0
     # 'parler-tts/parler_tts_mini': 'parler-tts/parler_tts_mini', # Mini is the default model of parler_tts
     # 'parler-tts/parler-tts-expresso': 'parler-tts/parler-tts-expresso', # 4.29 4.32 4.36.1 4.42.0
     # # Microsoft Edge TTS
+    # 'innoai/Edge-TTS-Text-to-Speech': 'innoai/Edge-TTS-Text-to-Speech', # 4.29
+    # IMS-Toucan
     'innoai/Edge-TTS-Text-to-Speech': 'innoai/Edge-TTS-Text-to-Speech', # 4.29
     # HF TTS w issues
         'series': 'E2/F5 TTS',
     },
+    # IMS-Toucan
+    'Flux9665/MassivelyMultilingualTTS': {
+        'name': 'IMS-Toucan',
+		'function': "/predict",
+        'text_param_index': 0,
+        'return_audio_index': 0,
+        'series': 'IMS-Toucan',
+    }
     # TTS w issues
     # 'PolyAI/pheme': '/predict#0', #sleepy HF Space
     # 'amphion/Text-to-Speech': '/predict#0', #takes a whole minute to synthesize
 		3: "F5-TTS", # model
 		4: False, # cleanup silence
     },
+    # IMS-Toucan
+    'Flux9665/MassivelyMultilingualTTS': {
+		1: "English (eng)", #language
+		2: 0.6, #prosody_creativity
+		3: 1, #duration_scaling_factor
+		4: 41, #voice_seed
+		5: -7.5, #emb1
+		6: None, #reference_audio
+    }
 }
 hf_clients: Tuple[Client] = {}

test_tts_ims-toucan.py ADDED Viewed

	@@ -0,0 +1,16 @@

+import os
+from gradio_client import Client
+client = Client("Flux9665/MassivelyMultilingualTTS", hf_token=os.getenv('HF_TOKEN'))
+endpoints = client.view_api(all_endpoints=True, print_info=False, return_format='dict')
+# print(endpoints)
+result = client.predict(
+		prompt="What I cannot create, I do not understand.",
+		language="English (eng)",
+		prosody_creativity=0.5,
+		duration_scaling_factor=1,
+		voice_seed=27,
+		emb1=-7.5,
+		reference_audio=None,
+		api_name="/predict"
+)