Spaces:
Running
Running
openvoice TTS disabled in favor of melotts; xVASynth American English model trained and enabled
Browse files
app.py
CHANGED
|
@@ -65,34 +65,35 @@ AVAILABLE_MODELS = {
|
|
| 65 |
# 'VoiceCraft 2.0': 'voicecraft',
|
| 66 |
# 'Parler TTS': 'parler'
|
| 67 |
|
| 68 |
-
# HF Gradio Spaces:
|
| 69 |
-
|
| 70 |
-
|
| 71 |
-
'
|
| 72 |
-
'myshell-ai/
|
| 73 |
-
'
|
| 74 |
-
|
|
|
|
| 75 |
# 'coqui/CoquiTTS': 'coqui/CoquiTTS',
|
| 76 |
-
'
|
| 77 |
-
'
|
| 78 |
-
'fishaudio/fish-speech-1': 'fishaudio/fish-speech-1', # 4.29.0
|
| 79 |
|
| 80 |
-
# Parler
|
| 81 |
-
'parler-tts/parler_tts': 'parler-tts/parler_tts', # 4.29.
|
| 82 |
-
'parler-tts/parler-tts-expresso': 'parler-tts/parler-tts-expresso', # 4.29.
|
| 83 |
|
| 84 |
-
# Microsoft Edge TTS
|
| 85 |
-
'innoai/Edge-TTS-Text-to-Speech': 'innoai/Edge-TTS-Text-to-Speech',
|
| 86 |
|
| 87 |
-
# TTS w issues
|
|
|
|
| 88 |
# 'PolyAI/pheme': '/predict#0', # sleepy HF Space
|
| 89 |
-
# 'amphion/Text-to-Speech': '/predict#0', #
|
| 90 |
# 'suno/bark': '3#0', # Hallucinates
|
| 91 |
# 'shivammehta25/Matcha-TTS': '5#0', # seems to require multiple requests for setup
|
| 92 |
-
# 'styletts2/styletts2': '0#0', # API disabled
|
| 93 |
-
# 'Manmay/tortoise-tts': '/predict#0', # Cannot
|
| 94 |
# 'pytorch/Tacotron2': '0#0', # old gradio
|
| 95 |
-
# 'parler-tts/parler_tts_mini': 'parler-tts/parler_tts_mini', #
|
| 96 |
}
|
| 97 |
|
| 98 |
HF_SPACES = {
|
|
@@ -167,7 +168,7 @@ HF_SPACES = {
|
|
| 167 |
'text_param_index': 0,
|
| 168 |
'return_audio_index': 0,
|
| 169 |
},
|
| 170 |
-
# Parler
|
| 171 |
'parler-tts/parler_tts_mini': {
|
| 172 |
'name': 'Parler Mini',
|
| 173 |
'function': '/gen_tts',
|
|
@@ -229,11 +230,11 @@ OVERRIDE_INPUTS = {
|
|
| 229 |
},
|
| 230 |
'myshell-ai/OpenVoice': {
|
| 231 |
1: 'default', # style
|
| 232 |
-
2:
|
| 233 |
},
|
| 234 |
'myshell-ai/OpenVoiceV2': {
|
| 235 |
-
1: '
|
| 236 |
-
2:
|
| 237 |
},
|
| 238 |
'PolyAI/pheme': {
|
| 239 |
1: 'YOU1000000044_S0000798', # voice
|
|
@@ -241,7 +242,7 @@ OVERRIDE_INPUTS = {
|
|
| 241 |
3: 0.7, #Tempo - Gradio Slider issue: takes min. rather than value
|
| 242 |
},
|
| 243 |
'Pendrokar/xVASynth-TTS': {
|
| 244 |
-
1: '
|
| 245 |
3: 1.0, #pacing/duration - Gradio Slider issue: takes min. rather than value
|
| 246 |
},
|
| 247 |
'suno/bark': {
|
|
|
|
| 65 |
# 'VoiceCraft 2.0': 'voicecraft',
|
| 66 |
# 'Parler TTS': 'parler'
|
| 67 |
|
| 68 |
+
# HF Gradio Spaces: # <works with gradio version #>
|
| 69 |
+
# gravio version that works with most spaces: 4.29
|
| 70 |
+
'coqui/xtts': 'coqui/xtts', # 4.29 4.32
|
| 71 |
+
'collabora/WhisperSpeech': 'collabora/WhisperSpeech', # 4.32 4.36.1
|
| 72 |
+
# 'myshell-ai/OpenVoice': 'myshell-ai/OpenVoice', # same devs as MeloTTS, which scores higher # 4.29
|
| 73 |
+
# 'myshell-ai/OpenVoiceV2': 'myshell-ai/OpenVoiceV2', # same devs as MeloTTS, which scores higher # 4.29
|
| 74 |
+
'mrfakename/MetaVoice-1B-v0.1': 'mrfakename/MetaVoice-1B-v0.1', # 4.29 4.32
|
| 75 |
+
# 'Pendrokar/xVASynth-TTS': 'Pendrokar/xVASynth-TTS', # EN-GB 4.29 4.32 4.42.0
|
| 76 |
# 'coqui/CoquiTTS': 'coqui/CoquiTTS',
|
| 77 |
+
'mrfakename/MeloTTS': 'mrfakename/MeloTTS', # 4.29 4.32
|
| 78 |
+
'fishaudio/fish-speech-1': 'fishaudio/fish-speech-1', # 4.29 4.32 4.36.1
|
|
|
|
| 79 |
|
| 80 |
+
# # Parler
|
| 81 |
+
'parler-tts/parler_tts': 'parler-tts/parler_tts', # 4.29 4.32 4.36.1 4.42.0
|
| 82 |
+
'parler-tts/parler-tts-expresso': 'parler-tts/parler-tts-expresso', # 4.29 4.32 4.36.1 4.42.0
|
| 83 |
|
| 84 |
+
# # Microsoft Edge TTS
|
| 85 |
+
'innoai/Edge-TTS-Text-to-Speech': 'innoai/Edge-TTS-Text-to-Speech', # 4.29
|
| 86 |
|
| 87 |
+
# HF TTS w issues
|
| 88 |
+
# 'LeeSangHoon/HierSpeech_TTS': 'LeeSangHoon/HierSpeech_TTS', # irresponsive to exclamation marks # 4.29
|
| 89 |
# 'PolyAI/pheme': '/predict#0', # sleepy HF Space
|
| 90 |
+
# 'amphion/Text-to-Speech': '/predict#0', # disabled also on original HF space due to poor ratings
|
| 91 |
# 'suno/bark': '3#0', # Hallucinates
|
| 92 |
# 'shivammehta25/Matcha-TTS': '5#0', # seems to require multiple requests for setup
|
| 93 |
+
# 'styletts2/styletts2': '0#0', # API disabled, awaiting approval of PR #15
|
| 94 |
+
# 'Manmay/tortoise-tts': '/predict#0', # Cannot retrieve streamed file; 403
|
| 95 |
# 'pytorch/Tacotron2': '0#0', # old gradio
|
| 96 |
+
# 'parler-tts/parler_tts_mini': 'parler-tts/parler_tts_mini', # Mini is the default model of parler_tts
|
| 97 |
}
|
| 98 |
|
| 99 |
HF_SPACES = {
|
|
|
|
| 168 |
'text_param_index': 0,
|
| 169 |
'return_audio_index': 0,
|
| 170 |
},
|
| 171 |
+
# Parler Mini
|
| 172 |
'parler-tts/parler_tts_mini': {
|
| 173 |
'name': 'Parler Mini',
|
| 174 |
'function': '/gen_tts',
|
|
|
|
| 230 |
},
|
| 231 |
'myshell-ai/OpenVoice': {
|
| 232 |
1: 'default', # style
|
| 233 |
+
2: 'https://huggingface.co/spaces/myshell-ai/OpenVoiceV2/resolve/main/examples/speaker0.mp3', # voice sample
|
| 234 |
},
|
| 235 |
'myshell-ai/OpenVoiceV2': {
|
| 236 |
+
1: 'en_us', # style
|
| 237 |
+
2: 'https://huggingface.co/spaces/myshell-ai/OpenVoiceV2/resolve/main/examples/speaker0.mp3', # voice sample
|
| 238 |
},
|
| 239 |
'PolyAI/pheme': {
|
| 240 |
1: 'YOU1000000044_S0000798', # voice
|
|
|
|
| 242 |
3: 0.7, #Tempo - Gradio Slider issue: takes min. rather than value
|
| 243 |
},
|
| 244 |
'Pendrokar/xVASynth-TTS': {
|
| 245 |
+
1: 'x_ex04', #fine-tuned voice model name
|
| 246 |
3: 1.0, #pacing/duration - Gradio Slider issue: takes min. rather than value
|
| 247 |
},
|
| 248 |
'suno/bark': {
|