Spaces:
Running
on
Zero
Running
on
Zero
TTS added: LLaSa 8B; re-enabled openvoice to get to ~1000 votes; FS broken
Browse files- app/models.py +23 -9
app/models.py
CHANGED
@@ -25,14 +25,14 @@ AVAILABLE_MODELS = {
|
|
25 |
# gradio version that works with most spaces: 4.29
|
26 |
# 'coqui/xtts': 'coqui/xtts', # 4.29 4.32; extra_headers error appears for 5.13
|
27 |
# 'collabora/WhisperSpeech': 'collabora/WhisperSpeech', # 4.32 4.36.1
|
28 |
-
|
29 |
-
|
30 |
# 'mrfakename/MetaVoice-1B-v0.1': 'mrfakename/MetaVoice-1B-v0.1', # 4.29 4.32
|
31 |
'Pendrokar/xVASynth-TTS': 'Pendrokar/xVASynth-TTS', # 4.29 4.32 4.42.0
|
32 |
'Pendrokar/xVASynth-TTS/NoDeepMoji': 'Pendrokar/xVASynth-TTS', # 4.29 4.32 4.42.0
|
33 |
# 'coqui/CoquiTTS': 'coqui/CoquiTTS',
|
34 |
-
|
35 |
-
|
36 |
|
37 |
# E2 & F5 TTS
|
38 |
# F5 model
|
@@ -46,7 +46,7 @@ AVAILABLE_MODELS = {
|
|
46 |
# Parler Mini model
|
47 |
# 'parler-tts/parler_tts': 'parler-tts/parler_tts', # 4.29 4.32 4.36.1 4.42.0
|
48 |
# 'parler-tts/parler_tts_mini': 'parler-tts/parler_tts_mini', # Mini is the default model of parler_tts
|
49 |
-
'parler-tts/parler-tts-expresso': 'parler-tts/parler-tts-expresso', # 4.29 4.32 4.36.1 4.42.0
|
50 |
|
51 |
# # Microsoft Edge TTS
|
52 |
# 'innoai/Edge-TTS-Text-to-Speech': 'innoai/Edge-TTS-Text-to-Speech', # API disabled
|
@@ -55,7 +55,7 @@ AVAILABLE_MODELS = {
|
|
55 |
# 'Flux9665/MassivelyMultilingualTTS': 'Flux9665/MassivelyMultilingualTTS', # 5.1
|
56 |
|
57 |
# StyleTTS v2
|
58 |
-
'Pendrokar/style-tts-2': 'Pendrokar/style-tts-2', # more votes in OG arena; emotionless
|
59 |
|
60 |
# StyleTTS Kokoro v0.19
|
61 |
# 'hexgrad/kokoro': 'hexgrad/Kokoro-TTS',
|
@@ -79,6 +79,8 @@ AVAILABLE_MODELS = {
|
|
79 |
|
80 |
# llasa 3b TTS
|
81 |
'srinivasbilla/llasa-3b-tts': 'srinivasbilla/llasa-3b-tts',
|
|
|
|
|
82 |
|
83 |
# Mars5
|
84 |
# 'CAMB-AI/mars5_space': 'CAMB-AI/mars5_space', # slow inference; Unstable
|
@@ -288,7 +290,7 @@ HF_SPACES = {
|
|
288 |
|
289 |
# StyleTTS Kokoro v0.19
|
290 |
'hexgrad/kokoro': {
|
291 |
-
'name': '
|
292 |
'function': '/generate',
|
293 |
'text_param_index': 'text',
|
294 |
'return_audio_index': 0,
|
@@ -375,8 +377,17 @@ HF_SPACES = {
|
|
375 |
'text_param_index': 'target_text',
|
376 |
'return_audio_index': 0,
|
377 |
'is_zero_gpu_space': True,
|
378 |
-
'series': 'llasa
|
379 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
380 |
},
|
381 |
|
382 |
# Mars5
|
@@ -611,6 +622,9 @@ OVERRIDE_INPUTS = {
|
|
611 |
'srinivasbilla/llasa-3b-tts': {
|
612 |
'sample_audio_path': handle_file('voice_samples/EN_B00004_S00051_W000213.mp3')
|
613 |
},
|
|
|
|
|
|
|
614 |
|
615 |
# MARS 5
|
616 |
'CAMB-AI/mars5_space': {
|
|
|
25 |
# gradio version that works with most spaces: 4.29
|
26 |
# 'coqui/xtts': 'coqui/xtts', # 4.29 4.32; extra_headers error appears for 5.13
|
27 |
# 'collabora/WhisperSpeech': 'collabora/WhisperSpeech', # 4.32 4.36.1
|
28 |
+
'myshell-ai/OpenVoice': 'myshell-ai/OpenVoice', # same devs as MeloTTS, which scores higher # 4.29
|
29 |
+
'myshell-ai/OpenVoiceV2': 'myshell-ai/OpenVoiceV2', # same devs as MeloTTS, which scores higher # 4.29
|
30 |
# 'mrfakename/MetaVoice-1B-v0.1': 'mrfakename/MetaVoice-1B-v0.1', # 4.29 4.32
|
31 |
'Pendrokar/xVASynth-TTS': 'Pendrokar/xVASynth-TTS', # 4.29 4.32 4.42.0
|
32 |
'Pendrokar/xVASynth-TTS/NoDeepMoji': 'Pendrokar/xVASynth-TTS', # 4.29 4.32 4.42.0
|
33 |
# 'coqui/CoquiTTS': 'coqui/CoquiTTS',
|
34 |
+
'mrfakename/MeloTTS': 'mrfakename/MeloTTS', # 4.29 4.32
|
35 |
+
# 'fishaudio/fish-speech-1': 'fishaudio/fish-speech-1', # Queue ERROR
|
36 |
|
37 |
# E2 & F5 TTS
|
38 |
# F5 model
|
|
|
46 |
# Parler Mini model
|
47 |
# 'parler-tts/parler_tts': 'parler-tts/parler_tts', # 4.29 4.32 4.36.1 4.42.0
|
48 |
# 'parler-tts/parler_tts_mini': 'parler-tts/parler_tts_mini', # Mini is the default model of parler_tts
|
49 |
+
# 'parler-tts/parler-tts-expresso': 'parler-tts/parler-tts-expresso', # 4.29 4.32 4.36.1 4.42.0
|
50 |
|
51 |
# # Microsoft Edge TTS
|
52 |
# 'innoai/Edge-TTS-Text-to-Speech': 'innoai/Edge-TTS-Text-to-Speech', # API disabled
|
|
|
55 |
# 'Flux9665/MassivelyMultilingualTTS': 'Flux9665/MassivelyMultilingualTTS', # 5.1
|
56 |
|
57 |
# StyleTTS v2
|
58 |
+
# 'Pendrokar/style-tts-2': 'Pendrokar/style-tts-2', # more votes in OG arena; emotionless
|
59 |
|
60 |
# StyleTTS Kokoro v0.19
|
61 |
# 'hexgrad/kokoro': 'hexgrad/Kokoro-TTS',
|
|
|
79 |
|
80 |
# llasa 3b TTS
|
81 |
'srinivasbilla/llasa-3b-tts': 'srinivasbilla/llasa-3b-tts',
|
82 |
+
# llasa 8b TTS
|
83 |
+
'srinivasbilla/llasa-8b-tts': 'srinivasbilla/llasa-8b-tts',
|
84 |
|
85 |
# Mars5
|
86 |
# 'CAMB-AI/mars5_space': 'CAMB-AI/mars5_space', # slow inference; Unstable
|
|
|
290 |
|
291 |
# StyleTTS Kokoro v0.19
|
292 |
'hexgrad/kokoro': {
|
293 |
+
'name': 'Kokoro v0.19',
|
294 |
'function': '/generate',
|
295 |
'text_param_index': 'text',
|
296 |
'return_audio_index': 0,
|
|
|
377 |
'text_param_index': 'target_text',
|
378 |
'return_audio_index': 0,
|
379 |
'is_zero_gpu_space': True,
|
380 |
+
'series': 'llasa',
|
381 |
+
},
|
382 |
+
|
383 |
+
# LlaSa 8B
|
384 |
+
'srinivasbilla/llasa-8b-tts': {
|
385 |
+
'name': 'LLaSA 8B',
|
386 |
+
'function': '/infer',
|
387 |
+
'text_param_index': 'target_text',
|
388 |
+
'return_audio_index': 0,
|
389 |
+
'is_zero_gpu_space': True,
|
390 |
+
'series': 'llasa',
|
391 |
},
|
392 |
|
393 |
# Mars5
|
|
|
622 |
'srinivasbilla/llasa-3b-tts': {
|
623 |
'sample_audio_path': handle_file('voice_samples/EN_B00004_S00051_W000213.mp3')
|
624 |
},
|
625 |
+
'srinivasbilla/llasa-8b-tts': {
|
626 |
+
'sample_audio_path': handle_file('voice_samples/EN_B00004_S00051_W000213.mp3')
|
627 |
+
},
|
628 |
|
629 |
# MARS 5
|
630 |
'CAMB-AI/mars5_space': {
|