Pendrokar commited on
Commit
fbc6b3e
·
1 Parent(s): d1639f5

TTS added: LLaSa 8B; re-enabled openvoice to get to ~1000 votes; FS broken

Browse files
Files changed (1) hide show
  1. app/models.py +23 -9
app/models.py CHANGED
@@ -25,14 +25,14 @@ AVAILABLE_MODELS = {
25
  # gradio version that works with most spaces: 4.29
26
  # 'coqui/xtts': 'coqui/xtts', # 4.29 4.32; extra_headers error appears for 5.13
27
  # 'collabora/WhisperSpeech': 'collabora/WhisperSpeech', # 4.32 4.36.1
28
- # 'myshell-ai/OpenVoice': 'myshell-ai/OpenVoice', # same devs as MeloTTS, which scores higher # 4.29
29
- # 'myshell-ai/OpenVoiceV2': 'myshell-ai/OpenVoiceV2', # same devs as MeloTTS, which scores higher # 4.29
30
  # 'mrfakename/MetaVoice-1B-v0.1': 'mrfakename/MetaVoice-1B-v0.1', # 4.29 4.32
31
  'Pendrokar/xVASynth-TTS': 'Pendrokar/xVASynth-TTS', # 4.29 4.32 4.42.0
32
  'Pendrokar/xVASynth-TTS/NoDeepMoji': 'Pendrokar/xVASynth-TTS', # 4.29 4.32 4.42.0
33
  # 'coqui/CoquiTTS': 'coqui/CoquiTTS',
34
- 'mrfakename/MeloTTS': 'mrfakename/MeloTTS', # 4.29 4.32
35
- 'fishaudio/fish-speech-1': 'fishaudio/fish-speech-1', # 4.29 4.32 4.36.1
36
 
37
  # E2 & F5 TTS
38
  # F5 model
@@ -46,7 +46,7 @@ AVAILABLE_MODELS = {
46
  # Parler Mini model
47
  # 'parler-tts/parler_tts': 'parler-tts/parler_tts', # 4.29 4.32 4.36.1 4.42.0
48
  # 'parler-tts/parler_tts_mini': 'parler-tts/parler_tts_mini', # Mini is the default model of parler_tts
49
- 'parler-tts/parler-tts-expresso': 'parler-tts/parler-tts-expresso', # 4.29 4.32 4.36.1 4.42.0
50
 
51
  # # Microsoft Edge TTS
52
  # 'innoai/Edge-TTS-Text-to-Speech': 'innoai/Edge-TTS-Text-to-Speech', # API disabled
@@ -55,7 +55,7 @@ AVAILABLE_MODELS = {
55
  # 'Flux9665/MassivelyMultilingualTTS': 'Flux9665/MassivelyMultilingualTTS', # 5.1
56
 
57
  # StyleTTS v2
58
- 'Pendrokar/style-tts-2': 'Pendrokar/style-tts-2', # more votes in OG arena; emotionless
59
 
60
  # StyleTTS Kokoro v0.19
61
  # 'hexgrad/kokoro': 'hexgrad/Kokoro-TTS',
@@ -79,6 +79,8 @@ AVAILABLE_MODELS = {
79
 
80
  # llasa 3b TTS
81
  'srinivasbilla/llasa-3b-tts': 'srinivasbilla/llasa-3b-tts',
 
 
82
 
83
  # Mars5
84
  # 'CAMB-AI/mars5_space': 'CAMB-AI/mars5_space', # slow inference; Unstable
@@ -288,7 +290,7 @@ HF_SPACES = {
288
 
289
  # StyleTTS Kokoro v0.19
290
  'hexgrad/kokoro': {
291
- 'name': 'StyleTTS Kokoro v19',
292
  'function': '/generate',
293
  'text_param_index': 'text',
294
  'return_audio_index': 0,
@@ -375,8 +377,17 @@ HF_SPACES = {
375
  'text_param_index': 'target_text',
376
  'return_audio_index': 0,
377
  'is_zero_gpu_space': True,
378
- 'series': 'llasa 3b',
379
- # 'emoji': '🥵', # requires 300s reserved ZeroGPU!
 
 
 
 
 
 
 
 
 
380
  },
381
 
382
  # Mars5
@@ -611,6 +622,9 @@ OVERRIDE_INPUTS = {
611
  'srinivasbilla/llasa-3b-tts': {
612
  'sample_audio_path': handle_file('voice_samples/EN_B00004_S00051_W000213.mp3')
613
  },
 
 
 
614
 
615
  # MARS 5
616
  'CAMB-AI/mars5_space': {
 
25
  # gradio version that works with most spaces: 4.29
26
  # 'coqui/xtts': 'coqui/xtts', # 4.29 4.32; extra_headers error appears for 5.13
27
  # 'collabora/WhisperSpeech': 'collabora/WhisperSpeech', # 4.32 4.36.1
28
+ 'myshell-ai/OpenVoice': 'myshell-ai/OpenVoice', # same devs as MeloTTS, which scores higher # 4.29
29
+ 'myshell-ai/OpenVoiceV2': 'myshell-ai/OpenVoiceV2', # same devs as MeloTTS, which scores higher # 4.29
30
  # 'mrfakename/MetaVoice-1B-v0.1': 'mrfakename/MetaVoice-1B-v0.1', # 4.29 4.32
31
  'Pendrokar/xVASynth-TTS': 'Pendrokar/xVASynth-TTS', # 4.29 4.32 4.42.0
32
  'Pendrokar/xVASynth-TTS/NoDeepMoji': 'Pendrokar/xVASynth-TTS', # 4.29 4.32 4.42.0
33
  # 'coqui/CoquiTTS': 'coqui/CoquiTTS',
34
+ 'mrfakename/MeloTTS': 'mrfakename/MeloTTS', # 4.29 4.32
35
+ # 'fishaudio/fish-speech-1': 'fishaudio/fish-speech-1', # Queue ERROR
36
 
37
  # E2 & F5 TTS
38
  # F5 model
 
46
  # Parler Mini model
47
  # 'parler-tts/parler_tts': 'parler-tts/parler_tts', # 4.29 4.32 4.36.1 4.42.0
48
  # 'parler-tts/parler_tts_mini': 'parler-tts/parler_tts_mini', # Mini is the default model of parler_tts
49
+ # 'parler-tts/parler-tts-expresso': 'parler-tts/parler-tts-expresso', # 4.29 4.32 4.36.1 4.42.0
50
 
51
  # # Microsoft Edge TTS
52
  # 'innoai/Edge-TTS-Text-to-Speech': 'innoai/Edge-TTS-Text-to-Speech', # API disabled
 
55
  # 'Flux9665/MassivelyMultilingualTTS': 'Flux9665/MassivelyMultilingualTTS', # 5.1
56
 
57
  # StyleTTS v2
58
+ # 'Pendrokar/style-tts-2': 'Pendrokar/style-tts-2', # more votes in OG arena; emotionless
59
 
60
  # StyleTTS Kokoro v0.19
61
  # 'hexgrad/kokoro': 'hexgrad/Kokoro-TTS',
 
79
 
80
  # llasa 3b TTS
81
  'srinivasbilla/llasa-3b-tts': 'srinivasbilla/llasa-3b-tts',
82
+ # llasa 8b TTS
83
+ 'srinivasbilla/llasa-8b-tts': 'srinivasbilla/llasa-8b-tts',
84
 
85
  # Mars5
86
  # 'CAMB-AI/mars5_space': 'CAMB-AI/mars5_space', # slow inference; Unstable
 
290
 
291
  # StyleTTS Kokoro v0.19
292
  'hexgrad/kokoro': {
293
+ 'name': 'Kokoro v0.19',
294
  'function': '/generate',
295
  'text_param_index': 'text',
296
  'return_audio_index': 0,
 
377
  'text_param_index': 'target_text',
378
  'return_audio_index': 0,
379
  'is_zero_gpu_space': True,
380
+ 'series': 'llasa',
381
+ },
382
+
383
+ # LlaSa 8B
384
+ 'srinivasbilla/llasa-8b-tts': {
385
+ 'name': 'LLaSA 8B',
386
+ 'function': '/infer',
387
+ 'text_param_index': 'target_text',
388
+ 'return_audio_index': 0,
389
+ 'is_zero_gpu_space': True,
390
+ 'series': 'llasa',
391
  },
392
 
393
  # Mars5
 
622
  'srinivasbilla/llasa-3b-tts': {
623
  'sample_audio_path': handle_file('voice_samples/EN_B00004_S00051_W000213.mp3')
624
  },
625
+ 'srinivasbilla/llasa-8b-tts': {
626
+ 'sample_audio_path': handle_file('voice_samples/EN_B00004_S00051_W000213.mp3')
627
+ },
628
 
629
  # MARS 5
630
  'CAMB-AI/mars5_space': {