Pendrokar commited on
Commit
89b92be
1 Parent(s): 62e9c0f

openvoice TTS disabled in favor of melotts; xVASynth American English model trained and enabled

Browse files
Files changed (1) hide show
  1. app.py +26 -25
app.py CHANGED
@@ -65,34 +65,35 @@ AVAILABLE_MODELS = {
65
  # 'VoiceCraft 2.0': 'voicecraft',
66
  # 'Parler TTS': 'parler'
67
 
68
- # HF Gradio Spaces:
69
- 'coqui/xtts': 'coqui/xtts',
70
- # 'collabora/WhisperSpeech': 'collabora/WhisperSpeech', # old gradio?
71
- 'myshell-ai/OpenVoice': 'myshell-ai/OpenVoice', # 4.29.0
72
- 'myshell-ai/OpenVoiceV2': 'myshell-ai/OpenVoiceV2', # 4.29.0
73
- 'mrfakename/MetaVoice-1B-v0.1': 'mrfakename/MetaVoice-1B-v0.1', # 4.29.0
74
- #'Pendrokar/xVASynth-TTS': 'Pendrokar/xVASynth-TTS', # EN-GB 4.29.0 4.42.0
 
75
  # 'coqui/CoquiTTS': 'coqui/CoquiTTS',
76
- 'LeeSangHoon/HierSpeech_TTS': 'LeeSangHoon/HierSpeech_TTS', # 4.29.0
77
- 'mrfakename/MeloTTS': 'mrfakename/MeloTTS', # 4.29.0
78
- 'fishaudio/fish-speech-1': 'fishaudio/fish-speech-1', # 4.29.0
79
 
80
- # Parler
81
- 'parler-tts/parler_tts': 'parler-tts/parler_tts', # 4.29.0 4.42.0
82
- 'parler-tts/parler-tts-expresso': 'parler-tts/parler-tts-expresso', # 4.29.0 4.42.0
83
 
84
- # Microsoft Edge TTS
85
- 'innoai/Edge-TTS-Text-to-Speech': 'innoai/Edge-TTS-Text-to-Speech',
86
 
87
- # TTS w issues
 
88
  # 'PolyAI/pheme': '/predict#0', # sleepy HF Space
89
- # 'amphion/Text-to-Speech': '/predict#0', # old running space, takes a whole minute to synthesize
90
  # 'suno/bark': '3#0', # Hallucinates
91
  # 'shivammehta25/Matcha-TTS': '5#0', # seems to require multiple requests for setup
92
- # 'styletts2/styletts2': '0#0', # API disabled
93
- # 'Manmay/tortoise-tts': '/predict#0', # Cannot skip text-from-file parameter
94
  # 'pytorch/Tacotron2': '0#0', # old gradio
95
- # 'parler-tts/parler_tts_mini': 'parler-tts/parler_tts_mini', # old gradio - ValueError: Unsupported protocol: sse_v3
96
  }
97
 
98
  HF_SPACES = {
@@ -167,7 +168,7 @@ HF_SPACES = {
167
  'text_param_index': 0,
168
  'return_audio_index': 0,
169
  },
170
- # Parler
171
  'parler-tts/parler_tts_mini': {
172
  'name': 'Parler Mini',
173
  'function': '/gen_tts',
@@ -229,11 +230,11 @@ OVERRIDE_INPUTS = {
229
  },
230
  'myshell-ai/OpenVoice': {
231
  1: 'default', # style
232
- 2: DEFAULT_VOICE_SAMPLE_STR, # voice sample
233
  },
234
  'myshell-ai/OpenVoiceV2': {
235
- 1: 'en_default', # style
236
- 2: DEFAULT_VOICE_SAMPLE_STR, # voice sample
237
  },
238
  'PolyAI/pheme': {
239
  1: 'YOU1000000044_S0000798', # voice
@@ -241,7 +242,7 @@ OVERRIDE_INPUTS = {
241
  3: 0.7, #Tempo - Gradio Slider issue: takes min. rather than value
242
  },
243
  'Pendrokar/xVASynth-TTS': {
244
- 1: 'ccby_nvidia_hifi_92_F', #fine-tuned voice model name; #92 BRITISH
245
  3: 1.0, #pacing/duration - Gradio Slider issue: takes min. rather than value
246
  },
247
  'suno/bark': {
 
65
  # 'VoiceCraft 2.0': 'voicecraft',
66
  # 'Parler TTS': 'parler'
67
 
68
+ # HF Gradio Spaces: # <works with gradio version #>
69
+ # gravio version that works with most spaces: 4.29
70
+ 'coqui/xtts': 'coqui/xtts', # 4.29 4.32
71
+ 'collabora/WhisperSpeech': 'collabora/WhisperSpeech', # 4.32 4.36.1
72
+ # 'myshell-ai/OpenVoice': 'myshell-ai/OpenVoice', # same devs as MeloTTS, which scores higher # 4.29
73
+ # 'myshell-ai/OpenVoiceV2': 'myshell-ai/OpenVoiceV2', # same devs as MeloTTS, which scores higher # 4.29
74
+ 'mrfakename/MetaVoice-1B-v0.1': 'mrfakename/MetaVoice-1B-v0.1', # 4.29 4.32
75
+ # 'Pendrokar/xVASynth-TTS': 'Pendrokar/xVASynth-TTS', # EN-GB 4.29 4.32 4.42.0
76
  # 'coqui/CoquiTTS': 'coqui/CoquiTTS',
77
+ 'mrfakename/MeloTTS': 'mrfakename/MeloTTS', # 4.29 4.32
78
+ 'fishaudio/fish-speech-1': 'fishaudio/fish-speech-1', # 4.29 4.32 4.36.1
 
79
 
80
+ # # Parler
81
+ 'parler-tts/parler_tts': 'parler-tts/parler_tts', # 4.29 4.32 4.36.1 4.42.0
82
+ 'parler-tts/parler-tts-expresso': 'parler-tts/parler-tts-expresso', # 4.29 4.32 4.36.1 4.42.0
83
 
84
+ # # Microsoft Edge TTS
85
+ 'innoai/Edge-TTS-Text-to-Speech': 'innoai/Edge-TTS-Text-to-Speech', # 4.29
86
 
87
+ # HF TTS w issues
88
+ # 'LeeSangHoon/HierSpeech_TTS': 'LeeSangHoon/HierSpeech_TTS', # irresponsive to exclamation marks # 4.29
89
  # 'PolyAI/pheme': '/predict#0', # sleepy HF Space
90
+ # 'amphion/Text-to-Speech': '/predict#0', # disabled also on original HF space due to poor ratings
91
  # 'suno/bark': '3#0', # Hallucinates
92
  # 'shivammehta25/Matcha-TTS': '5#0', # seems to require multiple requests for setup
93
+ # 'styletts2/styletts2': '0#0', # API disabled, awaiting approval of PR #15
94
+ # 'Manmay/tortoise-tts': '/predict#0', # Cannot retrieve streamed file; 403
95
  # 'pytorch/Tacotron2': '0#0', # old gradio
96
+ # 'parler-tts/parler_tts_mini': 'parler-tts/parler_tts_mini', # Mini is the default model of parler_tts
97
  }
98
 
99
  HF_SPACES = {
 
168
  'text_param_index': 0,
169
  'return_audio_index': 0,
170
  },
171
+ # Parler Mini
172
  'parler-tts/parler_tts_mini': {
173
  'name': 'Parler Mini',
174
  'function': '/gen_tts',
 
230
  },
231
  'myshell-ai/OpenVoice': {
232
  1: 'default', # style
233
+ 2: 'https://huggingface.co/spaces/myshell-ai/OpenVoiceV2/resolve/main/examples/speaker0.mp3', # voice sample
234
  },
235
  'myshell-ai/OpenVoiceV2': {
236
+ 1: 'en_us', # style
237
+ 2: 'https://huggingface.co/spaces/myshell-ai/OpenVoiceV2/resolve/main/examples/speaker0.mp3', # voice sample
238
  },
239
  'PolyAI/pheme': {
240
  1: 'YOU1000000044_S0000798', # voice
 
242
  3: 0.7, #Tempo - Gradio Slider issue: takes min. rather than value
243
  },
244
  'Pendrokar/xVASynth-TTS': {
245
+ 1: 'x_ex04', #fine-tuned voice model name
246
  3: 1.0, #pacing/duration - Gradio Slider issue: takes min. rather than value
247
  },
248
  'suno/bark': {