Pendrokar commited on
Commit
484a84d
·
1 Parent(s): 4f0aefc

New TTS: OpenAudio S1 Mini (by Fish Audio)

Browse files
Files changed (1) hide show
  1. app/models.py +32 -2
app/models.py CHANGED
@@ -35,7 +35,6 @@ AVAILABLE_MODELS = {
35
  # 'Pendrokar/xVASynth-TTS/NoDeepMoji': 'Pendrokar/xVASynth-TTS', # 4.29 4.32 4.42.0
36
  # 'coqui/CoquiTTS': 'coqui/CoquiTTS',
37
  # 'mrfakename/MeloTTS': 'mrfakename/MeloTTS', # 4.29 4.32
38
- # 'fishaudio/fish-speech-1': 'fishaudio/fish-speech-1', # Queue ERROR
39
 
40
  # E2 & F5 TTS
41
  # F5 model
@@ -119,7 +118,11 @@ AVAILABLE_MODELS = {
119
  # Chatterbox
120
  'ResembleAI/Chatterbox': 'ResembleAI/Chatterbox',
121
 
 
 
 
122
  # HF TTS w issues
 
123
  # 'LeeSangHoon/HierSpeech_TTS': 'LeeSangHoon/HierSpeech_TTS', # irresponsive to exclamation marks # 4.29
124
  # 'PolyAI/pheme': '/predict#0', # sleepy HF Space
125
  # 'amphion/Text-to-Speech': '/predict#0', # disabled also on original HF space due to poor ratings
@@ -304,6 +307,16 @@ HF_SPACES = {
304
  # 'emoji': '😷',
305
  },
306
 
 
 
 
 
 
 
 
 
 
 
307
  # F5 TTS
308
  'mrfakename/E2-F5-TTS': {
309
  'name': 'F5 TTS',
@@ -687,6 +700,23 @@ OVERRIDE_INPUTS = {
687
  'use_memory_cache': "never",
688
  },
689
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
690
  # F5
691
  'mrfakename/E2-F5-TTS': {
692
  'ref_audio_input': handle_file('voice_samples/EN_B00004_S00051_W000213.mp3'),
@@ -966,7 +996,7 @@ closed_source = [
966
  ]
967
 
968
  # top five models in order to always have one of them picked and scrutinized
969
- top_five = ['PHBJT/multi_parler_tts', 'PHBJT/multi_parler_tts/reformatted', 'ResembleAI/Chatterbox']
970
 
971
  # prioritize low vote models
972
  sql = 'SELECT name FROM model WHERE (upvote + downvote) < 750 ORDER BY (upvote + downvote) ASC'
 
35
  # 'Pendrokar/xVASynth-TTS/NoDeepMoji': 'Pendrokar/xVASynth-TTS', # 4.29 4.32 4.42.0
36
  # 'coqui/CoquiTTS': 'coqui/CoquiTTS',
37
  # 'mrfakename/MeloTTS': 'mrfakename/MeloTTS', # 4.29 4.32
 
38
 
39
  # E2 & F5 TTS
40
  # F5 model
 
118
  # Chatterbox
119
  'ResembleAI/Chatterbox': 'ResembleAI/Chatterbox',
120
 
121
+ # OpenAudio S1 (Fish Audio)
122
+ 'fishaudio/openaudio-s1-mini': 'fishaudio/openaudio-s1-mini',
123
+
124
  # HF TTS w issues
125
+ # 'fishaudio/fish-speech-1': 'fishaudio/fish-speech-1', # Discontinued for OpenAudio S1
126
  # 'LeeSangHoon/HierSpeech_TTS': 'LeeSangHoon/HierSpeech_TTS', # irresponsive to exclamation marks # 4.29
127
  # 'PolyAI/pheme': '/predict#0', # sleepy HF Space
128
  # 'amphion/Text-to-Speech': '/predict#0', # disabled also on original HF space due to poor ratings
 
307
  # 'emoji': '😷',
308
  },
309
 
310
+ # OpenAudio S1 (Fish Audio)
311
+ 'fishaudio/openaudio-s1-mini': {
312
+ 'name': 'OpenAudio S1 Mini',
313
+ 'function': '/partial',
314
+ 'text_param_index': 'text',
315
+ 'return_audio_index': 0,
316
+ 'series': 'Fish Speech',
317
+ # 'emoji': '😷',
318
+ },
319
+
320
  # F5 TTS
321
  'mrfakename/E2-F5-TTS': {
322
  'name': 'F5 TTS',
 
700
  'use_memory_cache': "never",
701
  },
702
 
703
+ # OpenAudio S1 (Fish Audio)
704
+ 'fishaudio/openaudio-s1-mini': {
705
+ # 'reference_id': "Hello!!", # voice id string - https://fish.audio/discovery/
706
+ # 'reference_audio': None,
707
+ # 'reference_text': None,
708
+ 'reference_audio': DEFAULT_VOICE_SAMPLE,
709
+ 'reference_text': DEFAULT_VOICE_TRANSCRIPT,
710
+ 'max_new_tokens': 0,
711
+ 'chunk_length': 0,
712
+ 'top_p': 0.9,
713
+ 'repetition_penalty': 1.1,
714
+ 'temperature': 0.9,
715
+ 'seed': 0,
716
+ 'use_memory_cache': "on",
717
+ # 'emoji': '😷',
718
+ },
719
+
720
  # F5
721
  'mrfakename/E2-F5-TTS': {
722
  'ref_audio_input': handle_file('voice_samples/EN_B00004_S00051_W000213.mp3'),
 
996
  ]
997
 
998
  # top five models in order to always have one of them picked and scrutinized
999
+ top_five = ['PHBJT/multi_parler_tts', 'fishaudio/openaudio-s1-mini', 'ResembleAI/Chatterbox']
1000
 
1001
  # prioritize low vote models
1002
  sql = 'SELECT name FROM model WHERE (upvote + downvote) < 750 ORDER BY (upvote + downvote) ASC'