dkounadis
/

artificial-styletts2

audio-generation

Model card Files Files and versions

Dionyssos commited on Sep 2, 2024

Commit

5d9a91a

·

1 Parent(s): e1acca5

Readme

Files changed (2) hide show

README.py +31 -0
tts_harvard.py +2 -2

README.py ADDED Viewed

	@@ -0,0 +1,31 @@

+---
+license: cc-by-nc-sa-4.0
+language:
+- en
+pipeline_tag: text-to-speech
+tags:
+- msp-podcast
+- emotion-recognition
+- audio
+- speech
+- styletts2
+- mimic3
+- speech-emotion-recognition
+- dkounadis
+---
+# Artificial StyleTTS2
+Using Mimic-3 Synthetic Speech to Drive StyleTTS2
+**[arXiv Coming soon]()**
+```
+```
+See demo at [SHIFT TTS tool](https://github.com/audeering/shift/tree/main)

tts_harvard.py CHANGED Viewed

@@ -106,12 +106,12 @@ for audio_prompt in ['english',
                      'human',
                      'foreign',
                      'foreign_4x']:
-    OUT_FILE = f'{audio_prompt}_hfg.wav'
     if not os.path.isfile(OUT_FILE):
                     total_audio = []
                     total_style = []
                     ix = 0
-                    for list_of_10 in harvard_individual_sentences[:2]:
                         # long_sentence = ' '.join(list_of_10['sentences'])
                         # harvard.append(long_sentence.replace('.', ' '))
                         for text in list_of_10['sentences']:

                      'human',
                      'foreign',
                      'foreign_4x']:
+    OUT_FILE = f'{audio_prompt}_hfullh.wav'
     if not os.path.isfile(OUT_FILE):
                     total_audio = []
                     total_style = []
                     ix = 0
+                    for list_of_10 in harvard_individual_sentences[:1000]:
                         # long_sentence = ' '.join(list_of_10['sentences'])
                         # harvard.append(long_sentence.replace('.', ' '))
                         for text in list_of_10['sentences']: