Spaces:

innnky
/

soft-vits-singingvc

App Files Files Community

rcell commited on Sep 13, 2022

Commit

3f36c0a

•

1 Parent(s): c195376

fix

Files changed (1) hide show

app.py +6 -6

app.py CHANGED Viewed

@@ -15,19 +15,19 @@ import utils
 from models import SynthesizerTrn
 from text.symbols import symbols
 from text import text_to_sequence
-import torchcrepe
 def resize2d(source, target_len):
     source[source<0.001] = np.nan
     target = np.interp(np.arange(0, len(source)*target_len, len(source))/ target_len, np.arange(0, len(source)), source)
     return np.nan_to_num(target)
 def convert_wav_22050_to_f0(audio):
-    tmp = torchcrepe.predict(audio=audio, fmin=50, fmax=550,
-                             sample_rate=22050, model='full',
-                             batch_size=2048, device='cuda:0').numpy()[0]
     f0 = np.zeros_like(tmp)
-    f0[tmp > 0] = tmp[tmp > 0]
     return f0
 def get_text(text, hps):
     text_norm = text_to_sequence(text, hps.data.text_cleaners)
     if hps.data.add_blank:

 from models import SynthesizerTrn
 from text.symbols import symbols
 from text import text_to_sequence
 def resize2d(source, target_len):
     source[source<0.001] = np.nan
     target = np.interp(np.arange(0, len(source)*target_len, len(source))/ target_len, np.arange(0, len(source)), source)
     return np.nan_to_num(target)
 def convert_wav_22050_to_f0(audio):
+    tmp = librosa.pyin(audio,
+                fmin=librosa.note_to_hz('C0'),
+                fmax=librosa.note_to_hz('C7'),
+                frame_length=1780)[0]
     f0 = np.zeros_like(tmp)
+    f0[tmp>0] = tmp[tmp>0]
     return f0
 def get_text(text, hps):
     text_norm = text_to_sequence(text, hps.data.text_cleaners)
     if hps.data.add_blank: