rcell commited on
Commit
3f36c0a
1 Parent(s): c195376
Files changed (1) hide show
  1. app.py +6 -6
app.py CHANGED
@@ -15,19 +15,19 @@ import utils
15
  from models import SynthesizerTrn
16
  from text.symbols import symbols
17
  from text import text_to_sequence
18
- import torchcrepe
19
-
20
  def resize2d(source, target_len):
21
  source[source<0.001] = np.nan
22
  target = np.interp(np.arange(0, len(source)*target_len, len(source))/ target_len, np.arange(0, len(source)), source)
23
  return np.nan_to_num(target)
24
  def convert_wav_22050_to_f0(audio):
25
- tmp = torchcrepe.predict(audio=audio, fmin=50, fmax=550,
26
- sample_rate=22050, model='full',
27
- batch_size=2048, device='cuda:0').numpy()[0]
 
28
  f0 = np.zeros_like(tmp)
29
- f0[tmp > 0] = tmp[tmp > 0]
30
  return f0
 
31
  def get_text(text, hps):
32
  text_norm = text_to_sequence(text, hps.data.text_cleaners)
33
  if hps.data.add_blank:
 
15
  from models import SynthesizerTrn
16
  from text.symbols import symbols
17
  from text import text_to_sequence
 
 
18
  def resize2d(source, target_len):
19
  source[source<0.001] = np.nan
20
  target = np.interp(np.arange(0, len(source)*target_len, len(source))/ target_len, np.arange(0, len(source)), source)
21
  return np.nan_to_num(target)
22
  def convert_wav_22050_to_f0(audio):
23
+ tmp = librosa.pyin(audio,
24
+ fmin=librosa.note_to_hz('C0'),
25
+ fmax=librosa.note_to_hz('C7'),
26
+ frame_length=1780)[0]
27
  f0 = np.zeros_like(tmp)
28
+ f0[tmp>0] = tmp[tmp>0]
29
  return f0
30
+
31
  def get_text(text, hps):
32
  text_norm = text_to_sequence(text, hps.data.text_cleaners)
33
  if hps.data.add_blank: