Hendrik Schroeter commited on
Commit
2527d95
·
unverified ·
1 Parent(s): 6df9060

Some more debug prints

Browse files
Files changed (1) hide show
  1. app.py +10 -6
app.py CHANGED
@@ -43,6 +43,7 @@ def mix_at_snr(clean, noise, snr, eps=1e-10):
43
  K = torch.sqrt((E_noise / E_speech) * 10 ** (snr / 10) + eps)
44
  noise = noise / K
45
  mixture = clean + noise
 
46
  assert torch.isfinite(mixture).all()
47
  max_m = mixture.abs().max()
48
  if max_m > 1:
@@ -51,25 +52,28 @@ def mix_at_snr(clean, noise, snr, eps=1e-10):
51
  return clean, noise, mixture
52
 
53
 
54
- def mix_and_denoise(speech, speech_alt, noise, snr):
55
  sr = config("sr", 48000, int, section="df")
56
- print(speech, noise, snr)
57
  if noise is None:
58
  noise = "samples/dkitchen.wav"
59
  sp_kwargs = {}
60
- if speech is None or "none" in speech:
61
  speech = "samples/p232_013_clean.wav"
62
- if speech_alt is not None and "none" not in speech_alt:
63
  print("using speech_alt")
64
- speech = speech_alt
65
  else:
 
66
  sp_kwargs = {"frame_offset": 4800}
67
- speech, _ = load_audio(speech, sr, **sp_kwargs)
68
  print(f"Loaded speech with shape {speech.shape}")
69
  noise, _ = load_audio(noise, sr)
70
  print(f"Loaded noise with shape {noise.shape}")
71
  speech, noise, noisy = mix_at_snr(speech, noise, snr)
 
72
  enhanced = enhance(model, df, noisy)
 
73
  lim = torch.linspace(0.0, 1.0, int(sr * 0.15)).unsqueeze(0)
74
  lim = torch.cat((lim, torch.ones(1, enhanced.shape[1] - lim.shape[1])), dim=1)
75
  enhanced = enhanced * lim
 
43
  K = torch.sqrt((E_noise / E_speech) * 10 ** (snr / 10) + eps)
44
  noise = noise / K
45
  mixture = clean + noise
46
+ print("mixture:", mixture.shape)
47
  assert torch.isfinite(mixture).all()
48
  max_m = mixture.abs().max()
49
  if max_m > 1:
 
52
  return clean, noise, mixture
53
 
54
 
55
+ def mix_and_denoise(speech_rec, speech_upl, noise, snr):
56
  sr = config("sr", 48000, int, section="df")
57
+ print(speech_rec, noise, snr)
58
  if noise is None:
59
  noise = "samples/dkitchen.wav"
60
  sp_kwargs = {}
61
+ if speech_rec is None or "none" in speech_rec:
62
  speech = "samples/p232_013_clean.wav"
63
+ if speech_upl is not None and "none" not in speech_upl:
64
  print("using speech_alt")
65
+ speech = speech_upl
66
  else:
67
+ speech = speech_rec
68
  sp_kwargs = {"frame_offset": 4800}
69
+ speech, _ = load_audio(speech_rec, sr, **sp_kwargs)
70
  print(f"Loaded speech with shape {speech.shape}")
71
  noise, _ = load_audio(noise, sr)
72
  print(f"Loaded noise with shape {noise.shape}")
73
  speech, noise, noisy = mix_at_snr(speech, noise, snr)
74
+ print("Start denoising audio")
75
  enhanced = enhance(model, df, noisy)
76
+ print("Denoising finished")
77
  lim = torch.linspace(0.0, 1.0, int(sr * 0.15)).unsqueeze(0)
78
  lim = torch.cat((lim, torch.ones(1, enhanced.shape[1] - lim.shape[1])), dim=1)
79
  enhanced = enhanced * lim