Spaces:
Running
Running
Hendrik Schroeter
commited on
Commit
•
ea2e234
1
Parent(s):
7cbdca2
load local model
Browse files- .gitattributes +2 -0
- DeepFilterNet2/checkpoints/model_96.ckpt.best +3 -0
- DeepFilterNet2/config.ini +109 -0
- app.py +1 -1
.gitattributes
CHANGED
@@ -25,3 +25,5 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
|
|
25 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
26 |
*.zstandard filter=lfs diff=lfs merge=lfs -text
|
27 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
25 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
26 |
*.zstandard filter=lfs diff=lfs merge=lfs -text
|
27 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
28 |
+
*ckpt filter=lfs diff=lfs merge=lfs -text
|
29 |
+
*best filter=lfs diff=lfs merge=lfs -text
|
DeepFilterNet2/checkpoints/model_96.ckpt.best
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bb5eccb429e675bb4ec5ec9e280f048bfff9787b40bd3eb835fd11509eb14a3e
|
3 |
+
size 9397209
|
DeepFilterNet2/config.ini
ADDED
@@ -0,0 +1,109 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
[train]
|
2 |
+
seed = 43
|
3 |
+
device =
|
4 |
+
model = deepfilternet2
|
5 |
+
jit = false
|
6 |
+
mask_only = false
|
7 |
+
df_only = false
|
8 |
+
batch_size = 96
|
9 |
+
batch_size_eval = 128
|
10 |
+
num_workers = 16
|
11 |
+
max_sample_len_s = 3.0
|
12 |
+
p_atten_lim = 0.0
|
13 |
+
p_reverb = 0.1
|
14 |
+
overfit = false
|
15 |
+
max_epochs = 100
|
16 |
+
log_freq = 100
|
17 |
+
log_timings = False
|
18 |
+
validation_criteria = loss
|
19 |
+
validation_criteria_rule = min
|
20 |
+
early_stopping_patience = 15
|
21 |
+
global_ds_sampling_f = 1
|
22 |
+
num_prefetch_batches = 8
|
23 |
+
dataloader_snrs = -5,0,5,10,20,40
|
24 |
+
detect_anomaly = false
|
25 |
+
batch_size_scheduling = 0/8,1/16,2/24,5/32,10/64,20/128,40/9999
|
26 |
+
start_eval = true
|
27 |
+
validation_set_caching = false
|
28 |
+
|
29 |
+
[df]
|
30 |
+
sr = 48000
|
31 |
+
fft_size = 960
|
32 |
+
hop_size = 480
|
33 |
+
nb_erb = 32
|
34 |
+
nb_df = 96
|
35 |
+
norm_tau = 1
|
36 |
+
lsnr_max = 35
|
37 |
+
lsnr_min = -15
|
38 |
+
min_nb_erb_freqs = 2
|
39 |
+
pad_mode = input_specf
|
40 |
+
|
41 |
+
[deepfilternet]
|
42 |
+
conv_lookahead = 2
|
43 |
+
conv_ch = 64
|
44 |
+
conv_depthwise = True
|
45 |
+
emb_hidden_dim = 256
|
46 |
+
emb_num_layers = 3
|
47 |
+
gru_groups = 8
|
48 |
+
linear_groups = 8
|
49 |
+
conv_dec_mode = transposed
|
50 |
+
convt_depthwise = True
|
51 |
+
mask_pf = False
|
52 |
+
df_order = 5
|
53 |
+
df_lookahead = 2
|
54 |
+
df_hidden_dim = 256
|
55 |
+
df_num_layers = 2
|
56 |
+
dfop_method = df
|
57 |
+
group_shuffle = False
|
58 |
+
conv_kernel = 1,3
|
59 |
+
df_gru_skip = none
|
60 |
+
df_output_layer = groupedlinear
|
61 |
+
gru_type = squeeze
|
62 |
+
df_pathway_kernel_size_t = 5
|
63 |
+
df_n_iter = 1
|
64 |
+
enc_concat = True
|
65 |
+
conv_kernel_inp = 3,3
|
66 |
+
|
67 |
+
[localsnrloss]
|
68 |
+
factor = 1e-3
|
69 |
+
|
70 |
+
[maskloss]
|
71 |
+
factor = 0
|
72 |
+
mask = iam
|
73 |
+
gamma = 0.6
|
74 |
+
gamma_pred = 0.6
|
75 |
+
f_under = 1
|
76 |
+
|
77 |
+
[spectralloss]
|
78 |
+
factor_magnitude = 1000
|
79 |
+
factor_complex = 1000
|
80 |
+
gamma = 0.3
|
81 |
+
|
82 |
+
[dfalphaloss]
|
83 |
+
factor = 0.0
|
84 |
+
|
85 |
+
[multiresspecloss]
|
86 |
+
factor = 500
|
87 |
+
factor_complex = 500
|
88 |
+
gamma = 0.3
|
89 |
+
fft_sizes = 256,512,1024
|
90 |
+
|
91 |
+
[optim]
|
92 |
+
lr = 0.001
|
93 |
+
momentum = 0
|
94 |
+
weight_decay = 1e-12
|
95 |
+
weight_decay_end = 0.05
|
96 |
+
optimizer = adamw
|
97 |
+
lr_min = 1e-06
|
98 |
+
lr_warmup = 0.0001
|
99 |
+
warmup_epochs = 3
|
100 |
+
lr_cycle_mul = 1.0
|
101 |
+
lr_cycle_decay = 0.5
|
102 |
+
lr_cycle_limit = 1
|
103 |
+
lr_update_per_epoch = False
|
104 |
+
lr_cycle_epochs = -1
|
105 |
+
|
106 |
+
[sdrloss]
|
107 |
+
factor = 0.0
|
108 |
+
segmental_ws = 0
|
109 |
+
|
app.py
CHANGED
@@ -18,7 +18,7 @@ from df.enhance import enhance, init_df, load_audio, save_audio
|
|
18 |
from df.utils import resample
|
19 |
|
20 |
device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
|
21 |
-
model, df, _ = init_df(config_allow_defaults=True)
|
22 |
model = model.to(device=device).eval()
|
23 |
|
24 |
NOISES = {
|
|
|
18 |
from df.utils import resample
|
19 |
|
20 |
device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
|
21 |
+
model, df, _ = init_df("./DeepFilterNet2", config_allow_defaults=True)
|
22 |
model = model.to(device=device).eval()
|
23 |
|
24 |
NOISES = {
|