|
|
|
|
|
defaults: |
|
- /solver/default |
|
- /model: score/basic |
|
- override /dset: audio/default |
|
- _self_ |
|
|
|
solver: diffusion |
|
|
|
sample_rate: 16000 |
|
channels: 1 |
|
compression_model_checkpoint: //sig/5091833e |
|
n_q: 2 |
|
|
|
dataset: |
|
batch_size: 8 |
|
num_workers: 10 |
|
segment_duration: 1 |
|
train: |
|
num_samples: 100 |
|
valid: |
|
num_samples: 100 |
|
evaluate: |
|
batch_size: 8 |
|
num_samples: 10 |
|
generate: |
|
batch_size: 8 |
|
num_samples: 10 |
|
segment_duration: 10 |
|
|
|
loss: |
|
kind: mse |
|
norm_power: 0. |
|
|
|
valid: |
|
every: 1 |
|
|
|
evaluate: |
|
every: 5 |
|
num_workers: 5 |
|
metrics: |
|
visqol: false |
|
sisnr: false |
|
rvm: true |
|
|
|
generate: |
|
every: 5 |
|
num_workers: 5 |
|
audio: |
|
sample_rate: ${sample_rate} |
|
|
|
checkpoint: |
|
save_last: true |
|
save_every: 25 |
|
keep_last: 10 |
|
keep_every_states: null |
|
|
|
|
|
optim: |
|
epochs: 50 |
|
updates_per_epoch: 2000 |
|
lr: 2e-4 |
|
max_norm: 0 |
|
optimizer: adam |
|
adam: |
|
betas: [0.9, 0.999] |
|
weight_decay: 0. |
|
ema: |
|
use: true |
|
updates: 1 |
|
device: ${device} |
|
decay: 0.99 |
|
|
|
processor: |
|
name: multi_band_processor |
|
use: false |
|
n_bands: 8 |
|
num_samples: 10_000 |
|
power_std: 1. |
|
|
|
resampling: |
|
use: false |
|
target_sr: 16000 |
|
|
|
filter: |
|
use: false |
|
n_bands: 4 |
|
idx_band: 0 |
|
cutoffs: null |
|
|
|
schedule: |
|
repartition: "power" |
|
variable_step_batch: true |
|
beta_t0: 1.0e-5 |
|
beta_t1: 2.9e-2 |
|
beta_exp: 7.5 |
|
num_steps: 1000 |
|
variance: 'beta' |
|
clip: 5. |
|
rescale: 1. |
|
n_bands: null |
|
noise_scale: 1.0 |
|
|
|
metrics: |
|
num_stage: 4 |
|
|