|
|
|
|
|
defaults: |
|
- /solver/default |
|
- /conditioner: none |
|
- _self_ |
|
- /solver/musicgen/evaluation: none |
|
- override /dset: audio/default |
|
|
|
autocast: true |
|
autocast_dtype: float16 |
|
|
|
solver: musicgen |
|
sample_rate: ??? |
|
channels: ??? |
|
compression_model_checkpoint: ??? |
|
|
|
|
|
|
|
|
|
|
|
compression_model_n_q: null |
|
|
|
tokens: |
|
padding_with_special_token: false |
|
|
|
interleave_stereo_codebooks: |
|
use: false |
|
per_timestep: false |
|
|
|
cache: |
|
path: |
|
write: false |
|
write_shard: 0 |
|
write_num_shards: 1 |
|
|
|
|
|
dataset: |
|
batch_size: 128 |
|
num_workers: 10 |
|
segment_duration: 30 |
|
min_segment_ratio: 0.8 |
|
return_info: true |
|
train: |
|
num_samples: 1000000 |
|
valid: |
|
num_samples: 10000 |
|
generate: |
|
num_samples: 50 |
|
|
|
metrics: |
|
fad: |
|
use_gt: false |
|
model: tf |
|
tf: |
|
bin: null |
|
model_path: //reference/fad/vggish_model.ckpt |
|
kld: |
|
use_gt: false |
|
model: passt |
|
passt: |
|
pretrained_length: 20 |
|
text_consistency: |
|
use_gt: false |
|
model: clap |
|
clap: |
|
model_path: //reference/clap/music_audioset_epoch_15_esc_90.14.pt |
|
model_arch: 'HTSAT-base' |
|
enable_fusion: false |
|
chroma_cosine: |
|
use_gt: false |
|
model: chroma_base |
|
chroma_base: |
|
sample_rate: ${sample_rate} |
|
n_chroma: 12 |
|
radix2_exp: 14 |
|
argmax: true |
|
|
|
generate: |
|
every: 25 |
|
num_workers: 5 |
|
path: samples |
|
audio: |
|
format: wav |
|
strategy: loudness |
|
sample_rate: ${sample_rate} |
|
loudness_headroom_db: 14 |
|
lm: |
|
prompted_samples: true |
|
unprompted_samples: true |
|
gen_gt_samples: false |
|
prompt_duration: null |
|
gen_duration: null |
|
remove_prompts: false |
|
|
|
use_sampling: false |
|
temp: 1.0 |
|
top_k: 0 |
|
top_p: 0.0 |
|
evaluate: |
|
every: 25 |
|
num_workers: 5 |
|
metrics: |
|
base: false |
|
fad: false |
|
kld: false |
|
text_consistency: false |
|
chroma_cosine: false |
|
|
|
checkpoint: |
|
save_last: true |
|
save_every: 50 |
|
keep_last: 10 |
|
keep_every_states: null |
|
|
|
optim: |
|
epochs: 200 |
|
updates_per_epoch: 2000 |
|
lr: 1e-4 |
|
optimizer: adamw |
|
max_norm: 1.0 |
|
eager_sync: true |
|
adam: |
|
betas: [0.9, 0.95] |
|
weight_decay: 0.1 |
|
eps: 1e-8 |
|
|
|
schedule: |
|
lr_scheduler: null |
|
|