File size: 356 Bytes
16717ee |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 |
{
"backbone_class": "decoder.models.VocosBackbone",
"head_class": "decoder.heads.ISTFTHead",
"backbone_config": {
"input_channels": 512,
"dim": 768,
"intermediate_dim": 2304,
"num_layers": 12,
"adanorm_num_embeddings": 4
},
"head_config": {
"dim": 768,
"n_fft": 1280,
"hop_length": 320,
"padding": "same"
}
} |