Spaces:
Running
Running
{ | |
"base_config": "egs/vocoder/gan/exp_config_base.json", | |
"preprocess": { | |
// acoustic features | |
"extract_mel": true, | |
"extract_audio": true, | |
"extract_amplitude_phase": true, | |
// Features used for model training | |
"use_mel": true, | |
"use_audio": true, | |
"use_amplitude_phase": true | |
}, | |
"model": { | |
"generator": "apnet", | |
"apnet": { | |
"ASP_channel": 512, | |
"ASP_resblock_kernel_sizes": [3,7,11], | |
"ASP_resblock_dilation_sizes": [[1,3,5], [1,3,5], [1,3,5]], | |
"ASP_input_conv_kernel_size": 7, | |
"ASP_output_conv_kernel_size": 7, | |
"PSP_channel": 512, | |
"PSP_resblock_kernel_sizes": [3,7,11], | |
"PSP_resblock_dilation_sizes": [[1,3,5], [1,3,5], [1,3,5]], | |
"PSP_input_conv_kernel_size": 7, | |
"PSP_output_R_conv_kernel_size": 7, | |
"PSP_output_I_conv_kernel_size": 7, | |
} | |
}, | |
"train": { | |
"criterions": [ | |
"feature", | |
"discriminator", | |
"generator", | |
"mel", | |
"phase", | |
"amplitude", | |
"consistency" | |
] | |
}, | |
"inference": { | |
"batch_size": 1, | |
} | |
} | |