File size: 1,799 Bytes
9fb1a94 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 |
{
"feature_extraction": {
"sequence": [
{
"operation": {
"name": "audio_decoder",
"type": "AudioDecoderEx",
"attrs": {
"target_sample_rates": [
8000,
16000
]
}
}
},
{
"operation": {
"name": "phi_4_audio_embed",
"type": "Phi4AudioEmbed",
"attrs": {
"audio_compression_rate": 8,
"stft_normal/n_fft": 512,
"stft_normal/frame_length": 400,
"stft_normal/hop_length": 160,
"stft_normal/win_fn": "hamming",
"logmel/chunk_size": 30,
"logmel/hop_length": 160,
"logmel/n_fft": 512,
"logmel/n_mel": 80,
"logmel/feature_first": 0,
"logmel/no_padding": 1,
"stft_normal_8k/n_fft": 256,
"stft_normal_8k/frame_length": 200,
"stft_normal_8k/hop_length": 80,
"stft_normal_8k/win_fn": "hamming",
"logmel_8k/chunk_size": 30,
"logmel_8k/hop_length": 80,
"logmel_8k/n_fft": 512,
"logmel_8k/n_mel": 80,
"logmel_8k/feature_first": 0,
"logmel_8k/no_padding": 1
}
}
}
],
"output_aligner": "phi4-audio-aligner"
}
} |