File size: 1,799 Bytes
9fb1a94
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
{
    "feature_extraction": {
        "sequence": [
            {
                "operation": {
                    "name": "audio_decoder",
                    "type": "AudioDecoderEx",
                    "attrs": {
                        "target_sample_rates": [
                            8000,
                            16000
                        ]
                    }
                }
            },
            {
                "operation": {
                    "name": "phi_4_audio_embed",
                    "type": "Phi4AudioEmbed",
                    "attrs": {
                        "audio_compression_rate": 8,
                        "stft_normal/n_fft": 512,
                        "stft_normal/frame_length": 400,
                        "stft_normal/hop_length": 160,
                        "stft_normal/win_fn": "hamming",
                        "logmel/chunk_size": 30,
                        "logmel/hop_length": 160,
                        "logmel/n_fft": 512,
                        "logmel/n_mel": 80,
                        "logmel/feature_first": 0,
                        "logmel/no_padding": 1,
                        "stft_normal_8k/n_fft": 256,
                        "stft_normal_8k/frame_length": 200,
                        "stft_normal_8k/hop_length": 80,
                        "stft_normal_8k/win_fn": "hamming",
                        "logmel_8k/chunk_size": 30,
                        "logmel_8k/hop_length": 80,
                        "logmel_8k/n_fft": 512,
                        "logmel_8k/n_mel": 80,
                        "logmel_8k/feature_first": 0,
                        "logmel_8k/no_padding": 1
                    }
                }
            }
        ],
        "output_aligner": "phi4-audio-aligner"
    }
}