File size: 553 Bytes
e34aada
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
ds_name: TH1KH_512
raw_data_dir: /mnt/bn/sa-ag-data/yezhenhui/datasets/raw/TH1KH_512
binary_data_dir: data/binary/TH1KH_512
# binary_data_dir: /dev/shm/TH1KH
process_id: 0 # rank id when pre-processing dataset
total_process: 1 # number of ranks when pre-processing dataset
split_seed: 999 # random seed that split chunks during pre-processing dataset

max_sentences_per_batch: 1024
max_tokens_per_batch: 200000

load_db_to_memory: false

num_workers: 4
use_kv_dataset: true

binarization_args:
  with_hubert: false
  with_mel: false
  with_coeff: true