ds_name: TH1KH_512 raw_data_dir: /mnt/bn/sa-ag-data/yezhenhui/datasets/raw/TH1KH_512 binary_data_dir: data/binary/TH1KH_512 # binary_data_dir: /dev/shm/TH1KH process_id: 0 # rank id when pre-processing dataset total_process: 1 # number of ranks when pre-processing dataset split_seed: 999 # random seed that split chunks during pre-processing dataset max_sentences_per_batch: 1024 max_tokens_per_batch: 200000 load_db_to_memory: false num_workers: 4 use_kv_dataset: true binarization_args: with_hubert: false with_mel: false with_coeff: true