ameerazam08's picture
Upload folder using huggingface_hub
e34aada verified
raw
history blame
553 Bytes
ds_name: TH1KH_512
raw_data_dir: /mnt/bn/sa-ag-data/yezhenhui/datasets/raw/TH1KH_512
binary_data_dir: data/binary/TH1KH_512
# binary_data_dir: /dev/shm/TH1KH
process_id: 0 # rank id when pre-processing dataset
total_process: 1 # number of ranks when pre-processing dataset
split_seed: 999 # random seed that split chunks during pre-processing dataset
max_sentences_per_batch: 1024
max_tokens_per_batch: 200000
load_db_to_memory: false
num_workers: 4
use_kv_dataset: true
binarization_args:
with_hubert: false
with_mel: false
with_coeff: true