File size: 1,251 Bytes
9742bb8 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 |
#!/bin/bash
FAIRSEQ= # Setup your fairseq directory
config_dir=${FAIRSEQ}/examples/mr_hubert/config
config_name=mr_hubert_base_librispeech
# override configs if need
max_tokens=3200000
max_sample_size=1000000
max_update=50000
# Prepared Data Directory
data_dir=librispeech
# -- data_dir
# -- train.tsv
# -- train.ltr
# -- valid.tsv
# -- valid.ltr
# -- dict.ltr.txt
exp_dir=exp # Target experiments directory
ratios="[1, 2]" # Default label rate ratios
hubert_path=/path/of/your/hubert.pt
_opts=
# If use slurm, uncomment this line and modify the job submission at
# _opts="${_opts} hydra/launcher=submitit_slurm +hydra.launcher.partition=${your_slurm_partition} +run=submitit_reg"
# If want to set additional experiment tag, uncomment this line
# _opts="${_opts} hydra.sweep.subdir=${your_experiment_tag}"
python ${FAIRSEQ}/fairseq_cli/hydra_train.py \
-m --config-dir ${config_dir} --config-name ${config_name} ${_opts} \
task.data=${data_dir} +task.max_sample_size=${max_sample_size} \
task.label_dir=${data_dir} \
task.label_rate_ratios='${ratios}' \
dataset.max_tokens=${max_tokens} \
optimization.max_update=${max_update} \
model.multires_hubert_path=${hubert_path} \
hydra.sweep.dir=${exp_dir} &
|