|
#!/usr/bin/env bash |
|
|
|
|
|
|
|
|
|
export GPUS_PER_NODE=8 |
|
|
|
export NUM_NODES=$SLURM_NNODES |
|
|
|
master_addr=$(scontrol show hostnames "$SLURM_JOB_NODELIST" | head -n 1) |
|
export MASTER_ADDR=$master_addr |
|
|
|
|
|
export MASTER_PORT=12350 |
|
|
|
export RANK=$SLURM_NODEID |
|
|
|
echo "MASTER_ADDR: $MASTER_ADDR" |
|
echo "RANK :$RANK" |
|
echo "NUM_NODES :$NUM_NODES" |
|
echo "GPUS_PER_NODE :$GPUS_PER_NODE" |
|
|
|
export MIOPEN_USER_DB_PATH=/lus/home/NAT/gda2204/mshukor/.config/miopen_${MASTER_ADDR}_${SLURM_PROCID}/ |
|
|
|
echo "MIOPEN_USER_DB_PATH :$MIOPEN_USER_DB_PATH" |
|
|
|
num_workers=0 |
|
|
|
|
|
|
|
|
|
|
|
|
|
ofa_dir=/lus/home/NAT/gda2204/mshukor/code/unival |
|
base_data_dir=/lus/scratch/NAT/gda2204/SHARED/data |
|
base_log_dir=/work/NAT/gda2204/mshukor/logs |
|
|
|
|
|
|
|
|
|
bpe_dir=${ofa_dir}/utils/BPE |
|
user_dir=${ofa_dir}/ofa_module |
|
|
|
|
|
|
|
|
|
selected_cols=0,4,2,3 |
|
|
|
|
|
image_encoder_name=resnet |
|
|
|
|
|
|
|
|
|
exp_name=eval_refcocoplus_base_best_refcocoplus_ratacapsnlivqagroundofapt |
|
path=${base_log_dir}/ofa/pretrained_models/average_models/refcocoplus_ratacapsnlivqagroundofapt.pt |
|
|
|
echo ${path} |
|
result_path=${base_log_dir}/ofa/results/refcocoplus/${exp_name} |
|
mkdir ${result_path} |
|
|
|
|
|
|
|
|
|
data=${base_data_dir}/ofa/refcocoplus_data/refcocoplus_val.tsv |
|
split='refcocoplus_val' |
|
|
|
python3 -m torch.distributed.launch \ |
|
--nnodes=${NUM_NODES} \ |
|
--nproc_per_node=${GPUS_PER_NODE} \ |
|
--master_port=${MASTER_PORT} \ |
|
--node_rank=${RANK} \ |
|
--master_addr=${MASTER_ADDR} \ |
|
--use_env ${ofa_dir}/evaluate.py \ |
|
${data} \ |
|
--path=${path} \ |
|
--user-dir=${user_dir} \ |
|
--task=refcoco \ |
|
--batch-size=16 \ |
|
--log-format=simple --log-interval=10 \ |
|
--seed=7 \ |
|
--gen-subset=${split} \ |
|
--results-path=${result_path} \ |
|
--beam=5 \ |
|
--min-len=4 \ |
|
--max-len-a=0 \ |
|
--max-len-b=4 \ |
|
--no-repeat-ngram-size=3 \ |
|
--fp16 \ |
|
--num-workers=0 \ |
|
--model-overrides="{\"data\":\"${data}\",\"bpe_dir\":\"${bpe_dir}\",\"selected_cols\":\"${selected_cols}\"}" |
|
|
|
data=${base_data_dir}/ofa/refcocoplus_data/refcocoplus_testA.tsv |
|
split='refcocoplus_testA' |
|
python3 -m torch.distributed.launch \ |
|
--nnodes=${NUM_NODES} \ |
|
--nproc_per_node=${GPUS_PER_NODE} \ |
|
--master_port=${MASTER_PORT} \ |
|
--node_rank=${RANK} \ |
|
--master_addr=${MASTER_ADDR} \ |
|
--use_env ${ofa_dir}/evaluate.py \ |
|
${data} \ |
|
--path=${path} \ |
|
--user-dir=${user_dir} \ |
|
--task=refcoco \ |
|
--batch-size=16 \ |
|
--log-format=simple --log-interval=10 \ |
|
--seed=7 \ |
|
--gen-subset=${split} \ |
|
--results-path=${result_path} \ |
|
--beam=5 \ |
|
--min-len=4 \ |
|
--max-len-a=0 \ |
|
--max-len-b=4 \ |
|
--no-repeat-ngram-size=3 \ |
|
--fp16 \ |
|
--num-workers=0 \ |
|
--model-overrides="{\"data\":\"${data}\",\"bpe_dir\":\"${bpe_dir}\",\"selected_cols\":\"${selected_cols}\"}" |
|
|
|
|
|
data=${base_data_dir}/ofa/refcocoplus_data/refcocoplus_testB.tsv |
|
split='refcocoplus_testB' |
|
|
|
python3 -m torch.distributed.launch \ |
|
--nnodes=${NUM_NODES} \ |
|
--nproc_per_node=${GPUS_PER_NODE} \ |
|
--master_port=${MASTER_PORT} \ |
|
--node_rank=${RANK} \ |
|
--master_addr=${MASTER_ADDR} \ |
|
--use_env ${ofa_dir}/evaluate.py \ |
|
${data} \ |
|
--path=${path} \ |
|
--user-dir=${user_dir} \ |
|
--task=refcoco \ |
|
--batch-size=16 \ |
|
--log-format=simple --log-interval=10 \ |
|
--seed=7 \ |
|
--gen-subset=${split} \ |
|
--results-path=${result_path} \ |
|
--beam=5 \ |
|
--min-len=4 \ |
|
--max-len-a=0 \ |
|
--max-len-b=4 \ |
|
--no-repeat-ngram-size=3 \ |
|
--fp16 \ |
|
--num-workers=0 \ |
|
--model-overrides="{\"data\":\"${data}\",\"bpe_dir\":\"${bpe_dir}\",\"selected_cols\":\"${selected_cols}\"}" |
|
|