BEAKER=1 WEKA=1 ./shell_scripts/run_tulu_eval.sh eval_gsm8k_v3_check_v3_v3 /weka/oe-adapt-default/hamishi/simplex-diffusion/tulu_v3_mistral_v3 gsm8k BEAKER=1 WEKA=1 ./shell_scripts/run_tulu_eval.sh eval_bbh_v3_check_v3_v3 /weka/oe-adapt-default/hamishi/simplex-diffusion/tulu_v3_mistral_v3 bbh BEAKER=1 WEKA=1 ./shell_scripts/run_tulu_eval.sh eval_alpaca_eval_v3_check_v3_v3 /weka/oe-adapt-default/hamishi/simplex-diffusion/tulu_v3_mistral_v3 alpaca_eval BEAKER=1 WEKA=1 ./shell_scripts/run_tulu_eval.sh eval_ifeval_v3_check_v3_v3 /weka/oe-adapt-default/hamishi/simplex-diffusion/tulu_v3_mistral_v3 ifeval BEAKER=1 WEKA=1 ./shell_scripts/run_tulu_eval.sh eval_triviaqa_v3_check_v3_v3 /weka/oe-adapt-default/hamishi/simplex-diffusion/tulu_v3_mistral_v3 triviaqa BEAKER=1 WEKA=1 ./shell_scripts/run_tulu_eval.sh eval_squad_v3_check_v3_v3 /weka/oe-adapt-default/hamishi/simplex-diffusion/tulu_v3_mistral_v3 squad run_name=$1 checkpoint_mount=$2 eval_dataset_name=$3