# Example: ./sub.sh tmp_proj 0,1,2,3 3 --> Use 0,1,2,3 for training, release GPUs, use GPU:3 for inference. | |
module load gcc/11.2.0 cuda/11.8 cudnn/8.6.0_cu11x && cpu_core_num=6 | |
# module load compilers/cuda/11.8 compilers/gcc/12.2.0 cudnn/8.4.0.27_cuda11.x && cpu_core_num=32 | |
export PYTHONUNBUFFERED=1 | |
method=${1:-"BSL"} | |
devices=${2:-0} | |
gpu_num=$(($(echo ${devices%%,} | grep -o "," | wc -l)+1)) | |
sbatch --nodes=1 -p vip_gpu_ailab -A ai4bio \ | |
--gres=gpu:${gpu_num} --ntasks-per-node=1 --cpus-per-task=$((gpu_num*cpu_core_num)) \ | |
./train_test.sh ${method} ${devices} | |
hostname | |