# export NCCL_P2P_DISABLE="1" # export NCCL_IB_DISABLE="1" export OMP_NUM_THREADS=1 export ACCELERATE_LOG_LEVEL=info export WANDB_PROJECT='Mistral-DPO' export WANDB_ENTITY="ckip" # output_dir="DPO/DPO-test" output_dir="DPO/dpo-full-0715" # Check if the directory does not exist if [ -d ${output_dir} ]; then echo "The directory already exists." exit fi mkdir -p ${output_dir} current_script=$0 cp ${current_script} ${output_dir} accelerate launch \ --config_file alignment-handbook/recipes/accelerate_configs/deepspeed_zero3.yaml \ --num_processes 4 \ test_dpo.py \ "dpo_config_full.yaml" \ --load_in_4bit=false \ --logging_steps=1 \ --model_name_or_path="/share/home/models/ckiplab/CKIP-Mistral-7B-Instruct-v1/" \ --train_file="data/training_ptt_dpo-include_id-converted.jsonl" \ --validation_file="data/testing_ptt_dpo_include_id-converted.jsonl" \ --cache_dir="cache_dir" \ --output_dir=${output_dir} \ | tee ${output_dir}/trainin.log # recipes/{model_name}/{task}/config_full.yaml