multitensor commited on
Commit
681e79d
·
verified ·
1 Parent(s): ce7766c

Upload folder using huggingface_hub

Browse files
Files changed (1) hide show
  1. pretrain_all.sh +42 -0
pretrain_all.sh ADDED
@@ -0,0 +1,42 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ CUDA_VISIBLE_DEVICES=0,1 deepspeed llava/train/train_mem.py \
2
+ --deepspeed ./scripts/zero2.json \
3
+ --model_name_or_path ./Meta-Llama-3.1-8B-Instruct \
4
+ --version plain \
5
+ --data_path train_json/video_image_asr_caption_pre.json \
6
+ --audio_asr_folder /home/yu/Downloads \
7
+ --audio_caption_folder /media/yu/33da5c9f-d06a-4b18-acc4-b4e1c20292471/0818 \
8
+ --video_folder video_data \
9
+ --image_folder /media/yu/33da5c9f-d06a-4b18-acc4-b4e1c20292471 \
10
+ --X "Audio_asr" "Audio_caption" "Video" "Image" \
11
+ --audio_tower ./LanguageBind_Audio_Asr \
12
+ --audio_caption_tower LanguageBind/LanguageBind_Audio \
13
+ --video_tower LanguageBind/LanguageBind_Video_merge \
14
+ --image_tower LanguageBind/LanguageBind_Image \
15
+ --mm_projector_type mlp2x_gelu \
16
+ --tune_mm_mlp_adapter True \
17
+ --mm_vision_select_layer -2 \
18
+ --mm_use_x_start_end False \
19
+ --mm_use_x_patch_token False \
20
+ --bf16 True \
21
+ --output_dir ./checkpoints/Video-LLaVA-Pretrain-7B \
22
+ --num_train_epochs 1 \
23
+ --per_device_train_batch_size 1 \
24
+ --per_device_eval_batch_size 16 \
25
+ --gradient_accumulation_steps 32 \
26
+ --evaluation_strategy "no" \
27
+ --save_strategy "steps" \
28
+ --save_steps 2000 \
29
+ --save_total_limit 20 \
30
+ --learning_rate 1e-3 \
31
+ --weight_decay 0. \
32
+ --warmup_ratio 0.03 \
33
+ --lr_scheduler_type "cosine" \
34
+ --logging_steps 1 \
35
+ --tf32 True \
36
+ --model_max_length 2048 \
37
+ --tokenizer_model_max_length 3072 \
38
+ --gradient_checkpointing True \
39
+ --dataloader_num_workers 8 \
40
+ --lazy_preprocess True \
41
+ --report_to tensorboard \
42
+ --cache_dir "./cache_dir"