stash
/

llava-v1.5-13b-task-lora-20240803_110435

Model card Files Files and versions Community

stash commited on Aug 3, 2024

Commit

ea3765e

·

verified ·

1 Parent(s): 84ad8c0

Update README.md

Files changed (1) hide show

README.md +35 -1

README.md CHANGED Viewed

@@ -7,7 +7,41 @@ library_name: peft
 <!-- Provide a quick summary of what the model is/does. -->
 ## Model Details

 <!-- Provide a quick summary of what the model is/does. -->
+echo "Starting LoRA fine-tuning..."
+deepspeed LLaVA/llava/train/train_mem.py \
+    --lora_enable True --lora_r 128 --lora_alpha 256 --mm_projector_lr 2e-5 \
+    --deepspeed ./LLaVA/scripts/zero3.json \
+    --model_name_or_path liuhaotian/llava-v1.5-7b \
+    --version v1 \
+    --data_path "${output_dir}/processed_dataset_correct_path.json" \
+    --image_folder "${image_dir}" \
+    --vision_tower openai/clip-vit-large-patch14-336 \
+    --mm_projector_type mlp2x_gelu \
+    --mm_vision_select_layer -2 \
+    --mm_use_im_start_end False \
+    --mm_use_im_patch_token False \
+    --image_aspect_ratio pad \
+    --group_by_modality_length True \
+    --bf16 True \
+    --output_dir "${output_dir}/checkpoints/${model_name}" \
+    --num_train_epochs 1 \
+    --per_device_train_batch_size 2 \
+    --per_device_eval_batch_size 2 \
+    --gradient_accumulation_steps 5 \
+    --evaluation_strategy "no" \
+    --save_strategy "steps" \
+    --save_steps 50000 \
+    --save_total_limit 1 \
+    --learning_rate 2e-6 \
+    --weight_decay 0. \
+    --warmup_ratio 0.03 \
+    --lr_scheduler_type "cosine" \
+    --logging_steps 1 \
+    --tf32 True \
+    --model_max_length 2048 \
+    --gradient_checkpointing True \
+    --dataloader_num_workers 1 \
+    --lazy_preprocess True
 ## Model Details