#!/bin/bash GPU_IDS="0,1" DATA_ROOT="$ROOT_DIR/video-dataset-disney" CAPTION_COLUMN="prompt.txt" VIDEO_COLUMN="videos.txt" OUTPUT_DIR="hunyuan-video" ID_TOKEN="BW_STYLE" # Model arguments model_cmd="--model_name hunyuan_video \ --pretrained_model_name_or_path hunyuanvideo-community/HunyuanVideo" # Dataset arguments dataset_cmd="--data_root $DATA_ROOT \ --video_column $VIDEO_COLUMN \ --caption_column $CAPTION_COLUMN \ --id_token $ID_TOKEN \ --video_resolution_buckets 24x512x768 \ --caption_dropout_p 0.05" # Dataloader arguments dataloader_cmd="--dataloader_num_workers 0 --precompute_conditions" # Training arguments training_cmd="--training_type lora \ --seed 42 \ --batch_size 1 \ --train_steps 10 \ --rank 16 \ --lora_alpha 16 \ --target_modules to_q to_k to_v to_out.0 \ --gradient_accumulation_steps 1 \ --gradient_checkpointing \ --checkpointing_steps 5 \ --checkpointing_limit 2 \ --enable_slicing \ --enable_tiling" # Optimizer arguments optimizer_cmd="--optimizer adamw \ --lr 3e-5 \ --beta1 0.9 \ --beta2 0.95 \ --weight_decay 1e-4 \ --epsilon 1e-8 \ --max_grad_norm 1.0" # Validation arguments validation_prompts=$(cat <