Spaces:
Runtime error
Runtime error
MODEL_ID="THUDM/CogVideoX-2b" | |
NUM_GPUS=8 | |
# For more details on the expected data format, please refer to the README. | |
DATA_ROOT="/path/to/my/datasets/video-dataset" # This needs to be the path to the base directory where your videos are located. | |
CAPTION_COLUMN="prompt.txt" | |
VIDEO_COLUMN="videos.txt" | |
OUTPUT_DIR="/path/to/my/datasets/preprocessed-dataset" | |
HEIGHT_BUCKETS="480 720" | |
WIDTH_BUCKETS="720 960" | |
FRAME_BUCKETS="49" | |
MAX_NUM_FRAMES="49" | |
MAX_SEQUENCE_LENGTH=226 | |
TARGET_FPS=8 | |
BATCH_SIZE=1 | |
DTYPE=fp32 | |
# To create a folder-style dataset structure without pre-encoding videos and captions | |
# For Image-to-Video finetuning, make sure to pass `--save_image_latents` | |
CMD_WITHOUT_PRE_ENCODING="\ | |
torchrun --nproc_per_node=$NUM_GPUS \ | |
training/prepare_dataset.py \ | |
--model_id $MODEL_ID \ | |
--data_root $DATA_ROOT \ | |
--caption_column $CAPTION_COLUMN \ | |
--video_column $VIDEO_COLUMN \ | |
--output_dir $OUTPUT_DIR \ | |
--height_buckets $HEIGHT_BUCKETS \ | |
--width_buckets $WIDTH_BUCKETS \ | |
--frame_buckets $FRAME_BUCKETS \ | |
--max_num_frames $MAX_NUM_FRAMES \ | |
--max_sequence_length $MAX_SEQUENCE_LENGTH \ | |
--target_fps $TARGET_FPS \ | |
--batch_size $BATCH_SIZE \ | |
--dtype $DTYPE | |
" | |
CMD_WITH_PRE_ENCODING="$CMD_WITHOUT_PRE_ENCODING --save_latents_and_embeddings" | |
# Select which you'd like to run | |
CMD=$CMD_WITH_PRE_ENCODING | |
echo "===== Running \`$CMD\` =====" | |
eval $CMD | |
echo -ne "===== Finished running script =====\n" | |