datasets: llava_pretrain: data_type: image sample_ratio: 1 # internvid: # data_type: frames # sample_ratio: 10 gpt4v_public: data_type: frames sample_ratio: 1 task_types: ['summary'] fps: 1.0 conv_type: single train_data_path: /mnt/bn/algo-masp-nas-2/xiangchen/data/shared_gpt4v_data/data_500k_filtered.json