|
data_configs = { |
|
'llava_pretrain': { |
|
'data_type': 'images', |
|
'train_data_path': '/mnt/bn/algo-masp-nas-2/baiyi.by/data/blip_laion_cc_sbu_558k/meta_data.json' |
|
}, |
|
'llava_instruct': { |
|
'data_type': 'images', |
|
'train_data_path': '/mnt/bn/algo-masp-nas-2/baiyi.by/data/llava_instruct_150k/meta_data.json' |
|
}, |
|
'lrv_instruct': { |
|
'data_type': 'images', |
|
'train_data_path': '/mnt/bn/algo-masp-nas-2/baiyi.by/data/lrv_instructions/meta_data.json' |
|
}, |
|
'coco_caption': { |
|
'data_type': 'images', |
|
'train_data_path': '/mnt/bn/data-tns-algo-masp/baiyi.by/data/coco_caption/train.json' |
|
}, |
|
'cc_sbu': { |
|
'data_type': 'images', |
|
'train_data_path': '/mnt/bn/baiyi-arnold-nas/data/masp/vlm_data/cc_sbu/meta_data.json' |
|
}, |
|
'laion': { |
|
'data_type': 'images', |
|
'train_data_path': '/mnt/bn/data-tns-algo-masp/baiyi.by/data/laion/train.json' |
|
}, |
|
'webvid': { |
|
'data_type': 'video', |
|
'train_data_path': '/mnt/bn/baiyi-arnold-nas/data/masp/vlm_data/webvid_10M_video/train.json', |
|
'val_data_path': '/mnt/bn/baiyi-arnold-nas/data/masp/vlm_data/webvid_10M_video/val.json' |
|
}, |
|
'internvid': { |
|
'data_type': 'frames', |
|
'fps': 0.5, |
|
'train_data_path': '/mnt/bn/algo-masp-nas-2/baiyi.by/data/InternVid/meta_data.json' |
|
}, |
|
'video_chatgpt_instruct_single': { |
|
'data_type': 'video', |
|
'train_data_path': '/mnt/bn/algo-masp-nas-2/baiyi.by/data/VideoChatGPT_Instruct_100K_single/train.json' |
|
}, |
|
'video_chatgpt_instruct_multi': { |
|
'data_type': 'video', |
|
'train_data_path': '/mnt/bn/algo-masp-nas-2/baiyi.by/data/VideoChatGPT_Instruct_100K_multi/train.json' |
|
}, |
|
'video_chatgpt': { |
|
'data_type': 'frames', |
|
'train_data_path': '/mnt/bn/algo-masp-nas-2/baiyi.by/data/video_chatgpt_instruct/meta_data.json' |
|
}, |
|
'm3it': { |
|
'data_type': 'images', |
|
'default_tasks': [ |
|
'coco', |
|
'textcap', |
|
'image-paragraph-captioning', |
|
'coco-goi', |
|
'coco-itm', |
|
'vqa-v2', |
|
'shapes', |
|
'docvqa', |
|
'ocr-vqa', |
|
'st-vqa', |
|
'text-vqa', |
|
'gqa', |
|
'okvqa', |
|
'a-okvqa', |
|
'viquae', |
|
'clevr', |
|
'nlvr', |
|
'vcr', |
|
'visual-mrc', |
|
'visual-dialog', |
|
'multi30k' |
|
] |
|
}, |
|
'tt_vqa': { |
|
'data_type': 'frames', |
|
'fps': 2, |
|
'train_data_path': '/mnt/bn/algo-masp-nas-2/baiyi.by/data/ADSO_Anno_Data/batch_20231128/meta_data_single_60k_caption_170k_QA.json' |
|
|
|
|
|
}, |
|
'gpt4v_tt_vqa': { |
|
'data_type': 'frames', |
|
'fps': 0.5, |
|
|
|
|
|
'train_data_path': '/mnt/bn/algo-masp-nas-2/xiangchen/dataset/masp/20231222_120k_multi_filtered.json', |
|
'task_types': ['caption', 'qas'], |
|
'conv_type': 'single' |
|
}, |
|
'sharegpt4v': { |
|
'data_type': 'images', |
|
'coco_dir': '/mnt/bn/data-tns-algo-masp/data', |
|
'llava_dir': '/mnt/bn/data-tns-algo-masp/baiyi.by/data/blip_laion_cc_sbu_558k', |
|
'other_dir': '/mnt/bn/algo-masp-nas-2/xiangchen/dataset/sharegpt4v', |
|
}, |
|
'gpt4v_public': { |
|
'data_type': 'frames', |
|
'fps': 1, |
|
'train_data_path': '/mnt/bn/algo-masp-nas-2/xiangchen/data/shared_gpt4v_data/data_130k.json', |
|
|
|
'task_types': ['summary', 'detail', 'qa_pairs'], |
|
'conv_type': 'single', |
|
'sample_method': 'uniform' |
|
}, |
|
|
|
'gpt4v_internal': { |
|
'data_type': 'frames', |
|
'fps': 2, |
|
'train_data_path': '/mnt/bn/algo-masp-nas-2/xiangchen/dataset/masp/gpt4v_internal_28k.json', |
|
'task_types': ['summary','detail','qa_pairs'], |
|
'conv_type': 'single' |
|
}, |
|
|
|
'synthdog': { |
|
'data_type': 'images', |
|
}, |
|
|
|
'ocr_vqa': { |
|
'data_type': 'images', |
|
'train_data_path': '/mnt/bn/algo-masp-nas-2/xiangchen/dataset/OCR-VQA/training_meta.json' |
|
}, |
|
|
|
'sharegpt': { |
|
'data_type': 'text' |
|
}, |
|
|
|
'text_caps':{ |
|
'data_type': 'images', |
|
'train_data_path': '/mnt/bn/algo-masp-nas-2/xiangchen/dataset/TextCaps/TextCaps_0.1_train.json' |
|
}, |
|
|
|
'synthetic_ocr':{ |
|
'data_type': 'frames', |
|
'fps': 0.5, |
|
'train_data_path': '/mnt/bn/algo-masp-nas-2/xiangchen/dataset/masp/synthetic_ocr/train_filtered.json' |
|
}, |
|
|
|
'lk_image':{ |
|
'data_type': 'images', |
|
'train_data_path': '/mnt/bn/liangkeg/data/xiangchen/finetune_all_detail_vidal200k_videollava_images_im.json' |
|
}, |
|
|
|
'lk_video':{ |
|
'data_type': 'frames', |
|
'fps': 1, |
|
'train_data_path': '/mnt/bn/liangkeg/data/xiangchen/finetune_all_detail_vidal200k_videollava_images_vid.json', |
|
'select_datasets': ['webvid10m', 'webvid2m', 'activitynet', 'vidal', 'hdvila'], |
|
}, |
|
|
|
'promptv1_2_internal':{ |
|
'data_type': 'frames', |
|
'train_data_path': '/mnt/bn/algo-masp-nas-2/kaili.zhao/data/masp_data/train/gpt4v_annotation/202400401week_gpt4v_all_videos_unique_ids.json', |
|
'task_types': ['caption'] |
|
} |
|
} |
|
|
|
|
|
|