data_configs = { 'llava_pretrain': { 'data_type': 'images', 'train_data_path': '/mnt/bn/algo-masp-nas-2/baiyi.by/data/blip_laion_cc_sbu_558k/meta_data.json' }, 'llava_instruct': { 'data_type': 'images', 'train_data_path': '/mnt/bn/algo-masp-nas-2/baiyi.by/data/llava_instruct_150k/meta_data.json' }, 'lrv_instruct': { 'data_type': 'images', 'train_data_path': '/mnt/bn/algo-masp-nas-2/baiyi.by/data/lrv_instructions/meta_data.json' }, 'coco_caption': { 'data_type': 'images', 'train_data_path': '/mnt/bn/data-tns-algo-masp/baiyi.by/data/coco_caption/train.json' }, 'cc_sbu': { 'data_type': 'images', 'train_data_path': '/mnt/bn/baiyi-arnold-nas/data/masp/vlm_data/cc_sbu/meta_data.json' }, 'laion': { 'data_type': 'images', 'train_data_path': '/mnt/bn/data-tns-algo-masp/baiyi.by/data/laion/train.json' }, 'webvid': { 'data_type': 'video', 'train_data_path': '/mnt/bn/baiyi-arnold-nas/data/masp/vlm_data/webvid_10M_video/train.json', 'val_data_path': '/mnt/bn/baiyi-arnold-nas/data/masp/vlm_data/webvid_10M_video/val.json' }, 'internvid': { 'data_type': 'frames', 'fps': 0.5, 'train_data_path': '/mnt/bn/algo-masp-nas-2/baiyi.by/data/InternVid/meta_data.json' }, 'video_chatgpt_instruct_single': { 'data_type': 'video', 'train_data_path': '/mnt/bn/algo-masp-nas-2/baiyi.by/data/VideoChatGPT_Instruct_100K_single/train.json' }, 'video_chatgpt_instruct_multi': { 'data_type': 'video', 'train_data_path': '/mnt/bn/algo-masp-nas-2/baiyi.by/data/VideoChatGPT_Instruct_100K_multi/train.json' }, 'video_chatgpt': { 'data_type': 'frames', 'train_data_path': '/mnt/bn/algo-masp-nas-2/baiyi.by/data/video_chatgpt_instruct/meta_data.json' }, 'm3it': { 'data_type': 'images', 'default_tasks': [ 'coco', 'textcap', 'image-paragraph-captioning', 'coco-goi', 'coco-itm', 'vqa-v2', 'shapes', 'docvqa', 'ocr-vqa', 'st-vqa', 'text-vqa', 'gqa', 'okvqa', 'a-okvqa', 'viquae', 'clevr', 'nlvr', 'vcr', 'visual-mrc', 'visual-dialog', 'multi30k' ] }, 'tt_vqa': { 'data_type': 'frames', 'fps': 2, 'train_data_path': '/mnt/bn/algo-masp-nas-2/baiyi.by/data/ADSO_Anno_Data/batch_20231128/meta_data_single_60k_caption_170k_QA.json' # 'train_data_path': '/mnt/bn/yukunfeng-nasdrive/xiangchen/dataset/masp/20240208_meta_data_single_135k_caption_160k_QA.json' # 'train_data_path': '/mnt/bn/algo-masp-nas-2/baiyi.by/data/ADSO_Anno_Data/batch_20231128/meta_data_final_single_non_empty.json' }, 'gpt4v_tt_vqa': { 'data_type': 'frames', 'fps': 0.5, # 'train_data_path': '/mnt/bn/algo-masp-nas-2/baiyi.by/data/GPT4V_Negs/20231127_81k_single.json' # 'train_data_path': '/mnt/bn/yukunfeng-nasdrive/xiangchen/dataset/masp/20231127_81k_25k_filtered_single_non_empty.json' 'train_data_path': '/mnt/bn/algo-masp-nas-2/xiangchen/dataset/masp/20231222_120k_multi_filtered.json', 'task_types': ['caption', 'qas'], 'conv_type': 'single' }, 'sharegpt4v': { 'data_type': 'images', 'coco_dir': '/mnt/bn/data-tns-algo-masp/data', 'llava_dir': '/mnt/bn/data-tns-algo-masp/baiyi.by/data/blip_laion_cc_sbu_558k', 'other_dir': '/mnt/bn/algo-masp-nas-2/xiangchen/dataset/sharegpt4v', }, 'gpt4v_public': { 'data_type': 'frames', 'fps': 1, 'train_data_path': '/mnt/bn/algo-masp-nas-2/xiangchen/data/shared_gpt4v_data/data_130k.json', # 'train_data_path': '/mnt/bn/algo-masp-nas-2/xiangchen/data/shared_gpt4v_data/data_500k_filtered.json', 'task_types': ['summary', 'detail', 'qa_pairs'], 'conv_type': 'single', 'sample_method': 'uniform' }, 'gpt4v_internal': { 'data_type': 'frames', 'fps': 2, 'train_data_path': '/mnt/bn/algo-masp-nas-2/xiangchen/dataset/masp/gpt4v_internal_28k.json', 'task_types': ['summary','detail','qa_pairs'], 'conv_type': 'single' }, 'synthdog': { #500k 'data_type': 'images', }, 'ocr_vqa': { #200k 'data_type': 'images', 'train_data_path': '/mnt/bn/algo-masp-nas-2/xiangchen/dataset/OCR-VQA/training_meta.json' }, 'sharegpt': { #50k 'data_type': 'text' }, 'text_caps':{ #100k 'data_type': 'images', 'train_data_path': '/mnt/bn/algo-masp-nas-2/xiangchen/dataset/TextCaps/TextCaps_0.1_train.json' }, 'synthetic_ocr':{ # 50k 'data_type': 'frames', 'fps': 0.5, # total 10 frames for each video 'train_data_path': '/mnt/bn/algo-masp-nas-2/xiangchen/dataset/masp/synthetic_ocr/train_filtered.json' }, 'lk_image':{ # 600k 'data_type': 'images', 'train_data_path': '/mnt/bn/liangkeg/data/xiangchen/finetune_all_detail_vidal200k_videollava_images_im.json' }, 'lk_video':{ # 850k 'data_type': 'frames', 'fps': 1, 'train_data_path': '/mnt/bn/liangkeg/data/xiangchen/finetune_all_detail_vidal200k_videollava_images_vid.json', 'select_datasets': ['webvid10m', 'webvid2m', 'activitynet', 'vidal', 'hdvila'], }, 'promptv1_2_internal':{ # 210k 'data_type': 'frames', 'train_data_path': '/mnt/bn/algo-masp-nas-2/kaili.zhao/data/masp_data/train/gpt4v_annotation/202400401week_gpt4v_all_videos_unique_ids.json', 'task_types': ['caption'] } }