model1 / llava /datasets /data_cfgs.py
multitensor's picture
Upload folder using huggingface_hub
bbfa6f6 verified
data_configs = {
'llava_pretrain': {
'data_type': 'images',
'train_data_path': '/mnt/bn/algo-masp-nas-2/baiyi.by/data/blip_laion_cc_sbu_558k/meta_data.json'
},
'llava_instruct': {
'data_type': 'images',
'train_data_path': '/mnt/bn/algo-masp-nas-2/baiyi.by/data/llava_instruct_150k/meta_data.json'
},
'lrv_instruct': {
'data_type': 'images',
'train_data_path': '/mnt/bn/algo-masp-nas-2/baiyi.by/data/lrv_instructions/meta_data.json'
},
'coco_caption': {
'data_type': 'images',
'train_data_path': '/mnt/bn/data-tns-algo-masp/baiyi.by/data/coco_caption/train.json'
},
'cc_sbu': {
'data_type': 'images',
'train_data_path': '/mnt/bn/baiyi-arnold-nas/data/masp/vlm_data/cc_sbu/meta_data.json'
},
'laion': {
'data_type': 'images',
'train_data_path': '/mnt/bn/data-tns-algo-masp/baiyi.by/data/laion/train.json'
},
'webvid': {
'data_type': 'video',
'train_data_path': '/mnt/bn/baiyi-arnold-nas/data/masp/vlm_data/webvid_10M_video/train.json',
'val_data_path': '/mnt/bn/baiyi-arnold-nas/data/masp/vlm_data/webvid_10M_video/val.json'
},
'internvid': {
'data_type': 'frames',
'fps': 0.5,
'train_data_path': '/mnt/bn/algo-masp-nas-2/baiyi.by/data/InternVid/meta_data.json'
},
'video_chatgpt_instruct_single': {
'data_type': 'video',
'train_data_path': '/mnt/bn/algo-masp-nas-2/baiyi.by/data/VideoChatGPT_Instruct_100K_single/train.json'
},
'video_chatgpt_instruct_multi': {
'data_type': 'video',
'train_data_path': '/mnt/bn/algo-masp-nas-2/baiyi.by/data/VideoChatGPT_Instruct_100K_multi/train.json'
},
'video_chatgpt': {
'data_type': 'frames',
'train_data_path': '/mnt/bn/algo-masp-nas-2/baiyi.by/data/video_chatgpt_instruct/meta_data.json'
},
'm3it': {
'data_type': 'images',
'default_tasks': [
'coco',
'textcap',
'image-paragraph-captioning',
'coco-goi',
'coco-itm',
'vqa-v2',
'shapes',
'docvqa',
'ocr-vqa',
'st-vqa',
'text-vqa',
'gqa',
'okvqa',
'a-okvqa',
'viquae',
'clevr',
'nlvr',
'vcr',
'visual-mrc',
'visual-dialog',
'multi30k'
]
},
'tt_vqa': {
'data_type': 'frames',
'fps': 2,
'train_data_path': '/mnt/bn/algo-masp-nas-2/baiyi.by/data/ADSO_Anno_Data/batch_20231128/meta_data_single_60k_caption_170k_QA.json'
# 'train_data_path': '/mnt/bn/yukunfeng-nasdrive/xiangchen/dataset/masp/20240208_meta_data_single_135k_caption_160k_QA.json'
# 'train_data_path': '/mnt/bn/algo-masp-nas-2/baiyi.by/data/ADSO_Anno_Data/batch_20231128/meta_data_final_single_non_empty.json'
},
'gpt4v_tt_vqa': {
'data_type': 'frames',
'fps': 0.5,
# 'train_data_path': '/mnt/bn/algo-masp-nas-2/baiyi.by/data/GPT4V_Negs/20231127_81k_single.json'
# 'train_data_path': '/mnt/bn/yukunfeng-nasdrive/xiangchen/dataset/masp/20231127_81k_25k_filtered_single_non_empty.json'
'train_data_path': '/mnt/bn/algo-masp-nas-2/xiangchen/dataset/masp/20231222_120k_multi_filtered.json',
'task_types': ['caption', 'qas'],
'conv_type': 'single'
},
'sharegpt4v': {
'data_type': 'images',
'coco_dir': '/mnt/bn/data-tns-algo-masp/data',
'llava_dir': '/mnt/bn/data-tns-algo-masp/baiyi.by/data/blip_laion_cc_sbu_558k',
'other_dir': '/mnt/bn/algo-masp-nas-2/xiangchen/dataset/sharegpt4v',
},
'gpt4v_public': {
'data_type': 'frames',
'fps': 1,
'train_data_path': '/mnt/bn/algo-masp-nas-2/xiangchen/data/shared_gpt4v_data/data_130k.json',
# 'train_data_path': '/mnt/bn/algo-masp-nas-2/xiangchen/data/shared_gpt4v_data/data_500k_filtered.json',
'task_types': ['summary', 'detail', 'qa_pairs'],
'conv_type': 'single',
'sample_method': 'uniform'
},
'gpt4v_internal': {
'data_type': 'frames',
'fps': 2,
'train_data_path': '/mnt/bn/algo-masp-nas-2/xiangchen/dataset/masp/gpt4v_internal_28k.json',
'task_types': ['summary','detail','qa_pairs'],
'conv_type': 'single'
},
'synthdog': { #500k
'data_type': 'images',
},
'ocr_vqa': { #200k
'data_type': 'images',
'train_data_path': '/mnt/bn/algo-masp-nas-2/xiangchen/dataset/OCR-VQA/training_meta.json'
},
'sharegpt': { #50k
'data_type': 'text'
},
'text_caps':{ #100k
'data_type': 'images',
'train_data_path': '/mnt/bn/algo-masp-nas-2/xiangchen/dataset/TextCaps/TextCaps_0.1_train.json'
},
'synthetic_ocr':{ # 50k
'data_type': 'frames',
'fps': 0.5, # total 10 frames for each video
'train_data_path': '/mnt/bn/algo-masp-nas-2/xiangchen/dataset/masp/synthetic_ocr/train_filtered.json'
},
'lk_image':{ # 600k
'data_type': 'images',
'train_data_path': '/mnt/bn/liangkeg/data/xiangchen/finetune_all_detail_vidal200k_videollava_images_im.json'
},
'lk_video':{ # 850k
'data_type': 'frames',
'fps': 1,
'train_data_path': '/mnt/bn/liangkeg/data/xiangchen/finetune_all_detail_vidal200k_videollava_images_vid.json',
'select_datasets': ['webvid10m', 'webvid2m', 'activitynet', 'vidal', 'hdvila'],
},
'promptv1_2_internal':{ # 210k
'data_type': 'frames',
'train_data_path': '/mnt/bn/algo-masp-nas-2/kaili.zhao/data/masp_data/train/gpt4v_annotation/202400401week_gpt4v_all_videos_unique_ids.json',
'task_types': ['caption']
}
}