| data_configs = { |
| 'llava_pretrain': { |
| 'data_type': 'images', |
| 'train_data_path': '/mnt/bn/algo-masp-nas-2/baiyi.by/data/blip_laion_cc_sbu_558k/meta_data.json' |
| }, |
| 'llava_instruct': { |
| 'data_type': 'images', |
| 'train_data_path': '/mnt/bn/algo-masp-nas-2/baiyi.by/data/llava_instruct_150k/meta_data.json' |
| }, |
| 'lrv_instruct': { |
| 'data_type': 'images', |
| 'train_data_path': '/mnt/bn/algo-masp-nas-2/baiyi.by/data/lrv_instructions/meta_data.json' |
| }, |
| 'coco_caption': { |
| 'data_type': 'images', |
| 'train_data_path': '/mnt/bn/data-tns-algo-masp/baiyi.by/data/coco_caption/train.json' |
| }, |
| 'cc_sbu': { |
| 'data_type': 'images', |
| 'train_data_path': '/mnt/bn/baiyi-arnold-nas/data/masp/vlm_data/cc_sbu/meta_data.json' |
| }, |
| 'laion': { |
| 'data_type': 'images', |
| 'train_data_path': '/mnt/bn/data-tns-algo-masp/baiyi.by/data/laion/train.json' |
| }, |
| 'webvid': { |
| 'data_type': 'video', |
| 'train_data_path': '/mnt/bn/baiyi-arnold-nas/data/masp/vlm_data/webvid_10M_video/train.json', |
| 'val_data_path': '/mnt/bn/baiyi-arnold-nas/data/masp/vlm_data/webvid_10M_video/val.json' |
| }, |
| 'internvid': { |
| 'data_type': 'frames', |
| 'fps': 0.5, |
| 'train_data_path': '/mnt/bn/algo-masp-nas-2/baiyi.by/data/InternVid/meta_data.json' |
| }, |
| 'video_chatgpt_instruct_single': { |
| 'data_type': 'video', |
| 'train_data_path': '/mnt/bn/algo-masp-nas-2/baiyi.by/data/VideoChatGPT_Instruct_100K_single/train.json' |
| }, |
| 'video_chatgpt_instruct_multi': { |
| 'data_type': 'video', |
| 'train_data_path': '/mnt/bn/algo-masp-nas-2/baiyi.by/data/VideoChatGPT_Instruct_100K_multi/train.json' |
| }, |
| 'video_chatgpt': { |
| 'data_type': 'frames', |
| 'train_data_path': '/mnt/bn/algo-masp-nas-2/baiyi.by/data/video_chatgpt_instruct/meta_data.json' |
| }, |
| 'm3it': { |
| 'data_type': 'images', |
| 'default_tasks': [ |
| 'coco', |
| 'textcap', |
| 'image-paragraph-captioning', |
| 'coco-goi', |
| 'coco-itm', |
| 'vqa-v2', |
| 'shapes', |
| 'docvqa', |
| 'ocr-vqa', |
| 'st-vqa', |
| 'text-vqa', |
| 'gqa', |
| 'okvqa', |
| 'a-okvqa', |
| 'viquae', |
| 'clevr', |
| 'nlvr', |
| 'vcr', |
| 'visual-mrc', |
| 'visual-dialog', |
| 'multi30k' |
| ] |
| }, |
| 'tt_vqa': { |
| 'data_type': 'frames', |
| 'fps': 2, |
| 'train_data_path': '/mnt/bn/algo-masp-nas-2/baiyi.by/data/ADSO_Anno_Data/batch_20231128/meta_data_single_60k_caption_170k_QA.json' |
| |
| |
| }, |
| 'gpt4v_tt_vqa': { |
| 'data_type': 'frames', |
| 'fps': 0.5, |
| |
| |
| 'train_data_path': '/mnt/bn/algo-masp-nas-2/xiangchen/dataset/masp/20231222_120k_multi_filtered.json', |
| 'task_types': ['caption', 'qas'], |
| 'conv_type': 'single' |
| }, |
| 'sharegpt4v': { |
| 'data_type': 'images', |
| 'coco_dir': '/mnt/bn/data-tns-algo-masp/data', |
| 'llava_dir': '/mnt/bn/data-tns-algo-masp/baiyi.by/data/blip_laion_cc_sbu_558k', |
| 'other_dir': '/mnt/bn/algo-masp-nas-2/xiangchen/dataset/sharegpt4v', |
| }, |
| 'gpt4v_public': { |
| 'data_type': 'frames', |
| 'fps': 1, |
| 'train_data_path': '/mnt/bn/algo-masp-nas-2/xiangchen/data/shared_gpt4v_data/data_130k.json', |
| |
| 'task_types': ['summary', 'detail', 'qa_pairs'], |
| 'conv_type': 'single', |
| 'sample_method': 'uniform' |
| }, |
|
|
| 'gpt4v_internal': { |
| 'data_type': 'frames', |
| 'fps': 2, |
| 'train_data_path': '/mnt/bn/algo-masp-nas-2/xiangchen/dataset/masp/gpt4v_internal_28k.json', |
| 'task_types': ['summary','detail','qa_pairs'], |
| 'conv_type': 'single' |
| }, |
|
|
| 'synthdog': { |
| 'data_type': 'images', |
| }, |
|
|
| 'ocr_vqa': { |
| 'data_type': 'images', |
| 'train_data_path': '/mnt/bn/algo-masp-nas-2/xiangchen/dataset/OCR-VQA/training_meta.json' |
| }, |
|
|
| 'sharegpt': { |
| 'data_type': 'text' |
| }, |
|
|
| 'text_caps':{ |
| 'data_type': 'images', |
| 'train_data_path': '/mnt/bn/algo-masp-nas-2/xiangchen/dataset/TextCaps/TextCaps_0.1_train.json' |
| }, |
|
|
| 'synthetic_ocr':{ |
| 'data_type': 'frames', |
| 'fps': 0.5, |
| 'train_data_path': '/mnt/bn/algo-masp-nas-2/xiangchen/dataset/masp/synthetic_ocr/train_filtered.json' |
| }, |
|
|
| 'lk_image':{ |
| 'data_type': 'images', |
| 'train_data_path': '/mnt/bn/liangkeg/data/xiangchen/finetune_all_detail_vidal200k_videollava_images_im.json' |
| }, |
|
|
| 'lk_video':{ |
| 'data_type': 'frames', |
| 'fps': 1, |
| 'train_data_path': '/mnt/bn/liangkeg/data/xiangchen/finetune_all_detail_vidal200k_videollava_images_vid.json', |
| 'select_datasets': ['webvid10m', 'webvid2m', 'activitynet', 'vidal', 'hdvila'], |
| }, |
|
|
| 'promptv1_2_internal':{ |
| 'data_type': 'frames', |
| 'train_data_path': '/mnt/bn/algo-masp-nas-2/kaili.zhao/data/masp_data/train/gpt4v_annotation/202400401week_gpt4v_all_videos_unique_ids.json', |
| 'task_types': ['caption'] |
| } |
| } |
|
|
|
|
|
|