| { |
| "run": { |
| "task": "video_text_pretrain", |
| "lr_sched": "linear_warmup_cosine_lr", |
| "init_lr": 3e-05, |
| "min_lr": 1e-05, |
| "warmup_lr": 1e-06, |
| "weight_decay": 0.05, |
| "max_epoch": 3, |
| "iters_per_epoch": 51377, |
| "batch_size_train": 2, |
| "batch_size_eval": 4, |
| "num_workers": 4, |
| "warmup_steps": 25688, |
| "accum_grad_iters": 8, |
| "seed": 42, |
| "output_dir": "/data/mjjung/timechat/activitynet_vtune", |
| "amp": true, |
| "resume_ckpt_path": null, |
| "evaluate": false, |
| "train_splits": [ |
| "train" |
| ], |
| "device": "cuda", |
| "world_size": 4, |
| "dist_url": "env://", |
| "distributed": true, |
| "rank": 0, |
| "gpu": 0, |
| "dist_backend": "nccl" |
| }, |
| "model": { |
| "arch": "timechat", |
| "image_size": 224, |
| "drop_path_rate": 0, |
| "use_grad_checkpoint": true, |
| "vit_precision": "fp16", |
| "freeze_vit": true, |
| "freeze_qformer": false, |
| "num_query_token": 32, |
| "llama_model": "/data/mjjung/Video-LLaMA/Video-LLaMA-2-7B-Finetuned/llama-2-7b-chat-hf/", |
| "prompt": "", |
| "model_type": "pretrain_llama_v2", |
| "vit_model": "/data/mjjung/timechat/eva_vit_g.pth", |
| "q_former_model": "/data/mjjung/timechat/instruct_blip_vicuna7b_trimmed.pth", |
| "ckpt": "/data/mjjung/timechat/timechat_7b.pth", |
| "frozen_llama_proj": false, |
| "frozen_video_Qformer": false, |
| "fusion_head_layers": 2, |
| "max_frame_pos": 96, |
| "fusion_header_type": "seqTransf", |
| "max_txt_len": 2048, |
| "end_sym": "</s>", |
| "prompt_path": "", |
| "prompt_template": "[INST] <<SYS>>\\n \\n<</SYS>>\\n\\n{} [/INST] ", |
| "lora": true, |
| "lora_inference_mode": false, |
| "qformer_text_input": true, |
| "window_size": 32, |
| "stride": 32 |
| }, |
| "preprocess": { |
| "vis_processor": { |
| "train": { |
| "name": "alpro_video_train", |
| "image_size": 224, |
| "n_frms": 8 |
| }, |
| "eval": { |
| "name": "alpro_video_eval", |
| "image_size": 224, |
| "n_frms": 8 |
| } |
| }, |
| "text_processor": { |
| "train": { |
| "name": "blip_caption" |
| }, |
| "eval": { |
| "name": "blip_caption" |
| } |
| } |
| }, |
| "datasets": { |
| "charades_instruct": { |
| "data_type": "video", |
| "build_info": { |
| "anno_dir": "data/activitynet_filtered_qa_grounding.json", |
| "videos_dir": "/data/video_datasets/" |
| }, |
| "vis_processor": { |
| "train": { |
| "name": "alpro_video_train", |
| "n_frms": 96, |
| "image_size": 224 |
| } |
| }, |
| "text_processor": { |
| "train": { |
| "name": "blip_caption" |
| } |
| }, |
| "num_video_query_token": 32, |
| "tokenizer_name": "/data/mjjung/Video-LLaMA/Video-LLaMA-2-7B-Finetuned/llama-2-7b-chat-hf/", |
| "model_type": "llama_v2", |
| "num_frm": 96, |
| "sample_type": "rand", |
| "max_txt_len": 2048, |
| "stride": 32 |
| } |
| } |
| } |
| {"train_lr": "0.000", "train_loss": "0.162"} |
|
|