MgGladys commited on
Commit
5189071
·
verified ·
1 Parent(s): 0a937d7

Add files using upload-large-folder tool

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. .gitattributes +209 -0
  2. _fonts/NotoSansSC-Regular.otf +3 -0
  3. assets/example_video.mp4 +3 -0
  4. assets/mmeb_v2.png +3 -0
  5. assets/teaser.png +3 -0
  6. assets/train_vlm.png +3 -0
  7. assets/vlm2vec_results.png +3 -0
  8. experiments/Qwen2_5vl_3B_add_distill_0.2_0.6_DISTILL_FLOOR_0_12_3_h100_3_Classifier_Layer12_V5_i_ret/checkpoint-100/model.safetensors +3 -0
  9. experiments/Qwen2_5vl_3B_add_distill_0.2_0.6_DISTILL_FLOOR_0_12_3_h100_3_Classifier_Layer12_V5_i_ret/checkpoint-100/optimizer.pt +3 -0
  10. experiments/Qwen2_5vl_3B_add_distill_0.2_0.6_DISTILL_FLOOR_0_12_3_h100_3_Classifier_Layer12_V5_i_ret/checkpoint-100/rng_state.pth +3 -0
  11. experiments/Qwen2_5vl_3B_add_distill_0.2_0.6_DISTILL_FLOOR_0_12_3_h100_3_Classifier_Layer12_V5_i_ret/checkpoint-100/scheduler.pt +3 -0
  12. experiments/Qwen2_5vl_3B_add_distill_0.2_0.6_DISTILL_FLOOR_0_12_3_h100_3_Classifier_Layer12_V5_i_ret/checkpoint-100/tokenizer.json +3 -0
  13. experiments/Qwen2_5vl_3B_add_distill_0.2_0.6_DISTILL_FLOOR_0_12_3_h100_3_Classifier_Layer12_V5_i_ret/checkpoint-100/training_args.bin +3 -0
  14. experiments/Qwen2_5vl_3B_add_distill_0.2_0.6_DISTILL_FLOOR_0_12_3_h100_3_Classifier_Layer12_V5_i_ret/checkpoint-200/model.safetensors +3 -0
  15. experiments/Qwen2_5vl_3B_add_distill_0.2_0.6_DISTILL_FLOOR_0_12_3_h100_3_Classifier_Layer12_V5_i_ret/checkpoint-200/optimizer.pt +3 -0
  16. experiments/Qwen2_5vl_3B_add_distill_0.2_0.6_DISTILL_FLOOR_0_12_3_h100_3_Classifier_Layer12_V5_i_ret/checkpoint-200/rng_state.pth +3 -0
  17. experiments/Qwen2_5vl_3B_add_distill_0.2_0.6_DISTILL_FLOOR_0_12_3_h100_3_Classifier_Layer12_V5_i_ret/checkpoint-200/scheduler.pt +3 -0
  18. experiments/Qwen2_5vl_3B_add_distill_0.2_0.6_DISTILL_FLOOR_0_12_3_h100_3_Classifier_Layer12_V5_i_ret/checkpoint-200/tokenizer.json +3 -0
  19. experiments/Qwen2_5vl_3B_add_distill_0.2_0.6_DISTILL_FLOOR_0_12_3_h100_3_Classifier_Layer12_V5_i_ret/checkpoint-200/training_args.bin +3 -0
  20. experiments/Qwen2_5vl_3B_add_distill_0.2_0.6_DISTILL_FLOOR_0_12_3_h100_3_Classifier_Layer12_V5_i_ret/checkpoint-300/model.safetensors +3 -0
  21. experiments/Qwen2_5vl_3B_add_distill_0.2_0.6_DISTILL_FLOOR_0_12_3_h100_3_Classifier_Layer12_V5_i_ret/checkpoint-300/optimizer.pt +3 -0
  22. experiments/Qwen2_5vl_3B_add_distill_0.2_0.6_DISTILL_FLOOR_0_12_3_h100_3_Classifier_Layer12_V5_i_ret/checkpoint-300/rng_state.pth +3 -0
  23. experiments/Qwen2_5vl_3B_add_distill_0.2_0.6_DISTILL_FLOOR_0_12_3_h100_3_Classifier_Layer12_V5_i_ret/checkpoint-300/scheduler.pt +3 -0
  24. experiments/Qwen2_5vl_3B_add_distill_0.2_0.6_DISTILL_FLOOR_0_12_3_h100_3_Classifier_Layer12_V5_i_ret/checkpoint-300/tokenizer.json +3 -0
  25. experiments/Qwen2_5vl_3B_add_distill_0.2_0.6_DISTILL_FLOOR_0_12_3_h100_3_Classifier_Layer12_V5_i_ret/checkpoint-300/training_args.bin +3 -0
  26. experiments/Qwen2_5vl_3B_add_distill_0.2_0.6_DISTILL_FLOOR_0_12_3_h100_3_Classifier_Layer12_V5_i_ret/checkpoint-400/optimizer.pt +3 -0
  27. experiments/Qwen2_5vl_3B_add_distill_0.2_0.6_DISTILL_FLOOR_0_12_3_h100_3_Classifier_Layer12_V5_i_ret/checkpoint-400/tokenizer.json +3 -0
  28. experiments/Qwen2_5vl_3B_add_distill_0.2_0.6_DISTILL_FLOOR_0_12_3_h100_3_Classifier_Layer12_V5_i_ret/checkpoint-500/model.safetensors +3 -0
  29. experiments/Qwen2_5vl_3B_add_distill_0.2_0.6_DISTILL_FLOOR_0_12_3_h100_3_Classifier_Layer12_V5_i_ret/checkpoint-500/optimizer.pt +3 -0
  30. experiments/Qwen2_5vl_3B_add_distill_0.2_0.6_DISTILL_FLOOR_0_12_3_h100_3_Classifier_Layer12_V5_i_ret/checkpoint-500/rng_state.pth +3 -0
  31. experiments/Qwen2_5vl_3B_add_distill_0.2_0.6_DISTILL_FLOOR_0_12_3_h100_3_Classifier_Layer12_V5_i_ret/checkpoint-500/scheduler.pt +3 -0
  32. experiments/Qwen2_5vl_3B_add_distill_0.2_0.6_DISTILL_FLOOR_0_12_3_h100_3_Classifier_Layer12_V5_i_ret/checkpoint-500/training_args.bin +3 -0
  33. experiments/Qwen2_5vl_3B_add_distill_0.2_0.6_DISTILL_FLOOR_0_12_3_h100_3_Classifier_Layer12_V5_i_ret/checkpoint-600/model.safetensors +3 -0
  34. experiments/Qwen2_5vl_3B_add_distill_0.2_0.6_DISTILL_FLOOR_0_12_3_h100_3_Classifier_Layer12_V5_i_ret/checkpoint-600/rng_state.pth +3 -0
  35. experiments/Qwen2_5vl_3B_add_distill_0.2_0.6_DISTILL_FLOOR_0_12_3_h100_3_Classifier_Layer12_V5_i_ret/checkpoint-600/scheduler.pt +3 -0
  36. experiments/Qwen2_5vl_3B_add_distill_0.2_0.6_DISTILL_FLOOR_0_12_3_h100_3_Classifier_Layer12_V5_i_ret/checkpoint-600/tokenizer.json +3 -0
  37. experiments/Qwen2_5vl_3B_add_distill_0.2_0.6_DISTILL_FLOOR_0_12_3_h100_3_Classifier_Layer12_V5_i_ret/checkpoint-600/training_args.bin +3 -0
  38. experiments/Qwen2_5vl_3B_add_distill_0.2_0.6_DISTILL_FLOOR_0_12_3_h100_3_Classifier_Layer12_V5_i_ret/checkpoint-700/model.safetensors +3 -0
  39. experiments/Qwen2_5vl_3B_add_distill_0.2_0.6_DISTILL_FLOOR_0_12_3_h100_3_Classifier_Layer12_V5_i_ret/checkpoint-700/optimizer.pt +3 -0
  40. experiments/Qwen2_5vl_3B_add_distill_0.2_0.6_DISTILL_FLOOR_0_12_3_h100_3_Classifier_Layer12_V5_i_ret/checkpoint-700/rng_state.pth +3 -0
  41. experiments/Qwen2_5vl_3B_add_distill_0.2_0.6_DISTILL_FLOOR_0_12_3_h100_3_Classifier_Layer12_V5_i_ret/checkpoint-700/scheduler.pt +3 -0
  42. experiments/Qwen2_5vl_3B_add_distill_0.2_0.6_DISTILL_FLOOR_0_12_3_h100_3_Classifier_Layer12_V5_i_ret/checkpoint-700/tokenizer.json +3 -0
  43. experiments/Qwen2_5vl_3B_add_distill_0.2_0.6_DISTILL_FLOOR_0_12_3_h100_3_Classifier_Layer12_V5_i_ret/checkpoint-700/training_args.bin +3 -0
  44. experiments/Qwen2_5vl_3B_add_distill_0.2_0.6_DISTILL_FLOOR_0_12_3_h100_3_Classifier_Layer12_V5_i_ret/checkpoint-800/model.safetensors +3 -0
  45. experiments/Qwen2_5vl_3B_add_distill_0.2_0.6_DISTILL_FLOOR_0_12_3_h100_3_Classifier_Layer12_V5_i_ret/checkpoint-800/optimizer.pt +3 -0
  46. experiments/Qwen2_5vl_3B_add_distill_0.2_0.6_DISTILL_FLOOR_0_12_3_h100_3_Classifier_Layer12_V5_i_ret/checkpoint-800/rng_state.pth +3 -0
  47. experiments/Qwen2_5vl_3B_add_distill_0.2_0.6_DISTILL_FLOOR_0_12_3_h100_3_Classifier_Layer12_V5_i_ret/checkpoint-800/scheduler.pt +3 -0
  48. experiments/Qwen2_5vl_3B_add_distill_0.2_0.6_DISTILL_FLOOR_0_12_3_h100_3_Classifier_Layer12_V5_i_ret/checkpoint-800/tokenizer.json +3 -0
  49. experiments/Qwen2_5vl_3B_add_distill_0.2_0.6_DISTILL_FLOOR_0_12_3_h100_3_Classifier_Layer12_V5_i_ret/checkpoint-800/training_args.bin +3 -0
  50. experiments/Qwen2_5vl_3B_multilayer_distill_AOP_10_pooling_12_26_a100_multinode_Classifier_Layer12_V5_i_ret_bsz128/checkpoint-100/model.safetensors +3 -0
.gitattributes CHANGED
@@ -74,3 +74,212 @@ output_text_image.png filter=lfs diff=lfs merge=lfs -text
74
  ~/experiments/Qwen2_5vl_3B_multilayer_distill_AOP_10_pooling_12_26_a100_multinode/checkpoint-2200/tokenizer.json filter=lfs diff=lfs merge=lfs -text
75
  ~/experiments/Qwen2_5vl_3B_multilayer_distill_AOP_10_pooling_12_26_a100_multinode/checkpoint-3600/tokenizer.json filter=lfs diff=lfs merge=lfs -text
76
  ~/experiments/Qwen2_5vl_3B_multilayer_distill_AOP_10_pooling_12_26_a100_multinode/checkpoint-4600/tokenizer.json filter=lfs diff=lfs merge=lfs -text
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
74
  ~/experiments/Qwen2_5vl_3B_multilayer_distill_AOP_10_pooling_12_26_a100_multinode/checkpoint-2200/tokenizer.json filter=lfs diff=lfs merge=lfs -text
75
  ~/experiments/Qwen2_5vl_3B_multilayer_distill_AOP_10_pooling_12_26_a100_multinode/checkpoint-3600/tokenizer.json filter=lfs diff=lfs merge=lfs -text
76
  ~/experiments/Qwen2_5vl_3B_multilayer_distill_AOP_10_pooling_12_26_a100_multinode/checkpoint-4600/tokenizer.json filter=lfs diff=lfs merge=lfs -text
77
+ experiments/Qwen2_5vl_3B_add_distill_0.2_0.6_DISTILL_FLOOR_0_12_3_h100_3_Classifier_Layer12_V5_i_ret/checkpoint-800/tokenizer.json filter=lfs diff=lfs merge=lfs -text
78
+ experiments/Qwen2_5vl_3B_add_distill_0.2_0.6_DISTILL_FLOOR_0_12_3_h100_3_Classifier_Layer12_V5_i_ret/checkpoint-600/tokenizer.json filter=lfs diff=lfs merge=lfs -text
79
+ experiments/Qwen2_5vl_3B_add_distill_0.2_0.6_DISTILL_FLOOR_0_12_3_h100_3_Classifier_Layer12_V5_i_ret/checkpoint-400/tokenizer.json filter=lfs diff=lfs merge=lfs -text
80
+ experiments/Qwen2_5vl_3B_add_distill_0.2_0.6_DISTILL_FLOOR_0_12_3_h100_3_Classifier_Layer12_V5_i_ret/checkpoint-300/tokenizer.json filter=lfs diff=lfs merge=lfs -text
81
+ experiments/Qwen2_5vl_3B_add_distill_0.2_0.6_DISTILL_FLOOR_0_12_3_h100_3_Classifier_Layer12_V5_i_ret/checkpoint-200/tokenizer.json filter=lfs diff=lfs merge=lfs -text
82
+ experiments/Qwen2_5vl_3B_multilayer_distill_AOP_pooling_all_12_10_h100_4_Classifier_Layer12_V5_i_ret/checkpoint-100/tokenizer.json filter=lfs diff=lfs merge=lfs -text
83
+ experiments/Qwen2_5vl_3B_multilayer_distill_AOP_pooling_all_12_10_h100_4_Classifier_Layer12_V5_i_ret/wandb/run-20251215_064148-aq39pr89/run-aq39pr89.wandb filter=lfs diff=lfs merge=lfs -text
84
+ experiments/Qwen2_5vl_7B_multilayer_distill_AOP_pooling_all_12_10_h100_4_Classifier_Layer12_V5_i_ret_bsz512/wandb/run-20251222_084206-k6srohpe/run-k6srohpe.wandb filter=lfs diff=lfs merge=lfs -text
85
+ experiments/Qwen2_5vl_7B_multilayer_distill_AOP_pooling_all_12_10_h100_4_Classifier_Layer12_V5_i_ret_bsz512/checkpoint-500/tokenizer.json filter=lfs diff=lfs merge=lfs -text
86
+ experiments/Qwen2_5vl_7B_multilayer_distill_AOP_pooling_all_12_10_h100_4_Classifier_Layer12_V5_i_ret_bsz512/checkpoint-800/tokenizer.json filter=lfs diff=lfs merge=lfs -text
87
+ experiments/Qwen2_5vl_7B_multilayer_distill_AOP_pooling_all_12_10_h100_4_Classifier_Layer12_V5_i_ret_bsz512/checkpoint-600/tokenizer.json filter=lfs diff=lfs merge=lfs -text
88
+ experiments/Qwen2_5vl_7B_multilayer_distill_AOP_pooling_all_12_10_h100_4_Classifier_Layer12_V5_i_ret_bsz512/checkpoint-400/tokenizer.json filter=lfs diff=lfs merge=lfs -text
89
+ experiments/Qwen2_5vl_7B_multilayer_distill_AOP_pooling_all_12_10_h100_4_Classifier_Layer12_V5_i_ret_bsz512/checkpoint-300/tokenizer.json filter=lfs diff=lfs merge=lfs -text
90
+ experiments/Qwen2_5vl_7B_multilayer_distill_AOP_pooling_all_12_10_h100_4_Classifier_Layer12_V5_i_ret_bsz512/checkpoint-200/tokenizer.json filter=lfs diff=lfs merge=lfs -text
91
+ experiments/Qwen2_5vl_7B_multilayer_distill_aop_10_pooling_i_ret_12_30_h100_2_node_Classifier_L12_i_ret_bsz512/tokenizer.json filter=lfs diff=lfs merge=lfs -text
92
+ experiments/Qwen2_5vl_7B_multilayer_distill_aop_10_pooling_i_ret_12_30_h100_2_node_Classifier_L12_i_ret_bsz512/checkpoint-100/tokenizer.json filter=lfs diff=lfs merge=lfs -text
93
+ experiments/Qwen2_5vl_7B_multilayer_distill_aop_10_pooling_i_ret_12_30_h100_2_node_Classifier_L12_i_ret_bsz512/checkpoint-1000/tokenizer.json filter=lfs diff=lfs merge=lfs -text
94
+ experiments/Qwen2_5vl_7B_multilayer_distill_aop_10_pooling_i_ret_12_30_h100_2_node_Classifier_L12_i_ret_bsz512/checkpoint-700/tokenizer.json filter=lfs diff=lfs merge=lfs -text
95
+ experiments/Qwen2_5vl_7B_multilayer_distill_aop_10_pooling_i_ret_12_30_h100_2_node_Classifier_L12_i_ret_bsz512/checkpoint-900/tokenizer.json filter=lfs diff=lfs merge=lfs -text
96
+ experiments/Qwen2_5vl_7B_multilayer_distill_aop_10_pooling_i_ret_12_30_h100_2_node_Classifier_L12_i_ret_bsz512/checkpoint-500/tokenizer.json filter=lfs diff=lfs merge=lfs -text
97
+ experiments/Qwen2_5vl_7B_multilayer_distill_aop_10_pooling_i_ret_12_30_h100_2_node_Classifier_L12_i_ret_bsz512/checkpoint-800/tokenizer.json filter=lfs diff=lfs merge=lfs -text
98
+ experiments/Qwen2_5vl_7B_multilayer_distill_aop_10_pooling_i_ret_12_30_h100_2_node_Classifier_L12_i_ret_bsz512/checkpoint-600/tokenizer.json filter=lfs diff=lfs merge=lfs -text
99
+ experiments/Qwen2_5vl_7B_multilayer_distill_aop_10_pooling_i_ret_12_30_h100_2_node_Classifier_L12_i_ret_bsz512/checkpoint-400/tokenizer.json filter=lfs diff=lfs merge=lfs -text
100
+ experiments/Qwen2_5vl_7B_multilayer_distill_aop_10_pooling_i_ret_12_30_h100_2_node_Classifier_L12_i_ret_bsz512/checkpoint-300/tokenizer.json filter=lfs diff=lfs merge=lfs -text
101
+ experiments/Qwen2_5vl_7B_multilayer_distill_aop_10_pooling_i_ret_12_30_h100_2_node_Classifier_L12_i_ret_bsz512/checkpoint-200/tokenizer.json filter=lfs diff=lfs merge=lfs -text
102
+ experiments/Qwen2_5vl_3B_add_distill_0.2_0.6_DISTILL_FLOOR_0_12_3_h100_3_Classifier_Layer12_V5_i_ret/checkpoint-100/tokenizer.json filter=lfs diff=lfs merge=lfs -text
103
+ experiments/Qwen2_5vl_3B_add_distill_0.2_0.6_DISTILL_FLOOR_0_12_3_h100_3_Classifier_Layer12_V5_i_ret/checkpoint-700/tokenizer.json filter=lfs diff=lfs merge=lfs -text
104
+ experiments/Qwen2_5vl_3B_multilayer_distill_AOP_pooling_all_12_10_h100_4_Classifier_Layer12_V5_i_ret/checkpoint-700/tokenizer.json filter=lfs diff=lfs merge=lfs -text
105
+ experiments/Qwen2_5vl_3B_multilayer_distill_AOP_pooling_all_12_10_h100_4_Classifier_Layer12_V5_i_ret/checkpoint-500/tokenizer.json filter=lfs diff=lfs merge=lfs -text
106
+ experiments/Qwen2_5vl_3B_multilayer_distill_AOP_pooling_all_12_10_h100_4_Classifier_Layer12_V5_i_ret/checkpoint-600/tokenizer.json filter=lfs diff=lfs merge=lfs -text
107
+ experiments/Qwen2_5vl_3B_multilayer_distill_AOP_pooling_all_12_10_h100_4_Classifier_Layer12_V5_i_ret/checkpoint-400/tokenizer.json filter=lfs diff=lfs merge=lfs -text
108
+ experiments/Qwen2_5vl_3B_multilayer_distill_AOP_pooling_all_12_10_h100_4_Classifier_Layer12_V5_i_ret/checkpoint-200/tokenizer.json filter=lfs diff=lfs merge=lfs -text
109
+ experiments/Qwen2_5vl_3B_multilayer_distill_AOP_pooling_all_12_10_h100_4_Classifier_Layer12_V5_i_ret/checkpoint-300/tokenizer.json filter=lfs diff=lfs merge=lfs -text
110
+ exps/l12_t_0.5_8_i_2000/VLM2Vec-V2.0-Qwen2VL-2B/visdoc_retrival/ViDoRe_infovqa_qry_layer12 filter=lfs diff=lfs merge=lfs -text
111
+ exps/l12_t_0.5_8_i_2000/VLM2Vec-V2.0-Qwen2VL-2B/visdoc_retrival/ViDoRe_infovqa_score_details_both_layers.jsonl filter=lfs diff=lfs merge=lfs -text
112
+ exps/l12_t_0.5_8_i_2000/VLM2Vec-V2.0-Qwen2VL-2B/visdoc_retrival/ViDoRe_shiftproject_tgt_layerlast filter=lfs diff=lfs merge=lfs -text
113
+ exps/l12_t_0.5_8_i_2000/VLM2Vec-V2.0-Qwen2VL-2B/visdoc_retrival/ViDoRe_shiftproject_tgt_layer12 filter=lfs diff=lfs merge=lfs -text
114
+ exps/l12_t_0.5_8_i_2000/VLM2Vec-V2.0-Qwen2VL-2B/visdoc_retrival/ViDoRe_docvqa_tgt_layer12 filter=lfs diff=lfs merge=lfs -text
115
+ exps/l12_t_0.5_8_i_2000/VLM2Vec-V2.0-Qwen2VL-2B/visdoc_retrival/ViDoRe_docvqa_qry_layer12 filter=lfs diff=lfs merge=lfs -text
116
+ exps/l12_t_0.5_8_i_2000/VLM2Vec-V2.0-Qwen2VL-2B/visdoc_retrival/ViDoRe_tatdqa_tgt_layerlast filter=lfs diff=lfs merge=lfs -text
117
+ exps/l12_t_0.5_8_i_2000/VLM2Vec-V2.0-Qwen2VL-2B/visdoc_retrival/ViDoRe_docvqa_tgt_layerlast filter=lfs diff=lfs merge=lfs -text
118
+ exps/l12_t_0.5_8_i_2000/VLM2Vec-V2.0-Qwen2VL-2B/visdoc_retrival/ViDoRe_tatdqa_tgt_layer12 filter=lfs diff=lfs merge=lfs -text
119
+ exps/l12_t_0.5_8_i_2000/VLM2Vec-V2.0-Qwen2VL-2B/visdoc_retrival/ViDoRe_infovqa_score_details_layer12.jsonl filter=lfs diff=lfs merge=lfs -text
120
+ exps/l12_t_0.5_8_i_2000/VLM2Vec-V2.0-Qwen2VL-2B/visdoc_retrival/ViDoRe_shiftproject_qry_layer12 filter=lfs diff=lfs merge=lfs -text
121
+ exps/l12_t_0.5_8_i_2000/VLM2Vec-V2.0-Qwen2VL-2B/visdoc_retrival/ViDoRe_infovqa_qry_layerlast filter=lfs diff=lfs merge=lfs -text
122
+ exps/l12_t_0.5_8_i_2000/VLM2Vec-V2.0-Qwen2VL-2B/visdoc_retrival/ViDoRe_tabfquad_qry_layer12 filter=lfs diff=lfs merge=lfs -text
123
+ exps/l12_t_0.5_8_i_2000/VLM2Vec-V2.0-Qwen2VL-2B/visdoc_retrival/ViDoRe_docvqa_qry_layerlast filter=lfs diff=lfs merge=lfs -text
124
+ exps/l12_t_0.5_8_i_2000/VLM2Vec-V2.0-Qwen2VL-2B/visdoc_retrival/ViDoRe_arxivqa_tgt_layer12 filter=lfs diff=lfs merge=lfs -text
125
+ exps/l12_t_0.5_8_i_2000/VLM2Vec-V2.0-Qwen2VL-2B/visdoc_retrival/ViDoRe_tatdqa_qry_layer12 filter=lfs diff=lfs merge=lfs -text
126
+ exps/l12_t_0.5_8_i_2000/VLM2Vec-V2.0-Qwen2VL-2B/visdoc_retrival/ViDoRe_arxivqa_score_details_both_layers.jsonl filter=lfs diff=lfs merge=lfs -text
127
+ exps/l12_t_0.5_8_i_2000/VLM2Vec-V2.0-Qwen2VL-2B/visdoc_retrival/ViDoRe_tabfquad_tgt_layer12 filter=lfs diff=lfs merge=lfs -text
128
+ exps/l12_t_0.5_8_i_2000/VLM2Vec-V2.0-Qwen2VL-2B/visdoc_retrival/ViDoRe_infovqa_score_details_layerlast.jsonl filter=lfs diff=lfs merge=lfs -text
129
+ exps/l12_t_0.5_8_i_2000/VLM2Vec-V2.0-Qwen2VL-2B/visdoc_retrival/ViDoRe_tabfquad_tgt_layerlast filter=lfs diff=lfs merge=lfs -text
130
+ exps/l12_t_0.5_8_i_2000/VLM2Vec-V2.0-Qwen2VL-2B/visdoc_retrival/ViDoRe_tatdqa_qry_layerlast filter=lfs diff=lfs merge=lfs -text
131
+ exps/l12_t_0.5_8_i_2000/VLM2Vec-V2.0-Qwen2VL-2B/visdoc_retrival/ViDoRe_infovqa_tgt_layerlast filter=lfs diff=lfs merge=lfs -text
132
+ exps/l12_t_0.5_8_i_2000/VLM2Vec-V2.0-Qwen2VL-2B/visdoc_retrival/ViDoRe_arxivqa_score_details_layer12.jsonl filter=lfs diff=lfs merge=lfs -text
133
+ exps/l12_t_0.5_8_i_2000/VLM2Vec-V2.0-Qwen2VL-2B/visdoc_retrival/ViDoRe_arxivqa_tgt_layerlast filter=lfs diff=lfs merge=lfs -text
134
+ exps/l12_t_0.5_8_i_2000/VLM2Vec-V2.0-Qwen2VL-2B/visdoc_retrival/ViDoRe_docvqa_score_details_layer12.jsonl filter=lfs diff=lfs merge=lfs -text
135
+ exps/l12_t_0.5_8_i_2000/VLM2Vec-V2.0-Qwen2VL-2B/visdoc_retrival/ViDoRe_tabfquad_qry_layerlast filter=lfs diff=lfs merge=lfs -text
136
+ exps/l12_t_0.5_8_i_2000/VLM2Vec-V2.0-Qwen2VL-2B/visdoc_retrival/ViDoRe_docvqa_score_details_both_layers.jsonl filter=lfs diff=lfs merge=lfs -text
137
+ exps/l12_t_0.5_8_i_2000/VLM2Vec-V2.0-Qwen2VL-2B/visdoc_retrival/ViDoRe_arxivqa_qry_layer12 filter=lfs diff=lfs merge=lfs -text
138
+ exps/l12_t_0.5_8_i_2000/VLM2Vec-V2.0-Qwen2VL-2B/visdoc_retrival/ViDoRe_arxivqa_score_details_layerlast.jsonl filter=lfs diff=lfs merge=lfs -text
139
+ exps/l12_t_0.5_8_i_2000/VLM2Vec-V2.0-Qwen2VL-2B/visdoc_retrival/ViDoRe_arxivqa_qry_layerlast filter=lfs diff=lfs merge=lfs -text
140
+ exps/l12_t_0.5_8_i_2000/VLM2Vec-V2.0-Qwen2VL-2B/visdoc_retrival/ViDoRe_shiftproject_qry_layerlast filter=lfs diff=lfs merge=lfs -text
141
+ exps/l12_t_0.5_8_i_2000/VLM2Vec-V2.0-Qwen2VL-2B/visdoc_retrival/ViDoRe_docvqa_score_details_layerlast.jsonl filter=lfs diff=lfs merge=lfs -text
142
+ exps/l12_t_0.5_8_i_2000/VLM2Vec-V2.0-Qwen2VL-2B/visdoc_retrival/ViDoRe_infovqa_tgt_layer12 filter=lfs diff=lfs merge=lfs -text
143
+ exps/l12_t_0.5_8_i_2000/VLM2Vec-V2.0-Qwen2VL-2B/visdoc_retrival/ViDoRe_tatdqa_score_details_layerlast.jsonl filter=lfs diff=lfs merge=lfs -text
144
+ exps/l12_t_0.5_8_i_2000/VLM2Vec-V2.0-Qwen2VL-2B/visdoc_retrival/ViDoRe_tatdqa_score_details_both_layers.jsonl filter=lfs diff=lfs merge=lfs -text
145
+ exps/l12_t_0.5_8_i_2000/VLM2Vec-V2.0-Qwen2VL-2B/visdoc_retrival/ViDoRe_tatdqa_score_details_layer12.jsonl filter=lfs diff=lfs merge=lfs -text
146
+ exps/l12_t_0.5_8_i_2000/VLM2Vec-V2.0-Qwen2VL-2B/image_retrival/OVEN_tgt_layerlast filter=lfs diff=lfs merge=lfs -text
147
+ exps/l12_t_0.5_8_i_2000/VLM2Vec-V2.0-Qwen2VL-2B/image_retrival/NIGHTS_pred_layer12.jsonl filter=lfs diff=lfs merge=lfs -text
148
+ exps/l12_t_0.5_8_i_2000/VLM2Vec-V2.0-Qwen2VL-2B/image_retrival/NIGHTS_pred_layerlast.jsonl filter=lfs diff=lfs merge=lfs -text
149
+ exps/l12_t_0.5_8_i_2000/VLM2Vec-V2.0-Qwen2VL-2B/image_retrival/VisualNews_t2i_tgt_layer12 filter=lfs diff=lfs merge=lfs -text
150
+ exps/l12_t_0.5_8_i_2000/VLM2Vec-V2.0-Qwen2VL-2B/image_retrival/FashionIQ_tgt_layerlast filter=lfs diff=lfs merge=lfs -text
151
+ exps/l12_t_0.5_8_i_2000/VLM2Vec-V2.0-Qwen2VL-2B/image_retrival/VisDial_tgt_layerlast filter=lfs diff=lfs merge=lfs -text
152
+ exps/l12_t_0.5_8_i_2000/VLM2Vec-V2.0-Qwen2VL-2B/image_retrival/EDIS_pred_layerlast.jsonl filter=lfs diff=lfs merge=lfs -text
153
+ exps/l12_t_0.5_8_i_2000/VLM2Vec-V2.0-Qwen2VL-2B/image_retrival/VisualNews_t2i_score_details_layerlast.jsonl filter=lfs diff=lfs merge=lfs -text
154
+ exps/l12_t_0.5_8_i_2000/VLM2Vec-V2.0-Qwen2VL-2B/image_retrival/MSCOCO_t2i_qry_layerlast filter=lfs diff=lfs merge=lfs -text
155
+ exps/l12_t_0.5_8_i_2000/VLM2Vec-V2.0-Qwen2VL-2B/image_retrival/VisualNews_i2t_qry_layer12 filter=lfs diff=lfs merge=lfs -text
156
+ exps/l12_t_0.5_8_i_2000/VLM2Vec-V2.0-Qwen2VL-2B/image_retrival/EDIS_score_details_both_layers.jsonl filter=lfs diff=lfs merge=lfs -text
157
+ exps/l12_t_0.5_8_i_2000/VLM2Vec-V2.0-Qwen2VL-2B/image_retrival/FashionIQ_score_details_layer12.jsonl filter=lfs diff=lfs merge=lfs -text
158
+ exps/l12_t_0.5_8_i_2000/VLM2Vec-V2.0-Qwen2VL-2B/image_retrival/WebQA_score_details_layerlast.jsonl filter=lfs diff=lfs merge=lfs -text
159
+ exps/l12_t_0.5_8_i_2000/VLM2Vec-V2.0-Qwen2VL-2B/image_retrival/EDIS_qry_layerlast filter=lfs diff=lfs merge=lfs -text
160
+ exps/l12_t_0.5_8_i_2000/VLM2Vec-V2.0-Qwen2VL-2B/image_retrival/FashionIQ_info.jsonl filter=lfs diff=lfs merge=lfs -text
161
+ exps/l12_t_0.5_8_i_2000/VLM2Vec-V2.0-Qwen2VL-2B/image_retrival/FashionIQ_pred_layer12.jsonl filter=lfs diff=lfs merge=lfs -text
162
+ exps/l12_t_0.5_8_i_2000/VLM2Vec-V2.0-Qwen2VL-2B/image_retrival/MSCOCO_i2t_tgt_layerlast filter=lfs diff=lfs merge=lfs -text
163
+ exps/l12_t_0.5_8_i_2000/VLM2Vec-V2.0-Qwen2VL-2B/image_retrival/MSCOCO_t2i_pred_layer12.jsonl filter=lfs diff=lfs merge=lfs -text
164
+ exps/l12_t_0.5_8_i_2000/VLM2Vec-V2.0-Qwen2VL-2B/image_retrival/FashionIQ_score_details_layerlast.jsonl filter=lfs diff=lfs merge=lfs -text
165
+ exps/l12_t_0.5_8_i_2000/VLM2Vec-V2.0-Qwen2VL-2B/image_retrival/MSCOCO_i2t_pred_layerlast.jsonl filter=lfs diff=lfs merge=lfs -text
166
+ exps/l12_t_0.5_8_i_2000/VLM2Vec-V2.0-Qwen2VL-2B/image_retrival/VisDial_score_details_both_layers.jsonl filter=lfs diff=lfs merge=lfs -text
167
+ exps/l12_t_0.5_8_i_2000/VLM2Vec-V2.0-Qwen2VL-2B/image_retrival/VisDial_qry_layerlast filter=lfs diff=lfs merge=lfs -text
168
+ exps/l12_t_0.5_8_i_2000/VLM2Vec-V2.0-Qwen2VL-2B/image_retrival/MSCOCO_t2i_score_details_layerlast.jsonl filter=lfs diff=lfs merge=lfs -text
169
+ exps/l12_t_0.5_8_i_2000/VLM2Vec-V2.0-Qwen2VL-2B/image_retrival/NIGHTS_tgt_layer12 filter=lfs diff=lfs merge=lfs -text
170
+ exps/l12_t_0.5_8_i_2000/VLM2Vec-V2.0-Qwen2VL-2B/image_retrival/FashionIQ_score_details_both_layers.jsonl filter=lfs diff=lfs merge=lfs -text
171
+ exps/l12_t_0.5_8_i_2000/VLM2Vec-V2.0-Qwen2VL-2B/image_retrival/VisualNews_t2i_score_details_both_layers.jsonl filter=lfs diff=lfs merge=lfs -text
172
+ exps/l12_t_0.5_8_i_2000/VLM2Vec-V2.0-Qwen2VL-2B/image_retrival/NIGHTS_qry_layer12 filter=lfs diff=lfs merge=lfs -text
173
+ exps/l12_t_0.5_8_i_2000/VLM2Vec-V2.0-Qwen2VL-2B/image_retrival/VisualNews_i2t_score_details_layer12.jsonl filter=lfs diff=lfs merge=lfs -text
174
+ exps/l12_t_0.5_8_i_2000/VLM2Vec-V2.0-Qwen2VL-2B/image_retrival/WebQA_qry_layer12 filter=lfs diff=lfs merge=lfs -text
175
+ exps/l12_t_0.5_8_i_2000/VLM2Vec-V2.0-Qwen2VL-2B/image_retrival/EDIS_score_details_layerlast.jsonl filter=lfs diff=lfs merge=lfs -text
176
+ exps/l12_t_0.5_8_i_2000/VLM2Vec-V2.0-Qwen2VL-2B/image_retrival/FashionIQ_qry_layerlast filter=lfs diff=lfs merge=lfs -text
177
+ exps/l12_t_0.5_8_i_2000/VLM2Vec-V2.0-Qwen2VL-2B/image_retrival/Wiki-SS-NQ_info.jsonl filter=lfs diff=lfs merge=lfs -text
178
+ exps/l12_t_0.5_8_i_2000/VLM2Vec-V2.0-Qwen2VL-2B/image_retrival/EDIS_tgt_layer12 filter=lfs diff=lfs merge=lfs -text
179
+ exps/l12_t_0.5_8_i_2000/VLM2Vec-V2.0-Qwen2VL-2B/image_retrival/VisualNews_i2t_score_details_both_layers.jsonl filter=lfs diff=lfs merge=lfs -text
180
+ exps/l12_t_0.5_8_i_2000/VLM2Vec-V2.0-Qwen2VL-2B/image_retrival/WebQA_score_details_layer12.jsonl filter=lfs diff=lfs merge=lfs -text
181
+ exps/l12_t_0.5_8_i_2000/VLM2Vec-V2.0-Qwen2VL-2B/image_retrival/OVEN_score_details_layer12.jsonl filter=lfs diff=lfs merge=lfs -text
182
+ exps/l12_t_0.5_8_i_2000/VLM2Vec-V2.0-Qwen2VL-2B/image_retrival/CIRR_score_details_layerlast.jsonl filter=lfs diff=lfs merge=lfs -text
183
+ exps/l12_t_0.5_8_i_2000/VLM2Vec-V2.0-Qwen2VL-2B/image_retrival/OVEN_info.jsonl filter=lfs diff=lfs merge=lfs -text
184
+ exps/l12_t_0.5_8_i_2000/VLM2Vec-V2.0-Qwen2VL-2B/image_retrival/Wiki-SS-NQ_qry_layer12 filter=lfs diff=lfs merge=lfs -text
185
+ exps/l12_t_0.5_8_i_2000/VLM2Vec-V2.0-Qwen2VL-2B/image_retrival/OVEN_qry_layer12 filter=lfs diff=lfs merge=lfs -text
186
+ exps/l12_t_0.5_8_i_2000/VLM2Vec-V2.0-Qwen2VL-2B/image_retrival/CIRR_tgt_layerlast filter=lfs diff=lfs merge=lfs -text
187
+ exps/l12_t_0.5_8_i_2000/VLM2Vec-V2.0-Qwen2VL-2B/image_retrival/CIRR_qry_layerlast filter=lfs diff=lfs merge=lfs -text
188
+ exps/l12_t_0.5_8_i_2000/VLM2Vec-V2.0-Qwen2VL-2B/image_retrival/WebQA_tgt_layer12 filter=lfs diff=lfs merge=lfs -text
189
+ exps/l12_t_0.5_8_i_2000/VLM2Vec-V2.0-Qwen2VL-2B/image_retrival/VisDial_pred_layer12.jsonl filter=lfs diff=lfs merge=lfs -text
190
+ exps/l12_t_0.5_8_i_2000/VLM2Vec-V2.0-Qwen2VL-2B/image_retrival/MSCOCO_i2t_info.jsonl filter=lfs diff=lfs merge=lfs -text
191
+ exps/l12_t_0.5_8_i_2000/VLM2Vec-V2.0-Qwen2VL-2B/image_retrival/FashionIQ_pred_layerlast.jsonl filter=lfs diff=lfs merge=lfs -text
192
+ exps/l12_t_0.5_8_i_2000/VLM2Vec-V2.0-Qwen2VL-2B/image_retrival/EDIS_score_details_layer12.jsonl filter=lfs diff=lfs merge=lfs -text
193
+ exps/l12_t_0.5_8_i_2000/VLM2Vec-V2.0-Qwen2VL-2B/image_retrival/MSCOCO_t2i_pred_layerlast.jsonl filter=lfs diff=lfs merge=lfs -text
194
+ exps/l12_t_0.5_8_i_2000/VLM2Vec-V2.0-Qwen2VL-2B/image_retrival/VisDial_score_details_layer12.jsonl filter=lfs diff=lfs merge=lfs -text
195
+ exps/l12_t_0.5_8_i_2000/VLM2Vec-V2.0-Qwen2VL-2B/image_retrival/CIRR_qry_layer12 filter=lfs diff=lfs merge=lfs -text
196
+ exps/l12_t_0.5_8_i_2000/VLM2Vec-V2.0-Qwen2VL-2B/image_retrival/MSCOCO_i2t_score_details_layer12.jsonl filter=lfs diff=lfs merge=lfs -text
197
+ exps/l12_t_0.5_8_i_2000/VLM2Vec-V2.0-Qwen2VL-2B/image_retrival/CIRR_tgt_layer12 filter=lfs diff=lfs merge=lfs -text
198
+ exps/l12_t_0.5_8_i_2000/VLM2Vec-V2.0-Qwen2VL-2B/image_retrival/Wiki-SS-NQ_qry_layerlast filter=lfs diff=lfs merge=lfs -text
199
+ exps/l12_t_0.5_8_i_2000/VLM2Vec-V2.0-Qwen2VL-2B/image_retrival/EDIS_pred_layer12.jsonl filter=lfs diff=lfs merge=lfs -text
200
+ exps/l12_t_0.5_8_i_2000/VLM2Vec-V2.0-Qwen2VL-2B/image_retrival/VisualNews_t2i_pred_layerlast.jsonl filter=lfs diff=lfs merge=lfs -text
201
+ exps/l12_t_0.5_8_i_2000/VLM2Vec-V2.0-Qwen2VL-2B/image_retrival/VisualNews_t2i_score_details_layer12.jsonl filter=lfs diff=lfs merge=lfs -text
202
+ exps/l12_t_0.5_8_i_2000/VLM2Vec-V2.0-Qwen2VL-2B/image_retrival/EDIS_info.jsonl filter=lfs diff=lfs merge=lfs -text
203
+ exps/l12_t_0.5_8_i_2000/VLM2Vec-V2.0-Qwen2VL-2B/image_retrival/VisDial_score_details_layerlast.jsonl filter=lfs diff=lfs merge=lfs -text
204
+ exps/l12_t_0.5_8_i_2000/VLM2Vec-V2.0-Qwen2VL-2B/image_retrival/NIGHTS_info.jsonl filter=lfs diff=lfs merge=lfs -text
205
+ exps/l12_t_0.5_8_i_2000/VLM2Vec-V2.0-Qwen2VL-2B/image_retrival/VisualNews_t2i_info.jsonl filter=lfs diff=lfs merge=lfs -text
206
+ exps/l12_t_0.5_8_i_2000/VLM2Vec-V2.0-Qwen2VL-2B/image_retrival/VisualNews_t2i_qry_layerlast filter=lfs diff=lfs merge=lfs -text
207
+ exps/l12_t_0.5_8_i_2000/VLM2Vec-V2.0-Qwen2VL-2B/image_retrival/VisualNews_i2t_tgt_layer12 filter=lfs diff=lfs merge=lfs -text
208
+ exps/l12_t_0.5_8_i_2000/VLM2Vec-V2.0-Qwen2VL-2B/image_retrival/VisualNews_t2i_qry_layer12 filter=lfs diff=lfs merge=lfs -text
209
+ exps/l12_t_0.5_8_i_2000/VLM2Vec-V2.0-Qwen2VL-2B/image_retrival/MSCOCO_i2t_qry_layerlast filter=lfs diff=lfs merge=lfs -text
210
+ exps/l12_t_0.5_8_i_2000/VLM2Vec-V2.0-Qwen2VL-2B/image_retrival/WebQA_pred_layer12.jsonl filter=lfs diff=lfs merge=lfs -text
211
+ exps/l12_t_0.5_8_i_2000/VLM2Vec-V2.0-Qwen2VL-2B/image_retrival/MSCOCO_t2i_qry_layer12 filter=lfs diff=lfs merge=lfs -text
212
+ exps/l12_t_0.5_8_i_2000/VLM2Vec-V2.0-Qwen2VL-2B/image_retrival/NIGHTS_tgt_layerlast filter=lfs diff=lfs merge=lfs -text
213
+ exps/l12_t_0.5_8_i_2000/VLM2Vec-V2.0-Qwen2VL-2B/image_retrival/MSCOCO_i2t_pred_layer12.jsonl filter=lfs diff=lfs merge=lfs -text
214
+ exps/l12_t_0.5_8_i_2000/VLM2Vec-V2.0-Qwen2VL-2B/image_retrival/MSCOCO_t2i_tgt_layerlast filter=lfs diff=lfs merge=lfs -text
215
+ exps/l12_t_0.5_8_i_2000/VLM2Vec-V2.0-Qwen2VL-2B/image_retrival/CIRR_score_details_layer12.jsonl filter=lfs diff=lfs merge=lfs -text
216
+ exps/l12_t_0.5_8_i_2000/VLM2Vec-V2.0-Qwen2VL-2B/image_retrival/VisualNews_i2t_info.jsonl filter=lfs diff=lfs merge=lfs -text
217
+ exps/l12_t_0.5_8_i_2000/VLM2Vec-V2.0-Qwen2VL-2B/image_retrival/VisDial_pred_layerlast.jsonl filter=lfs diff=lfs merge=lfs -text
218
+ exps/l12_t_0.5_8_i_2000/VLM2Vec-V2.0-Qwen2VL-2B/image_retrival/Wiki-SS-NQ_tgt_layer12 filter=lfs diff=lfs merge=lfs -text
219
+ exps/l12_t_0.5_8_i_2000/VLM2Vec-V2.0-Qwen2VL-2B/image_retrival/MSCOCO_i2t_score_details_layerlast.jsonl filter=lfs diff=lfs merge=lfs -text
220
+ exps/l12_t_0.5_8_i_2000/VLM2Vec-V2.0-Qwen2VL-2B/image_retrival/OVEN_pred_layerlast.jsonl filter=lfs diff=lfs merge=lfs -text
221
+ exps/l12_t_0.5_8_i_2000/VLM2Vec-V2.0-Qwen2VL-2B/image_retrival/FashionIQ_tgt_layer12 filter=lfs diff=lfs merge=lfs -text
222
+ exps/l12_t_0.5_8_i_2000/VLM2Vec-V2.0-Qwen2VL-2B/image_retrival/OVEN_qry_layerlast filter=lfs diff=lfs merge=lfs -text
223
+ exps/l12_t_0.5_8_i_2000/VLM2Vec-V2.0-Qwen2VL-2B/image_retrival/WebQA_tgt_layerlast filter=lfs diff=lfs merge=lfs -text
224
+ exps/l12_t_0.5_8_i_2000/VLM2Vec-V2.0-Qwen2VL-2B/image_retrival/EDIS_tgt_layerlast filter=lfs diff=lfs merge=lfs -text
225
+ exps/l12_t_0.5_8_i_2000/VLM2Vec-V2.0-Qwen2VL-2B/image_retrival/MSCOCO_i2t_tgt_layer12 filter=lfs diff=lfs merge=lfs -text
226
+ exps/l12_t_0.5_8_i_2000/VLM2Vec-V2.0-Qwen2VL-2B/image_retrival/VisualNews_t2i_tgt_layerlast filter=lfs diff=lfs merge=lfs -text
227
+ exps/l12_t_0.5_8_i_2000/VLM2Vec-V2.0-Qwen2VL-2B/image_retrival/EDIS_qry_layer12 filter=lfs diff=lfs merge=lfs -text
228
+ exps/l12_t_0.5_8_i_2000/VLM2Vec-V2.0-Qwen2VL-2B/image_retrival/VisualNews_t2i_pred_layer12.jsonl filter=lfs diff=lfs merge=lfs -text
229
+ exps/l12_t_0.5_8_i_2000/VLM2Vec-V2.0-Qwen2VL-2B/image_retrival/NIGHTS_score_details_layerlast.jsonl filter=lfs diff=lfs merge=lfs -text
230
+ exps/l12_t_0.5_8_i_2000/VLM2Vec-V2.0-Qwen2VL-2B/image_retrival/MSCOCO_t2i_info.jsonl filter=lfs diff=lfs merge=lfs -text
231
+ exps/l12_t_0.5_8_i_2000/VLM2Vec-V2.0-Qwen2VL-2B/image_retrival/WebQA_pred_layerlast.jsonl filter=lfs diff=lfs merge=lfs -text
232
+ exps/l12_t_0.5_8_i_2000/VLM2Vec-V2.0-Qwen2VL-2B/image_retrival/MSCOCO_i2t_qry_layer12 filter=lfs diff=lfs merge=lfs -text
233
+ exps/l12_t_0.5_8_i_2000/VLM2Vec-V2.0-Qwen2VL-2B/image_retrival/CIRR_info.jsonl filter=lfs diff=lfs merge=lfs -text
234
+ exps/l12_t_0.5_8_i_2000/VLM2Vec-V2.0-Qwen2VL-2B/image_retrival/MSCOCO_t2i_score_details_both_layers.jsonl filter=lfs diff=lfs merge=lfs -text
235
+ exps/l12_t_0.5_8_i_2000/VLM2Vec-V2.0-Qwen2VL-2B/image_retrival/VisualNews_i2t_tgt_layerlast filter=lfs diff=lfs merge=lfs -text
236
+ exps/l12_t_0.5_8_i_2000/VLM2Vec-V2.0-Qwen2VL-2B/image_retrival/VisualNews_i2t_pred_layerlast.jsonl filter=lfs diff=lfs merge=lfs -text
237
+ exps/l12_t_0.5_8_i_2000/VLM2Vec-V2.0-Qwen2VL-2B/image_retrival/MSCOCO_i2t_score_details_both_layers.jsonl filter=lfs diff=lfs merge=lfs -text
238
+ exps/l12_t_0.5_8_i_2000/VLM2Vec-V2.0-Qwen2VL-2B/image_retrival/VisualNews_i2t_score_details_layerlast.jsonl filter=lfs diff=lfs merge=lfs -text
239
+ exps/l12_t_0.5_8_i_2000/VLM2Vec-V2.0-Qwen2VL-2B/image_retrival/NIGHTS_score_details_layer12.jsonl filter=lfs diff=lfs merge=lfs -text
240
+ exps/l12_t_0.5_8_i_2000/VLM2Vec-V2.0-Qwen2VL-2B/image_retrival/OVEN_pred_layer12.jsonl filter=lfs diff=lfs merge=lfs -text
241
+ exps/l12_t_0.5_8_i_2000/VLM2Vec-V2.0-Qwen2VL-2B/image_retrival/WebQA_qry_layerlast filter=lfs diff=lfs merge=lfs -text
242
+ exps/l12_t_0.5_8_i_2000/VLM2Vec-V2.0-Qwen2VL-2B/image_retrival/Wiki-SS-NQ_cand_img_token_masks_layer12.jsonl filter=lfs diff=lfs merge=lfs -text
243
+ exps/l12_t_0.5_8_i_2000/VLM2Vec-V2.0-Qwen2VL-2B/image_retrival/VisualNews_i2t_pred_layer12.jsonl filter=lfs diff=lfs merge=lfs -text
244
+ exps/l12_t_0.5_8_i_2000/VLM2Vec-V2.0-Qwen2VL-2B/image_retrival/OVEN_score_details_layerlast.jsonl filter=lfs diff=lfs merge=lfs -text
245
+ exps/l12_t_0.5_8_i_2000/VLM2Vec-V2.0-Qwen2VL-2B/image_retrival/VisDial_tgt_layer12 filter=lfs diff=lfs merge=lfs -text
246
+ exps/l12_t_0.5_8_i_2000/VLM2Vec-V2.0-Qwen2VL-2B/image_retrival/FashionIQ_qry_layer12 filter=lfs diff=lfs merge=lfs -text
247
+ exps/l12_t_0.5_8_i_2000/VLM2Vec-V2.0-Qwen2VL-2B/image_retrival/VisDial_info.jsonl filter=lfs diff=lfs merge=lfs -text
248
+ exps/l12_t_0.5_8_i_2000/VLM2Vec-V2.0-Qwen2VL-2B/image_retrival/CIRR_pred_layer12.jsonl filter=lfs diff=lfs merge=lfs -text
249
+ exps/l12_t_0.5_8_i_2000/VLM2Vec-V2.0-Qwen2VL-2B/image_retrival/MSCOCO_t2i_tgt_layer12 filter=lfs diff=lfs merge=lfs -text
250
+ exps/l12_t_0.5_8_i_2000/VLM2Vec-V2.0-Qwen2VL-2B/image_retrival/OVEN_tgt_layer12 filter=lfs diff=lfs merge=lfs -text
251
+ exps/l12_t_0.5_8_i_2000/VLM2Vec-V2.0-Qwen2VL-2B/image_retrival/WebQA_info.jsonl filter=lfs diff=lfs merge=lfs -text
252
+ exps/l12_t_0.5_8_i_2000/VLM2Vec-V2.0-Qwen2VL-2B/image_retrival/VisualNews_i2t_qry_layerlast filter=lfs diff=lfs merge=lfs -text
253
+ exps/l12_t_0.5_8_i_2000/VLM2Vec-V2.0-Qwen2VL-2B/image_retrival/NIGHTS_qry_layerlast filter=lfs diff=lfs merge=lfs -text
254
+ exps/l12_t_0.5_8_i_2000/VLM2Vec-V2.0-Qwen2VL-2B/image_retrival/VisDial_qry_layer12 filter=lfs diff=lfs merge=lfs -text
255
+ exps/l12_t_0.5_8_i_2000/VLM2Vec-V2.0-Qwen2VL-2B/image_retrival/WebQA_score_details_both_layers.jsonl filter=lfs diff=lfs merge=lfs -text
256
+ exps/l12_t_0.5_8_i_2000/VLM2Vec-V2.0-Qwen2VL-2B/image_retrival/MSCOCO_t2i_score_details_layer12.jsonl filter=lfs diff=lfs merge=lfs -text
257
+ exps/l12_t_0.5_8_i_2000/VLM2Vec-V2.0-Qwen2VL-2B/image_retrival/CIRR_score_details_both_layers.jsonl filter=lfs diff=lfs merge=lfs -text
258
+ exps/l12_t_0.5_8_i_2000/VLM2Vec-V2.0-Qwen2VL-2B/image_retrival/NIGHTS_score_details_both_layers.jsonl filter=lfs diff=lfs merge=lfs -text
259
+ _fonts/NotoSansSC-Regular.otf filter=lfs diff=lfs merge=lfs -text
260
+ exps/l12_t_0.5_8_i_2000/VLM2Vec-V2.0-Qwen2VL-2B/image_retrival/CIRR_pred_layerlast.jsonl filter=lfs diff=lfs merge=lfs -text
261
+ exps/l12_t_0.5_8_i_2000/VLM2Vec-V2.0-Qwen2VL-2B/image_retrival/Wiki-SS-NQ_cand_text_token_masks_layer12.jsonl filter=lfs diff=lfs merge=lfs -text
262
+ exps/l12_t_0.5_8_i_2000/VLM2Vec-V2.0-Qwen2VL-2B/image_retrival/OVEN_score_details_both_layers.jsonl filter=lfs diff=lfs merge=lfs -text
263
+ ~/experiments/Qwen2_5vl_3B_multilayer_distill_AOP_10_pooling_12_26_a100_multinode/checkpoint-1700/tokenizer.json filter=lfs diff=lfs merge=lfs -text
264
+ ~/experiments/Qwen2_5vl_3B_multilayer_distill_AOP_10_pooling_12_26_a100_multinode/checkpoint-5000/tokenizer.json filter=lfs diff=lfs merge=lfs -text
265
+ ~/experiments/Qwen2_5vl_3B_multilayer_distill_AOP_10_pooling_12_26_a100_multinode/wandb/run-20251225_171245-4tqbpvs0/run-4tqbpvs0.wandb filter=lfs diff=lfs merge=lfs -text
266
+ ~/experiments/Qwen2_5vl_3B_multilayer_distill_AOP_10_pooling_12_26_a100_multinode/checkpoint-1600/tokenizer.json filter=lfs diff=lfs merge=lfs -text
267
+ ~/experiments/Qwen2_5vl_3B_multilayer_distill_AOP_10_pooling_12_26_a100_multinode/checkpoint-1800/tokenizer.json filter=lfs diff=lfs merge=lfs -text
268
+ ~/experiments/Qwen2_5vl_3B_multilayer_distill_AOP_10_pooling_12_26_a100_multinode/checkpoint-400/tokenizer.json filter=lfs diff=lfs merge=lfs -text
269
+ ~/experiments/Qwen2_5vl_3B_multilayer_distill_AOP_10_pooling_12_26_a100_multinode/checkpoint-1900/tokenizer.json filter=lfs diff=lfs merge=lfs -text
270
+ ~/experiments/Qwen2_5vl_3B_multilayer_distill_AOP_10_pooling_12_26_a100_multinode/checkpoint-4800/tokenizer.json filter=lfs diff=lfs merge=lfs -text
271
+ ~/experiments/Qwen2_5vl_3B_multilayer_distill_AOP_10_pooling_12_26_a100_multinode/checkpoint-4500/tokenizer.json filter=lfs diff=lfs merge=lfs -text
272
+ ~/experiments/Qwen2_5vl_3B_multilayer_distill_AOP_10_pooling_12_26_a100_multinode/train.log filter=lfs diff=lfs merge=lfs -text
273
+ ~/experiments/Qwen2_5vl_3B_multilayer_distill_AOP_10_pooling_12_26_a100_multinode/checkpoint-300/tokenizer.json filter=lfs diff=lfs merge=lfs -text
274
+ ~/experiments/Qwen2_5vl_3B_multilayer_distill_AOP_10_pooling_12_26_a100_multinode/checkpoint-3700/tokenizer.json filter=lfs diff=lfs merge=lfs -text
275
+ ~/experiments/Qwen2_5vl_3B_multilayer_distill_AOP_10_pooling_12_26_a100_multinode/checkpoint-200/tokenizer.json filter=lfs diff=lfs merge=lfs -text
276
+ assets/train_vlm.png filter=lfs diff=lfs merge=lfs -text
277
+ assets/example_video.mp4 filter=lfs diff=lfs merge=lfs -text
278
+ assets/mmeb_v2.png filter=lfs diff=lfs merge=lfs -text
279
+ assets/teaser.png filter=lfs diff=lfs merge=lfs -text
280
+ assets/vlm2vec_results.png filter=lfs diff=lfs merge=lfs -text
281
+ experiments/Qwen2_5vl_3B_multilayer_distill_AOP_10_pooling_12_26_a100_multinode_Classifier_Layer12_V5_i_ret_bsz128/checkpoint-600/tokenizer.json filter=lfs diff=lfs merge=lfs -text
282
+ experiments/Qwen2_5vl_3B_multilayer_distill_AOP_10_pooling_12_26_a100_multinode_Classifier_Layer12_V5_i_ret_bsz128/checkpoint-400/tokenizer.json filter=lfs diff=lfs merge=lfs -text
283
+ experiments/Qwen2_5vl_3B_multilayer_distill_AOP_10_pooling_12_26_a100_multinode_Classifier_Layer12_V5_i_ret_bsz128/checkpoint-300/tokenizer.json filter=lfs diff=lfs merge=lfs -text
284
+ experiments/Qwen2_5vl_3B_multilayer_distill_AOP_10_pooling_12_26_a100_multinode_Classifier_Layer12_V5_i_ret_bsz128/checkpoint-200/tokenizer.json filter=lfs diff=lfs merge=lfs -text
285
+ experiments/Qwen2_5vl_3B_multilayer_distill_AOP_pooling_all_12_10_h100_4_Classifier_Layer12_V5_i_ret_bsz1024/tokenizer.json filter=lfs diff=lfs merge=lfs -text
_fonts/NotoSansSC-Regular.otf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:36a6899ea83db9e0615ca12e445789dfdc0a5382d0cd15bacb1f42a2fe590e6f
3
+ size 2318796
assets/example_video.mp4 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8da3fb45df69e628d09809e88b3f3725568de5d094a45361dea2a54d3e205f17
3
+ size 608283
assets/mmeb_v2.png ADDED

Git LFS Details

  • SHA256: 079ddc416a616456ae32725ea32e758989bd6867992454a2a5fd0fa55c47a98c
  • Pointer size: 131 Bytes
  • Size of remote file: 339 kB
assets/teaser.png ADDED

Git LFS Details

  • SHA256: e1ce982d7fe118f2472669d39f807293d1964c1e7db201899605ace77539340c
  • Pointer size: 131 Bytes
  • Size of remote file: 347 kB
assets/train_vlm.png ADDED

Git LFS Details

  • SHA256: 8d69b9f62e3a962dbd60794207fb96c9afaad7f0e0b64480c13b669c262f3792
  • Pointer size: 131 Bytes
  • Size of remote file: 726 kB
assets/vlm2vec_results.png ADDED

Git LFS Details

  • SHA256: 37c8ed75cf50bf47b9460685b4ed820487c96c9858bca5a1470063366771aa4c
  • Pointer size: 131 Bytes
  • Size of remote file: 739 kB
experiments/Qwen2_5vl_3B_add_distill_0.2_0.6_DISTILL_FLOOR_0_12_3_h100_3_Classifier_Layer12_V5_i_ret/checkpoint-100/model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:73daf458973717697b4cc74457dbbdef65f4e08708267bafd86be0cc8fa2579d
3
+ size 610620
experiments/Qwen2_5vl_3B_add_distill_0.2_0.6_DISTILL_FLOOR_0_12_3_h100_3_Classifier_Layer12_V5_i_ret/checkpoint-100/optimizer.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:172c79cad39433fdd3c928d7f6e9903f496563fa761b2537025a2ff6c2b87638
3
+ size 1233404
experiments/Qwen2_5vl_3B_add_distill_0.2_0.6_DISTILL_FLOOR_0_12_3_h100_3_Classifier_Layer12_V5_i_ret/checkpoint-100/rng_state.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2621e38ab5fcefc6915d35fcaa7b27d5b5892fccaa7ae5c9f7b7d4ba498321e9
3
+ size 14709
experiments/Qwen2_5vl_3B_add_distill_0.2_0.6_DISTILL_FLOOR_0_12_3_h100_3_Classifier_Layer12_V5_i_ret/checkpoint-100/scheduler.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3222e0bb19d7f9cf6eb8a496a9297573dc0b270b4c55c8e2eaa9443c5b18b442
3
+ size 1465
experiments/Qwen2_5vl_3B_add_distill_0.2_0.6_DISTILL_FLOOR_0_12_3_h100_3_Classifier_Layer12_V5_i_ret/checkpoint-100/tokenizer.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9c5ae00e602b8860cbd784ba82a8aa14e8feecec692e7076590d014d7b7fdafa
3
+ size 11421896
experiments/Qwen2_5vl_3B_add_distill_0.2_0.6_DISTILL_FLOOR_0_12_3_h100_3_Classifier_Layer12_V5_i_ret/checkpoint-100/training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:92ea4c997f296f10998af2302d56fce60bc8df3b9a633845d423e218037881f8
3
+ size 6289
experiments/Qwen2_5vl_3B_add_distill_0.2_0.6_DISTILL_FLOOR_0_12_3_h100_3_Classifier_Layer12_V5_i_ret/checkpoint-200/model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:25a4680b337688c3587234972703020a1492e750f8aa427d0d23eda4f82d3cd7
3
+ size 610620
experiments/Qwen2_5vl_3B_add_distill_0.2_0.6_DISTILL_FLOOR_0_12_3_h100_3_Classifier_Layer12_V5_i_ret/checkpoint-200/optimizer.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:694ca84778f20efab1125d413d633e3ba954e1c114c05f0fe7862b635d152526
3
+ size 1233404
experiments/Qwen2_5vl_3B_add_distill_0.2_0.6_DISTILL_FLOOR_0_12_3_h100_3_Classifier_Layer12_V5_i_ret/checkpoint-200/rng_state.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f361fa76441c3b1efbde41f6319a94924c7085661f8693a07ca2510716fda0ea
3
+ size 14709
experiments/Qwen2_5vl_3B_add_distill_0.2_0.6_DISTILL_FLOOR_0_12_3_h100_3_Classifier_Layer12_V5_i_ret/checkpoint-200/scheduler.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cc4996496bbf363708baba32f39889a80aadbe5b598653714ed77f13a8eecaa5
3
+ size 1465
experiments/Qwen2_5vl_3B_add_distill_0.2_0.6_DISTILL_FLOOR_0_12_3_h100_3_Classifier_Layer12_V5_i_ret/checkpoint-200/tokenizer.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9c5ae00e602b8860cbd784ba82a8aa14e8feecec692e7076590d014d7b7fdafa
3
+ size 11421896
experiments/Qwen2_5vl_3B_add_distill_0.2_0.6_DISTILL_FLOOR_0_12_3_h100_3_Classifier_Layer12_V5_i_ret/checkpoint-200/training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:92ea4c997f296f10998af2302d56fce60bc8df3b9a633845d423e218037881f8
3
+ size 6289
experiments/Qwen2_5vl_3B_add_distill_0.2_0.6_DISTILL_FLOOR_0_12_3_h100_3_Classifier_Layer12_V5_i_ret/checkpoint-300/model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d2cc60fd8092c4a03186f53c737dbaa848af63a3a7cf6b5c3e9961215b88759b
3
+ size 610620
experiments/Qwen2_5vl_3B_add_distill_0.2_0.6_DISTILL_FLOOR_0_12_3_h100_3_Classifier_Layer12_V5_i_ret/checkpoint-300/optimizer.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3908632c49dc1058c19d651765da5dcb76eef577e9d367300b3794936f74980f
3
+ size 1233404
experiments/Qwen2_5vl_3B_add_distill_0.2_0.6_DISTILL_FLOOR_0_12_3_h100_3_Classifier_Layer12_V5_i_ret/checkpoint-300/rng_state.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a82c339d5618f51a6eaa4ce5212b7a1d380d5e011d58a29553c0c43469f9346e
3
+ size 14709
experiments/Qwen2_5vl_3B_add_distill_0.2_0.6_DISTILL_FLOOR_0_12_3_h100_3_Classifier_Layer12_V5_i_ret/checkpoint-300/scheduler.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9008526ba75ad62032e440b0c008b057b115ab20ed57dfeabf0d04a531a70829
3
+ size 1465
experiments/Qwen2_5vl_3B_add_distill_0.2_0.6_DISTILL_FLOOR_0_12_3_h100_3_Classifier_Layer12_V5_i_ret/checkpoint-300/tokenizer.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9c5ae00e602b8860cbd784ba82a8aa14e8feecec692e7076590d014d7b7fdafa
3
+ size 11421896
experiments/Qwen2_5vl_3B_add_distill_0.2_0.6_DISTILL_FLOOR_0_12_3_h100_3_Classifier_Layer12_V5_i_ret/checkpoint-300/training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:92ea4c997f296f10998af2302d56fce60bc8df3b9a633845d423e218037881f8
3
+ size 6289
experiments/Qwen2_5vl_3B_add_distill_0.2_0.6_DISTILL_FLOOR_0_12_3_h100_3_Classifier_Layer12_V5_i_ret/checkpoint-400/optimizer.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5489ba4fc074ff8a3dc85d4437bb0aaa25d86e2acb7553ebed4a9b384b6d5b75
3
+ size 1233404
experiments/Qwen2_5vl_3B_add_distill_0.2_0.6_DISTILL_FLOOR_0_12_3_h100_3_Classifier_Layer12_V5_i_ret/checkpoint-400/tokenizer.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9c5ae00e602b8860cbd784ba82a8aa14e8feecec692e7076590d014d7b7fdafa
3
+ size 11421896
experiments/Qwen2_5vl_3B_add_distill_0.2_0.6_DISTILL_FLOOR_0_12_3_h100_3_Classifier_Layer12_V5_i_ret/checkpoint-500/model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c45908c34c0b2ea61e62dc26f4e31f8c9bb6cfd8357ec956a597469a6e9b621e
3
+ size 610620
experiments/Qwen2_5vl_3B_add_distill_0.2_0.6_DISTILL_FLOOR_0_12_3_h100_3_Classifier_Layer12_V5_i_ret/checkpoint-500/optimizer.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:65558959c8cd23a90c6cd3946c0199dd303bfe3f81a42312667cb6f06cb02b35
3
+ size 1233404
experiments/Qwen2_5vl_3B_add_distill_0.2_0.6_DISTILL_FLOOR_0_12_3_h100_3_Classifier_Layer12_V5_i_ret/checkpoint-500/rng_state.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f32c9d936626b1947211b7357e2fea06f301de933ce4914ce1b9ae00ec8aa293
3
+ size 14709
experiments/Qwen2_5vl_3B_add_distill_0.2_0.6_DISTILL_FLOOR_0_12_3_h100_3_Classifier_Layer12_V5_i_ret/checkpoint-500/scheduler.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:722558c642a49ec4ef9ed99cc7abfff13930586cde1147e66b9c12925bb52695
3
+ size 1465
experiments/Qwen2_5vl_3B_add_distill_0.2_0.6_DISTILL_FLOOR_0_12_3_h100_3_Classifier_Layer12_V5_i_ret/checkpoint-500/training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:92ea4c997f296f10998af2302d56fce60bc8df3b9a633845d423e218037881f8
3
+ size 6289
experiments/Qwen2_5vl_3B_add_distill_0.2_0.6_DISTILL_FLOOR_0_12_3_h100_3_Classifier_Layer12_V5_i_ret/checkpoint-600/model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:780ff7e98ef82c2564499f93e001375da2ce49c9fb27ebb415a8a7b3776db075
3
+ size 610620
experiments/Qwen2_5vl_3B_add_distill_0.2_0.6_DISTILL_FLOOR_0_12_3_h100_3_Classifier_Layer12_V5_i_ret/checkpoint-600/rng_state.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9b81d79a92f1efb5bbe5dc9a5e19acc17e196de66e6b3ac0ff6b2306ffe71c71
3
+ size 14709
experiments/Qwen2_5vl_3B_add_distill_0.2_0.6_DISTILL_FLOOR_0_12_3_h100_3_Classifier_Layer12_V5_i_ret/checkpoint-600/scheduler.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:26e061621879b73539433b27b4cb7d185c26675fa608ca552f868527fe25da0f
3
+ size 1465
experiments/Qwen2_5vl_3B_add_distill_0.2_0.6_DISTILL_FLOOR_0_12_3_h100_3_Classifier_Layer12_V5_i_ret/checkpoint-600/tokenizer.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9c5ae00e602b8860cbd784ba82a8aa14e8feecec692e7076590d014d7b7fdafa
3
+ size 11421896
experiments/Qwen2_5vl_3B_add_distill_0.2_0.6_DISTILL_FLOOR_0_12_3_h100_3_Classifier_Layer12_V5_i_ret/checkpoint-600/training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:92ea4c997f296f10998af2302d56fce60bc8df3b9a633845d423e218037881f8
3
+ size 6289
experiments/Qwen2_5vl_3B_add_distill_0.2_0.6_DISTILL_FLOOR_0_12_3_h100_3_Classifier_Layer12_V5_i_ret/checkpoint-700/model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0090bd8e0b61dd6a52acb1b89994945ca61ddd454dcfbacee79e6eb053931f65
3
+ size 610620
experiments/Qwen2_5vl_3B_add_distill_0.2_0.6_DISTILL_FLOOR_0_12_3_h100_3_Classifier_Layer12_V5_i_ret/checkpoint-700/optimizer.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d9cb3f07a3444711f501dacf5587b26ac22df9d2f4148729d5bcdf149dfa671e
3
+ size 1233404
experiments/Qwen2_5vl_3B_add_distill_0.2_0.6_DISTILL_FLOOR_0_12_3_h100_3_Classifier_Layer12_V5_i_ret/checkpoint-700/rng_state.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2c05b43259dbbddb8ff60eedd2a5bda8741bec334675fa80f610092cebf24936
3
+ size 14709
experiments/Qwen2_5vl_3B_add_distill_0.2_0.6_DISTILL_FLOOR_0_12_3_h100_3_Classifier_Layer12_V5_i_ret/checkpoint-700/scheduler.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ba0f6f25405a7159eff6ef362532d600a82fb1edaf96938dfe9d5b6ab51e5995
3
+ size 1465
experiments/Qwen2_5vl_3B_add_distill_0.2_0.6_DISTILL_FLOOR_0_12_3_h100_3_Classifier_Layer12_V5_i_ret/checkpoint-700/tokenizer.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9c5ae00e602b8860cbd784ba82a8aa14e8feecec692e7076590d014d7b7fdafa
3
+ size 11421896
experiments/Qwen2_5vl_3B_add_distill_0.2_0.6_DISTILL_FLOOR_0_12_3_h100_3_Classifier_Layer12_V5_i_ret/checkpoint-700/training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:92ea4c997f296f10998af2302d56fce60bc8df3b9a633845d423e218037881f8
3
+ size 6289
experiments/Qwen2_5vl_3B_add_distill_0.2_0.6_DISTILL_FLOOR_0_12_3_h100_3_Classifier_Layer12_V5_i_ret/checkpoint-800/model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:423de7e9ec1e416d3ce1cc68b4bc3466d7c8e720ef37ce0ded443809c0cdb76e
3
+ size 610620
experiments/Qwen2_5vl_3B_add_distill_0.2_0.6_DISTILL_FLOOR_0_12_3_h100_3_Classifier_Layer12_V5_i_ret/checkpoint-800/optimizer.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3305ae01c42962d0ebb8bbbf209e813275ba88e56d7c1bae09b335f330ea33d7
3
+ size 1233404
experiments/Qwen2_5vl_3B_add_distill_0.2_0.6_DISTILL_FLOOR_0_12_3_h100_3_Classifier_Layer12_V5_i_ret/checkpoint-800/rng_state.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d8af55f04e98ebbb30c150c2e6b577eb3aa22db26ea54c90b247c4f06f7e7001
3
+ size 14709
experiments/Qwen2_5vl_3B_add_distill_0.2_0.6_DISTILL_FLOOR_0_12_3_h100_3_Classifier_Layer12_V5_i_ret/checkpoint-800/scheduler.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:83beb3128052f974860ed5a9840c49f4725edca47579a2e1cf084edb206e08cc
3
+ size 1465
experiments/Qwen2_5vl_3B_add_distill_0.2_0.6_DISTILL_FLOOR_0_12_3_h100_3_Classifier_Layer12_V5_i_ret/checkpoint-800/tokenizer.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9c5ae00e602b8860cbd784ba82a8aa14e8feecec692e7076590d014d7b7fdafa
3
+ size 11421896
experiments/Qwen2_5vl_3B_add_distill_0.2_0.6_DISTILL_FLOOR_0_12_3_h100_3_Classifier_Layer12_V5_i_ret/checkpoint-800/training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:92ea4c997f296f10998af2302d56fce60bc8df3b9a633845d423e218037881f8
3
+ size 6289
experiments/Qwen2_5vl_3B_multilayer_distill_AOP_10_pooling_12_26_a100_multinode_Classifier_Layer12_V5_i_ret_bsz128/checkpoint-100/model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:01628a6d0c8e456c004b0c7cd547bd58efa36d3bbe5d1453f7dcc9afbd67a283
3
+ size 610620