MgGladys commited on
Commit
4e3e79a
·
verified ·
1 Parent(s): 3902497

Add files using upload-large-folder tool

Browse files
Files changed (20) hide show
  1. experiments/Qwen2_5vl_3B_add_distill_0.2_0.6_11_23_Classifier_Layer12_ImgText_V5_i_ret/checkpoint-100/added_tokens.json +24 -0
  2. experiments/Qwen2_5vl_3B_add_distill_0.2_0.6_11_23_Classifier_Layer12_ImgText_V5_i_ret/checkpoint-100/chat_template.jinja +7 -0
  3. experiments/Qwen2_5vl_3B_add_distill_0.2_0.6_11_23_Classifier_Layer12_ImgText_V5_i_ret/checkpoint-100/preprocessor_config.json +29 -0
  4. experiments/Qwen2_5vl_3B_add_distill_0.2_0.6_11_23_Classifier_Layer12_ImgText_V5_i_ret/checkpoint-100/special_tokens_map.json +31 -0
  5. experiments/Qwen2_5vl_3B_add_distill_0.2_0.6_11_23_Classifier_Layer12_ImgText_V5_i_ret/checkpoint-100/tokenizer_config.json +208 -0
  6. experiments/Qwen2_5vl_3B_add_distill_0.2_0.6_11_23_Classifier_Layer12_ImgText_V5_i_ret/checkpoint-100/trainer_state.json +734 -0
  7. experiments/Qwen2_5vl_3B_add_distill_0.2_0.6_11_23_Classifier_Layer12_ImgText_V5_i_ret/checkpoint-100/vocab.json +0 -0
  8. experiments/Qwen2_5vl_3B_add_distill_0.2_0.6_11_23_Classifier_Layer12_ImgText_V5_i_ret/checkpoint-500/added_tokens.json +24 -0
  9. experiments/Qwen2_5vl_3B_add_distill_0.2_0.6_11_23_Classifier_Layer12_ImgText_V5_i_ret/checkpoint-500/chat_template.jinja +7 -0
  10. experiments/Qwen2_5vl_3B_add_distill_0.2_0.6_11_23_Classifier_Layer12_ImgText_V5_i_ret/checkpoint-500/preprocessor_config.json +29 -0
  11. experiments/Qwen2_5vl_3B_add_distill_0.2_0.6_11_23_Classifier_Layer12_ImgText_V5_i_ret/checkpoint-500/special_tokens_map.json +31 -0
  12. experiments/Qwen2_5vl_3B_add_distill_0.2_0.6_11_23_Classifier_Layer12_ImgText_V5_i_ret/checkpoint-500/tokenizer_config.json +208 -0
  13. experiments/Qwen2_5vl_3B_add_distill_0.2_0.6_11_23_Classifier_Layer12_ImgText_V5_i_ret/checkpoint-500/trainer_state.json +3534 -0
  14. experiments/Qwen2_5vl_3B_add_distill_0.2_0.6_11_23_Classifier_Layer12_ImgText_V5_i_ret/train_cls.log +0 -0
  15. experiments/Qwen2_5vl_3B_add_distill_0.2_0.6_11_23_Classifier_Layer12_ImgText_V5_i_ret/wandb/debug-internal.log +6 -0
  16. experiments/Qwen2_5vl_3B_add_distill_0.2_0.6_11_23_Classifier_Layer12_ImgText_V5_i_ret/wandb/debug.log +22 -0
  17. experiments/Qwen2_5vl_3B_add_distill_0.2_0.6_11_23_Classifier_Layer12_ImgText_V5_i_ret/wandb/run-20251208_155605-ooq67cso/logs/debug-internal.log +6 -0
  18. experiments/Qwen2_5vl_3B_add_distill_0.2_0.6_11_23_Classifier_Layer12_ImgText_V5_i_ret/wandb/run-20251208_155605-ooq67cso/logs/debug.log +22 -0
  19. experiments/public/all_scores/LamRA-Ret.json +2198 -0
  20. experiments/public/all_scores/VLM2Vec-V2.0-Qwen2VL-2B.json +2198 -0
experiments/Qwen2_5vl_3B_add_distill_0.2_0.6_11_23_Classifier_Layer12_ImgText_V5_i_ret/checkpoint-100/added_tokens.json ADDED
@@ -0,0 +1,24 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "</tool_call>": 151658,
3
+ "<tool_call>": 151657,
4
+ "<|box_end|>": 151649,
5
+ "<|box_start|>": 151648,
6
+ "<|endoftext|>": 151643,
7
+ "<|file_sep|>": 151664,
8
+ "<|fim_middle|>": 151660,
9
+ "<|fim_pad|>": 151662,
10
+ "<|fim_prefix|>": 151659,
11
+ "<|fim_suffix|>": 151661,
12
+ "<|im_end|>": 151645,
13
+ "<|im_start|>": 151644,
14
+ "<|image_pad|>": 151655,
15
+ "<|object_ref_end|>": 151647,
16
+ "<|object_ref_start|>": 151646,
17
+ "<|quad_end|>": 151651,
18
+ "<|quad_start|>": 151650,
19
+ "<|repo_name|>": 151663,
20
+ "<|video_pad|>": 151656,
21
+ "<|vision_end|>": 151653,
22
+ "<|vision_pad|>": 151654,
23
+ "<|vision_start|>": 151652
24
+ }
experiments/Qwen2_5vl_3B_add_distill_0.2_0.6_11_23_Classifier_Layer12_ImgText_V5_i_ret/checkpoint-100/chat_template.jinja ADDED
@@ -0,0 +1,7 @@
 
 
 
 
 
 
 
 
1
+ {% set image_count = namespace(value=0) %}{% set video_count = namespace(value=0) %}{% for message in messages %}{% if loop.first and message['role'] != 'system' %}<|im_start|>system
2
+ You are a helpful assistant.<|im_end|>
3
+ {% endif %}<|im_start|>{{ message['role'] }}
4
+ {% if message['content'] is string %}{{ message['content'] }}<|im_end|>
5
+ {% else %}{% for content in message['content'] %}{% if content['type'] == 'image' or 'image' in content or 'image_url' in content %}{% set image_count.value = image_count.value + 1 %}{% if add_vision_id %}Picture {{ image_count.value }}: {% endif %}<|vision_start|><|image_pad|><|vision_end|>{% elif content['type'] == 'video' or 'video' in content %}{% set video_count.value = video_count.value + 1 %}{% if add_vision_id %}Video {{ video_count.value }}: {% endif %}<|vision_start|><|video_pad|><|vision_end|>{% elif 'text' in content %}{{ content['text'] }}{% endif %}{% endfor %}<|im_end|>
6
+ {% endif %}{% endfor %}{% if add_generation_prompt %}<|im_start|>assistant
7
+ {% endif %}
experiments/Qwen2_5vl_3B_add_distill_0.2_0.6_11_23_Classifier_Layer12_ImgText_V5_i_ret/checkpoint-100/preprocessor_config.json ADDED
@@ -0,0 +1,29 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "do_convert_rgb": true,
3
+ "do_normalize": true,
4
+ "do_rescale": true,
5
+ "do_resize": true,
6
+ "image_mean": [
7
+ 0.48145466,
8
+ 0.4578275,
9
+ 0.40821073
10
+ ],
11
+ "image_processor_type": "Qwen2_5_VLImageProcessor",
12
+ "image_std": [
13
+ 0.26862954,
14
+ 0.26130258,
15
+ 0.27577711
16
+ ],
17
+ "max_pixels": 1003520,
18
+ "merge_size": 2,
19
+ "min_pixels": 3136,
20
+ "patch_size": 14,
21
+ "processor_class": "Qwen2_5_VLProcessor",
22
+ "resample": 3,
23
+ "rescale_factor": 0.00392156862745098,
24
+ "size": {
25
+ "max_pixels": 1003520,
26
+ "min_pixels": 3136
27
+ },
28
+ "temporal_patch_size": 2
29
+ }
experiments/Qwen2_5vl_3B_add_distill_0.2_0.6_11_23_Classifier_Layer12_ImgText_V5_i_ret/checkpoint-100/special_tokens_map.json ADDED
@@ -0,0 +1,31 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "additional_special_tokens": [
3
+ "<|im_start|>",
4
+ "<|im_end|>",
5
+ "<|object_ref_start|>",
6
+ "<|object_ref_end|>",
7
+ "<|box_start|>",
8
+ "<|box_end|>",
9
+ "<|quad_start|>",
10
+ "<|quad_end|>",
11
+ "<|vision_start|>",
12
+ "<|vision_end|>",
13
+ "<|vision_pad|>",
14
+ "<|image_pad|>",
15
+ "<|video_pad|>"
16
+ ],
17
+ "eos_token": {
18
+ "content": "<|im_end|>",
19
+ "lstrip": false,
20
+ "normalized": false,
21
+ "rstrip": false,
22
+ "single_word": false
23
+ },
24
+ "pad_token": {
25
+ "content": "<|endoftext|>",
26
+ "lstrip": false,
27
+ "normalized": false,
28
+ "rstrip": false,
29
+ "single_word": false
30
+ }
31
+ }
experiments/Qwen2_5vl_3B_add_distill_0.2_0.6_11_23_Classifier_Layer12_ImgText_V5_i_ret/checkpoint-100/tokenizer_config.json ADDED
@@ -0,0 +1,208 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "add_bos_token": false,
3
+ "add_prefix_space": false,
4
+ "added_tokens_decoder": {
5
+ "151643": {
6
+ "content": "<|endoftext|>",
7
+ "lstrip": false,
8
+ "normalized": false,
9
+ "rstrip": false,
10
+ "single_word": false,
11
+ "special": true
12
+ },
13
+ "151644": {
14
+ "content": "<|im_start|>",
15
+ "lstrip": false,
16
+ "normalized": false,
17
+ "rstrip": false,
18
+ "single_word": false,
19
+ "special": true
20
+ },
21
+ "151645": {
22
+ "content": "<|im_end|>",
23
+ "lstrip": false,
24
+ "normalized": false,
25
+ "rstrip": false,
26
+ "single_word": false,
27
+ "special": true
28
+ },
29
+ "151646": {
30
+ "content": "<|object_ref_start|>",
31
+ "lstrip": false,
32
+ "normalized": false,
33
+ "rstrip": false,
34
+ "single_word": false,
35
+ "special": true
36
+ },
37
+ "151647": {
38
+ "content": "<|object_ref_end|>",
39
+ "lstrip": false,
40
+ "normalized": false,
41
+ "rstrip": false,
42
+ "single_word": false,
43
+ "special": true
44
+ },
45
+ "151648": {
46
+ "content": "<|box_start|>",
47
+ "lstrip": false,
48
+ "normalized": false,
49
+ "rstrip": false,
50
+ "single_word": false,
51
+ "special": true
52
+ },
53
+ "151649": {
54
+ "content": "<|box_end|>",
55
+ "lstrip": false,
56
+ "normalized": false,
57
+ "rstrip": false,
58
+ "single_word": false,
59
+ "special": true
60
+ },
61
+ "151650": {
62
+ "content": "<|quad_start|>",
63
+ "lstrip": false,
64
+ "normalized": false,
65
+ "rstrip": false,
66
+ "single_word": false,
67
+ "special": true
68
+ },
69
+ "151651": {
70
+ "content": "<|quad_end|>",
71
+ "lstrip": false,
72
+ "normalized": false,
73
+ "rstrip": false,
74
+ "single_word": false,
75
+ "special": true
76
+ },
77
+ "151652": {
78
+ "content": "<|vision_start|>",
79
+ "lstrip": false,
80
+ "normalized": false,
81
+ "rstrip": false,
82
+ "single_word": false,
83
+ "special": true
84
+ },
85
+ "151653": {
86
+ "content": "<|vision_end|>",
87
+ "lstrip": false,
88
+ "normalized": false,
89
+ "rstrip": false,
90
+ "single_word": false,
91
+ "special": true
92
+ },
93
+ "151654": {
94
+ "content": "<|vision_pad|>",
95
+ "lstrip": false,
96
+ "normalized": false,
97
+ "rstrip": false,
98
+ "single_word": false,
99
+ "special": true
100
+ },
101
+ "151655": {
102
+ "content": "<|image_pad|>",
103
+ "lstrip": false,
104
+ "normalized": false,
105
+ "rstrip": false,
106
+ "single_word": false,
107
+ "special": true
108
+ },
109
+ "151656": {
110
+ "content": "<|video_pad|>",
111
+ "lstrip": false,
112
+ "normalized": false,
113
+ "rstrip": false,
114
+ "single_word": false,
115
+ "special": true
116
+ },
117
+ "151657": {
118
+ "content": "<tool_call>",
119
+ "lstrip": false,
120
+ "normalized": false,
121
+ "rstrip": false,
122
+ "single_word": false,
123
+ "special": false
124
+ },
125
+ "151658": {
126
+ "content": "</tool_call>",
127
+ "lstrip": false,
128
+ "normalized": false,
129
+ "rstrip": false,
130
+ "single_word": false,
131
+ "special": false
132
+ },
133
+ "151659": {
134
+ "content": "<|fim_prefix|>",
135
+ "lstrip": false,
136
+ "normalized": false,
137
+ "rstrip": false,
138
+ "single_word": false,
139
+ "special": false
140
+ },
141
+ "151660": {
142
+ "content": "<|fim_middle|>",
143
+ "lstrip": false,
144
+ "normalized": false,
145
+ "rstrip": false,
146
+ "single_word": false,
147
+ "special": false
148
+ },
149
+ "151661": {
150
+ "content": "<|fim_suffix|>",
151
+ "lstrip": false,
152
+ "normalized": false,
153
+ "rstrip": false,
154
+ "single_word": false,
155
+ "special": false
156
+ },
157
+ "151662": {
158
+ "content": "<|fim_pad|>",
159
+ "lstrip": false,
160
+ "normalized": false,
161
+ "rstrip": false,
162
+ "single_word": false,
163
+ "special": false
164
+ },
165
+ "151663": {
166
+ "content": "<|repo_name|>",
167
+ "lstrip": false,
168
+ "normalized": false,
169
+ "rstrip": false,
170
+ "single_word": false,
171
+ "special": false
172
+ },
173
+ "151664": {
174
+ "content": "<|file_sep|>",
175
+ "lstrip": false,
176
+ "normalized": false,
177
+ "rstrip": false,
178
+ "single_word": false,
179
+ "special": false
180
+ }
181
+ },
182
+ "additional_special_tokens": [
183
+ "<|im_start|>",
184
+ "<|im_end|>",
185
+ "<|object_ref_start|>",
186
+ "<|object_ref_end|>",
187
+ "<|box_start|>",
188
+ "<|box_end|>",
189
+ "<|quad_start|>",
190
+ "<|quad_end|>",
191
+ "<|vision_start|>",
192
+ "<|vision_end|>",
193
+ "<|vision_pad|>",
194
+ "<|image_pad|>",
195
+ "<|video_pad|>"
196
+ ],
197
+ "bos_token": null,
198
+ "clean_up_tokenization_spaces": false,
199
+ "eos_token": "<|im_end|>",
200
+ "errors": "replace",
201
+ "extra_special_tokens": {},
202
+ "model_max_length": 131072,
203
+ "pad_token": "<|endoftext|>",
204
+ "processor_class": "Qwen2_5_VLProcessor",
205
+ "split_special_tokens": false,
206
+ "tokenizer_class": "Qwen2Tokenizer",
207
+ "unk_token": null
208
+ }
experiments/Qwen2_5vl_3B_add_distill_0.2_0.6_11_23_Classifier_Layer12_ImgText_V5_i_ret/checkpoint-100/trainer_state.json ADDED
@@ -0,0 +1,734 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_global_step": null,
3
+ "best_metric": null,
4
+ "best_model_checkpoint": null,
5
+ "epoch": 0.1040582726326743,
6
+ "eval_steps": 500,
7
+ "global_step": 100,
8
+ "is_hyper_param_search": false,
9
+ "is_local_process_zero": true,
10
+ "is_world_process_zero": true,
11
+ "log_history": [
12
+ {
13
+ "epoch": 0.001040582726326743,
14
+ "grad_norm": 3.268874406814575,
15
+ "learning_rate": 0.0,
16
+ "loss": 0.6993,
17
+ "step": 1
18
+ },
19
+ {
20
+ "epoch": 0.002081165452653486,
21
+ "grad_norm": 3.8206846714019775,
22
+ "learning_rate": 5e-06,
23
+ "loss": 0.815,
24
+ "step": 2
25
+ },
26
+ {
27
+ "epoch": 0.003121748178980229,
28
+ "grad_norm": 3.077709436416626,
29
+ "learning_rate": 1e-05,
30
+ "loss": 0.758,
31
+ "step": 3
32
+ },
33
+ {
34
+ "epoch": 0.004162330905306972,
35
+ "grad_norm": 2.903688430786133,
36
+ "learning_rate": 1.5e-05,
37
+ "loss": 0.6332,
38
+ "step": 4
39
+ },
40
+ {
41
+ "epoch": 0.005202913631633715,
42
+ "grad_norm": 2.8597545623779297,
43
+ "learning_rate": 2e-05,
44
+ "loss": 0.7086,
45
+ "step": 5
46
+ },
47
+ {
48
+ "epoch": 0.006243496357960458,
49
+ "grad_norm": 3.6181485652923584,
50
+ "learning_rate": 2.5e-05,
51
+ "loss": 0.8511,
52
+ "step": 6
53
+ },
54
+ {
55
+ "epoch": 0.007284079084287201,
56
+ "grad_norm": 5.016982555389404,
57
+ "learning_rate": 3e-05,
58
+ "loss": 1.0901,
59
+ "step": 7
60
+ },
61
+ {
62
+ "epoch": 0.008324661810613945,
63
+ "grad_norm": 2.217885971069336,
64
+ "learning_rate": 3.5000000000000004e-05,
65
+ "loss": 0.5426,
66
+ "step": 8
67
+ },
68
+ {
69
+ "epoch": 0.009365244536940686,
70
+ "grad_norm": 2.0818731784820557,
71
+ "learning_rate": 4e-05,
72
+ "loss": 0.4986,
73
+ "step": 9
74
+ },
75
+ {
76
+ "epoch": 0.01040582726326743,
77
+ "grad_norm": 1.9352552890777588,
78
+ "learning_rate": 4.4999999999999996e-05,
79
+ "loss": 0.5358,
80
+ "step": 10
81
+ },
82
+ {
83
+ "epoch": 0.011446409989594173,
84
+ "grad_norm": 3.7815799713134766,
85
+ "learning_rate": 5e-05,
86
+ "loss": 0.877,
87
+ "step": 11
88
+ },
89
+ {
90
+ "epoch": 0.012486992715920915,
91
+ "grad_norm": 2.989179849624634,
92
+ "learning_rate": 5.5e-05,
93
+ "loss": 0.6389,
94
+ "step": 12
95
+ },
96
+ {
97
+ "epoch": 0.013527575442247659,
98
+ "grad_norm": 3.6533756256103516,
99
+ "learning_rate": 6e-05,
100
+ "loss": 0.7697,
101
+ "step": 13
102
+ },
103
+ {
104
+ "epoch": 0.014568158168574402,
105
+ "grad_norm": 2.5273356437683105,
106
+ "learning_rate": 6.500000000000001e-05,
107
+ "loss": 0.4582,
108
+ "step": 14
109
+ },
110
+ {
111
+ "epoch": 0.015608740894901144,
112
+ "grad_norm": 2.0315494537353516,
113
+ "learning_rate": 7.000000000000001e-05,
114
+ "loss": 0.4683,
115
+ "step": 15
116
+ },
117
+ {
118
+ "epoch": 0.01664932362122789,
119
+ "grad_norm": 1.3862802982330322,
120
+ "learning_rate": 7.5e-05,
121
+ "loss": 0.401,
122
+ "step": 16
123
+ },
124
+ {
125
+ "epoch": 0.01768990634755463,
126
+ "grad_norm": 3.2270781993865967,
127
+ "learning_rate": 8e-05,
128
+ "loss": 0.6733,
129
+ "step": 17
130
+ },
131
+ {
132
+ "epoch": 0.018730489073881373,
133
+ "grad_norm": 2.966115713119507,
134
+ "learning_rate": 8.5e-05,
135
+ "loss": 0.6105,
136
+ "step": 18
137
+ },
138
+ {
139
+ "epoch": 0.019771071800208116,
140
+ "grad_norm": 2.720820188522339,
141
+ "learning_rate": 8.999999999999999e-05,
142
+ "loss": 0.5462,
143
+ "step": 19
144
+ },
145
+ {
146
+ "epoch": 0.02081165452653486,
147
+ "grad_norm": 2.2214956283569336,
148
+ "learning_rate": 9.5e-05,
149
+ "loss": 0.5125,
150
+ "step": 20
151
+ },
152
+ {
153
+ "epoch": 0.021852237252861603,
154
+ "grad_norm": 2.2020890712738037,
155
+ "learning_rate": 0.0001,
156
+ "loss": 0.4953,
157
+ "step": 21
158
+ },
159
+ {
160
+ "epoch": 0.022892819979188347,
161
+ "grad_norm": 2.2625033855438232,
162
+ "learning_rate": 0.000105,
163
+ "loss": 0.5628,
164
+ "step": 22
165
+ },
166
+ {
167
+ "epoch": 0.023933402705515087,
168
+ "grad_norm": 2.223475933074951,
169
+ "learning_rate": 0.00011,
170
+ "loss": 0.5667,
171
+ "step": 23
172
+ },
173
+ {
174
+ "epoch": 0.02497398543184183,
175
+ "grad_norm": 2.982874631881714,
176
+ "learning_rate": 0.000115,
177
+ "loss": 0.6645,
178
+ "step": 24
179
+ },
180
+ {
181
+ "epoch": 0.026014568158168574,
182
+ "grad_norm": 2.5550947189331055,
183
+ "learning_rate": 0.00012,
184
+ "loss": 0.4668,
185
+ "step": 25
186
+ },
187
+ {
188
+ "epoch": 0.027055150884495317,
189
+ "grad_norm": 2.805063486099243,
190
+ "learning_rate": 0.000125,
191
+ "loss": 0.5205,
192
+ "step": 26
193
+ },
194
+ {
195
+ "epoch": 0.02809573361082206,
196
+ "grad_norm": 1.7745788097381592,
197
+ "learning_rate": 0.00013000000000000002,
198
+ "loss": 0.3622,
199
+ "step": 27
200
+ },
201
+ {
202
+ "epoch": 0.029136316337148804,
203
+ "grad_norm": 1.6776342391967773,
204
+ "learning_rate": 0.000135,
205
+ "loss": 0.3641,
206
+ "step": 28
207
+ },
208
+ {
209
+ "epoch": 0.030176899063475548,
210
+ "grad_norm": 2.4569647312164307,
211
+ "learning_rate": 0.00014000000000000001,
212
+ "loss": 0.5263,
213
+ "step": 29
214
+ },
215
+ {
216
+ "epoch": 0.031217481789802288,
217
+ "grad_norm": 1.2685638666152954,
218
+ "learning_rate": 0.000145,
219
+ "loss": 0.3199,
220
+ "step": 30
221
+ },
222
+ {
223
+ "epoch": 0.03225806451612903,
224
+ "grad_norm": 1.3093715906143188,
225
+ "learning_rate": 0.00015,
226
+ "loss": 0.4389,
227
+ "step": 31
228
+ },
229
+ {
230
+ "epoch": 0.03329864724245578,
231
+ "grad_norm": 1.643606185913086,
232
+ "learning_rate": 0.000155,
233
+ "loss": 0.3973,
234
+ "step": 32
235
+ },
236
+ {
237
+ "epoch": 0.03433922996878252,
238
+ "grad_norm": 1.27973473072052,
239
+ "learning_rate": 0.00016,
240
+ "loss": 0.3601,
241
+ "step": 33
242
+ },
243
+ {
244
+ "epoch": 0.03537981269510926,
245
+ "grad_norm": 1.3652054071426392,
246
+ "learning_rate": 0.000165,
247
+ "loss": 0.4557,
248
+ "step": 34
249
+ },
250
+ {
251
+ "epoch": 0.036420395421436005,
252
+ "grad_norm": 1.2647119760513306,
253
+ "learning_rate": 0.00017,
254
+ "loss": 0.3723,
255
+ "step": 35
256
+ },
257
+ {
258
+ "epoch": 0.037460978147762745,
259
+ "grad_norm": 1.2717779874801636,
260
+ "learning_rate": 0.000175,
261
+ "loss": 0.3429,
262
+ "step": 36
263
+ },
264
+ {
265
+ "epoch": 0.03850156087408949,
266
+ "grad_norm": 1.7270296812057495,
267
+ "learning_rate": 0.00017999999999999998,
268
+ "loss": 0.4089,
269
+ "step": 37
270
+ },
271
+ {
272
+ "epoch": 0.03954214360041623,
273
+ "grad_norm": 1.5404200553894043,
274
+ "learning_rate": 0.000185,
275
+ "loss": 0.3764,
276
+ "step": 38
277
+ },
278
+ {
279
+ "epoch": 0.04058272632674298,
280
+ "grad_norm": 1.1958752870559692,
281
+ "learning_rate": 0.00019,
282
+ "loss": 0.375,
283
+ "step": 39
284
+ },
285
+ {
286
+ "epoch": 0.04162330905306972,
287
+ "grad_norm": 1.4304900169372559,
288
+ "learning_rate": 0.00019500000000000002,
289
+ "loss": 0.3802,
290
+ "step": 40
291
+ },
292
+ {
293
+ "epoch": 0.04266389177939646,
294
+ "grad_norm": 1.654426097869873,
295
+ "learning_rate": 0.0002,
296
+ "loss": 0.2566,
297
+ "step": 41
298
+ },
299
+ {
300
+ "epoch": 0.043704474505723206,
301
+ "grad_norm": 1.7565494775772095,
302
+ "learning_rate": 0.000205,
303
+ "loss": 0.3105,
304
+ "step": 42
305
+ },
306
+ {
307
+ "epoch": 0.044745057232049947,
308
+ "grad_norm": 2.055324077606201,
309
+ "learning_rate": 0.00021,
310
+ "loss": 0.3233,
311
+ "step": 43
312
+ },
313
+ {
314
+ "epoch": 0.045785639958376693,
315
+ "grad_norm": 1.283117651939392,
316
+ "learning_rate": 0.000215,
317
+ "loss": 0.3023,
318
+ "step": 44
319
+ },
320
+ {
321
+ "epoch": 0.046826222684703434,
322
+ "grad_norm": 1.292840838432312,
323
+ "learning_rate": 0.00022,
324
+ "loss": 0.2821,
325
+ "step": 45
326
+ },
327
+ {
328
+ "epoch": 0.047866805411030174,
329
+ "grad_norm": 1.0345746278762817,
330
+ "learning_rate": 0.00022500000000000002,
331
+ "loss": 0.2539,
332
+ "step": 46
333
+ },
334
+ {
335
+ "epoch": 0.04890738813735692,
336
+ "grad_norm": 1.0240848064422607,
337
+ "learning_rate": 0.00023,
338
+ "loss": 0.3298,
339
+ "step": 47
340
+ },
341
+ {
342
+ "epoch": 0.04994797086368366,
343
+ "grad_norm": 1.7957828044891357,
344
+ "learning_rate": 0.000235,
345
+ "loss": 0.205,
346
+ "step": 48
347
+ },
348
+ {
349
+ "epoch": 0.05098855359001041,
350
+ "grad_norm": 1.3810360431671143,
351
+ "learning_rate": 0.00024,
352
+ "loss": 0.2919,
353
+ "step": 49
354
+ },
355
+ {
356
+ "epoch": 0.05202913631633715,
357
+ "grad_norm": 0.8331364393234253,
358
+ "learning_rate": 0.000245,
359
+ "loss": 0.1943,
360
+ "step": 50
361
+ },
362
+ {
363
+ "epoch": 0.053069719042663895,
364
+ "grad_norm": 1.213149070739746,
365
+ "learning_rate": 0.00025,
366
+ "loss": 0.3011,
367
+ "step": 51
368
+ },
369
+ {
370
+ "epoch": 0.054110301768990635,
371
+ "grad_norm": 0.9544571042060852,
372
+ "learning_rate": 0.000255,
373
+ "loss": 0.3511,
374
+ "step": 52
375
+ },
376
+ {
377
+ "epoch": 0.055150884495317375,
378
+ "grad_norm": 0.9204476475715637,
379
+ "learning_rate": 0.00026000000000000003,
380
+ "loss": 0.2048,
381
+ "step": 53
382
+ },
383
+ {
384
+ "epoch": 0.05619146722164412,
385
+ "grad_norm": 1.7272144556045532,
386
+ "learning_rate": 0.00026500000000000004,
387
+ "loss": 0.2715,
388
+ "step": 54
389
+ },
390
+ {
391
+ "epoch": 0.05723204994797086,
392
+ "grad_norm": 0.891767680644989,
393
+ "learning_rate": 0.00027,
394
+ "loss": 0.2116,
395
+ "step": 55
396
+ },
397
+ {
398
+ "epoch": 0.05827263267429761,
399
+ "grad_norm": 0.8020220398902893,
400
+ "learning_rate": 0.000275,
401
+ "loss": 0.2101,
402
+ "step": 56
403
+ },
404
+ {
405
+ "epoch": 0.05931321540062435,
406
+ "grad_norm": 1.2897636890411377,
407
+ "learning_rate": 0.00028000000000000003,
408
+ "loss": 0.242,
409
+ "step": 57
410
+ },
411
+ {
412
+ "epoch": 0.060353798126951096,
413
+ "grad_norm": 2.2333452701568604,
414
+ "learning_rate": 0.000285,
415
+ "loss": 0.3461,
416
+ "step": 58
417
+ },
418
+ {
419
+ "epoch": 0.061394380853277836,
420
+ "grad_norm": 1.124709963798523,
421
+ "learning_rate": 0.00029,
422
+ "loss": 0.1709,
423
+ "step": 59
424
+ },
425
+ {
426
+ "epoch": 0.062434963579604576,
427
+ "grad_norm": 0.7170735001564026,
428
+ "learning_rate": 0.000295,
429
+ "loss": 0.1954,
430
+ "step": 60
431
+ },
432
+ {
433
+ "epoch": 0.06347554630593132,
434
+ "grad_norm": 1.3257620334625244,
435
+ "learning_rate": 0.0003,
436
+ "loss": 0.2816,
437
+ "step": 61
438
+ },
439
+ {
440
+ "epoch": 0.06451612903225806,
441
+ "grad_norm": 0.7642104029655457,
442
+ "learning_rate": 0.000305,
443
+ "loss": 0.1788,
444
+ "step": 62
445
+ },
446
+ {
447
+ "epoch": 0.06555671175858481,
448
+ "grad_norm": 0.9636558890342712,
449
+ "learning_rate": 0.00031,
450
+ "loss": 0.2138,
451
+ "step": 63
452
+ },
453
+ {
454
+ "epoch": 0.06659729448491156,
455
+ "grad_norm": 0.7231699228286743,
456
+ "learning_rate": 0.000315,
457
+ "loss": 0.19,
458
+ "step": 64
459
+ },
460
+ {
461
+ "epoch": 0.06763787721123829,
462
+ "grad_norm": 0.9044433236122131,
463
+ "learning_rate": 0.00032,
464
+ "loss": 0.1863,
465
+ "step": 65
466
+ },
467
+ {
468
+ "epoch": 0.06867845993756504,
469
+ "grad_norm": 0.6787164807319641,
470
+ "learning_rate": 0.00032500000000000004,
471
+ "loss": 0.1615,
472
+ "step": 66
473
+ },
474
+ {
475
+ "epoch": 0.06971904266389178,
476
+ "grad_norm": 0.6610997915267944,
477
+ "learning_rate": 0.00033,
478
+ "loss": 0.1777,
479
+ "step": 67
480
+ },
481
+ {
482
+ "epoch": 0.07075962539021852,
483
+ "grad_norm": 0.8359801173210144,
484
+ "learning_rate": 0.000335,
485
+ "loss": 0.238,
486
+ "step": 68
487
+ },
488
+ {
489
+ "epoch": 0.07180020811654526,
490
+ "grad_norm": 0.7294996976852417,
491
+ "learning_rate": 0.00034,
492
+ "loss": 0.2018,
493
+ "step": 69
494
+ },
495
+ {
496
+ "epoch": 0.07284079084287201,
497
+ "grad_norm": 0.7325947880744934,
498
+ "learning_rate": 0.000345,
499
+ "loss": 0.1372,
500
+ "step": 70
501
+ },
502
+ {
503
+ "epoch": 0.07388137356919876,
504
+ "grad_norm": 0.7132765650749207,
505
+ "learning_rate": 0.00035,
506
+ "loss": 0.1951,
507
+ "step": 71
508
+ },
509
+ {
510
+ "epoch": 0.07492195629552549,
511
+ "grad_norm": 1.1800177097320557,
512
+ "learning_rate": 0.000355,
513
+ "loss": 0.2546,
514
+ "step": 72
515
+ },
516
+ {
517
+ "epoch": 0.07596253902185224,
518
+ "grad_norm": 1.0050599575042725,
519
+ "learning_rate": 0.00035999999999999997,
520
+ "loss": 0.189,
521
+ "step": 73
522
+ },
523
+ {
524
+ "epoch": 0.07700312174817898,
525
+ "grad_norm": 0.7532162070274353,
526
+ "learning_rate": 0.000365,
527
+ "loss": 0.1276,
528
+ "step": 74
529
+ },
530
+ {
531
+ "epoch": 0.07804370447450572,
532
+ "grad_norm": 0.8199287056922913,
533
+ "learning_rate": 0.00037,
534
+ "loss": 0.2116,
535
+ "step": 75
536
+ },
537
+ {
538
+ "epoch": 0.07908428720083246,
539
+ "grad_norm": 0.8740005493164062,
540
+ "learning_rate": 0.000375,
541
+ "loss": 0.1754,
542
+ "step": 76
543
+ },
544
+ {
545
+ "epoch": 0.08012486992715921,
546
+ "grad_norm": 0.6971861124038696,
547
+ "learning_rate": 0.00038,
548
+ "loss": 0.1799,
549
+ "step": 77
550
+ },
551
+ {
552
+ "epoch": 0.08116545265348596,
553
+ "grad_norm": 0.6992635726928711,
554
+ "learning_rate": 0.00038500000000000003,
555
+ "loss": 0.1663,
556
+ "step": 78
557
+ },
558
+ {
559
+ "epoch": 0.08220603537981269,
560
+ "grad_norm": 0.8527954816818237,
561
+ "learning_rate": 0.00039000000000000005,
562
+ "loss": 0.1676,
563
+ "step": 79
564
+ },
565
+ {
566
+ "epoch": 0.08324661810613944,
567
+ "grad_norm": 0.7233165502548218,
568
+ "learning_rate": 0.000395,
569
+ "loss": 0.1635,
570
+ "step": 80
571
+ },
572
+ {
573
+ "epoch": 0.08428720083246619,
574
+ "grad_norm": 1.2006125450134277,
575
+ "learning_rate": 0.0004,
576
+ "loss": 0.1902,
577
+ "step": 81
578
+ },
579
+ {
580
+ "epoch": 0.08532778355879292,
581
+ "grad_norm": 0.6341950297355652,
582
+ "learning_rate": 0.00040500000000000003,
583
+ "loss": 0.1396,
584
+ "step": 82
585
+ },
586
+ {
587
+ "epoch": 0.08636836628511967,
588
+ "grad_norm": 0.670028030872345,
589
+ "learning_rate": 0.00041,
590
+ "loss": 0.162,
591
+ "step": 83
592
+ },
593
+ {
594
+ "epoch": 0.08740894901144641,
595
+ "grad_norm": 0.6362585425376892,
596
+ "learning_rate": 0.000415,
597
+ "loss": 0.155,
598
+ "step": 84
599
+ },
600
+ {
601
+ "epoch": 0.08844953173777315,
602
+ "grad_norm": 0.7975156307220459,
603
+ "learning_rate": 0.00042,
604
+ "loss": 0.1264,
605
+ "step": 85
606
+ },
607
+ {
608
+ "epoch": 0.08949011446409989,
609
+ "grad_norm": 0.5603007078170776,
610
+ "learning_rate": 0.000425,
611
+ "loss": 0.1505,
612
+ "step": 86
613
+ },
614
+ {
615
+ "epoch": 0.09053069719042664,
616
+ "grad_norm": 0.515308141708374,
617
+ "learning_rate": 0.00043,
618
+ "loss": 0.1364,
619
+ "step": 87
620
+ },
621
+ {
622
+ "epoch": 0.09157127991675339,
623
+ "grad_norm": 0.6081110239028931,
624
+ "learning_rate": 0.000435,
625
+ "loss": 0.1428,
626
+ "step": 88
627
+ },
628
+ {
629
+ "epoch": 0.09261186264308012,
630
+ "grad_norm": 0.5383463501930237,
631
+ "learning_rate": 0.00044,
632
+ "loss": 0.1293,
633
+ "step": 89
634
+ },
635
+ {
636
+ "epoch": 0.09365244536940687,
637
+ "grad_norm": 0.659436047077179,
638
+ "learning_rate": 0.00044500000000000003,
639
+ "loss": 0.1475,
640
+ "step": 90
641
+ },
642
+ {
643
+ "epoch": 0.09469302809573361,
644
+ "grad_norm": 0.5411190390586853,
645
+ "learning_rate": 0.00045000000000000004,
646
+ "loss": 0.1408,
647
+ "step": 91
648
+ },
649
+ {
650
+ "epoch": 0.09573361082206035,
651
+ "grad_norm": 0.6518479585647583,
652
+ "learning_rate": 0.000455,
653
+ "loss": 0.1576,
654
+ "step": 92
655
+ },
656
+ {
657
+ "epoch": 0.0967741935483871,
658
+ "grad_norm": 0.5494299530982971,
659
+ "learning_rate": 0.00046,
660
+ "loss": 0.1099,
661
+ "step": 93
662
+ },
663
+ {
664
+ "epoch": 0.09781477627471384,
665
+ "grad_norm": 0.8132746815681458,
666
+ "learning_rate": 0.000465,
667
+ "loss": 0.1636,
668
+ "step": 94
669
+ },
670
+ {
671
+ "epoch": 0.09885535900104059,
672
+ "grad_norm": 0.5652503371238708,
673
+ "learning_rate": 0.00047,
674
+ "loss": 0.1595,
675
+ "step": 95
676
+ },
677
+ {
678
+ "epoch": 0.09989594172736732,
679
+ "grad_norm": 0.61795973777771,
680
+ "learning_rate": 0.000475,
681
+ "loss": 0.0745,
682
+ "step": 96
683
+ },
684
+ {
685
+ "epoch": 0.10093652445369407,
686
+ "grad_norm": 0.4944301247596741,
687
+ "learning_rate": 0.00048,
688
+ "loss": 0.1406,
689
+ "step": 97
690
+ },
691
+ {
692
+ "epoch": 0.10197710718002082,
693
+ "grad_norm": 0.5052417516708374,
694
+ "learning_rate": 0.00048499999999999997,
695
+ "loss": 0.104,
696
+ "step": 98
697
+ },
698
+ {
699
+ "epoch": 0.10301768990634755,
700
+ "grad_norm": 0.46198371052742004,
701
+ "learning_rate": 0.00049,
702
+ "loss": 0.0883,
703
+ "step": 99
704
+ },
705
+ {
706
+ "epoch": 0.1040582726326743,
707
+ "grad_norm": 0.6346387267112732,
708
+ "learning_rate": 0.000495,
709
+ "loss": 0.154,
710
+ "step": 100
711
+ }
712
+ ],
713
+ "logging_steps": 1,
714
+ "max_steps": 1000,
715
+ "num_input_tokens_seen": 0,
716
+ "num_train_epochs": 2,
717
+ "save_steps": 100,
718
+ "stateful_callbacks": {
719
+ "TrainerControl": {
720
+ "args": {
721
+ "should_epoch_stop": false,
722
+ "should_evaluate": false,
723
+ "should_log": false,
724
+ "should_save": true,
725
+ "should_training_stop": false
726
+ },
727
+ "attributes": {}
728
+ }
729
+ },
730
+ "total_flos": 0.0,
731
+ "train_batch_size": 256,
732
+ "trial_name": null,
733
+ "trial_params": null
734
+ }
experiments/Qwen2_5vl_3B_add_distill_0.2_0.6_11_23_Classifier_Layer12_ImgText_V5_i_ret/checkpoint-100/vocab.json ADDED
The diff for this file is too large to render. See raw diff
 
experiments/Qwen2_5vl_3B_add_distill_0.2_0.6_11_23_Classifier_Layer12_ImgText_V5_i_ret/checkpoint-500/added_tokens.json ADDED
@@ -0,0 +1,24 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "</tool_call>": 151658,
3
+ "<tool_call>": 151657,
4
+ "<|box_end|>": 151649,
5
+ "<|box_start|>": 151648,
6
+ "<|endoftext|>": 151643,
7
+ "<|file_sep|>": 151664,
8
+ "<|fim_middle|>": 151660,
9
+ "<|fim_pad|>": 151662,
10
+ "<|fim_prefix|>": 151659,
11
+ "<|fim_suffix|>": 151661,
12
+ "<|im_end|>": 151645,
13
+ "<|im_start|>": 151644,
14
+ "<|image_pad|>": 151655,
15
+ "<|object_ref_end|>": 151647,
16
+ "<|object_ref_start|>": 151646,
17
+ "<|quad_end|>": 151651,
18
+ "<|quad_start|>": 151650,
19
+ "<|repo_name|>": 151663,
20
+ "<|video_pad|>": 151656,
21
+ "<|vision_end|>": 151653,
22
+ "<|vision_pad|>": 151654,
23
+ "<|vision_start|>": 151652
24
+ }
experiments/Qwen2_5vl_3B_add_distill_0.2_0.6_11_23_Classifier_Layer12_ImgText_V5_i_ret/checkpoint-500/chat_template.jinja ADDED
@@ -0,0 +1,7 @@
 
 
 
 
 
 
 
 
1
+ {% set image_count = namespace(value=0) %}{% set video_count = namespace(value=0) %}{% for message in messages %}{% if loop.first and message['role'] != 'system' %}<|im_start|>system
2
+ You are a helpful assistant.<|im_end|>
3
+ {% endif %}<|im_start|>{{ message['role'] }}
4
+ {% if message['content'] is string %}{{ message['content'] }}<|im_end|>
5
+ {% else %}{% for content in message['content'] %}{% if content['type'] == 'image' or 'image' in content or 'image_url' in content %}{% set image_count.value = image_count.value + 1 %}{% if add_vision_id %}Picture {{ image_count.value }}: {% endif %}<|vision_start|><|image_pad|><|vision_end|>{% elif content['type'] == 'video' or 'video' in content %}{% set video_count.value = video_count.value + 1 %}{% if add_vision_id %}Video {{ video_count.value }}: {% endif %}<|vision_start|><|video_pad|><|vision_end|>{% elif 'text' in content %}{{ content['text'] }}{% endif %}{% endfor %}<|im_end|>
6
+ {% endif %}{% endfor %}{% if add_generation_prompt %}<|im_start|>assistant
7
+ {% endif %}
experiments/Qwen2_5vl_3B_add_distill_0.2_0.6_11_23_Classifier_Layer12_ImgText_V5_i_ret/checkpoint-500/preprocessor_config.json ADDED
@@ -0,0 +1,29 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "do_convert_rgb": true,
3
+ "do_normalize": true,
4
+ "do_rescale": true,
5
+ "do_resize": true,
6
+ "image_mean": [
7
+ 0.48145466,
8
+ 0.4578275,
9
+ 0.40821073
10
+ ],
11
+ "image_processor_type": "Qwen2_5_VLImageProcessor",
12
+ "image_std": [
13
+ 0.26862954,
14
+ 0.26130258,
15
+ 0.27577711
16
+ ],
17
+ "max_pixels": 1003520,
18
+ "merge_size": 2,
19
+ "min_pixels": 3136,
20
+ "patch_size": 14,
21
+ "processor_class": "Qwen2_5_VLProcessor",
22
+ "resample": 3,
23
+ "rescale_factor": 0.00392156862745098,
24
+ "size": {
25
+ "max_pixels": 1003520,
26
+ "min_pixels": 3136
27
+ },
28
+ "temporal_patch_size": 2
29
+ }
experiments/Qwen2_5vl_3B_add_distill_0.2_0.6_11_23_Classifier_Layer12_ImgText_V5_i_ret/checkpoint-500/special_tokens_map.json ADDED
@@ -0,0 +1,31 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "additional_special_tokens": [
3
+ "<|im_start|>",
4
+ "<|im_end|>",
5
+ "<|object_ref_start|>",
6
+ "<|object_ref_end|>",
7
+ "<|box_start|>",
8
+ "<|box_end|>",
9
+ "<|quad_start|>",
10
+ "<|quad_end|>",
11
+ "<|vision_start|>",
12
+ "<|vision_end|>",
13
+ "<|vision_pad|>",
14
+ "<|image_pad|>",
15
+ "<|video_pad|>"
16
+ ],
17
+ "eos_token": {
18
+ "content": "<|im_end|>",
19
+ "lstrip": false,
20
+ "normalized": false,
21
+ "rstrip": false,
22
+ "single_word": false
23
+ },
24
+ "pad_token": {
25
+ "content": "<|endoftext|>",
26
+ "lstrip": false,
27
+ "normalized": false,
28
+ "rstrip": false,
29
+ "single_word": false
30
+ }
31
+ }
experiments/Qwen2_5vl_3B_add_distill_0.2_0.6_11_23_Classifier_Layer12_ImgText_V5_i_ret/checkpoint-500/tokenizer_config.json ADDED
@@ -0,0 +1,208 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "add_bos_token": false,
3
+ "add_prefix_space": false,
4
+ "added_tokens_decoder": {
5
+ "151643": {
6
+ "content": "<|endoftext|>",
7
+ "lstrip": false,
8
+ "normalized": false,
9
+ "rstrip": false,
10
+ "single_word": false,
11
+ "special": true
12
+ },
13
+ "151644": {
14
+ "content": "<|im_start|>",
15
+ "lstrip": false,
16
+ "normalized": false,
17
+ "rstrip": false,
18
+ "single_word": false,
19
+ "special": true
20
+ },
21
+ "151645": {
22
+ "content": "<|im_end|>",
23
+ "lstrip": false,
24
+ "normalized": false,
25
+ "rstrip": false,
26
+ "single_word": false,
27
+ "special": true
28
+ },
29
+ "151646": {
30
+ "content": "<|object_ref_start|>",
31
+ "lstrip": false,
32
+ "normalized": false,
33
+ "rstrip": false,
34
+ "single_word": false,
35
+ "special": true
36
+ },
37
+ "151647": {
38
+ "content": "<|object_ref_end|>",
39
+ "lstrip": false,
40
+ "normalized": false,
41
+ "rstrip": false,
42
+ "single_word": false,
43
+ "special": true
44
+ },
45
+ "151648": {
46
+ "content": "<|box_start|>",
47
+ "lstrip": false,
48
+ "normalized": false,
49
+ "rstrip": false,
50
+ "single_word": false,
51
+ "special": true
52
+ },
53
+ "151649": {
54
+ "content": "<|box_end|>",
55
+ "lstrip": false,
56
+ "normalized": false,
57
+ "rstrip": false,
58
+ "single_word": false,
59
+ "special": true
60
+ },
61
+ "151650": {
62
+ "content": "<|quad_start|>",
63
+ "lstrip": false,
64
+ "normalized": false,
65
+ "rstrip": false,
66
+ "single_word": false,
67
+ "special": true
68
+ },
69
+ "151651": {
70
+ "content": "<|quad_end|>",
71
+ "lstrip": false,
72
+ "normalized": false,
73
+ "rstrip": false,
74
+ "single_word": false,
75
+ "special": true
76
+ },
77
+ "151652": {
78
+ "content": "<|vision_start|>",
79
+ "lstrip": false,
80
+ "normalized": false,
81
+ "rstrip": false,
82
+ "single_word": false,
83
+ "special": true
84
+ },
85
+ "151653": {
86
+ "content": "<|vision_end|>",
87
+ "lstrip": false,
88
+ "normalized": false,
89
+ "rstrip": false,
90
+ "single_word": false,
91
+ "special": true
92
+ },
93
+ "151654": {
94
+ "content": "<|vision_pad|>",
95
+ "lstrip": false,
96
+ "normalized": false,
97
+ "rstrip": false,
98
+ "single_word": false,
99
+ "special": true
100
+ },
101
+ "151655": {
102
+ "content": "<|image_pad|>",
103
+ "lstrip": false,
104
+ "normalized": false,
105
+ "rstrip": false,
106
+ "single_word": false,
107
+ "special": true
108
+ },
109
+ "151656": {
110
+ "content": "<|video_pad|>",
111
+ "lstrip": false,
112
+ "normalized": false,
113
+ "rstrip": false,
114
+ "single_word": false,
115
+ "special": true
116
+ },
117
+ "151657": {
118
+ "content": "<tool_call>",
119
+ "lstrip": false,
120
+ "normalized": false,
121
+ "rstrip": false,
122
+ "single_word": false,
123
+ "special": false
124
+ },
125
+ "151658": {
126
+ "content": "</tool_call>",
127
+ "lstrip": false,
128
+ "normalized": false,
129
+ "rstrip": false,
130
+ "single_word": false,
131
+ "special": false
132
+ },
133
+ "151659": {
134
+ "content": "<|fim_prefix|>",
135
+ "lstrip": false,
136
+ "normalized": false,
137
+ "rstrip": false,
138
+ "single_word": false,
139
+ "special": false
140
+ },
141
+ "151660": {
142
+ "content": "<|fim_middle|>",
143
+ "lstrip": false,
144
+ "normalized": false,
145
+ "rstrip": false,
146
+ "single_word": false,
147
+ "special": false
148
+ },
149
+ "151661": {
150
+ "content": "<|fim_suffix|>",
151
+ "lstrip": false,
152
+ "normalized": false,
153
+ "rstrip": false,
154
+ "single_word": false,
155
+ "special": false
156
+ },
157
+ "151662": {
158
+ "content": "<|fim_pad|>",
159
+ "lstrip": false,
160
+ "normalized": false,
161
+ "rstrip": false,
162
+ "single_word": false,
163
+ "special": false
164
+ },
165
+ "151663": {
166
+ "content": "<|repo_name|>",
167
+ "lstrip": false,
168
+ "normalized": false,
169
+ "rstrip": false,
170
+ "single_word": false,
171
+ "special": false
172
+ },
173
+ "151664": {
174
+ "content": "<|file_sep|>",
175
+ "lstrip": false,
176
+ "normalized": false,
177
+ "rstrip": false,
178
+ "single_word": false,
179
+ "special": false
180
+ }
181
+ },
182
+ "additional_special_tokens": [
183
+ "<|im_start|>",
184
+ "<|im_end|>",
185
+ "<|object_ref_start|>",
186
+ "<|object_ref_end|>",
187
+ "<|box_start|>",
188
+ "<|box_end|>",
189
+ "<|quad_start|>",
190
+ "<|quad_end|>",
191
+ "<|vision_start|>",
192
+ "<|vision_end|>",
193
+ "<|vision_pad|>",
194
+ "<|image_pad|>",
195
+ "<|video_pad|>"
196
+ ],
197
+ "bos_token": null,
198
+ "clean_up_tokenization_spaces": false,
199
+ "eos_token": "<|im_end|>",
200
+ "errors": "replace",
201
+ "extra_special_tokens": {},
202
+ "model_max_length": 131072,
203
+ "pad_token": "<|endoftext|>",
204
+ "processor_class": "Qwen2_5_VLProcessor",
205
+ "split_special_tokens": false,
206
+ "tokenizer_class": "Qwen2Tokenizer",
207
+ "unk_token": null
208
+ }
experiments/Qwen2_5vl_3B_add_distill_0.2_0.6_11_23_Classifier_Layer12_ImgText_V5_i_ret/checkpoint-500/trainer_state.json ADDED
@@ -0,0 +1,3534 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_global_step": null,
3
+ "best_metric": null,
4
+ "best_model_checkpoint": null,
5
+ "epoch": 0.5202913631633714,
6
+ "eval_steps": 500,
7
+ "global_step": 500,
8
+ "is_hyper_param_search": false,
9
+ "is_local_process_zero": true,
10
+ "is_world_process_zero": true,
11
+ "log_history": [
12
+ {
13
+ "epoch": 0.001040582726326743,
14
+ "grad_norm": 3.268874406814575,
15
+ "learning_rate": 0.0,
16
+ "loss": 0.6993,
17
+ "step": 1
18
+ },
19
+ {
20
+ "epoch": 0.002081165452653486,
21
+ "grad_norm": 3.8206846714019775,
22
+ "learning_rate": 5e-06,
23
+ "loss": 0.815,
24
+ "step": 2
25
+ },
26
+ {
27
+ "epoch": 0.003121748178980229,
28
+ "grad_norm": 3.077709436416626,
29
+ "learning_rate": 1e-05,
30
+ "loss": 0.758,
31
+ "step": 3
32
+ },
33
+ {
34
+ "epoch": 0.004162330905306972,
35
+ "grad_norm": 2.903688430786133,
36
+ "learning_rate": 1.5e-05,
37
+ "loss": 0.6332,
38
+ "step": 4
39
+ },
40
+ {
41
+ "epoch": 0.005202913631633715,
42
+ "grad_norm": 2.8597545623779297,
43
+ "learning_rate": 2e-05,
44
+ "loss": 0.7086,
45
+ "step": 5
46
+ },
47
+ {
48
+ "epoch": 0.006243496357960458,
49
+ "grad_norm": 3.6181485652923584,
50
+ "learning_rate": 2.5e-05,
51
+ "loss": 0.8511,
52
+ "step": 6
53
+ },
54
+ {
55
+ "epoch": 0.007284079084287201,
56
+ "grad_norm": 5.016982555389404,
57
+ "learning_rate": 3e-05,
58
+ "loss": 1.0901,
59
+ "step": 7
60
+ },
61
+ {
62
+ "epoch": 0.008324661810613945,
63
+ "grad_norm": 2.217885971069336,
64
+ "learning_rate": 3.5000000000000004e-05,
65
+ "loss": 0.5426,
66
+ "step": 8
67
+ },
68
+ {
69
+ "epoch": 0.009365244536940686,
70
+ "grad_norm": 2.0818731784820557,
71
+ "learning_rate": 4e-05,
72
+ "loss": 0.4986,
73
+ "step": 9
74
+ },
75
+ {
76
+ "epoch": 0.01040582726326743,
77
+ "grad_norm": 1.9352552890777588,
78
+ "learning_rate": 4.4999999999999996e-05,
79
+ "loss": 0.5358,
80
+ "step": 10
81
+ },
82
+ {
83
+ "epoch": 0.011446409989594173,
84
+ "grad_norm": 3.7815799713134766,
85
+ "learning_rate": 5e-05,
86
+ "loss": 0.877,
87
+ "step": 11
88
+ },
89
+ {
90
+ "epoch": 0.012486992715920915,
91
+ "grad_norm": 2.989179849624634,
92
+ "learning_rate": 5.5e-05,
93
+ "loss": 0.6389,
94
+ "step": 12
95
+ },
96
+ {
97
+ "epoch": 0.013527575442247659,
98
+ "grad_norm": 3.6533756256103516,
99
+ "learning_rate": 6e-05,
100
+ "loss": 0.7697,
101
+ "step": 13
102
+ },
103
+ {
104
+ "epoch": 0.014568158168574402,
105
+ "grad_norm": 2.5273356437683105,
106
+ "learning_rate": 6.500000000000001e-05,
107
+ "loss": 0.4582,
108
+ "step": 14
109
+ },
110
+ {
111
+ "epoch": 0.015608740894901144,
112
+ "grad_norm": 2.0315494537353516,
113
+ "learning_rate": 7.000000000000001e-05,
114
+ "loss": 0.4683,
115
+ "step": 15
116
+ },
117
+ {
118
+ "epoch": 0.01664932362122789,
119
+ "grad_norm": 1.3862802982330322,
120
+ "learning_rate": 7.5e-05,
121
+ "loss": 0.401,
122
+ "step": 16
123
+ },
124
+ {
125
+ "epoch": 0.01768990634755463,
126
+ "grad_norm": 3.2270781993865967,
127
+ "learning_rate": 8e-05,
128
+ "loss": 0.6733,
129
+ "step": 17
130
+ },
131
+ {
132
+ "epoch": 0.018730489073881373,
133
+ "grad_norm": 2.966115713119507,
134
+ "learning_rate": 8.5e-05,
135
+ "loss": 0.6105,
136
+ "step": 18
137
+ },
138
+ {
139
+ "epoch": 0.019771071800208116,
140
+ "grad_norm": 2.720820188522339,
141
+ "learning_rate": 8.999999999999999e-05,
142
+ "loss": 0.5462,
143
+ "step": 19
144
+ },
145
+ {
146
+ "epoch": 0.02081165452653486,
147
+ "grad_norm": 2.2214956283569336,
148
+ "learning_rate": 9.5e-05,
149
+ "loss": 0.5125,
150
+ "step": 20
151
+ },
152
+ {
153
+ "epoch": 0.021852237252861603,
154
+ "grad_norm": 2.2020890712738037,
155
+ "learning_rate": 0.0001,
156
+ "loss": 0.4953,
157
+ "step": 21
158
+ },
159
+ {
160
+ "epoch": 0.022892819979188347,
161
+ "grad_norm": 2.2625033855438232,
162
+ "learning_rate": 0.000105,
163
+ "loss": 0.5628,
164
+ "step": 22
165
+ },
166
+ {
167
+ "epoch": 0.023933402705515087,
168
+ "grad_norm": 2.223475933074951,
169
+ "learning_rate": 0.00011,
170
+ "loss": 0.5667,
171
+ "step": 23
172
+ },
173
+ {
174
+ "epoch": 0.02497398543184183,
175
+ "grad_norm": 2.982874631881714,
176
+ "learning_rate": 0.000115,
177
+ "loss": 0.6645,
178
+ "step": 24
179
+ },
180
+ {
181
+ "epoch": 0.026014568158168574,
182
+ "grad_norm": 2.5550947189331055,
183
+ "learning_rate": 0.00012,
184
+ "loss": 0.4668,
185
+ "step": 25
186
+ },
187
+ {
188
+ "epoch": 0.027055150884495317,
189
+ "grad_norm": 2.805063486099243,
190
+ "learning_rate": 0.000125,
191
+ "loss": 0.5205,
192
+ "step": 26
193
+ },
194
+ {
195
+ "epoch": 0.02809573361082206,
196
+ "grad_norm": 1.7745788097381592,
197
+ "learning_rate": 0.00013000000000000002,
198
+ "loss": 0.3622,
199
+ "step": 27
200
+ },
201
+ {
202
+ "epoch": 0.029136316337148804,
203
+ "grad_norm": 1.6776342391967773,
204
+ "learning_rate": 0.000135,
205
+ "loss": 0.3641,
206
+ "step": 28
207
+ },
208
+ {
209
+ "epoch": 0.030176899063475548,
210
+ "grad_norm": 2.4569647312164307,
211
+ "learning_rate": 0.00014000000000000001,
212
+ "loss": 0.5263,
213
+ "step": 29
214
+ },
215
+ {
216
+ "epoch": 0.031217481789802288,
217
+ "grad_norm": 1.2685638666152954,
218
+ "learning_rate": 0.000145,
219
+ "loss": 0.3199,
220
+ "step": 30
221
+ },
222
+ {
223
+ "epoch": 0.03225806451612903,
224
+ "grad_norm": 1.3093715906143188,
225
+ "learning_rate": 0.00015,
226
+ "loss": 0.4389,
227
+ "step": 31
228
+ },
229
+ {
230
+ "epoch": 0.03329864724245578,
231
+ "grad_norm": 1.643606185913086,
232
+ "learning_rate": 0.000155,
233
+ "loss": 0.3973,
234
+ "step": 32
235
+ },
236
+ {
237
+ "epoch": 0.03433922996878252,
238
+ "grad_norm": 1.27973473072052,
239
+ "learning_rate": 0.00016,
240
+ "loss": 0.3601,
241
+ "step": 33
242
+ },
243
+ {
244
+ "epoch": 0.03537981269510926,
245
+ "grad_norm": 1.3652054071426392,
246
+ "learning_rate": 0.000165,
247
+ "loss": 0.4557,
248
+ "step": 34
249
+ },
250
+ {
251
+ "epoch": 0.036420395421436005,
252
+ "grad_norm": 1.2647119760513306,
253
+ "learning_rate": 0.00017,
254
+ "loss": 0.3723,
255
+ "step": 35
256
+ },
257
+ {
258
+ "epoch": 0.037460978147762745,
259
+ "grad_norm": 1.2717779874801636,
260
+ "learning_rate": 0.000175,
261
+ "loss": 0.3429,
262
+ "step": 36
263
+ },
264
+ {
265
+ "epoch": 0.03850156087408949,
266
+ "grad_norm": 1.7270296812057495,
267
+ "learning_rate": 0.00017999999999999998,
268
+ "loss": 0.4089,
269
+ "step": 37
270
+ },
271
+ {
272
+ "epoch": 0.03954214360041623,
273
+ "grad_norm": 1.5404200553894043,
274
+ "learning_rate": 0.000185,
275
+ "loss": 0.3764,
276
+ "step": 38
277
+ },
278
+ {
279
+ "epoch": 0.04058272632674298,
280
+ "grad_norm": 1.1958752870559692,
281
+ "learning_rate": 0.00019,
282
+ "loss": 0.375,
283
+ "step": 39
284
+ },
285
+ {
286
+ "epoch": 0.04162330905306972,
287
+ "grad_norm": 1.4304900169372559,
288
+ "learning_rate": 0.00019500000000000002,
289
+ "loss": 0.3802,
290
+ "step": 40
291
+ },
292
+ {
293
+ "epoch": 0.04266389177939646,
294
+ "grad_norm": 1.654426097869873,
295
+ "learning_rate": 0.0002,
296
+ "loss": 0.2566,
297
+ "step": 41
298
+ },
299
+ {
300
+ "epoch": 0.043704474505723206,
301
+ "grad_norm": 1.7565494775772095,
302
+ "learning_rate": 0.000205,
303
+ "loss": 0.3105,
304
+ "step": 42
305
+ },
306
+ {
307
+ "epoch": 0.044745057232049947,
308
+ "grad_norm": 2.055324077606201,
309
+ "learning_rate": 0.00021,
310
+ "loss": 0.3233,
311
+ "step": 43
312
+ },
313
+ {
314
+ "epoch": 0.045785639958376693,
315
+ "grad_norm": 1.283117651939392,
316
+ "learning_rate": 0.000215,
317
+ "loss": 0.3023,
318
+ "step": 44
319
+ },
320
+ {
321
+ "epoch": 0.046826222684703434,
322
+ "grad_norm": 1.292840838432312,
323
+ "learning_rate": 0.00022,
324
+ "loss": 0.2821,
325
+ "step": 45
326
+ },
327
+ {
328
+ "epoch": 0.047866805411030174,
329
+ "grad_norm": 1.0345746278762817,
330
+ "learning_rate": 0.00022500000000000002,
331
+ "loss": 0.2539,
332
+ "step": 46
333
+ },
334
+ {
335
+ "epoch": 0.04890738813735692,
336
+ "grad_norm": 1.0240848064422607,
337
+ "learning_rate": 0.00023,
338
+ "loss": 0.3298,
339
+ "step": 47
340
+ },
341
+ {
342
+ "epoch": 0.04994797086368366,
343
+ "grad_norm": 1.7957828044891357,
344
+ "learning_rate": 0.000235,
345
+ "loss": 0.205,
346
+ "step": 48
347
+ },
348
+ {
349
+ "epoch": 0.05098855359001041,
350
+ "grad_norm": 1.3810360431671143,
351
+ "learning_rate": 0.00024,
352
+ "loss": 0.2919,
353
+ "step": 49
354
+ },
355
+ {
356
+ "epoch": 0.05202913631633715,
357
+ "grad_norm": 0.8331364393234253,
358
+ "learning_rate": 0.000245,
359
+ "loss": 0.1943,
360
+ "step": 50
361
+ },
362
+ {
363
+ "epoch": 0.053069719042663895,
364
+ "grad_norm": 1.213149070739746,
365
+ "learning_rate": 0.00025,
366
+ "loss": 0.3011,
367
+ "step": 51
368
+ },
369
+ {
370
+ "epoch": 0.054110301768990635,
371
+ "grad_norm": 0.9544571042060852,
372
+ "learning_rate": 0.000255,
373
+ "loss": 0.3511,
374
+ "step": 52
375
+ },
376
+ {
377
+ "epoch": 0.055150884495317375,
378
+ "grad_norm": 0.9204476475715637,
379
+ "learning_rate": 0.00026000000000000003,
380
+ "loss": 0.2048,
381
+ "step": 53
382
+ },
383
+ {
384
+ "epoch": 0.05619146722164412,
385
+ "grad_norm": 1.7272144556045532,
386
+ "learning_rate": 0.00026500000000000004,
387
+ "loss": 0.2715,
388
+ "step": 54
389
+ },
390
+ {
391
+ "epoch": 0.05723204994797086,
392
+ "grad_norm": 0.891767680644989,
393
+ "learning_rate": 0.00027,
394
+ "loss": 0.2116,
395
+ "step": 55
396
+ },
397
+ {
398
+ "epoch": 0.05827263267429761,
399
+ "grad_norm": 0.8020220398902893,
400
+ "learning_rate": 0.000275,
401
+ "loss": 0.2101,
402
+ "step": 56
403
+ },
404
+ {
405
+ "epoch": 0.05931321540062435,
406
+ "grad_norm": 1.2897636890411377,
407
+ "learning_rate": 0.00028000000000000003,
408
+ "loss": 0.242,
409
+ "step": 57
410
+ },
411
+ {
412
+ "epoch": 0.060353798126951096,
413
+ "grad_norm": 2.2333452701568604,
414
+ "learning_rate": 0.000285,
415
+ "loss": 0.3461,
416
+ "step": 58
417
+ },
418
+ {
419
+ "epoch": 0.061394380853277836,
420
+ "grad_norm": 1.124709963798523,
421
+ "learning_rate": 0.00029,
422
+ "loss": 0.1709,
423
+ "step": 59
424
+ },
425
+ {
426
+ "epoch": 0.062434963579604576,
427
+ "grad_norm": 0.7170735001564026,
428
+ "learning_rate": 0.000295,
429
+ "loss": 0.1954,
430
+ "step": 60
431
+ },
432
+ {
433
+ "epoch": 0.06347554630593132,
434
+ "grad_norm": 1.3257620334625244,
435
+ "learning_rate": 0.0003,
436
+ "loss": 0.2816,
437
+ "step": 61
438
+ },
439
+ {
440
+ "epoch": 0.06451612903225806,
441
+ "grad_norm": 0.7642104029655457,
442
+ "learning_rate": 0.000305,
443
+ "loss": 0.1788,
444
+ "step": 62
445
+ },
446
+ {
447
+ "epoch": 0.06555671175858481,
448
+ "grad_norm": 0.9636558890342712,
449
+ "learning_rate": 0.00031,
450
+ "loss": 0.2138,
451
+ "step": 63
452
+ },
453
+ {
454
+ "epoch": 0.06659729448491156,
455
+ "grad_norm": 0.7231699228286743,
456
+ "learning_rate": 0.000315,
457
+ "loss": 0.19,
458
+ "step": 64
459
+ },
460
+ {
461
+ "epoch": 0.06763787721123829,
462
+ "grad_norm": 0.9044433236122131,
463
+ "learning_rate": 0.00032,
464
+ "loss": 0.1863,
465
+ "step": 65
466
+ },
467
+ {
468
+ "epoch": 0.06867845993756504,
469
+ "grad_norm": 0.6787164807319641,
470
+ "learning_rate": 0.00032500000000000004,
471
+ "loss": 0.1615,
472
+ "step": 66
473
+ },
474
+ {
475
+ "epoch": 0.06971904266389178,
476
+ "grad_norm": 0.6610997915267944,
477
+ "learning_rate": 0.00033,
478
+ "loss": 0.1777,
479
+ "step": 67
480
+ },
481
+ {
482
+ "epoch": 0.07075962539021852,
483
+ "grad_norm": 0.8359801173210144,
484
+ "learning_rate": 0.000335,
485
+ "loss": 0.238,
486
+ "step": 68
487
+ },
488
+ {
489
+ "epoch": 0.07180020811654526,
490
+ "grad_norm": 0.7294996976852417,
491
+ "learning_rate": 0.00034,
492
+ "loss": 0.2018,
493
+ "step": 69
494
+ },
495
+ {
496
+ "epoch": 0.07284079084287201,
497
+ "grad_norm": 0.7325947880744934,
498
+ "learning_rate": 0.000345,
499
+ "loss": 0.1372,
500
+ "step": 70
501
+ },
502
+ {
503
+ "epoch": 0.07388137356919876,
504
+ "grad_norm": 0.7132765650749207,
505
+ "learning_rate": 0.00035,
506
+ "loss": 0.1951,
507
+ "step": 71
508
+ },
509
+ {
510
+ "epoch": 0.07492195629552549,
511
+ "grad_norm": 1.1800177097320557,
512
+ "learning_rate": 0.000355,
513
+ "loss": 0.2546,
514
+ "step": 72
515
+ },
516
+ {
517
+ "epoch": 0.07596253902185224,
518
+ "grad_norm": 1.0050599575042725,
519
+ "learning_rate": 0.00035999999999999997,
520
+ "loss": 0.189,
521
+ "step": 73
522
+ },
523
+ {
524
+ "epoch": 0.07700312174817898,
525
+ "grad_norm": 0.7532162070274353,
526
+ "learning_rate": 0.000365,
527
+ "loss": 0.1276,
528
+ "step": 74
529
+ },
530
+ {
531
+ "epoch": 0.07804370447450572,
532
+ "grad_norm": 0.8199287056922913,
533
+ "learning_rate": 0.00037,
534
+ "loss": 0.2116,
535
+ "step": 75
536
+ },
537
+ {
538
+ "epoch": 0.07908428720083246,
539
+ "grad_norm": 0.8740005493164062,
540
+ "learning_rate": 0.000375,
541
+ "loss": 0.1754,
542
+ "step": 76
543
+ },
544
+ {
545
+ "epoch": 0.08012486992715921,
546
+ "grad_norm": 0.6971861124038696,
547
+ "learning_rate": 0.00038,
548
+ "loss": 0.1799,
549
+ "step": 77
550
+ },
551
+ {
552
+ "epoch": 0.08116545265348596,
553
+ "grad_norm": 0.6992635726928711,
554
+ "learning_rate": 0.00038500000000000003,
555
+ "loss": 0.1663,
556
+ "step": 78
557
+ },
558
+ {
559
+ "epoch": 0.08220603537981269,
560
+ "grad_norm": 0.8527954816818237,
561
+ "learning_rate": 0.00039000000000000005,
562
+ "loss": 0.1676,
563
+ "step": 79
564
+ },
565
+ {
566
+ "epoch": 0.08324661810613944,
567
+ "grad_norm": 0.7233165502548218,
568
+ "learning_rate": 0.000395,
569
+ "loss": 0.1635,
570
+ "step": 80
571
+ },
572
+ {
573
+ "epoch": 0.08428720083246619,
574
+ "grad_norm": 1.2006125450134277,
575
+ "learning_rate": 0.0004,
576
+ "loss": 0.1902,
577
+ "step": 81
578
+ },
579
+ {
580
+ "epoch": 0.08532778355879292,
581
+ "grad_norm": 0.6341950297355652,
582
+ "learning_rate": 0.00040500000000000003,
583
+ "loss": 0.1396,
584
+ "step": 82
585
+ },
586
+ {
587
+ "epoch": 0.08636836628511967,
588
+ "grad_norm": 0.670028030872345,
589
+ "learning_rate": 0.00041,
590
+ "loss": 0.162,
591
+ "step": 83
592
+ },
593
+ {
594
+ "epoch": 0.08740894901144641,
595
+ "grad_norm": 0.6362585425376892,
596
+ "learning_rate": 0.000415,
597
+ "loss": 0.155,
598
+ "step": 84
599
+ },
600
+ {
601
+ "epoch": 0.08844953173777315,
602
+ "grad_norm": 0.7975156307220459,
603
+ "learning_rate": 0.00042,
604
+ "loss": 0.1264,
605
+ "step": 85
606
+ },
607
+ {
608
+ "epoch": 0.08949011446409989,
609
+ "grad_norm": 0.5603007078170776,
610
+ "learning_rate": 0.000425,
611
+ "loss": 0.1505,
612
+ "step": 86
613
+ },
614
+ {
615
+ "epoch": 0.09053069719042664,
616
+ "grad_norm": 0.515308141708374,
617
+ "learning_rate": 0.00043,
618
+ "loss": 0.1364,
619
+ "step": 87
620
+ },
621
+ {
622
+ "epoch": 0.09157127991675339,
623
+ "grad_norm": 0.6081110239028931,
624
+ "learning_rate": 0.000435,
625
+ "loss": 0.1428,
626
+ "step": 88
627
+ },
628
+ {
629
+ "epoch": 0.09261186264308012,
630
+ "grad_norm": 0.5383463501930237,
631
+ "learning_rate": 0.00044,
632
+ "loss": 0.1293,
633
+ "step": 89
634
+ },
635
+ {
636
+ "epoch": 0.09365244536940687,
637
+ "grad_norm": 0.659436047077179,
638
+ "learning_rate": 0.00044500000000000003,
639
+ "loss": 0.1475,
640
+ "step": 90
641
+ },
642
+ {
643
+ "epoch": 0.09469302809573361,
644
+ "grad_norm": 0.5411190390586853,
645
+ "learning_rate": 0.00045000000000000004,
646
+ "loss": 0.1408,
647
+ "step": 91
648
+ },
649
+ {
650
+ "epoch": 0.09573361082206035,
651
+ "grad_norm": 0.6518479585647583,
652
+ "learning_rate": 0.000455,
653
+ "loss": 0.1576,
654
+ "step": 92
655
+ },
656
+ {
657
+ "epoch": 0.0967741935483871,
658
+ "grad_norm": 0.5494299530982971,
659
+ "learning_rate": 0.00046,
660
+ "loss": 0.1099,
661
+ "step": 93
662
+ },
663
+ {
664
+ "epoch": 0.09781477627471384,
665
+ "grad_norm": 0.8132746815681458,
666
+ "learning_rate": 0.000465,
667
+ "loss": 0.1636,
668
+ "step": 94
669
+ },
670
+ {
671
+ "epoch": 0.09885535900104059,
672
+ "grad_norm": 0.5652503371238708,
673
+ "learning_rate": 0.00047,
674
+ "loss": 0.1595,
675
+ "step": 95
676
+ },
677
+ {
678
+ "epoch": 0.09989594172736732,
679
+ "grad_norm": 0.61795973777771,
680
+ "learning_rate": 0.000475,
681
+ "loss": 0.0745,
682
+ "step": 96
683
+ },
684
+ {
685
+ "epoch": 0.10093652445369407,
686
+ "grad_norm": 0.4944301247596741,
687
+ "learning_rate": 0.00048,
688
+ "loss": 0.1406,
689
+ "step": 97
690
+ },
691
+ {
692
+ "epoch": 0.10197710718002082,
693
+ "grad_norm": 0.5052417516708374,
694
+ "learning_rate": 0.00048499999999999997,
695
+ "loss": 0.104,
696
+ "step": 98
697
+ },
698
+ {
699
+ "epoch": 0.10301768990634755,
700
+ "grad_norm": 0.46198371052742004,
701
+ "learning_rate": 0.00049,
702
+ "loss": 0.0883,
703
+ "step": 99
704
+ },
705
+ {
706
+ "epoch": 0.1040582726326743,
707
+ "grad_norm": 0.6346387267112732,
708
+ "learning_rate": 0.000495,
709
+ "loss": 0.154,
710
+ "step": 100
711
+ },
712
+ {
713
+ "epoch": 0.10509885535900104,
714
+ "grad_norm": 0.4819563925266266,
715
+ "learning_rate": 0.0005,
716
+ "loss": 0.1454,
717
+ "step": 101
718
+ },
719
+ {
720
+ "epoch": 0.10613943808532779,
721
+ "grad_norm": 0.44754841923713684,
722
+ "learning_rate": 0.0004994444444444445,
723
+ "loss": 0.0742,
724
+ "step": 102
725
+ },
726
+ {
727
+ "epoch": 0.10718002081165452,
728
+ "grad_norm": 0.3852291703224182,
729
+ "learning_rate": 0.0004988888888888889,
730
+ "loss": 0.063,
731
+ "step": 103
732
+ },
733
+ {
734
+ "epoch": 0.10822060353798127,
735
+ "grad_norm": 0.572284460067749,
736
+ "learning_rate": 0.0004983333333333334,
737
+ "loss": 0.1434,
738
+ "step": 104
739
+ },
740
+ {
741
+ "epoch": 0.10926118626430802,
742
+ "grad_norm": 0.402413934469223,
743
+ "learning_rate": 0.0004977777777777778,
744
+ "loss": 0.0897,
745
+ "step": 105
746
+ },
747
+ {
748
+ "epoch": 0.11030176899063475,
749
+ "grad_norm": 0.5178724527359009,
750
+ "learning_rate": 0.0004972222222222222,
751
+ "loss": 0.0991,
752
+ "step": 106
753
+ },
754
+ {
755
+ "epoch": 0.1113423517169615,
756
+ "grad_norm": 0.5298802852630615,
757
+ "learning_rate": 0.0004966666666666666,
758
+ "loss": 0.1265,
759
+ "step": 107
760
+ },
761
+ {
762
+ "epoch": 0.11238293444328824,
763
+ "grad_norm": 0.5106524229049683,
764
+ "learning_rate": 0.0004961111111111111,
765
+ "loss": 0.076,
766
+ "step": 108
767
+ },
768
+ {
769
+ "epoch": 0.11342351716961499,
770
+ "grad_norm": 0.4718921482563019,
771
+ "learning_rate": 0.0004955555555555556,
772
+ "loss": 0.0927,
773
+ "step": 109
774
+ },
775
+ {
776
+ "epoch": 0.11446409989594172,
777
+ "grad_norm": 0.4144158661365509,
778
+ "learning_rate": 0.000495,
779
+ "loss": 0.1075,
780
+ "step": 110
781
+ },
782
+ {
783
+ "epoch": 0.11550468262226847,
784
+ "grad_norm": 0.44835594296455383,
785
+ "learning_rate": 0.0004944444444444445,
786
+ "loss": 0.1093,
787
+ "step": 111
788
+ },
789
+ {
790
+ "epoch": 0.11654526534859522,
791
+ "grad_norm": 0.6650722622871399,
792
+ "learning_rate": 0.0004938888888888889,
793
+ "loss": 0.1082,
794
+ "step": 112
795
+ },
796
+ {
797
+ "epoch": 0.11758584807492195,
798
+ "grad_norm": 0.40712565183639526,
799
+ "learning_rate": 0.0004933333333333334,
800
+ "loss": 0.0622,
801
+ "step": 113
802
+ },
803
+ {
804
+ "epoch": 0.1186264308012487,
805
+ "grad_norm": 0.5961405634880066,
806
+ "learning_rate": 0.0004927777777777777,
807
+ "loss": 0.1041,
808
+ "step": 114
809
+ },
810
+ {
811
+ "epoch": 0.11966701352757544,
812
+ "grad_norm": 0.4379814863204956,
813
+ "learning_rate": 0.0004922222222222222,
814
+ "loss": 0.1172,
815
+ "step": 115
816
+ },
817
+ {
818
+ "epoch": 0.12070759625390219,
819
+ "grad_norm": 0.4038859009742737,
820
+ "learning_rate": 0.0004916666666666666,
821
+ "loss": 0.083,
822
+ "step": 116
823
+ },
824
+ {
825
+ "epoch": 0.12174817898022892,
826
+ "grad_norm": 0.49663108587265015,
827
+ "learning_rate": 0.0004911111111111111,
828
+ "loss": 0.0732,
829
+ "step": 117
830
+ },
831
+ {
832
+ "epoch": 0.12278876170655567,
833
+ "grad_norm": 0.34757199883461,
834
+ "learning_rate": 0.0004905555555555556,
835
+ "loss": 0.0946,
836
+ "step": 118
837
+ },
838
+ {
839
+ "epoch": 0.12382934443288242,
840
+ "grad_norm": 0.421332448720932,
841
+ "learning_rate": 0.00049,
842
+ "loss": 0.0856,
843
+ "step": 119
844
+ },
845
+ {
846
+ "epoch": 0.12486992715920915,
847
+ "grad_norm": 0.41452690958976746,
848
+ "learning_rate": 0.0004894444444444445,
849
+ "loss": 0.1235,
850
+ "step": 120
851
+ },
852
+ {
853
+ "epoch": 0.1259105098855359,
854
+ "grad_norm": 0.6133429408073425,
855
+ "learning_rate": 0.0004888888888888889,
856
+ "loss": 0.1004,
857
+ "step": 121
858
+ },
859
+ {
860
+ "epoch": 0.12695109261186263,
861
+ "grad_norm": 0.4711684286594391,
862
+ "learning_rate": 0.0004883333333333333,
863
+ "loss": 0.0944,
864
+ "step": 122
865
+ },
866
+ {
867
+ "epoch": 0.1279916753381894,
868
+ "grad_norm": 0.4512624144554138,
869
+ "learning_rate": 0.0004877777777777778,
870
+ "loss": 0.1027,
871
+ "step": 123
872
+ },
873
+ {
874
+ "epoch": 0.12903225806451613,
875
+ "grad_norm": 0.42018765211105347,
876
+ "learning_rate": 0.0004872222222222222,
877
+ "loss": 0.1185,
878
+ "step": 124
879
+ },
880
+ {
881
+ "epoch": 0.13007284079084286,
882
+ "grad_norm": 0.49484384059906006,
883
+ "learning_rate": 0.0004866666666666667,
884
+ "loss": 0.0782,
885
+ "step": 125
886
+ },
887
+ {
888
+ "epoch": 0.13111342351716962,
889
+ "grad_norm": 0.4003879427909851,
890
+ "learning_rate": 0.0004861111111111111,
891
+ "loss": 0.087,
892
+ "step": 126
893
+ },
894
+ {
895
+ "epoch": 0.13215400624349635,
896
+ "grad_norm": 0.5285933017730713,
897
+ "learning_rate": 0.0004855555555555556,
898
+ "loss": 0.078,
899
+ "step": 127
900
+ },
901
+ {
902
+ "epoch": 0.1331945889698231,
903
+ "grad_norm": 0.3752761781215668,
904
+ "learning_rate": 0.00048499999999999997,
905
+ "loss": 0.0792,
906
+ "step": 128
907
+ },
908
+ {
909
+ "epoch": 0.13423517169614985,
910
+ "grad_norm": 0.3410363495349884,
911
+ "learning_rate": 0.00048444444444444446,
912
+ "loss": 0.1107,
913
+ "step": 129
914
+ },
915
+ {
916
+ "epoch": 0.13527575442247658,
917
+ "grad_norm": 0.38146358728408813,
918
+ "learning_rate": 0.0004838888888888889,
919
+ "loss": 0.0894,
920
+ "step": 130
921
+ },
922
+ {
923
+ "epoch": 0.13631633714880334,
924
+ "grad_norm": 0.5861756801605225,
925
+ "learning_rate": 0.00048333333333333334,
926
+ "loss": 0.1187,
927
+ "step": 131
928
+ },
929
+ {
930
+ "epoch": 0.13735691987513007,
931
+ "grad_norm": 0.7138178944587708,
932
+ "learning_rate": 0.0004827777777777778,
933
+ "loss": 0.1242,
934
+ "step": 132
935
+ },
936
+ {
937
+ "epoch": 0.1383975026014568,
938
+ "grad_norm": 0.3060092031955719,
939
+ "learning_rate": 0.0004822222222222222,
940
+ "loss": 0.0721,
941
+ "step": 133
942
+ },
943
+ {
944
+ "epoch": 0.13943808532778357,
945
+ "grad_norm": 0.32948216795921326,
946
+ "learning_rate": 0.0004816666666666667,
947
+ "loss": 0.0814,
948
+ "step": 134
949
+ },
950
+ {
951
+ "epoch": 0.1404786680541103,
952
+ "grad_norm": 0.2897670865058899,
953
+ "learning_rate": 0.0004811111111111111,
954
+ "loss": 0.0728,
955
+ "step": 135
956
+ },
957
+ {
958
+ "epoch": 0.14151925078043703,
959
+ "grad_norm": 0.32715317606925964,
960
+ "learning_rate": 0.0004805555555555556,
961
+ "loss": 0.083,
962
+ "step": 136
963
+ },
964
+ {
965
+ "epoch": 0.1425598335067638,
966
+ "grad_norm": 0.28751736879348755,
967
+ "learning_rate": 0.00048,
968
+ "loss": 0.0619,
969
+ "step": 137
970
+ },
971
+ {
972
+ "epoch": 0.14360041623309053,
973
+ "grad_norm": 0.3826645612716675,
974
+ "learning_rate": 0.00047944444444444445,
975
+ "loss": 0.1057,
976
+ "step": 138
977
+ },
978
+ {
979
+ "epoch": 0.14464099895941726,
980
+ "grad_norm": 0.4589000642299652,
981
+ "learning_rate": 0.0004788888888888889,
982
+ "loss": 0.1138,
983
+ "step": 139
984
+ },
985
+ {
986
+ "epoch": 0.14568158168574402,
987
+ "grad_norm": 0.4404071569442749,
988
+ "learning_rate": 0.0004783333333333333,
989
+ "loss": 0.0824,
990
+ "step": 140
991
+ },
992
+ {
993
+ "epoch": 0.14672216441207075,
994
+ "grad_norm": 0.4857710301876068,
995
+ "learning_rate": 0.0004777777777777778,
996
+ "loss": 0.0744,
997
+ "step": 141
998
+ },
999
+ {
1000
+ "epoch": 0.14776274713839752,
1001
+ "grad_norm": 0.34489718079566956,
1002
+ "learning_rate": 0.00047722222222222225,
1003
+ "loss": 0.0556,
1004
+ "step": 142
1005
+ },
1006
+ {
1007
+ "epoch": 0.14880332986472425,
1008
+ "grad_norm": 0.3448956310749054,
1009
+ "learning_rate": 0.0004766666666666667,
1010
+ "loss": 0.064,
1011
+ "step": 143
1012
+ },
1013
+ {
1014
+ "epoch": 0.14984391259105098,
1015
+ "grad_norm": 0.3096216917037964,
1016
+ "learning_rate": 0.0004761111111111111,
1017
+ "loss": 0.0816,
1018
+ "step": 144
1019
+ },
1020
+ {
1021
+ "epoch": 0.15088449531737774,
1022
+ "grad_norm": 0.4213986396789551,
1023
+ "learning_rate": 0.00047555555555555556,
1024
+ "loss": 0.1041,
1025
+ "step": 145
1026
+ },
1027
+ {
1028
+ "epoch": 0.15192507804370448,
1029
+ "grad_norm": 0.2673068046569824,
1030
+ "learning_rate": 0.000475,
1031
+ "loss": 0.0836,
1032
+ "step": 146
1033
+ },
1034
+ {
1035
+ "epoch": 0.1529656607700312,
1036
+ "grad_norm": 0.35139915347099304,
1037
+ "learning_rate": 0.00047444444444444444,
1038
+ "loss": 0.0866,
1039
+ "step": 147
1040
+ },
1041
+ {
1042
+ "epoch": 0.15400624349635797,
1043
+ "grad_norm": 0.3168632388114929,
1044
+ "learning_rate": 0.00047388888888888893,
1045
+ "loss": 0.0693,
1046
+ "step": 148
1047
+ },
1048
+ {
1049
+ "epoch": 0.1550468262226847,
1050
+ "grad_norm": 0.3259681761264801,
1051
+ "learning_rate": 0.00047333333333333336,
1052
+ "loss": 0.0525,
1053
+ "step": 149
1054
+ },
1055
+ {
1056
+ "epoch": 0.15608740894901144,
1057
+ "grad_norm": 0.44802430272102356,
1058
+ "learning_rate": 0.0004727777777777778,
1059
+ "loss": 0.0938,
1060
+ "step": 150
1061
+ },
1062
+ {
1063
+ "epoch": 0.1571279916753382,
1064
+ "grad_norm": 0.2723800241947174,
1065
+ "learning_rate": 0.00047222222222222224,
1066
+ "loss": 0.0637,
1067
+ "step": 151
1068
+ },
1069
+ {
1070
+ "epoch": 0.15816857440166493,
1071
+ "grad_norm": 0.33274656534194946,
1072
+ "learning_rate": 0.0004716666666666667,
1073
+ "loss": 0.0776,
1074
+ "step": 152
1075
+ },
1076
+ {
1077
+ "epoch": 0.15920915712799166,
1078
+ "grad_norm": 0.41862592101097107,
1079
+ "learning_rate": 0.0004711111111111111,
1080
+ "loss": 0.0979,
1081
+ "step": 153
1082
+ },
1083
+ {
1084
+ "epoch": 0.16024973985431842,
1085
+ "grad_norm": 0.35577768087387085,
1086
+ "learning_rate": 0.00047055555555555555,
1087
+ "loss": 0.0414,
1088
+ "step": 154
1089
+ },
1090
+ {
1091
+ "epoch": 0.16129032258064516,
1092
+ "grad_norm": 0.32270193099975586,
1093
+ "learning_rate": 0.00047,
1094
+ "loss": 0.101,
1095
+ "step": 155
1096
+ },
1097
+ {
1098
+ "epoch": 0.16233090530697192,
1099
+ "grad_norm": 0.2666638493537903,
1100
+ "learning_rate": 0.0004694444444444445,
1101
+ "loss": 0.0689,
1102
+ "step": 156
1103
+ },
1104
+ {
1105
+ "epoch": 0.16337148803329865,
1106
+ "grad_norm": 0.20294290781021118,
1107
+ "learning_rate": 0.0004688888888888889,
1108
+ "loss": 0.0533,
1109
+ "step": 157
1110
+ },
1111
+ {
1112
+ "epoch": 0.16441207075962538,
1113
+ "grad_norm": 0.3359270989894867,
1114
+ "learning_rate": 0.00046833333333333335,
1115
+ "loss": 0.0817,
1116
+ "step": 158
1117
+ },
1118
+ {
1119
+ "epoch": 0.16545265348595214,
1120
+ "grad_norm": 0.44312432408332825,
1121
+ "learning_rate": 0.0004677777777777778,
1122
+ "loss": 0.0862,
1123
+ "step": 159
1124
+ },
1125
+ {
1126
+ "epoch": 0.16649323621227888,
1127
+ "grad_norm": 0.24581390619277954,
1128
+ "learning_rate": 0.0004672222222222222,
1129
+ "loss": 0.0585,
1130
+ "step": 160
1131
+ },
1132
+ {
1133
+ "epoch": 0.1675338189386056,
1134
+ "grad_norm": 0.25939878821372986,
1135
+ "learning_rate": 0.00046666666666666666,
1136
+ "loss": 0.0737,
1137
+ "step": 161
1138
+ },
1139
+ {
1140
+ "epoch": 0.16857440166493237,
1141
+ "grad_norm": 0.212020605802536,
1142
+ "learning_rate": 0.0004661111111111111,
1143
+ "loss": 0.0487,
1144
+ "step": 162
1145
+ },
1146
+ {
1147
+ "epoch": 0.1696149843912591,
1148
+ "grad_norm": 0.30007174611091614,
1149
+ "learning_rate": 0.0004655555555555556,
1150
+ "loss": 0.0695,
1151
+ "step": 163
1152
+ },
1153
+ {
1154
+ "epoch": 0.17065556711758584,
1155
+ "grad_norm": 0.2842208445072174,
1156
+ "learning_rate": 0.000465,
1157
+ "loss": 0.0612,
1158
+ "step": 164
1159
+ },
1160
+ {
1161
+ "epoch": 0.1716961498439126,
1162
+ "grad_norm": 0.2660129964351654,
1163
+ "learning_rate": 0.00046444444444444446,
1164
+ "loss": 0.0557,
1165
+ "step": 165
1166
+ },
1167
+ {
1168
+ "epoch": 0.17273673257023933,
1169
+ "grad_norm": 0.3331991732120514,
1170
+ "learning_rate": 0.0004638888888888889,
1171
+ "loss": 0.0676,
1172
+ "step": 166
1173
+ },
1174
+ {
1175
+ "epoch": 0.17377731529656607,
1176
+ "grad_norm": 0.2525298297405243,
1177
+ "learning_rate": 0.00046333333333333334,
1178
+ "loss": 0.0552,
1179
+ "step": 167
1180
+ },
1181
+ {
1182
+ "epoch": 0.17481789802289283,
1183
+ "grad_norm": 0.2903599739074707,
1184
+ "learning_rate": 0.0004627777777777778,
1185
+ "loss": 0.0823,
1186
+ "step": 168
1187
+ },
1188
+ {
1189
+ "epoch": 0.17585848074921956,
1190
+ "grad_norm": 0.25501200556755066,
1191
+ "learning_rate": 0.0004622222222222222,
1192
+ "loss": 0.0529,
1193
+ "step": 169
1194
+ },
1195
+ {
1196
+ "epoch": 0.1768990634755463,
1197
+ "grad_norm": 0.27259787917137146,
1198
+ "learning_rate": 0.0004616666666666667,
1199
+ "loss": 0.0635,
1200
+ "step": 170
1201
+ },
1202
+ {
1203
+ "epoch": 0.17793964620187305,
1204
+ "grad_norm": 0.22791972756385803,
1205
+ "learning_rate": 0.00046111111111111114,
1206
+ "loss": 0.0608,
1207
+ "step": 171
1208
+ },
1209
+ {
1210
+ "epoch": 0.17898022892819979,
1211
+ "grad_norm": 0.40977853536605835,
1212
+ "learning_rate": 0.0004605555555555556,
1213
+ "loss": 0.0907,
1214
+ "step": 172
1215
+ },
1216
+ {
1217
+ "epoch": 0.18002081165452655,
1218
+ "grad_norm": 0.27355197072029114,
1219
+ "learning_rate": 0.00046,
1220
+ "loss": 0.0688,
1221
+ "step": 173
1222
+ },
1223
+ {
1224
+ "epoch": 0.18106139438085328,
1225
+ "grad_norm": 0.223897784948349,
1226
+ "learning_rate": 0.00045944444444444445,
1227
+ "loss": 0.0376,
1228
+ "step": 174
1229
+ },
1230
+ {
1231
+ "epoch": 0.18210197710718,
1232
+ "grad_norm": 0.3418944180011749,
1233
+ "learning_rate": 0.0004588888888888889,
1234
+ "loss": 0.0483,
1235
+ "step": 175
1236
+ },
1237
+ {
1238
+ "epoch": 0.18314255983350677,
1239
+ "grad_norm": 0.22283855080604553,
1240
+ "learning_rate": 0.0004583333333333333,
1241
+ "loss": 0.0602,
1242
+ "step": 176
1243
+ },
1244
+ {
1245
+ "epoch": 0.1841831425598335,
1246
+ "grad_norm": 0.260822594165802,
1247
+ "learning_rate": 0.0004577777777777778,
1248
+ "loss": 0.0681,
1249
+ "step": 177
1250
+ },
1251
+ {
1252
+ "epoch": 0.18522372528616024,
1253
+ "grad_norm": 0.2648361921310425,
1254
+ "learning_rate": 0.0004572222222222222,
1255
+ "loss": 0.064,
1256
+ "step": 178
1257
+ },
1258
+ {
1259
+ "epoch": 0.186264308012487,
1260
+ "grad_norm": 0.28108835220336914,
1261
+ "learning_rate": 0.0004566666666666667,
1262
+ "loss": 0.0664,
1263
+ "step": 179
1264
+ },
1265
+ {
1266
+ "epoch": 0.18730489073881373,
1267
+ "grad_norm": 0.3026326298713684,
1268
+ "learning_rate": 0.0004561111111111111,
1269
+ "loss": 0.0653,
1270
+ "step": 180
1271
+ },
1272
+ {
1273
+ "epoch": 0.18834547346514047,
1274
+ "grad_norm": 0.24034692347049713,
1275
+ "learning_rate": 0.00045555555555555556,
1276
+ "loss": 0.0653,
1277
+ "step": 181
1278
+ },
1279
+ {
1280
+ "epoch": 0.18938605619146723,
1281
+ "grad_norm": 0.2587687075138092,
1282
+ "learning_rate": 0.000455,
1283
+ "loss": 0.066,
1284
+ "step": 182
1285
+ },
1286
+ {
1287
+ "epoch": 0.19042663891779396,
1288
+ "grad_norm": 0.44995367527008057,
1289
+ "learning_rate": 0.00045444444444444444,
1290
+ "loss": 0.0697,
1291
+ "step": 183
1292
+ },
1293
+ {
1294
+ "epoch": 0.1914672216441207,
1295
+ "grad_norm": 0.29801756143569946,
1296
+ "learning_rate": 0.00045388888888888893,
1297
+ "loss": 0.068,
1298
+ "step": 184
1299
+ },
1300
+ {
1301
+ "epoch": 0.19250780437044746,
1302
+ "grad_norm": 0.2797435224056244,
1303
+ "learning_rate": 0.0004533333333333333,
1304
+ "loss": 0.0704,
1305
+ "step": 185
1306
+ },
1307
+ {
1308
+ "epoch": 0.1935483870967742,
1309
+ "grad_norm": 0.21289293467998505,
1310
+ "learning_rate": 0.0004527777777777778,
1311
+ "loss": 0.0476,
1312
+ "step": 186
1313
+ },
1314
+ {
1315
+ "epoch": 0.19458896982310095,
1316
+ "grad_norm": 0.2547968029975891,
1317
+ "learning_rate": 0.00045222222222222224,
1318
+ "loss": 0.0669,
1319
+ "step": 187
1320
+ },
1321
+ {
1322
+ "epoch": 0.19562955254942768,
1323
+ "grad_norm": 0.21561963856220245,
1324
+ "learning_rate": 0.0004516666666666667,
1325
+ "loss": 0.0687,
1326
+ "step": 188
1327
+ },
1328
+ {
1329
+ "epoch": 0.19667013527575442,
1330
+ "grad_norm": 0.24872778356075287,
1331
+ "learning_rate": 0.0004511111111111111,
1332
+ "loss": 0.0539,
1333
+ "step": 189
1334
+ },
1335
+ {
1336
+ "epoch": 0.19771071800208118,
1337
+ "grad_norm": 0.2251560389995575,
1338
+ "learning_rate": 0.00045055555555555555,
1339
+ "loss": 0.0631,
1340
+ "step": 190
1341
+ },
1342
+ {
1343
+ "epoch": 0.1987513007284079,
1344
+ "grad_norm": 0.3262229263782501,
1345
+ "learning_rate": 0.00045000000000000004,
1346
+ "loss": 0.0906,
1347
+ "step": 191
1348
+ },
1349
+ {
1350
+ "epoch": 0.19979188345473464,
1351
+ "grad_norm": 0.25986504554748535,
1352
+ "learning_rate": 0.0004494444444444444,
1353
+ "loss": 0.0424,
1354
+ "step": 192
1355
+ },
1356
+ {
1357
+ "epoch": 0.2008324661810614,
1358
+ "grad_norm": 0.279202938079834,
1359
+ "learning_rate": 0.0004488888888888889,
1360
+ "loss": 0.0603,
1361
+ "step": 193
1362
+ },
1363
+ {
1364
+ "epoch": 0.20187304890738814,
1365
+ "grad_norm": 0.24421726167201996,
1366
+ "learning_rate": 0.0004483333333333333,
1367
+ "loss": 0.0545,
1368
+ "step": 194
1369
+ },
1370
+ {
1371
+ "epoch": 0.20291363163371487,
1372
+ "grad_norm": 0.23044031858444214,
1373
+ "learning_rate": 0.0004477777777777778,
1374
+ "loss": 0.0582,
1375
+ "step": 195
1376
+ },
1377
+ {
1378
+ "epoch": 0.20395421436004163,
1379
+ "grad_norm": 0.3058019280433655,
1380
+ "learning_rate": 0.0004472222222222222,
1381
+ "loss": 0.071,
1382
+ "step": 196
1383
+ },
1384
+ {
1385
+ "epoch": 0.20499479708636836,
1386
+ "grad_norm": 0.32619190216064453,
1387
+ "learning_rate": 0.00044666666666666666,
1388
+ "loss": 0.0625,
1389
+ "step": 197
1390
+ },
1391
+ {
1392
+ "epoch": 0.2060353798126951,
1393
+ "grad_norm": 0.2773308753967285,
1394
+ "learning_rate": 0.00044611111111111115,
1395
+ "loss": 0.0496,
1396
+ "step": 198
1397
+ },
1398
+ {
1399
+ "epoch": 0.20707596253902186,
1400
+ "grad_norm": 0.19181455671787262,
1401
+ "learning_rate": 0.00044555555555555554,
1402
+ "loss": 0.0424,
1403
+ "step": 199
1404
+ },
1405
+ {
1406
+ "epoch": 0.2081165452653486,
1407
+ "grad_norm": 0.3275878131389618,
1408
+ "learning_rate": 0.00044500000000000003,
1409
+ "loss": 0.0505,
1410
+ "step": 200
1411
+ },
1412
+ {
1413
+ "epoch": 0.20915712799167535,
1414
+ "grad_norm": 0.2280910611152649,
1415
+ "learning_rate": 0.0004444444444444444,
1416
+ "loss": 0.0526,
1417
+ "step": 201
1418
+ },
1419
+ {
1420
+ "epoch": 0.21019771071800208,
1421
+ "grad_norm": 0.21952077746391296,
1422
+ "learning_rate": 0.0004438888888888889,
1423
+ "loss": 0.0581,
1424
+ "step": 202
1425
+ },
1426
+ {
1427
+ "epoch": 0.21123829344432882,
1428
+ "grad_norm": 0.2316325306892395,
1429
+ "learning_rate": 0.00044333333333333334,
1430
+ "loss": 0.0587,
1431
+ "step": 203
1432
+ },
1433
+ {
1434
+ "epoch": 0.21227887617065558,
1435
+ "grad_norm": 0.2537364363670349,
1436
+ "learning_rate": 0.0004427777777777778,
1437
+ "loss": 0.0557,
1438
+ "step": 204
1439
+ },
1440
+ {
1441
+ "epoch": 0.2133194588969823,
1442
+ "grad_norm": 0.24439412355422974,
1443
+ "learning_rate": 0.00044222222222222227,
1444
+ "loss": 0.0333,
1445
+ "step": 205
1446
+ },
1447
+ {
1448
+ "epoch": 0.21436004162330904,
1449
+ "grad_norm": 0.21104027330875397,
1450
+ "learning_rate": 0.00044166666666666665,
1451
+ "loss": 0.0643,
1452
+ "step": 206
1453
+ },
1454
+ {
1455
+ "epoch": 0.2154006243496358,
1456
+ "grad_norm": 0.2639058232307434,
1457
+ "learning_rate": 0.00044111111111111114,
1458
+ "loss": 0.0443,
1459
+ "step": 207
1460
+ },
1461
+ {
1462
+ "epoch": 0.21644120707596254,
1463
+ "grad_norm": 0.19854490458965302,
1464
+ "learning_rate": 0.0004405555555555555,
1465
+ "loss": 0.0402,
1466
+ "step": 208
1467
+ },
1468
+ {
1469
+ "epoch": 0.21748178980228927,
1470
+ "grad_norm": 0.49617311358451843,
1471
+ "learning_rate": 0.00044,
1472
+ "loss": 0.0668,
1473
+ "step": 209
1474
+ },
1475
+ {
1476
+ "epoch": 0.21852237252861603,
1477
+ "grad_norm": 0.2171219140291214,
1478
+ "learning_rate": 0.0004394444444444445,
1479
+ "loss": 0.0531,
1480
+ "step": 210
1481
+ },
1482
+ {
1483
+ "epoch": 0.21956295525494277,
1484
+ "grad_norm": 0.21126677095890045,
1485
+ "learning_rate": 0.0004388888888888889,
1486
+ "loss": 0.0618,
1487
+ "step": 211
1488
+ },
1489
+ {
1490
+ "epoch": 0.2206035379812695,
1491
+ "grad_norm": 0.22313550114631653,
1492
+ "learning_rate": 0.0004383333333333334,
1493
+ "loss": 0.0381,
1494
+ "step": 212
1495
+ },
1496
+ {
1497
+ "epoch": 0.22164412070759626,
1498
+ "grad_norm": 0.22066129744052887,
1499
+ "learning_rate": 0.00043777777777777776,
1500
+ "loss": 0.0516,
1501
+ "step": 213
1502
+ },
1503
+ {
1504
+ "epoch": 0.222684703433923,
1505
+ "grad_norm": 0.19753003120422363,
1506
+ "learning_rate": 0.00043722222222222225,
1507
+ "loss": 0.0472,
1508
+ "step": 214
1509
+ },
1510
+ {
1511
+ "epoch": 0.22372528616024975,
1512
+ "grad_norm": 0.20395542681217194,
1513
+ "learning_rate": 0.00043666666666666664,
1514
+ "loss": 0.0384,
1515
+ "step": 215
1516
+ },
1517
+ {
1518
+ "epoch": 0.2247658688865765,
1519
+ "grad_norm": 0.25114142894744873,
1520
+ "learning_rate": 0.00043611111111111113,
1521
+ "loss": 0.0557,
1522
+ "step": 216
1523
+ },
1524
+ {
1525
+ "epoch": 0.22580645161290322,
1526
+ "grad_norm": 0.3654433786869049,
1527
+ "learning_rate": 0.0004355555555555555,
1528
+ "loss": 0.0476,
1529
+ "step": 217
1530
+ },
1531
+ {
1532
+ "epoch": 0.22684703433922998,
1533
+ "grad_norm": 0.22211597859859467,
1534
+ "learning_rate": 0.000435,
1535
+ "loss": 0.0515,
1536
+ "step": 218
1537
+ },
1538
+ {
1539
+ "epoch": 0.2278876170655567,
1540
+ "grad_norm": 0.24841049313545227,
1541
+ "learning_rate": 0.0004344444444444445,
1542
+ "loss": 0.0662,
1543
+ "step": 219
1544
+ },
1545
+ {
1546
+ "epoch": 0.22892819979188345,
1547
+ "grad_norm": 0.2204892486333847,
1548
+ "learning_rate": 0.0004338888888888889,
1549
+ "loss": 0.0568,
1550
+ "step": 220
1551
+ },
1552
+ {
1553
+ "epoch": 0.2299687825182102,
1554
+ "grad_norm": 0.2373652160167694,
1555
+ "learning_rate": 0.00043333333333333337,
1556
+ "loss": 0.0492,
1557
+ "step": 221
1558
+ },
1559
+ {
1560
+ "epoch": 0.23100936524453694,
1561
+ "grad_norm": 0.26821693778038025,
1562
+ "learning_rate": 0.00043277777777777775,
1563
+ "loss": 0.0572,
1564
+ "step": 222
1565
+ },
1566
+ {
1567
+ "epoch": 0.23204994797086367,
1568
+ "grad_norm": 0.23499903082847595,
1569
+ "learning_rate": 0.00043222222222222224,
1570
+ "loss": 0.0443,
1571
+ "step": 223
1572
+ },
1573
+ {
1574
+ "epoch": 0.23309053069719043,
1575
+ "grad_norm": 0.2623459994792938,
1576
+ "learning_rate": 0.0004316666666666667,
1577
+ "loss": 0.0493,
1578
+ "step": 224
1579
+ },
1580
+ {
1581
+ "epoch": 0.23413111342351717,
1582
+ "grad_norm": 0.23820453882217407,
1583
+ "learning_rate": 0.0004311111111111111,
1584
+ "loss": 0.0462,
1585
+ "step": 225
1586
+ },
1587
+ {
1588
+ "epoch": 0.2351716961498439,
1589
+ "grad_norm": 0.196584090590477,
1590
+ "learning_rate": 0.0004305555555555556,
1591
+ "loss": 0.0442,
1592
+ "step": 226
1593
+ },
1594
+ {
1595
+ "epoch": 0.23621227887617066,
1596
+ "grad_norm": 0.26306819915771484,
1597
+ "learning_rate": 0.00043,
1598
+ "loss": 0.0564,
1599
+ "step": 227
1600
+ },
1601
+ {
1602
+ "epoch": 0.2372528616024974,
1603
+ "grad_norm": 0.2611851096153259,
1604
+ "learning_rate": 0.0004294444444444445,
1605
+ "loss": 0.0452,
1606
+ "step": 228
1607
+ },
1608
+ {
1609
+ "epoch": 0.23829344432882413,
1610
+ "grad_norm": 0.21443575620651245,
1611
+ "learning_rate": 0.00042888888888888886,
1612
+ "loss": 0.0543,
1613
+ "step": 229
1614
+ },
1615
+ {
1616
+ "epoch": 0.2393340270551509,
1617
+ "grad_norm": 0.30607742071151733,
1618
+ "learning_rate": 0.00042833333333333335,
1619
+ "loss": 0.0499,
1620
+ "step": 230
1621
+ },
1622
+ {
1623
+ "epoch": 0.24037460978147762,
1624
+ "grad_norm": 0.29146668314933777,
1625
+ "learning_rate": 0.0004277777777777778,
1626
+ "loss": 0.0588,
1627
+ "step": 231
1628
+ },
1629
+ {
1630
+ "epoch": 0.24141519250780438,
1631
+ "grad_norm": 0.18191011250019073,
1632
+ "learning_rate": 0.00042722222222222223,
1633
+ "loss": 0.0435,
1634
+ "step": 232
1635
+ },
1636
+ {
1637
+ "epoch": 0.24245577523413112,
1638
+ "grad_norm": 0.184339240193367,
1639
+ "learning_rate": 0.0004266666666666667,
1640
+ "loss": 0.0324,
1641
+ "step": 233
1642
+ },
1643
+ {
1644
+ "epoch": 0.24349635796045785,
1645
+ "grad_norm": 0.23122777044773102,
1646
+ "learning_rate": 0.0004261111111111111,
1647
+ "loss": 0.0343,
1648
+ "step": 234
1649
+ },
1650
+ {
1651
+ "epoch": 0.2445369406867846,
1652
+ "grad_norm": 0.20807258784770966,
1653
+ "learning_rate": 0.0004255555555555556,
1654
+ "loss": 0.0522,
1655
+ "step": 235
1656
+ },
1657
+ {
1658
+ "epoch": 0.24557752341311134,
1659
+ "grad_norm": 0.19972191751003265,
1660
+ "learning_rate": 0.000425,
1661
+ "loss": 0.0529,
1662
+ "step": 236
1663
+ },
1664
+ {
1665
+ "epoch": 0.24661810613943808,
1666
+ "grad_norm": 0.21919365227222443,
1667
+ "learning_rate": 0.00042444444444444447,
1668
+ "loss": 0.0406,
1669
+ "step": 237
1670
+ },
1671
+ {
1672
+ "epoch": 0.24765868886576484,
1673
+ "grad_norm": 0.2519589960575104,
1674
+ "learning_rate": 0.0004238888888888889,
1675
+ "loss": 0.0571,
1676
+ "step": 238
1677
+ },
1678
+ {
1679
+ "epoch": 0.24869927159209157,
1680
+ "grad_norm": 0.1512586921453476,
1681
+ "learning_rate": 0.00042333333333333334,
1682
+ "loss": 0.0368,
1683
+ "step": 239
1684
+ },
1685
+ {
1686
+ "epoch": 0.2497398543184183,
1687
+ "grad_norm": 0.20062124729156494,
1688
+ "learning_rate": 0.0004227777777777778,
1689
+ "loss": 0.0428,
1690
+ "step": 240
1691
+ },
1692
+ {
1693
+ "epoch": 0.25078043704474506,
1694
+ "grad_norm": 0.2119806557893753,
1695
+ "learning_rate": 0.0004222222222222222,
1696
+ "loss": 0.0592,
1697
+ "step": 241
1698
+ },
1699
+ {
1700
+ "epoch": 0.2518210197710718,
1701
+ "grad_norm": 0.3062295615673065,
1702
+ "learning_rate": 0.0004216666666666667,
1703
+ "loss": 0.0613,
1704
+ "step": 242
1705
+ },
1706
+ {
1707
+ "epoch": 0.25286160249739853,
1708
+ "grad_norm": 0.21827293932437897,
1709
+ "learning_rate": 0.0004211111111111111,
1710
+ "loss": 0.0531,
1711
+ "step": 243
1712
+ },
1713
+ {
1714
+ "epoch": 0.25390218522372526,
1715
+ "grad_norm": 0.2759004235267639,
1716
+ "learning_rate": 0.0004205555555555556,
1717
+ "loss": 0.0561,
1718
+ "step": 244
1719
+ },
1720
+ {
1721
+ "epoch": 0.25494276795005205,
1722
+ "grad_norm": 0.1976407915353775,
1723
+ "learning_rate": 0.00042,
1724
+ "loss": 0.0374,
1725
+ "step": 245
1726
+ },
1727
+ {
1728
+ "epoch": 0.2559833506763788,
1729
+ "grad_norm": 0.2423432171344757,
1730
+ "learning_rate": 0.00041944444444444445,
1731
+ "loss": 0.049,
1732
+ "step": 246
1733
+ },
1734
+ {
1735
+ "epoch": 0.2570239334027055,
1736
+ "grad_norm": 0.20555488765239716,
1737
+ "learning_rate": 0.0004188888888888889,
1738
+ "loss": 0.0518,
1739
+ "step": 247
1740
+ },
1741
+ {
1742
+ "epoch": 0.25806451612903225,
1743
+ "grad_norm": 0.21792030334472656,
1744
+ "learning_rate": 0.00041833333333333333,
1745
+ "loss": 0.0452,
1746
+ "step": 248
1747
+ },
1748
+ {
1749
+ "epoch": 0.259105098855359,
1750
+ "grad_norm": 0.2850765883922577,
1751
+ "learning_rate": 0.0004177777777777778,
1752
+ "loss": 0.0602,
1753
+ "step": 249
1754
+ },
1755
+ {
1756
+ "epoch": 0.2601456815816857,
1757
+ "grad_norm": 0.18359482288360596,
1758
+ "learning_rate": 0.0004172222222222222,
1759
+ "loss": 0.0331,
1760
+ "step": 250
1761
+ },
1762
+ {
1763
+ "epoch": 0.2611862643080125,
1764
+ "grad_norm": 0.2370993047952652,
1765
+ "learning_rate": 0.0004166666666666667,
1766
+ "loss": 0.0568,
1767
+ "step": 251
1768
+ },
1769
+ {
1770
+ "epoch": 0.26222684703433924,
1771
+ "grad_norm": 0.20278838276863098,
1772
+ "learning_rate": 0.00041611111111111113,
1773
+ "loss": 0.0542,
1774
+ "step": 252
1775
+ },
1776
+ {
1777
+ "epoch": 0.26326742976066597,
1778
+ "grad_norm": 0.21301935613155365,
1779
+ "learning_rate": 0.00041555555555555557,
1780
+ "loss": 0.0514,
1781
+ "step": 253
1782
+ },
1783
+ {
1784
+ "epoch": 0.2643080124869927,
1785
+ "grad_norm": 0.1811857521533966,
1786
+ "learning_rate": 0.000415,
1787
+ "loss": 0.0406,
1788
+ "step": 254
1789
+ },
1790
+ {
1791
+ "epoch": 0.26534859521331944,
1792
+ "grad_norm": 0.22240598499774933,
1793
+ "learning_rate": 0.00041444444444444444,
1794
+ "loss": 0.0558,
1795
+ "step": 255
1796
+ },
1797
+ {
1798
+ "epoch": 0.2663891779396462,
1799
+ "grad_norm": 0.19993361830711365,
1800
+ "learning_rate": 0.0004138888888888889,
1801
+ "loss": 0.0507,
1802
+ "step": 256
1803
+ },
1804
+ {
1805
+ "epoch": 0.26742976066597296,
1806
+ "grad_norm": 0.2210732102394104,
1807
+ "learning_rate": 0.0004133333333333333,
1808
+ "loss": 0.0464,
1809
+ "step": 257
1810
+ },
1811
+ {
1812
+ "epoch": 0.2684703433922997,
1813
+ "grad_norm": 0.24159833788871765,
1814
+ "learning_rate": 0.0004127777777777778,
1815
+ "loss": 0.0506,
1816
+ "step": 258
1817
+ },
1818
+ {
1819
+ "epoch": 0.2695109261186264,
1820
+ "grad_norm": 0.19818955659866333,
1821
+ "learning_rate": 0.00041222222222222224,
1822
+ "loss": 0.0583,
1823
+ "step": 259
1824
+ },
1825
+ {
1826
+ "epoch": 0.27055150884495316,
1827
+ "grad_norm": 0.34667930006980896,
1828
+ "learning_rate": 0.0004116666666666667,
1829
+ "loss": 0.0844,
1830
+ "step": 260
1831
+ },
1832
+ {
1833
+ "epoch": 0.2715920915712799,
1834
+ "grad_norm": 0.2061154991388321,
1835
+ "learning_rate": 0.0004111111111111111,
1836
+ "loss": 0.0361,
1837
+ "step": 261
1838
+ },
1839
+ {
1840
+ "epoch": 0.2726326742976067,
1841
+ "grad_norm": 0.3629634380340576,
1842
+ "learning_rate": 0.00041055555555555555,
1843
+ "loss": 0.0399,
1844
+ "step": 262
1845
+ },
1846
+ {
1847
+ "epoch": 0.2736732570239334,
1848
+ "grad_norm": 0.22805607318878174,
1849
+ "learning_rate": 0.00041,
1850
+ "loss": 0.0665,
1851
+ "step": 263
1852
+ },
1853
+ {
1854
+ "epoch": 0.27471383975026015,
1855
+ "grad_norm": 0.3538663983345032,
1856
+ "learning_rate": 0.00040944444444444443,
1857
+ "loss": 0.0564,
1858
+ "step": 264
1859
+ },
1860
+ {
1861
+ "epoch": 0.2757544224765869,
1862
+ "grad_norm": 0.21005156636238098,
1863
+ "learning_rate": 0.0004088888888888889,
1864
+ "loss": 0.0513,
1865
+ "step": 265
1866
+ },
1867
+ {
1868
+ "epoch": 0.2767950052029136,
1869
+ "grad_norm": 0.1628667265176773,
1870
+ "learning_rate": 0.00040833333333333336,
1871
+ "loss": 0.041,
1872
+ "step": 266
1873
+ },
1874
+ {
1875
+ "epoch": 0.2778355879292404,
1876
+ "grad_norm": 0.1788283884525299,
1877
+ "learning_rate": 0.0004077777777777778,
1878
+ "loss": 0.0332,
1879
+ "step": 267
1880
+ },
1881
+ {
1882
+ "epoch": 0.27887617065556713,
1883
+ "grad_norm": 0.2412905991077423,
1884
+ "learning_rate": 0.00040722222222222223,
1885
+ "loss": 0.0612,
1886
+ "step": 268
1887
+ },
1888
+ {
1889
+ "epoch": 0.27991675338189387,
1890
+ "grad_norm": 0.14978761970996857,
1891
+ "learning_rate": 0.00040666666666666667,
1892
+ "loss": 0.0313,
1893
+ "step": 269
1894
+ },
1895
+ {
1896
+ "epoch": 0.2809573361082206,
1897
+ "grad_norm": 0.1715932935476303,
1898
+ "learning_rate": 0.0004061111111111111,
1899
+ "loss": 0.0363,
1900
+ "step": 270
1901
+ },
1902
+ {
1903
+ "epoch": 0.28199791883454733,
1904
+ "grad_norm": 0.20580480992794037,
1905
+ "learning_rate": 0.00040555555555555554,
1906
+ "loss": 0.038,
1907
+ "step": 271
1908
+ },
1909
+ {
1910
+ "epoch": 0.28303850156087407,
1911
+ "grad_norm": 0.31613650918006897,
1912
+ "learning_rate": 0.00040500000000000003,
1913
+ "loss": 0.0456,
1914
+ "step": 272
1915
+ },
1916
+ {
1917
+ "epoch": 0.28407908428720086,
1918
+ "grad_norm": 0.4305758476257324,
1919
+ "learning_rate": 0.00040444444444444447,
1920
+ "loss": 0.0853,
1921
+ "step": 273
1922
+ },
1923
+ {
1924
+ "epoch": 0.2851196670135276,
1925
+ "grad_norm": 0.23432056605815887,
1926
+ "learning_rate": 0.0004038888888888889,
1927
+ "loss": 0.0565,
1928
+ "step": 274
1929
+ },
1930
+ {
1931
+ "epoch": 0.2861602497398543,
1932
+ "grad_norm": 0.19864040613174438,
1933
+ "learning_rate": 0.00040333333333333334,
1934
+ "loss": 0.0434,
1935
+ "step": 275
1936
+ },
1937
+ {
1938
+ "epoch": 0.28720083246618106,
1939
+ "grad_norm": 0.16542665660381317,
1940
+ "learning_rate": 0.0004027777777777778,
1941
+ "loss": 0.0412,
1942
+ "step": 276
1943
+ },
1944
+ {
1945
+ "epoch": 0.2882414151925078,
1946
+ "grad_norm": 0.2191186547279358,
1947
+ "learning_rate": 0.0004022222222222222,
1948
+ "loss": 0.0331,
1949
+ "step": 277
1950
+ },
1951
+ {
1952
+ "epoch": 0.2892819979188345,
1953
+ "grad_norm": 0.18664966523647308,
1954
+ "learning_rate": 0.00040166666666666665,
1955
+ "loss": 0.048,
1956
+ "step": 278
1957
+ },
1958
+ {
1959
+ "epoch": 0.2903225806451613,
1960
+ "grad_norm": 0.2270483821630478,
1961
+ "learning_rate": 0.0004011111111111111,
1962
+ "loss": 0.0377,
1963
+ "step": 279
1964
+ },
1965
+ {
1966
+ "epoch": 0.29136316337148804,
1967
+ "grad_norm": 0.24307194352149963,
1968
+ "learning_rate": 0.0004005555555555556,
1969
+ "loss": 0.0348,
1970
+ "step": 280
1971
+ },
1972
+ {
1973
+ "epoch": 0.2924037460978148,
1974
+ "grad_norm": 0.2359393984079361,
1975
+ "learning_rate": 0.0004,
1976
+ "loss": 0.0544,
1977
+ "step": 281
1978
+ },
1979
+ {
1980
+ "epoch": 0.2934443288241415,
1981
+ "grad_norm": 0.18014176189899445,
1982
+ "learning_rate": 0.00039944444444444446,
1983
+ "loss": 0.0511,
1984
+ "step": 282
1985
+ },
1986
+ {
1987
+ "epoch": 0.29448491155046824,
1988
+ "grad_norm": 0.1786079704761505,
1989
+ "learning_rate": 0.0003988888888888889,
1990
+ "loss": 0.0423,
1991
+ "step": 283
1992
+ },
1993
+ {
1994
+ "epoch": 0.29552549427679503,
1995
+ "grad_norm": 0.21372316777706146,
1996
+ "learning_rate": 0.00039833333333333333,
1997
+ "loss": 0.0376,
1998
+ "step": 284
1999
+ },
2000
+ {
2001
+ "epoch": 0.29656607700312176,
2002
+ "grad_norm": 0.18096502125263214,
2003
+ "learning_rate": 0.00039777777777777777,
2004
+ "loss": 0.0403,
2005
+ "step": 285
2006
+ },
2007
+ {
2008
+ "epoch": 0.2976066597294485,
2009
+ "grad_norm": 0.2152777463197708,
2010
+ "learning_rate": 0.0003972222222222222,
2011
+ "loss": 0.0479,
2012
+ "step": 286
2013
+ },
2014
+ {
2015
+ "epoch": 0.29864724245577523,
2016
+ "grad_norm": 0.2060365378856659,
2017
+ "learning_rate": 0.0003966666666666667,
2018
+ "loss": 0.0421,
2019
+ "step": 287
2020
+ },
2021
+ {
2022
+ "epoch": 0.29968782518210196,
2023
+ "grad_norm": 0.15571239590644836,
2024
+ "learning_rate": 0.00039611111111111113,
2025
+ "loss": 0.0358,
2026
+ "step": 288
2027
+ },
2028
+ {
2029
+ "epoch": 0.3007284079084287,
2030
+ "grad_norm": 0.16673770546913147,
2031
+ "learning_rate": 0.00039555555555555557,
2032
+ "loss": 0.0327,
2033
+ "step": 289
2034
+ },
2035
+ {
2036
+ "epoch": 0.3017689906347555,
2037
+ "grad_norm": 0.25307971239089966,
2038
+ "learning_rate": 0.000395,
2039
+ "loss": 0.0521,
2040
+ "step": 290
2041
+ },
2042
+ {
2043
+ "epoch": 0.3028095733610822,
2044
+ "grad_norm": 0.21981365978717804,
2045
+ "learning_rate": 0.00039444444444444444,
2046
+ "loss": 0.0506,
2047
+ "step": 291
2048
+ },
2049
+ {
2050
+ "epoch": 0.30385015608740895,
2051
+ "grad_norm": 0.21614228188991547,
2052
+ "learning_rate": 0.00039388888888888893,
2053
+ "loss": 0.0499,
2054
+ "step": 292
2055
+ },
2056
+ {
2057
+ "epoch": 0.3048907388137357,
2058
+ "grad_norm": 0.18407006561756134,
2059
+ "learning_rate": 0.0003933333333333333,
2060
+ "loss": 0.0401,
2061
+ "step": 293
2062
+ },
2063
+ {
2064
+ "epoch": 0.3059313215400624,
2065
+ "grad_norm": 0.17395204305648804,
2066
+ "learning_rate": 0.0003927777777777778,
2067
+ "loss": 0.043,
2068
+ "step": 294
2069
+ },
2070
+ {
2071
+ "epoch": 0.30697190426638915,
2072
+ "grad_norm": 0.21453210711479187,
2073
+ "learning_rate": 0.00039222222222222225,
2074
+ "loss": 0.0543,
2075
+ "step": 295
2076
+ },
2077
+ {
2078
+ "epoch": 0.30801248699271594,
2079
+ "grad_norm": 0.15130619704723358,
2080
+ "learning_rate": 0.0003916666666666667,
2081
+ "loss": 0.0315,
2082
+ "step": 296
2083
+ },
2084
+ {
2085
+ "epoch": 0.3090530697190427,
2086
+ "grad_norm": 0.15348005294799805,
2087
+ "learning_rate": 0.0003911111111111111,
2088
+ "loss": 0.0441,
2089
+ "step": 297
2090
+ },
2091
+ {
2092
+ "epoch": 0.3100936524453694,
2093
+ "grad_norm": 0.14079153537750244,
2094
+ "learning_rate": 0.00039055555555555556,
2095
+ "loss": 0.0408,
2096
+ "step": 298
2097
+ },
2098
+ {
2099
+ "epoch": 0.31113423517169614,
2100
+ "grad_norm": 0.20261019468307495,
2101
+ "learning_rate": 0.00039000000000000005,
2102
+ "loss": 0.0494,
2103
+ "step": 299
2104
+ },
2105
+ {
2106
+ "epoch": 0.31217481789802287,
2107
+ "grad_norm": 0.1492331326007843,
2108
+ "learning_rate": 0.00038944444444444443,
2109
+ "loss": 0.0349,
2110
+ "step": 300
2111
+ },
2112
+ {
2113
+ "epoch": 0.31321540062434966,
2114
+ "grad_norm": 0.22079823911190033,
2115
+ "learning_rate": 0.0003888888888888889,
2116
+ "loss": 0.0427,
2117
+ "step": 301
2118
+ },
2119
+ {
2120
+ "epoch": 0.3142559833506764,
2121
+ "grad_norm": 0.3576699495315552,
2122
+ "learning_rate": 0.0003883333333333333,
2123
+ "loss": 0.0523,
2124
+ "step": 302
2125
+ },
2126
+ {
2127
+ "epoch": 0.3152965660770031,
2128
+ "grad_norm": 0.2876051664352417,
2129
+ "learning_rate": 0.0003877777777777778,
2130
+ "loss": 0.0625,
2131
+ "step": 303
2132
+ },
2133
+ {
2134
+ "epoch": 0.31633714880332986,
2135
+ "grad_norm": 0.20341859757900238,
2136
+ "learning_rate": 0.00038722222222222223,
2137
+ "loss": 0.0614,
2138
+ "step": 304
2139
+ },
2140
+ {
2141
+ "epoch": 0.3173777315296566,
2142
+ "grad_norm": 0.17374646663665771,
2143
+ "learning_rate": 0.00038666666666666667,
2144
+ "loss": 0.0369,
2145
+ "step": 305
2146
+ },
2147
+ {
2148
+ "epoch": 0.3184183142559833,
2149
+ "grad_norm": 0.18767137825489044,
2150
+ "learning_rate": 0.00038611111111111116,
2151
+ "loss": 0.0499,
2152
+ "step": 306
2153
+ },
2154
+ {
2155
+ "epoch": 0.3194588969823101,
2156
+ "grad_norm": 0.19571766257286072,
2157
+ "learning_rate": 0.00038555555555555554,
2158
+ "loss": 0.0455,
2159
+ "step": 307
2160
+ },
2161
+ {
2162
+ "epoch": 0.32049947970863685,
2163
+ "grad_norm": 0.17226622998714447,
2164
+ "learning_rate": 0.00038500000000000003,
2165
+ "loss": 0.0304,
2166
+ "step": 308
2167
+ },
2168
+ {
2169
+ "epoch": 0.3215400624349636,
2170
+ "grad_norm": 0.21688619256019592,
2171
+ "learning_rate": 0.0003844444444444444,
2172
+ "loss": 0.0433,
2173
+ "step": 309
2174
+ },
2175
+ {
2176
+ "epoch": 0.3225806451612903,
2177
+ "grad_norm": 0.25550422072410583,
2178
+ "learning_rate": 0.0003838888888888889,
2179
+ "loss": 0.0492,
2180
+ "step": 310
2181
+ },
2182
+ {
2183
+ "epoch": 0.32362122788761705,
2184
+ "grad_norm": 0.30014583468437195,
2185
+ "learning_rate": 0.00038333333333333334,
2186
+ "loss": 0.0377,
2187
+ "step": 311
2188
+ },
2189
+ {
2190
+ "epoch": 0.32466181061394384,
2191
+ "grad_norm": 0.1463593989610672,
2192
+ "learning_rate": 0.0003827777777777778,
2193
+ "loss": 0.0349,
2194
+ "step": 312
2195
+ },
2196
+ {
2197
+ "epoch": 0.32570239334027057,
2198
+ "grad_norm": 0.24401473999023438,
2199
+ "learning_rate": 0.0003822222222222223,
2200
+ "loss": 0.0596,
2201
+ "step": 313
2202
+ },
2203
+ {
2204
+ "epoch": 0.3267429760665973,
2205
+ "grad_norm": 0.17971399426460266,
2206
+ "learning_rate": 0.00038166666666666666,
2207
+ "loss": 0.0418,
2208
+ "step": 314
2209
+ },
2210
+ {
2211
+ "epoch": 0.32778355879292403,
2212
+ "grad_norm": 0.19277223944664001,
2213
+ "learning_rate": 0.00038111111111111115,
2214
+ "loss": 0.0511,
2215
+ "step": 315
2216
+ },
2217
+ {
2218
+ "epoch": 0.32882414151925077,
2219
+ "grad_norm": 0.1726415902376175,
2220
+ "learning_rate": 0.00038055555555555553,
2221
+ "loss": 0.0267,
2222
+ "step": 316
2223
+ },
2224
+ {
2225
+ "epoch": 0.3298647242455775,
2226
+ "grad_norm": 0.14282868802547455,
2227
+ "learning_rate": 0.00038,
2228
+ "loss": 0.027,
2229
+ "step": 317
2230
+ },
2231
+ {
2232
+ "epoch": 0.3309053069719043,
2233
+ "grad_norm": 0.17617446184158325,
2234
+ "learning_rate": 0.0003794444444444444,
2235
+ "loss": 0.0472,
2236
+ "step": 318
2237
+ },
2238
+ {
2239
+ "epoch": 0.331945889698231,
2240
+ "grad_norm": 0.16604778170585632,
2241
+ "learning_rate": 0.0003788888888888889,
2242
+ "loss": 0.0454,
2243
+ "step": 319
2244
+ },
2245
+ {
2246
+ "epoch": 0.33298647242455776,
2247
+ "grad_norm": 0.19378170371055603,
2248
+ "learning_rate": 0.0003783333333333334,
2249
+ "loss": 0.0417,
2250
+ "step": 320
2251
+ },
2252
+ {
2253
+ "epoch": 0.3340270551508845,
2254
+ "grad_norm": 0.18169185519218445,
2255
+ "learning_rate": 0.00037777777777777777,
2256
+ "loss": 0.0414,
2257
+ "step": 321
2258
+ },
2259
+ {
2260
+ "epoch": 0.3350676378772112,
2261
+ "grad_norm": 0.33982396125793457,
2262
+ "learning_rate": 0.00037722222222222226,
2263
+ "loss": 0.0571,
2264
+ "step": 322
2265
+ },
2266
+ {
2267
+ "epoch": 0.33610822060353795,
2268
+ "grad_norm": 0.14488692581653595,
2269
+ "learning_rate": 0.00037666666666666664,
2270
+ "loss": 0.0371,
2271
+ "step": 323
2272
+ },
2273
+ {
2274
+ "epoch": 0.33714880332986474,
2275
+ "grad_norm": 0.2292122095823288,
2276
+ "learning_rate": 0.00037611111111111113,
2277
+ "loss": 0.0416,
2278
+ "step": 324
2279
+ },
2280
+ {
2281
+ "epoch": 0.3381893860561915,
2282
+ "grad_norm": 0.14065934717655182,
2283
+ "learning_rate": 0.0003755555555555555,
2284
+ "loss": 0.0384,
2285
+ "step": 325
2286
+ },
2287
+ {
2288
+ "epoch": 0.3392299687825182,
2289
+ "grad_norm": 0.17268255352973938,
2290
+ "learning_rate": 0.000375,
2291
+ "loss": 0.0389,
2292
+ "step": 326
2293
+ },
2294
+ {
2295
+ "epoch": 0.34027055150884494,
2296
+ "grad_norm": 0.19866085052490234,
2297
+ "learning_rate": 0.0003744444444444445,
2298
+ "loss": 0.0432,
2299
+ "step": 327
2300
+ },
2301
+ {
2302
+ "epoch": 0.3413111342351717,
2303
+ "grad_norm": 0.15219862759113312,
2304
+ "learning_rate": 0.0003738888888888889,
2305
+ "loss": 0.0444,
2306
+ "step": 328
2307
+ },
2308
+ {
2309
+ "epoch": 0.34235171696149846,
2310
+ "grad_norm": 0.19327589869499207,
2311
+ "learning_rate": 0.0003733333333333334,
2312
+ "loss": 0.0393,
2313
+ "step": 329
2314
+ },
2315
+ {
2316
+ "epoch": 0.3433922996878252,
2317
+ "grad_norm": 0.1899562031030655,
2318
+ "learning_rate": 0.00037277777777777776,
2319
+ "loss": 0.0477,
2320
+ "step": 330
2321
+ },
2322
+ {
2323
+ "epoch": 0.34443288241415193,
2324
+ "grad_norm": 0.15427608788013458,
2325
+ "learning_rate": 0.00037222222222222225,
2326
+ "loss": 0.0474,
2327
+ "step": 331
2328
+ },
2329
+ {
2330
+ "epoch": 0.34547346514047866,
2331
+ "grad_norm": 0.20968617498874664,
2332
+ "learning_rate": 0.00037166666666666663,
2333
+ "loss": 0.0466,
2334
+ "step": 332
2335
+ },
2336
+ {
2337
+ "epoch": 0.3465140478668054,
2338
+ "grad_norm": 0.19527389109134674,
2339
+ "learning_rate": 0.0003711111111111111,
2340
+ "loss": 0.0321,
2341
+ "step": 333
2342
+ },
2343
+ {
2344
+ "epoch": 0.34755463059313213,
2345
+ "grad_norm": 0.17147623002529144,
2346
+ "learning_rate": 0.0003705555555555556,
2347
+ "loss": 0.036,
2348
+ "step": 334
2349
+ },
2350
+ {
2351
+ "epoch": 0.3485952133194589,
2352
+ "grad_norm": 0.14404618740081787,
2353
+ "learning_rate": 0.00037,
2354
+ "loss": 0.0334,
2355
+ "step": 335
2356
+ },
2357
+ {
2358
+ "epoch": 0.34963579604578565,
2359
+ "grad_norm": 0.15034568309783936,
2360
+ "learning_rate": 0.0003694444444444445,
2361
+ "loss": 0.0282,
2362
+ "step": 336
2363
+ },
2364
+ {
2365
+ "epoch": 0.3506763787721124,
2366
+ "grad_norm": 0.15347059071063995,
2367
+ "learning_rate": 0.00036888888888888887,
2368
+ "loss": 0.0417,
2369
+ "step": 337
2370
+ },
2371
+ {
2372
+ "epoch": 0.3517169614984391,
2373
+ "grad_norm": 0.2456592172384262,
2374
+ "learning_rate": 0.00036833333333333336,
2375
+ "loss": 0.0534,
2376
+ "step": 338
2377
+ },
2378
+ {
2379
+ "epoch": 0.35275754422476585,
2380
+ "grad_norm": 0.10621064156293869,
2381
+ "learning_rate": 0.00036777777777777774,
2382
+ "loss": 0.0321,
2383
+ "step": 339
2384
+ },
2385
+ {
2386
+ "epoch": 0.3537981269510926,
2387
+ "grad_norm": 0.16830244660377502,
2388
+ "learning_rate": 0.00036722222222222223,
2389
+ "loss": 0.0317,
2390
+ "step": 340
2391
+ },
2392
+ {
2393
+ "epoch": 0.3548387096774194,
2394
+ "grad_norm": 0.12538719177246094,
2395
+ "learning_rate": 0.00036666666666666667,
2396
+ "loss": 0.0416,
2397
+ "step": 341
2398
+ },
2399
+ {
2400
+ "epoch": 0.3558792924037461,
2401
+ "grad_norm": 0.17756634950637817,
2402
+ "learning_rate": 0.0003661111111111111,
2403
+ "loss": 0.043,
2404
+ "step": 342
2405
+ },
2406
+ {
2407
+ "epoch": 0.35691987513007284,
2408
+ "grad_norm": 0.14569824934005737,
2409
+ "learning_rate": 0.0003655555555555556,
2410
+ "loss": 0.0429,
2411
+ "step": 343
2412
+ },
2413
+ {
2414
+ "epoch": 0.35796045785639957,
2415
+ "grad_norm": 0.12731237709522247,
2416
+ "learning_rate": 0.000365,
2417
+ "loss": 0.0325,
2418
+ "step": 344
2419
+ },
2420
+ {
2421
+ "epoch": 0.3590010405827263,
2422
+ "grad_norm": 0.19159571826457977,
2423
+ "learning_rate": 0.00036444444444444447,
2424
+ "loss": 0.0583,
2425
+ "step": 345
2426
+ },
2427
+ {
2428
+ "epoch": 0.3600416233090531,
2429
+ "grad_norm": 0.18616175651550293,
2430
+ "learning_rate": 0.00036388888888888886,
2431
+ "loss": 0.0465,
2432
+ "step": 346
2433
+ },
2434
+ {
2435
+ "epoch": 0.3610822060353798,
2436
+ "grad_norm": 0.15460412204265594,
2437
+ "learning_rate": 0.00036333333333333335,
2438
+ "loss": 0.0421,
2439
+ "step": 347
2440
+ },
2441
+ {
2442
+ "epoch": 0.36212278876170656,
2443
+ "grad_norm": 0.1955643892288208,
2444
+ "learning_rate": 0.0003627777777777778,
2445
+ "loss": 0.0433,
2446
+ "step": 348
2447
+ },
2448
+ {
2449
+ "epoch": 0.3631633714880333,
2450
+ "grad_norm": 0.13383328914642334,
2451
+ "learning_rate": 0.0003622222222222222,
2452
+ "loss": 0.0305,
2453
+ "step": 349
2454
+ },
2455
+ {
2456
+ "epoch": 0.36420395421436,
2457
+ "grad_norm": 0.15549112856388092,
2458
+ "learning_rate": 0.0003616666666666667,
2459
+ "loss": 0.0466,
2460
+ "step": 350
2461
+ },
2462
+ {
2463
+ "epoch": 0.36524453694068676,
2464
+ "grad_norm": 0.26684895157814026,
2465
+ "learning_rate": 0.0003611111111111111,
2466
+ "loss": 0.0595,
2467
+ "step": 351
2468
+ },
2469
+ {
2470
+ "epoch": 0.36628511966701355,
2471
+ "grad_norm": 0.20298495888710022,
2472
+ "learning_rate": 0.0003605555555555556,
2473
+ "loss": 0.0388,
2474
+ "step": 352
2475
+ },
2476
+ {
2477
+ "epoch": 0.3673257023933403,
2478
+ "grad_norm": 0.11693593859672546,
2479
+ "learning_rate": 0.00035999999999999997,
2480
+ "loss": 0.0258,
2481
+ "step": 353
2482
+ },
2483
+ {
2484
+ "epoch": 0.368366285119667,
2485
+ "grad_norm": 0.19449491798877716,
2486
+ "learning_rate": 0.00035944444444444446,
2487
+ "loss": 0.0558,
2488
+ "step": 354
2489
+ },
2490
+ {
2491
+ "epoch": 0.36940686784599375,
2492
+ "grad_norm": 0.15460844337940216,
2493
+ "learning_rate": 0.0003588888888888889,
2494
+ "loss": 0.0447,
2495
+ "step": 355
2496
+ },
2497
+ {
2498
+ "epoch": 0.3704474505723205,
2499
+ "grad_norm": 0.11926595866680145,
2500
+ "learning_rate": 0.00035833333333333333,
2501
+ "loss": 0.0265,
2502
+ "step": 356
2503
+ },
2504
+ {
2505
+ "epoch": 0.37148803329864727,
2506
+ "grad_norm": 0.14108620584011078,
2507
+ "learning_rate": 0.00035777777777777777,
2508
+ "loss": 0.0316,
2509
+ "step": 357
2510
+ },
2511
+ {
2512
+ "epoch": 0.372528616024974,
2513
+ "grad_norm": 0.15077660977840424,
2514
+ "learning_rate": 0.0003572222222222222,
2515
+ "loss": 0.0371,
2516
+ "step": 358
2517
+ },
2518
+ {
2519
+ "epoch": 0.37356919875130074,
2520
+ "grad_norm": 0.20584896206855774,
2521
+ "learning_rate": 0.0003566666666666667,
2522
+ "loss": 0.0352,
2523
+ "step": 359
2524
+ },
2525
+ {
2526
+ "epoch": 0.37460978147762747,
2527
+ "grad_norm": 0.19043448567390442,
2528
+ "learning_rate": 0.0003561111111111111,
2529
+ "loss": 0.0503,
2530
+ "step": 360
2531
+ },
2532
+ {
2533
+ "epoch": 0.3756503642039542,
2534
+ "grad_norm": 0.1698172390460968,
2535
+ "learning_rate": 0.00035555555555555557,
2536
+ "loss": 0.0473,
2537
+ "step": 361
2538
+ },
2539
+ {
2540
+ "epoch": 0.37669094693028093,
2541
+ "grad_norm": 0.13688473403453827,
2542
+ "learning_rate": 0.000355,
2543
+ "loss": 0.0346,
2544
+ "step": 362
2545
+ },
2546
+ {
2547
+ "epoch": 0.3777315296566077,
2548
+ "grad_norm": 0.15289755165576935,
2549
+ "learning_rate": 0.00035444444444444445,
2550
+ "loss": 0.0266,
2551
+ "step": 363
2552
+ },
2553
+ {
2554
+ "epoch": 0.37877211238293446,
2555
+ "grad_norm": 0.1375945657491684,
2556
+ "learning_rate": 0.0003538888888888889,
2557
+ "loss": 0.0425,
2558
+ "step": 364
2559
+ },
2560
+ {
2561
+ "epoch": 0.3798126951092612,
2562
+ "grad_norm": 0.14744621515274048,
2563
+ "learning_rate": 0.0003533333333333333,
2564
+ "loss": 0.0327,
2565
+ "step": 365
2566
+ },
2567
+ {
2568
+ "epoch": 0.3808532778355879,
2569
+ "grad_norm": 0.1553272008895874,
2570
+ "learning_rate": 0.0003527777777777778,
2571
+ "loss": 0.0349,
2572
+ "step": 366
2573
+ },
2574
+ {
2575
+ "epoch": 0.38189386056191466,
2576
+ "grad_norm": 0.13864699006080627,
2577
+ "learning_rate": 0.00035222222222222225,
2578
+ "loss": 0.0358,
2579
+ "step": 367
2580
+ },
2581
+ {
2582
+ "epoch": 0.3829344432882414,
2583
+ "grad_norm": 0.14019955694675446,
2584
+ "learning_rate": 0.0003516666666666667,
2585
+ "loss": 0.0362,
2586
+ "step": 368
2587
+ },
2588
+ {
2589
+ "epoch": 0.3839750260145682,
2590
+ "grad_norm": 0.1420709192752838,
2591
+ "learning_rate": 0.0003511111111111111,
2592
+ "loss": 0.0336,
2593
+ "step": 369
2594
+ },
2595
+ {
2596
+ "epoch": 0.3850156087408949,
2597
+ "grad_norm": 0.2503511309623718,
2598
+ "learning_rate": 0.00035055555555555556,
2599
+ "loss": 0.0708,
2600
+ "step": 370
2601
+ },
2602
+ {
2603
+ "epoch": 0.38605619146722164,
2604
+ "grad_norm": 0.15453968942165375,
2605
+ "learning_rate": 0.00035,
2606
+ "loss": 0.0399,
2607
+ "step": 371
2608
+ },
2609
+ {
2610
+ "epoch": 0.3870967741935484,
2611
+ "grad_norm": 0.16369573771953583,
2612
+ "learning_rate": 0.00034944444444444443,
2613
+ "loss": 0.0416,
2614
+ "step": 372
2615
+ },
2616
+ {
2617
+ "epoch": 0.3881373569198751,
2618
+ "grad_norm": 0.13033686578273773,
2619
+ "learning_rate": 0.0003488888888888889,
2620
+ "loss": 0.0389,
2621
+ "step": 373
2622
+ },
2623
+ {
2624
+ "epoch": 0.3891779396462019,
2625
+ "grad_norm": 0.12253396213054657,
2626
+ "learning_rate": 0.00034833333333333336,
2627
+ "loss": 0.0329,
2628
+ "step": 374
2629
+ },
2630
+ {
2631
+ "epoch": 0.39021852237252863,
2632
+ "grad_norm": 0.17739014327526093,
2633
+ "learning_rate": 0.0003477777777777778,
2634
+ "loss": 0.0386,
2635
+ "step": 375
2636
+ },
2637
+ {
2638
+ "epoch": 0.39125910509885536,
2639
+ "grad_norm": 0.14024539291858673,
2640
+ "learning_rate": 0.00034722222222222224,
2641
+ "loss": 0.0283,
2642
+ "step": 376
2643
+ },
2644
+ {
2645
+ "epoch": 0.3922996878251821,
2646
+ "grad_norm": 0.08809250593185425,
2647
+ "learning_rate": 0.00034666666666666667,
2648
+ "loss": 0.0304,
2649
+ "step": 377
2650
+ },
2651
+ {
2652
+ "epoch": 0.39334027055150883,
2653
+ "grad_norm": 0.21931345760822296,
2654
+ "learning_rate": 0.0003461111111111111,
2655
+ "loss": 0.0563,
2656
+ "step": 378
2657
+ },
2658
+ {
2659
+ "epoch": 0.39438085327783556,
2660
+ "grad_norm": 0.16589802503585815,
2661
+ "learning_rate": 0.00034555555555555555,
2662
+ "loss": 0.0282,
2663
+ "step": 379
2664
+ },
2665
+ {
2666
+ "epoch": 0.39542143600416235,
2667
+ "grad_norm": 0.14240865409374237,
2668
+ "learning_rate": 0.000345,
2669
+ "loss": 0.0344,
2670
+ "step": 380
2671
+ },
2672
+ {
2673
+ "epoch": 0.3964620187304891,
2674
+ "grad_norm": 0.19559325277805328,
2675
+ "learning_rate": 0.0003444444444444445,
2676
+ "loss": 0.0467,
2677
+ "step": 381
2678
+ },
2679
+ {
2680
+ "epoch": 0.3975026014568158,
2681
+ "grad_norm": 0.2773292362689972,
2682
+ "learning_rate": 0.0003438888888888889,
2683
+ "loss": 0.0707,
2684
+ "step": 382
2685
+ },
2686
+ {
2687
+ "epoch": 0.39854318418314255,
2688
+ "grad_norm": 0.14945051074028015,
2689
+ "learning_rate": 0.00034333333333333335,
2690
+ "loss": 0.0405,
2691
+ "step": 383
2692
+ },
2693
+ {
2694
+ "epoch": 0.3995837669094693,
2695
+ "grad_norm": 0.12058687955141068,
2696
+ "learning_rate": 0.0003427777777777778,
2697
+ "loss": 0.0251,
2698
+ "step": 384
2699
+ },
2700
+ {
2701
+ "epoch": 0.4006243496357961,
2702
+ "grad_norm": 0.17662587761878967,
2703
+ "learning_rate": 0.0003422222222222222,
2704
+ "loss": 0.0312,
2705
+ "step": 385
2706
+ },
2707
+ {
2708
+ "epoch": 0.4016649323621228,
2709
+ "grad_norm": 0.1708107441663742,
2710
+ "learning_rate": 0.00034166666666666666,
2711
+ "loss": 0.0361,
2712
+ "step": 386
2713
+ },
2714
+ {
2715
+ "epoch": 0.40270551508844954,
2716
+ "grad_norm": 0.2108927220106125,
2717
+ "learning_rate": 0.0003411111111111111,
2718
+ "loss": 0.0542,
2719
+ "step": 387
2720
+ },
2721
+ {
2722
+ "epoch": 0.4037460978147763,
2723
+ "grad_norm": 0.14585725963115692,
2724
+ "learning_rate": 0.0003405555555555556,
2725
+ "loss": 0.0311,
2726
+ "step": 388
2727
+ },
2728
+ {
2729
+ "epoch": 0.404786680541103,
2730
+ "grad_norm": 0.13707710802555084,
2731
+ "learning_rate": 0.00034,
2732
+ "loss": 0.0422,
2733
+ "step": 389
2734
+ },
2735
+ {
2736
+ "epoch": 0.40582726326742974,
2737
+ "grad_norm": 0.18573620915412903,
2738
+ "learning_rate": 0.00033944444444444446,
2739
+ "loss": 0.0377,
2740
+ "step": 390
2741
+ },
2742
+ {
2743
+ "epoch": 0.4068678459937565,
2744
+ "grad_norm": 0.13296887278556824,
2745
+ "learning_rate": 0.0003388888888888889,
2746
+ "loss": 0.0316,
2747
+ "step": 391
2748
+ },
2749
+ {
2750
+ "epoch": 0.40790842872008326,
2751
+ "grad_norm": 0.1429716795682907,
2752
+ "learning_rate": 0.00033833333333333334,
2753
+ "loss": 0.0397,
2754
+ "step": 392
2755
+ },
2756
+ {
2757
+ "epoch": 0.40894901144641,
2758
+ "grad_norm": 0.1604965329170227,
2759
+ "learning_rate": 0.00033777777777777777,
2760
+ "loss": 0.0434,
2761
+ "step": 393
2762
+ },
2763
+ {
2764
+ "epoch": 0.4099895941727367,
2765
+ "grad_norm": 0.11536327749490738,
2766
+ "learning_rate": 0.0003372222222222222,
2767
+ "loss": 0.0318,
2768
+ "step": 394
2769
+ },
2770
+ {
2771
+ "epoch": 0.41103017689906346,
2772
+ "grad_norm": 0.19248682260513306,
2773
+ "learning_rate": 0.0003366666666666667,
2774
+ "loss": 0.0373,
2775
+ "step": 395
2776
+ },
2777
+ {
2778
+ "epoch": 0.4120707596253902,
2779
+ "grad_norm": 0.13444487750530243,
2780
+ "learning_rate": 0.00033611111111111114,
2781
+ "loss": 0.0409,
2782
+ "step": 396
2783
+ },
2784
+ {
2785
+ "epoch": 0.413111342351717,
2786
+ "grad_norm": 0.12350185215473175,
2787
+ "learning_rate": 0.0003355555555555556,
2788
+ "loss": 0.0328,
2789
+ "step": 397
2790
+ },
2791
+ {
2792
+ "epoch": 0.4141519250780437,
2793
+ "grad_norm": 0.12351303547620773,
2794
+ "learning_rate": 0.000335,
2795
+ "loss": 0.0357,
2796
+ "step": 398
2797
+ },
2798
+ {
2799
+ "epoch": 0.41519250780437045,
2800
+ "grad_norm": 0.16849550604820251,
2801
+ "learning_rate": 0.00033444444444444445,
2802
+ "loss": 0.0266,
2803
+ "step": 399
2804
+ },
2805
+ {
2806
+ "epoch": 0.4162330905306972,
2807
+ "grad_norm": 0.10034651309251785,
2808
+ "learning_rate": 0.0003338888888888889,
2809
+ "loss": 0.0293,
2810
+ "step": 400
2811
+ },
2812
+ {
2813
+ "epoch": 0.4172736732570239,
2814
+ "grad_norm": 0.14957422018051147,
2815
+ "learning_rate": 0.0003333333333333333,
2816
+ "loss": 0.0425,
2817
+ "step": 401
2818
+ },
2819
+ {
2820
+ "epoch": 0.4183142559833507,
2821
+ "grad_norm": 0.1114712730050087,
2822
+ "learning_rate": 0.0003327777777777778,
2823
+ "loss": 0.0352,
2824
+ "step": 402
2825
+ },
2826
+ {
2827
+ "epoch": 0.41935483870967744,
2828
+ "grad_norm": 0.12611107528209686,
2829
+ "learning_rate": 0.0003322222222222222,
2830
+ "loss": 0.0295,
2831
+ "step": 403
2832
+ },
2833
+ {
2834
+ "epoch": 0.42039542143600417,
2835
+ "grad_norm": 0.13259468972682953,
2836
+ "learning_rate": 0.0003316666666666667,
2837
+ "loss": 0.0286,
2838
+ "step": 404
2839
+ },
2840
+ {
2841
+ "epoch": 0.4214360041623309,
2842
+ "grad_norm": 0.11859951168298721,
2843
+ "learning_rate": 0.0003311111111111111,
2844
+ "loss": 0.0344,
2845
+ "step": 405
2846
+ },
2847
+ {
2848
+ "epoch": 0.42247658688865763,
2849
+ "grad_norm": 0.13458934426307678,
2850
+ "learning_rate": 0.00033055555555555556,
2851
+ "loss": 0.0388,
2852
+ "step": 406
2853
+ },
2854
+ {
2855
+ "epoch": 0.42351716961498437,
2856
+ "grad_norm": 0.13809777796268463,
2857
+ "learning_rate": 0.00033,
2858
+ "loss": 0.0364,
2859
+ "step": 407
2860
+ },
2861
+ {
2862
+ "epoch": 0.42455775234131116,
2863
+ "grad_norm": 0.09218713641166687,
2864
+ "learning_rate": 0.00032944444444444444,
2865
+ "loss": 0.0236,
2866
+ "step": 408
2867
+ },
2868
+ {
2869
+ "epoch": 0.4255983350676379,
2870
+ "grad_norm": 0.14193609356880188,
2871
+ "learning_rate": 0.0003288888888888889,
2872
+ "loss": 0.0298,
2873
+ "step": 409
2874
+ },
2875
+ {
2876
+ "epoch": 0.4266389177939646,
2877
+ "grad_norm": 0.12762799859046936,
2878
+ "learning_rate": 0.0003283333333333333,
2879
+ "loss": 0.0339,
2880
+ "step": 410
2881
+ },
2882
+ {
2883
+ "epoch": 0.42767950052029136,
2884
+ "grad_norm": 0.1513296365737915,
2885
+ "learning_rate": 0.0003277777777777778,
2886
+ "loss": 0.0441,
2887
+ "step": 411
2888
+ },
2889
+ {
2890
+ "epoch": 0.4287200832466181,
2891
+ "grad_norm": 0.11212543398141861,
2892
+ "learning_rate": 0.00032722222222222224,
2893
+ "loss": 0.0295,
2894
+ "step": 412
2895
+ },
2896
+ {
2897
+ "epoch": 0.4297606659729448,
2898
+ "grad_norm": 0.14514677226543427,
2899
+ "learning_rate": 0.0003266666666666667,
2900
+ "loss": 0.0355,
2901
+ "step": 413
2902
+ },
2903
+ {
2904
+ "epoch": 0.4308012486992716,
2905
+ "grad_norm": 0.1356545239686966,
2906
+ "learning_rate": 0.0003261111111111111,
2907
+ "loss": 0.0369,
2908
+ "step": 414
2909
+ },
2910
+ {
2911
+ "epoch": 0.43184183142559834,
2912
+ "grad_norm": 0.10390274971723557,
2913
+ "learning_rate": 0.00032555555555555555,
2914
+ "loss": 0.0235,
2915
+ "step": 415
2916
+ },
2917
+ {
2918
+ "epoch": 0.4328824141519251,
2919
+ "grad_norm": 0.13086703419685364,
2920
+ "learning_rate": 0.00032500000000000004,
2921
+ "loss": 0.0351,
2922
+ "step": 416
2923
+ },
2924
+ {
2925
+ "epoch": 0.4339229968782518,
2926
+ "grad_norm": 0.1003120169043541,
2927
+ "learning_rate": 0.0003244444444444444,
2928
+ "loss": 0.0339,
2929
+ "step": 417
2930
+ },
2931
+ {
2932
+ "epoch": 0.43496357960457854,
2933
+ "grad_norm": 0.11209513247013092,
2934
+ "learning_rate": 0.0003238888888888889,
2935
+ "loss": 0.0264,
2936
+ "step": 418
2937
+ },
2938
+ {
2939
+ "epoch": 0.43600416233090533,
2940
+ "grad_norm": 0.17661242187023163,
2941
+ "learning_rate": 0.0003233333333333333,
2942
+ "loss": 0.0446,
2943
+ "step": 419
2944
+ },
2945
+ {
2946
+ "epoch": 0.43704474505723206,
2947
+ "grad_norm": 0.23437397181987762,
2948
+ "learning_rate": 0.0003227777777777778,
2949
+ "loss": 0.0594,
2950
+ "step": 420
2951
+ },
2952
+ {
2953
+ "epoch": 0.4380853277835588,
2954
+ "grad_norm": 0.1441585272550583,
2955
+ "learning_rate": 0.0003222222222222222,
2956
+ "loss": 0.0325,
2957
+ "step": 421
2958
+ },
2959
+ {
2960
+ "epoch": 0.43912591050988553,
2961
+ "grad_norm": 0.17519664764404297,
2962
+ "learning_rate": 0.00032166666666666666,
2963
+ "loss": 0.0298,
2964
+ "step": 422
2965
+ },
2966
+ {
2967
+ "epoch": 0.44016649323621226,
2968
+ "grad_norm": 0.12393476814031601,
2969
+ "learning_rate": 0.00032111111111111115,
2970
+ "loss": 0.0359,
2971
+ "step": 423
2972
+ },
2973
+ {
2974
+ "epoch": 0.441207075962539,
2975
+ "grad_norm": 0.1459573358297348,
2976
+ "learning_rate": 0.00032055555555555554,
2977
+ "loss": 0.0386,
2978
+ "step": 424
2979
+ },
2980
+ {
2981
+ "epoch": 0.4422476586888658,
2982
+ "grad_norm": 0.09201126545667648,
2983
+ "learning_rate": 0.00032,
2984
+ "loss": 0.0308,
2985
+ "step": 425
2986
+ },
2987
+ {
2988
+ "epoch": 0.4432882414151925,
2989
+ "grad_norm": 0.10579176247119904,
2990
+ "learning_rate": 0.0003194444444444444,
2991
+ "loss": 0.0268,
2992
+ "step": 426
2993
+ },
2994
+ {
2995
+ "epoch": 0.44432882414151925,
2996
+ "grad_norm": 0.148898184299469,
2997
+ "learning_rate": 0.0003188888888888889,
2998
+ "loss": 0.0311,
2999
+ "step": 427
3000
+ },
3001
+ {
3002
+ "epoch": 0.445369406867846,
3003
+ "grad_norm": 0.12894581258296967,
3004
+ "learning_rate": 0.00031833333333333334,
3005
+ "loss": 0.0346,
3006
+ "step": 428
3007
+ },
3008
+ {
3009
+ "epoch": 0.4464099895941727,
3010
+ "grad_norm": 0.13777734339237213,
3011
+ "learning_rate": 0.0003177777777777778,
3012
+ "loss": 0.0381,
3013
+ "step": 429
3014
+ },
3015
+ {
3016
+ "epoch": 0.4474505723204995,
3017
+ "grad_norm": 0.08925038576126099,
3018
+ "learning_rate": 0.00031722222222222227,
3019
+ "loss": 0.028,
3020
+ "step": 430
3021
+ },
3022
+ {
3023
+ "epoch": 0.44849115504682624,
3024
+ "grad_norm": 0.13310398161411285,
3025
+ "learning_rate": 0.00031666666666666665,
3026
+ "loss": 0.0381,
3027
+ "step": 431
3028
+ },
3029
+ {
3030
+ "epoch": 0.449531737773153,
3031
+ "grad_norm": 0.11413469910621643,
3032
+ "learning_rate": 0.00031611111111111114,
3033
+ "loss": 0.03,
3034
+ "step": 432
3035
+ },
3036
+ {
3037
+ "epoch": 0.4505723204994797,
3038
+ "grad_norm": 0.12046143412590027,
3039
+ "learning_rate": 0.0003155555555555555,
3040
+ "loss": 0.0427,
3041
+ "step": 433
3042
+ },
3043
+ {
3044
+ "epoch": 0.45161290322580644,
3045
+ "grad_norm": 0.10713426768779755,
3046
+ "learning_rate": 0.000315,
3047
+ "loss": 0.0336,
3048
+ "step": 434
3049
+ },
3050
+ {
3051
+ "epoch": 0.45265348595213317,
3052
+ "grad_norm": 0.09529422223567963,
3053
+ "learning_rate": 0.0003144444444444445,
3054
+ "loss": 0.0241,
3055
+ "step": 435
3056
+ },
3057
+ {
3058
+ "epoch": 0.45369406867845996,
3059
+ "grad_norm": 0.11491887271404266,
3060
+ "learning_rate": 0.0003138888888888889,
3061
+ "loss": 0.0329,
3062
+ "step": 436
3063
+ },
3064
+ {
3065
+ "epoch": 0.4547346514047867,
3066
+ "grad_norm": 0.11572989821434021,
3067
+ "learning_rate": 0.0003133333333333334,
3068
+ "loss": 0.0345,
3069
+ "step": 437
3070
+ },
3071
+ {
3072
+ "epoch": 0.4557752341311134,
3073
+ "grad_norm": 0.12939798831939697,
3074
+ "learning_rate": 0.00031277777777777776,
3075
+ "loss": 0.0332,
3076
+ "step": 438
3077
+ },
3078
+ {
3079
+ "epoch": 0.45681581685744016,
3080
+ "grad_norm": 0.19764038920402527,
3081
+ "learning_rate": 0.00031222222222222225,
3082
+ "loss": 0.0346,
3083
+ "step": 439
3084
+ },
3085
+ {
3086
+ "epoch": 0.4578563995837669,
3087
+ "grad_norm": 0.14365462958812714,
3088
+ "learning_rate": 0.00031166666666666663,
3089
+ "loss": 0.0379,
3090
+ "step": 440
3091
+ },
3092
+ {
3093
+ "epoch": 0.4588969823100936,
3094
+ "grad_norm": 0.12927298247814178,
3095
+ "learning_rate": 0.0003111111111111111,
3096
+ "loss": 0.0287,
3097
+ "step": 441
3098
+ },
3099
+ {
3100
+ "epoch": 0.4599375650364204,
3101
+ "grad_norm": 0.12843161821365356,
3102
+ "learning_rate": 0.0003105555555555555,
3103
+ "loss": 0.0289,
3104
+ "step": 442
3105
+ },
3106
+ {
3107
+ "epoch": 0.46097814776274715,
3108
+ "grad_norm": 0.12266694754362106,
3109
+ "learning_rate": 0.00031,
3110
+ "loss": 0.0297,
3111
+ "step": 443
3112
+ },
3113
+ {
3114
+ "epoch": 0.4620187304890739,
3115
+ "grad_norm": 0.12433566153049469,
3116
+ "learning_rate": 0.0003094444444444445,
3117
+ "loss": 0.0249,
3118
+ "step": 444
3119
+ },
3120
+ {
3121
+ "epoch": 0.4630593132154006,
3122
+ "grad_norm": 0.1348317265510559,
3123
+ "learning_rate": 0.0003088888888888889,
3124
+ "loss": 0.0311,
3125
+ "step": 445
3126
+ },
3127
+ {
3128
+ "epoch": 0.46409989594172735,
3129
+ "grad_norm": 0.1345110535621643,
3130
+ "learning_rate": 0.00030833333333333337,
3131
+ "loss": 0.0354,
3132
+ "step": 446
3133
+ },
3134
+ {
3135
+ "epoch": 0.46514047866805414,
3136
+ "grad_norm": 0.09218961000442505,
3137
+ "learning_rate": 0.00030777777777777775,
3138
+ "loss": 0.0249,
3139
+ "step": 447
3140
+ },
3141
+ {
3142
+ "epoch": 0.46618106139438087,
3143
+ "grad_norm": 0.15081824362277985,
3144
+ "learning_rate": 0.00030722222222222224,
3145
+ "loss": 0.0428,
3146
+ "step": 448
3147
+ },
3148
+ {
3149
+ "epoch": 0.4672216441207076,
3150
+ "grad_norm": 0.11748257279396057,
3151
+ "learning_rate": 0.0003066666666666667,
3152
+ "loss": 0.037,
3153
+ "step": 449
3154
+ },
3155
+ {
3156
+ "epoch": 0.46826222684703434,
3157
+ "grad_norm": 0.1960999071598053,
3158
+ "learning_rate": 0.0003061111111111111,
3159
+ "loss": 0.051,
3160
+ "step": 450
3161
+ },
3162
+ {
3163
+ "epoch": 0.46930280957336107,
3164
+ "grad_norm": 0.12845076620578766,
3165
+ "learning_rate": 0.0003055555555555556,
3166
+ "loss": 0.0323,
3167
+ "step": 451
3168
+ },
3169
+ {
3170
+ "epoch": 0.4703433922996878,
3171
+ "grad_norm": 0.12757262587547302,
3172
+ "learning_rate": 0.000305,
3173
+ "loss": 0.0487,
3174
+ "step": 452
3175
+ },
3176
+ {
3177
+ "epoch": 0.4713839750260146,
3178
+ "grad_norm": 0.18625207245349884,
3179
+ "learning_rate": 0.0003044444444444445,
3180
+ "loss": 0.0301,
3181
+ "step": 453
3182
+ },
3183
+ {
3184
+ "epoch": 0.4724245577523413,
3185
+ "grad_norm": 0.18307316303253174,
3186
+ "learning_rate": 0.00030388888888888886,
3187
+ "loss": 0.0355,
3188
+ "step": 454
3189
+ },
3190
+ {
3191
+ "epoch": 0.47346514047866806,
3192
+ "grad_norm": 0.12024041265249252,
3193
+ "learning_rate": 0.00030333333333333335,
3194
+ "loss": 0.0384,
3195
+ "step": 455
3196
+ },
3197
+ {
3198
+ "epoch": 0.4745057232049948,
3199
+ "grad_norm": 0.1274184286594391,
3200
+ "learning_rate": 0.0003027777777777778,
3201
+ "loss": 0.036,
3202
+ "step": 456
3203
+ },
3204
+ {
3205
+ "epoch": 0.4755463059313215,
3206
+ "grad_norm": 0.11767745018005371,
3207
+ "learning_rate": 0.0003022222222222222,
3208
+ "loss": 0.0239,
3209
+ "step": 457
3210
+ },
3211
+ {
3212
+ "epoch": 0.47658688865764826,
3213
+ "grad_norm": 0.10346122086048126,
3214
+ "learning_rate": 0.0003016666666666667,
3215
+ "loss": 0.0357,
3216
+ "step": 458
3217
+ },
3218
+ {
3219
+ "epoch": 0.47762747138397504,
3220
+ "grad_norm": 0.15750320255756378,
3221
+ "learning_rate": 0.0003011111111111111,
3222
+ "loss": 0.0427,
3223
+ "step": 459
3224
+ },
3225
+ {
3226
+ "epoch": 0.4786680541103018,
3227
+ "grad_norm": 0.12909509241580963,
3228
+ "learning_rate": 0.0003005555555555556,
3229
+ "loss": 0.0192,
3230
+ "step": 460
3231
+ },
3232
+ {
3233
+ "epoch": 0.4797086368366285,
3234
+ "grad_norm": 0.14776866137981415,
3235
+ "learning_rate": 0.0003,
3236
+ "loss": 0.0343,
3237
+ "step": 461
3238
+ },
3239
+ {
3240
+ "epoch": 0.48074921956295524,
3241
+ "grad_norm": 0.13104130327701569,
3242
+ "learning_rate": 0.00029944444444444446,
3243
+ "loss": 0.0309,
3244
+ "step": 462
3245
+ },
3246
+ {
3247
+ "epoch": 0.481789802289282,
3248
+ "grad_norm": 0.1027032732963562,
3249
+ "learning_rate": 0.0002988888888888889,
3250
+ "loss": 0.0356,
3251
+ "step": 463
3252
+ },
3253
+ {
3254
+ "epoch": 0.48283038501560877,
3255
+ "grad_norm": 0.11130186170339584,
3256
+ "learning_rate": 0.00029833333333333334,
3257
+ "loss": 0.039,
3258
+ "step": 464
3259
+ },
3260
+ {
3261
+ "epoch": 0.4838709677419355,
3262
+ "grad_norm": 0.09622237086296082,
3263
+ "learning_rate": 0.0002977777777777778,
3264
+ "loss": 0.0254,
3265
+ "step": 465
3266
+ },
3267
+ {
3268
+ "epoch": 0.48491155046826223,
3269
+ "grad_norm": 0.11083600670099258,
3270
+ "learning_rate": 0.0002972222222222222,
3271
+ "loss": 0.0248,
3272
+ "step": 466
3273
+ },
3274
+ {
3275
+ "epoch": 0.48595213319458896,
3276
+ "grad_norm": 0.1895148605108261,
3277
+ "learning_rate": 0.0002966666666666667,
3278
+ "loss": 0.0388,
3279
+ "step": 467
3280
+ },
3281
+ {
3282
+ "epoch": 0.4869927159209157,
3283
+ "grad_norm": 0.14607883989810944,
3284
+ "learning_rate": 0.0002961111111111111,
3285
+ "loss": 0.0277,
3286
+ "step": 468
3287
+ },
3288
+ {
3289
+ "epoch": 0.48803329864724243,
3290
+ "grad_norm": 0.09221769124269485,
3291
+ "learning_rate": 0.0002955555555555556,
3292
+ "loss": 0.0195,
3293
+ "step": 469
3294
+ },
3295
+ {
3296
+ "epoch": 0.4890738813735692,
3297
+ "grad_norm": 0.12375712394714355,
3298
+ "learning_rate": 0.000295,
3299
+ "loss": 0.0235,
3300
+ "step": 470
3301
+ },
3302
+ {
3303
+ "epoch": 0.49011446409989595,
3304
+ "grad_norm": 0.14334923028945923,
3305
+ "learning_rate": 0.00029444444444444445,
3306
+ "loss": 0.0328,
3307
+ "step": 471
3308
+ },
3309
+ {
3310
+ "epoch": 0.4911550468262227,
3311
+ "grad_norm": 0.15130150318145752,
3312
+ "learning_rate": 0.0002938888888888889,
3313
+ "loss": 0.0401,
3314
+ "step": 472
3315
+ },
3316
+ {
3317
+ "epoch": 0.4921956295525494,
3318
+ "grad_norm": 0.13768820464611053,
3319
+ "learning_rate": 0.0002933333333333333,
3320
+ "loss": 0.0296,
3321
+ "step": 473
3322
+ },
3323
+ {
3324
+ "epoch": 0.49323621227887615,
3325
+ "grad_norm": 0.194923534989357,
3326
+ "learning_rate": 0.0002927777777777778,
3327
+ "loss": 0.0375,
3328
+ "step": 474
3329
+ },
3330
+ {
3331
+ "epoch": 0.49427679500520294,
3332
+ "grad_norm": 0.12720853090286255,
3333
+ "learning_rate": 0.0002922222222222222,
3334
+ "loss": 0.024,
3335
+ "step": 475
3336
+ },
3337
+ {
3338
+ "epoch": 0.4953173777315297,
3339
+ "grad_norm": 0.10007695853710175,
3340
+ "learning_rate": 0.0002916666666666667,
3341
+ "loss": 0.0314,
3342
+ "step": 476
3343
+ },
3344
+ {
3345
+ "epoch": 0.4963579604578564,
3346
+ "grad_norm": 0.10536729544401169,
3347
+ "learning_rate": 0.00029111111111111113,
3348
+ "loss": 0.0296,
3349
+ "step": 477
3350
+ },
3351
+ {
3352
+ "epoch": 0.49739854318418314,
3353
+ "grad_norm": 0.14973285794258118,
3354
+ "learning_rate": 0.00029055555555555556,
3355
+ "loss": 0.0305,
3356
+ "step": 478
3357
+ },
3358
+ {
3359
+ "epoch": 0.4984391259105099,
3360
+ "grad_norm": 0.1162821501493454,
3361
+ "learning_rate": 0.00029,
3362
+ "loss": 0.0405,
3363
+ "step": 479
3364
+ },
3365
+ {
3366
+ "epoch": 0.4994797086368366,
3367
+ "grad_norm": 0.11506082862615585,
3368
+ "learning_rate": 0.00028944444444444444,
3369
+ "loss": 0.0271,
3370
+ "step": 480
3371
+ },
3372
+ {
3373
+ "epoch": 0.5005202913631633,
3374
+ "grad_norm": 0.14310665428638458,
3375
+ "learning_rate": 0.0002888888888888889,
3376
+ "loss": 0.0358,
3377
+ "step": 481
3378
+ },
3379
+ {
3380
+ "epoch": 0.5015608740894901,
3381
+ "grad_norm": 0.1785290539264679,
3382
+ "learning_rate": 0.0002883333333333333,
3383
+ "loss": 0.0409,
3384
+ "step": 482
3385
+ },
3386
+ {
3387
+ "epoch": 0.5026014568158168,
3388
+ "grad_norm": 0.17906583845615387,
3389
+ "learning_rate": 0.0002877777777777778,
3390
+ "loss": 0.0353,
3391
+ "step": 483
3392
+ },
3393
+ {
3394
+ "epoch": 0.5036420395421436,
3395
+ "grad_norm": 0.13935832679271698,
3396
+ "learning_rate": 0.00028722222222222224,
3397
+ "loss": 0.022,
3398
+ "step": 484
3399
+ },
3400
+ {
3401
+ "epoch": 0.5046826222684704,
3402
+ "grad_norm": 0.10252871364355087,
3403
+ "learning_rate": 0.0002866666666666667,
3404
+ "loss": 0.0269,
3405
+ "step": 485
3406
+ },
3407
+ {
3408
+ "epoch": 0.5057232049947971,
3409
+ "grad_norm": 0.15208114683628082,
3410
+ "learning_rate": 0.0002861111111111111,
3411
+ "loss": 0.0386,
3412
+ "step": 486
3413
+ },
3414
+ {
3415
+ "epoch": 0.5067637877211238,
3416
+ "grad_norm": 0.10026312619447708,
3417
+ "learning_rate": 0.00028555555555555555,
3418
+ "loss": 0.0265,
3419
+ "step": 487
3420
+ },
3421
+ {
3422
+ "epoch": 0.5078043704474505,
3423
+ "grad_norm": 0.14320847392082214,
3424
+ "learning_rate": 0.000285,
3425
+ "loss": 0.0254,
3426
+ "step": 488
3427
+ },
3428
+ {
3429
+ "epoch": 0.5088449531737773,
3430
+ "grad_norm": 0.11394159495830536,
3431
+ "learning_rate": 0.0002844444444444444,
3432
+ "loss": 0.0295,
3433
+ "step": 489
3434
+ },
3435
+ {
3436
+ "epoch": 0.5098855359001041,
3437
+ "grad_norm": 0.13264909386634827,
3438
+ "learning_rate": 0.0002838888888888889,
3439
+ "loss": 0.0342,
3440
+ "step": 490
3441
+ },
3442
+ {
3443
+ "epoch": 0.5109261186264308,
3444
+ "grad_norm": 0.08985685557126999,
3445
+ "learning_rate": 0.00028333333333333335,
3446
+ "loss": 0.0252,
3447
+ "step": 491
3448
+ },
3449
+ {
3450
+ "epoch": 0.5119667013527576,
3451
+ "grad_norm": 0.07926324754953384,
3452
+ "learning_rate": 0.0002827777777777778,
3453
+ "loss": 0.0217,
3454
+ "step": 492
3455
+ },
3456
+ {
3457
+ "epoch": 0.5130072840790842,
3458
+ "grad_norm": 0.1059025451540947,
3459
+ "learning_rate": 0.00028222222222222223,
3460
+ "loss": 0.0218,
3461
+ "step": 493
3462
+ },
3463
+ {
3464
+ "epoch": 0.514047866805411,
3465
+ "grad_norm": 0.09140279144048691,
3466
+ "learning_rate": 0.00028166666666666666,
3467
+ "loss": 0.0242,
3468
+ "step": 494
3469
+ },
3470
+ {
3471
+ "epoch": 0.5150884495317378,
3472
+ "grad_norm": 0.0896432101726532,
3473
+ "learning_rate": 0.0002811111111111111,
3474
+ "loss": 0.0232,
3475
+ "step": 495
3476
+ },
3477
+ {
3478
+ "epoch": 0.5161290322580645,
3479
+ "grad_norm": 0.10562644153833389,
3480
+ "learning_rate": 0.00028055555555555554,
3481
+ "loss": 0.0295,
3482
+ "step": 496
3483
+ },
3484
+ {
3485
+ "epoch": 0.5171696149843913,
3486
+ "grad_norm": 0.09908954054117203,
3487
+ "learning_rate": 0.00028000000000000003,
3488
+ "loss": 0.0324,
3489
+ "step": 497
3490
+ },
3491
+ {
3492
+ "epoch": 0.518210197710718,
3493
+ "grad_norm": 0.1016746237874031,
3494
+ "learning_rate": 0.00027944444444444447,
3495
+ "loss": 0.0236,
3496
+ "step": 498
3497
+ },
3498
+ {
3499
+ "epoch": 0.5192507804370448,
3500
+ "grad_norm": 0.13807839155197144,
3501
+ "learning_rate": 0.0002788888888888889,
3502
+ "loss": 0.0377,
3503
+ "step": 499
3504
+ },
3505
+ {
3506
+ "epoch": 0.5202913631633714,
3507
+ "grad_norm": 0.14611020684242249,
3508
+ "learning_rate": 0.00027833333333333334,
3509
+ "loss": 0.0337,
3510
+ "step": 500
3511
+ }
3512
+ ],
3513
+ "logging_steps": 1,
3514
+ "max_steps": 1000,
3515
+ "num_input_tokens_seen": 0,
3516
+ "num_train_epochs": 2,
3517
+ "save_steps": 100,
3518
+ "stateful_callbacks": {
3519
+ "TrainerControl": {
3520
+ "args": {
3521
+ "should_epoch_stop": false,
3522
+ "should_evaluate": false,
3523
+ "should_log": false,
3524
+ "should_save": true,
3525
+ "should_training_stop": false
3526
+ },
3527
+ "attributes": {}
3528
+ }
3529
+ },
3530
+ "total_flos": 0.0,
3531
+ "train_batch_size": 256,
3532
+ "trial_name": null,
3533
+ "trial_params": null
3534
+ }
experiments/Qwen2_5vl_3B_add_distill_0.2_0.6_11_23_Classifier_Layer12_ImgText_V5_i_ret/train_cls.log ADDED
The diff for this file is too large to render. See raw diff
 
experiments/Qwen2_5vl_3B_add_distill_0.2_0.6_11_23_Classifier_Layer12_ImgText_V5_i_ret/wandb/debug-internal.log ADDED
@@ -0,0 +1,6 @@
 
 
 
 
 
 
 
1
+ {"time":"2025-12-08T15:56:05.410578123Z","level":"INFO","msg":"stream: starting","core version":"0.22.2"}
2
+ {"time":"2025-12-08T15:56:05.59298929Z","level":"INFO","msg":"stream: created new stream","id":"ooq67cso"}
3
+ {"time":"2025-12-08T15:56:05.593102261Z","level":"INFO","msg":"handler: started","stream_id":"ooq67cso"}
4
+ {"time":"2025-12-08T15:56:05.593163436Z","level":"INFO","msg":"stream: started","id":"ooq67cso"}
5
+ {"time":"2025-12-08T15:56:05.593200284Z","level":"INFO","msg":"writer: started","stream_id":"ooq67cso"}
6
+ {"time":"2025-12-08T15:56:05.593218469Z","level":"INFO","msg":"sender: started","stream_id":"ooq67cso"}
experiments/Qwen2_5vl_3B_add_distill_0.2_0.6_11_23_Classifier_Layer12_ImgText_V5_i_ret/wandb/debug.log ADDED
@@ -0,0 +1,22 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ 2025-12-08 15:56:05,198 INFO MainThread:575516 [wandb_setup.py:_flush():81] Current SDK version is 0.22.2
2
+ 2025-12-08 15:56:05,198 INFO MainThread:575516 [wandb_setup.py:_flush():81] Configure stats pid to 575516
3
+ 2025-12-08 15:56:05,198 INFO MainThread:575516 [wandb_setup.py:_flush():81] Loading settings from /home/v-menggao/.config/wandb/settings
4
+ 2025-12-08 15:56:05,198 INFO MainThread:575516 [wandb_setup.py:_flush():81] Loading settings from /home/v-menggao/code/VLM2Vec/wandb/settings
5
+ 2025-12-08 15:56:05,198 INFO MainThread:575516 [wandb_setup.py:_flush():81] Loading settings from environment variables
6
+ 2025-12-08 15:56:05,198 INFO MainThread:575516 [wandb_init.py:setup_run_log_directory():705] Logging user logs to /home/v-menggao/code/VLM2Vec/experiments/Qwen2_5vl_3B_add_distill_0.2_0.6_11_23_Classifier_Layer12_ImgText_V5_i_ret/wandb/run-20251208_155605-ooq67cso/logs/debug.log
7
+ 2025-12-08 15:56:05,198 INFO MainThread:575516 [wandb_init.py:setup_run_log_directory():706] Logging internal logs to /home/v-menggao/code/VLM2Vec/experiments/Qwen2_5vl_3B_add_distill_0.2_0.6_11_23_Classifier_Layer12_ImgText_V5_i_ret/wandb/run-20251208_155605-ooq67cso/logs/debug-internal.log
8
+ 2025-12-08 15:56:05,198 INFO MainThread:575516 [wandb_init.py:init():832] calling init triggers
9
+ 2025-12-08 15:56:05,198 INFO MainThread:575516 [wandb_init.py:init():837] wandb.init called with sweep_config: {}
10
+ config: {'_wandb': {}}
11
+ 2025-12-08 15:56:05,198 INFO MainThread:575516 [wandb_init.py:init():880] starting backend
12
+ 2025-12-08 15:56:05,404 INFO MainThread:575516 [wandb_init.py:init():883] sending inform_init request
13
+ 2025-12-08 15:56:05,409 INFO MainThread:575516 [wandb_init.py:init():891] backend started and connected
14
+ 2025-12-08 15:56:05,410 INFO MainThread:575516 [wandb_init.py:init():961] updated telemetry
15
+ 2025-12-08 15:56:05,415 INFO MainThread:575516 [wandb_init.py:init():985] communicating run to backend with 90.0 second timeout
16
+ 2025-12-08 15:56:05,834 INFO MainThread:575516 [wandb_init.py:init():1036] starting run threads in backend
17
+ 2025-12-08 15:56:05,938 INFO MainThread:575516 [wandb_run.py:_console_start():2509] atexit reg
18
+ 2025-12-08 15:56:05,938 INFO MainThread:575516 [wandb_run.py:_redirect():2357] redirect: wrap_raw
19
+ 2025-12-08 15:56:05,938 INFO MainThread:575516 [wandb_run.py:_redirect():2426] Wrapping output streams.
20
+ 2025-12-08 15:56:05,938 INFO MainThread:575516 [wandb_run.py:_redirect():2449] Redirects installed.
21
+ 2025-12-08 15:56:05,941 INFO MainThread:575516 [wandb_init.py:init():1076] run started, returning control to user process
22
+ 2025-12-08 15:56:05,942 INFO MainThread:575516 [wandb_run.py:_config_callback():1392] config_cb None None {'output_dir': '/home/v-menggao/code/VLM2Vec/experiments/Qwen2_5vl_3B_add_distill_0.2_0.6_11_23_Classifier_Layer12_ImgText_V5_i_ret', 'overwrite_output_dir': False, 'do_train': False, 'do_eval': False, 'do_predict': False, 'eval_strategy': 'no', 'prediction_loss_only': False, 'per_device_train_batch_size': 256, 'per_device_eval_batch_size': 8, 'per_gpu_train_batch_size': None, 'per_gpu_eval_batch_size': None, 'gradient_accumulation_steps': 1, 'eval_accumulation_steps': None, 'eval_delay': 0, 'torch_empty_cache_steps': None, 'learning_rate': 0.0005, 'weight_decay': 0.0, 'adam_beta1': 0.9, 'adam_beta2': 0.999, 'adam_epsilon': 1e-08, 'max_grad_norm': 1.0, 'num_train_epochs': 1, 'max_steps': 1000, 'lr_scheduler_type': 'linear', 'lr_scheduler_kwargs': {}, 'warmup_ratio': 0.0, 'warmup_steps': 100, 'log_level': 'passive', 'log_level_replica': 'warning', 'log_on_each_node': True, 'logging_dir': '/home/v-menggao/code/VLM2Vec/experiments/Qwen2_5vl_3B_add_distill_0.2_0.6_11_23_Classifier_Layer12_ImgText_V5_i_ret/runs/Dec08_15-53-18_GCRAZGDL1688', 'logging_strategy': 'steps', 'logging_first_step': False, 'logging_steps': 1, 'logging_nan_inf_filter': True, 'save_strategy': 'steps', 'save_steps': 100, 'save_total_limit': None, 'save_safetensors': True, 'save_on_each_node': False, 'save_only_model': False, 'restore_callback_states_from_checkpoint': False, 'no_cuda': False, 'use_cpu': False, 'use_mps_device': False, 'seed': 42, 'data_seed': None, 'jit_mode_eval': False, 'use_ipex': False, 'bf16': True, 'fp16': False, 'fp16_opt_level': 'O1', 'half_precision_backend': 'auto', 'bf16_full_eval': False, 'fp16_full_eval': False, 'tf32': None, 'local_rank': 0, 'ddp_backend': None, 'tpu_num_cores': None, 'tpu_metrics_debug': False, 'debug': [], 'dataloader_drop_last': True, 'eval_steps': None, 'dataloader_num_workers': 1, 'dataloader_prefetch_factor': None, 'past_index': -1, 'run_name': 'Qwen2_5vl_3B_add_distill_0.2_0.6_11_23_Classifier_Layer12_ImgText_V5_i_ret', 'disable_tqdm': False, 'remove_unused_columns': False, 'label_names': None, 'load_best_model_at_end': False, 'metric_for_best_model': None, 'greater_is_better': None, 'ignore_data_skip': False, 'fsdp': [], 'fsdp_min_num_params': 0, 'fsdp_config': {'min_num_params': 0, 'xla': False, 'xla_fsdp_v2': False, 'xla_fsdp_grad_ckpt': False}, 'fsdp_transformer_layer_cls_to_wrap': None, 'accelerator_config': {'split_batches': False, 'dispatch_batches': None, 'even_batches': True, 'use_seedable_sampler': True, 'non_blocking': False, 'gradient_accumulation_kwargs': None}, 'deepspeed': None, 'label_smoothing_factor': 0.0, 'optim': 'adamw_torch', 'optim_args': None, 'adafactor': False, 'group_by_length': False, 'length_column_name': 'length', 'report_to': ['wandb'], 'ddp_find_unused_parameters': True, 'ddp_bucket_cap_mb': None, 'ddp_broadcast_buffers': None, 'dataloader_pin_memory': True, 'dataloader_persistent_workers': False, 'skip_memory_metrics': True, 'use_legacy_prediction_loop': False, 'push_to_hub': False, 'resume_from_checkpoint': None, 'hub_model_id': None, 'hub_strategy': 'every_save', 'hub_token': '<HUB_TOKEN>', 'hub_private_repo': None, 'hub_always_push': False, 'gradient_checkpointing': False, 'gradient_checkpointing_kwargs': None, 'include_inputs_for_metrics': False, 'include_for_metrics': [], 'eval_do_concat_batches': True, 'fp16_backend': 'auto', 'push_to_hub_model_id': None, 'push_to_hub_organization': None, 'push_to_hub_token': '<PUSH_TO_HUB_TOKEN>', 'mp_parameters': '', 'auto_find_batch_size': False, 'full_determinism': False, 'torchdynamo': None, 'ray_scope': 'last', 'ddp_timeout': 1800, 'torch_compile': False, 'torch_compile_backend': None, 'torch_compile_mode': None, 'include_tokens_per_second': False, 'include_num_input_tokens_seen': False, 'neftune_noise_alpha': None, 'optim_target_modules': None, 'batch_eval_metrics': False, 'eval_on_start': False, 'use_liger_kernel': False, 'eval_use_gather_object': False, 'average_tokens_across_devices': False, 'image_encoder_freeze': False, 'resume_from': 'none', 'project_name': None, 'grad_cache': False, 'gc_q_chunk_size': 2, 'gc_p_chunk_size': 2, 'interleave_stopping_strategy': 'all_exhausted', 'interleave_batch_size': 0}
experiments/Qwen2_5vl_3B_add_distill_0.2_0.6_11_23_Classifier_Layer12_ImgText_V5_i_ret/wandb/run-20251208_155605-ooq67cso/logs/debug-internal.log ADDED
@@ -0,0 +1,6 @@
 
 
 
 
 
 
 
1
+ {"time":"2025-12-08T15:56:05.410578123Z","level":"INFO","msg":"stream: starting","core version":"0.22.2"}
2
+ {"time":"2025-12-08T15:56:05.59298929Z","level":"INFO","msg":"stream: created new stream","id":"ooq67cso"}
3
+ {"time":"2025-12-08T15:56:05.593102261Z","level":"INFO","msg":"handler: started","stream_id":"ooq67cso"}
4
+ {"time":"2025-12-08T15:56:05.593163436Z","level":"INFO","msg":"stream: started","id":"ooq67cso"}
5
+ {"time":"2025-12-08T15:56:05.593200284Z","level":"INFO","msg":"writer: started","stream_id":"ooq67cso"}
6
+ {"time":"2025-12-08T15:56:05.593218469Z","level":"INFO","msg":"sender: started","stream_id":"ooq67cso"}
experiments/Qwen2_5vl_3B_add_distill_0.2_0.6_11_23_Classifier_Layer12_ImgText_V5_i_ret/wandb/run-20251208_155605-ooq67cso/logs/debug.log ADDED
@@ -0,0 +1,22 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ 2025-12-08 15:56:05,198 INFO MainThread:575516 [wandb_setup.py:_flush():81] Current SDK version is 0.22.2
2
+ 2025-12-08 15:56:05,198 INFO MainThread:575516 [wandb_setup.py:_flush():81] Configure stats pid to 575516
3
+ 2025-12-08 15:56:05,198 INFO MainThread:575516 [wandb_setup.py:_flush():81] Loading settings from /home/v-menggao/.config/wandb/settings
4
+ 2025-12-08 15:56:05,198 INFO MainThread:575516 [wandb_setup.py:_flush():81] Loading settings from /home/v-menggao/code/VLM2Vec/wandb/settings
5
+ 2025-12-08 15:56:05,198 INFO MainThread:575516 [wandb_setup.py:_flush():81] Loading settings from environment variables
6
+ 2025-12-08 15:56:05,198 INFO MainThread:575516 [wandb_init.py:setup_run_log_directory():705] Logging user logs to /home/v-menggao/code/VLM2Vec/experiments/Qwen2_5vl_3B_add_distill_0.2_0.6_11_23_Classifier_Layer12_ImgText_V5_i_ret/wandb/run-20251208_155605-ooq67cso/logs/debug.log
7
+ 2025-12-08 15:56:05,198 INFO MainThread:575516 [wandb_init.py:setup_run_log_directory():706] Logging internal logs to /home/v-menggao/code/VLM2Vec/experiments/Qwen2_5vl_3B_add_distill_0.2_0.6_11_23_Classifier_Layer12_ImgText_V5_i_ret/wandb/run-20251208_155605-ooq67cso/logs/debug-internal.log
8
+ 2025-12-08 15:56:05,198 INFO MainThread:575516 [wandb_init.py:init():832] calling init triggers
9
+ 2025-12-08 15:56:05,198 INFO MainThread:575516 [wandb_init.py:init():837] wandb.init called with sweep_config: {}
10
+ config: {'_wandb': {}}
11
+ 2025-12-08 15:56:05,198 INFO MainThread:575516 [wandb_init.py:init():880] starting backend
12
+ 2025-12-08 15:56:05,404 INFO MainThread:575516 [wandb_init.py:init():883] sending inform_init request
13
+ 2025-12-08 15:56:05,409 INFO MainThread:575516 [wandb_init.py:init():891] backend started and connected
14
+ 2025-12-08 15:56:05,410 INFO MainThread:575516 [wandb_init.py:init():961] updated telemetry
15
+ 2025-12-08 15:56:05,415 INFO MainThread:575516 [wandb_init.py:init():985] communicating run to backend with 90.0 second timeout
16
+ 2025-12-08 15:56:05,834 INFO MainThread:575516 [wandb_init.py:init():1036] starting run threads in backend
17
+ 2025-12-08 15:56:05,938 INFO MainThread:575516 [wandb_run.py:_console_start():2509] atexit reg
18
+ 2025-12-08 15:56:05,938 INFO MainThread:575516 [wandb_run.py:_redirect():2357] redirect: wrap_raw
19
+ 2025-12-08 15:56:05,938 INFO MainThread:575516 [wandb_run.py:_redirect():2426] Wrapping output streams.
20
+ 2025-12-08 15:56:05,938 INFO MainThread:575516 [wandb_run.py:_redirect():2449] Redirects installed.
21
+ 2025-12-08 15:56:05,941 INFO MainThread:575516 [wandb_init.py:init():1076] run started, returning control to user process
22
+ 2025-12-08 15:56:05,942 INFO MainThread:575516 [wandb_run.py:_config_callback():1392] config_cb None None {'output_dir': '/home/v-menggao/code/VLM2Vec/experiments/Qwen2_5vl_3B_add_distill_0.2_0.6_11_23_Classifier_Layer12_ImgText_V5_i_ret', 'overwrite_output_dir': False, 'do_train': False, 'do_eval': False, 'do_predict': False, 'eval_strategy': 'no', 'prediction_loss_only': False, 'per_device_train_batch_size': 256, 'per_device_eval_batch_size': 8, 'per_gpu_train_batch_size': None, 'per_gpu_eval_batch_size': None, 'gradient_accumulation_steps': 1, 'eval_accumulation_steps': None, 'eval_delay': 0, 'torch_empty_cache_steps': None, 'learning_rate': 0.0005, 'weight_decay': 0.0, 'adam_beta1': 0.9, 'adam_beta2': 0.999, 'adam_epsilon': 1e-08, 'max_grad_norm': 1.0, 'num_train_epochs': 1, 'max_steps': 1000, 'lr_scheduler_type': 'linear', 'lr_scheduler_kwargs': {}, 'warmup_ratio': 0.0, 'warmup_steps': 100, 'log_level': 'passive', 'log_level_replica': 'warning', 'log_on_each_node': True, 'logging_dir': '/home/v-menggao/code/VLM2Vec/experiments/Qwen2_5vl_3B_add_distill_0.2_0.6_11_23_Classifier_Layer12_ImgText_V5_i_ret/runs/Dec08_15-53-18_GCRAZGDL1688', 'logging_strategy': 'steps', 'logging_first_step': False, 'logging_steps': 1, 'logging_nan_inf_filter': True, 'save_strategy': 'steps', 'save_steps': 100, 'save_total_limit': None, 'save_safetensors': True, 'save_on_each_node': False, 'save_only_model': False, 'restore_callback_states_from_checkpoint': False, 'no_cuda': False, 'use_cpu': False, 'use_mps_device': False, 'seed': 42, 'data_seed': None, 'jit_mode_eval': False, 'use_ipex': False, 'bf16': True, 'fp16': False, 'fp16_opt_level': 'O1', 'half_precision_backend': 'auto', 'bf16_full_eval': False, 'fp16_full_eval': False, 'tf32': None, 'local_rank': 0, 'ddp_backend': None, 'tpu_num_cores': None, 'tpu_metrics_debug': False, 'debug': [], 'dataloader_drop_last': True, 'eval_steps': None, 'dataloader_num_workers': 1, 'dataloader_prefetch_factor': None, 'past_index': -1, 'run_name': 'Qwen2_5vl_3B_add_distill_0.2_0.6_11_23_Classifier_Layer12_ImgText_V5_i_ret', 'disable_tqdm': False, 'remove_unused_columns': False, 'label_names': None, 'load_best_model_at_end': False, 'metric_for_best_model': None, 'greater_is_better': None, 'ignore_data_skip': False, 'fsdp': [], 'fsdp_min_num_params': 0, 'fsdp_config': {'min_num_params': 0, 'xla': False, 'xla_fsdp_v2': False, 'xla_fsdp_grad_ckpt': False}, 'fsdp_transformer_layer_cls_to_wrap': None, 'accelerator_config': {'split_batches': False, 'dispatch_batches': None, 'even_batches': True, 'use_seedable_sampler': True, 'non_blocking': False, 'gradient_accumulation_kwargs': None}, 'deepspeed': None, 'label_smoothing_factor': 0.0, 'optim': 'adamw_torch', 'optim_args': None, 'adafactor': False, 'group_by_length': False, 'length_column_name': 'length', 'report_to': ['wandb'], 'ddp_find_unused_parameters': True, 'ddp_bucket_cap_mb': None, 'ddp_broadcast_buffers': None, 'dataloader_pin_memory': True, 'dataloader_persistent_workers': False, 'skip_memory_metrics': True, 'use_legacy_prediction_loop': False, 'push_to_hub': False, 'resume_from_checkpoint': None, 'hub_model_id': None, 'hub_strategy': 'every_save', 'hub_token': '<HUB_TOKEN>', 'hub_private_repo': None, 'hub_always_push': False, 'gradient_checkpointing': False, 'gradient_checkpointing_kwargs': None, 'include_inputs_for_metrics': False, 'include_for_metrics': [], 'eval_do_concat_batches': True, 'fp16_backend': 'auto', 'push_to_hub_model_id': None, 'push_to_hub_organization': None, 'push_to_hub_token': '<PUSH_TO_HUB_TOKEN>', 'mp_parameters': '', 'auto_find_batch_size': False, 'full_determinism': False, 'torchdynamo': None, 'ray_scope': 'last', 'ddp_timeout': 1800, 'torch_compile': False, 'torch_compile_backend': None, 'torch_compile_mode': None, 'include_tokens_per_second': False, 'include_num_input_tokens_seen': False, 'neftune_noise_alpha': None, 'optim_target_modules': None, 'batch_eval_metrics': False, 'eval_on_start': False, 'use_liger_kernel': False, 'eval_use_gather_object': False, 'average_tokens_across_devices': False, 'image_encoder_freeze': False, 'resume_from': 'none', 'project_name': None, 'grad_cache': False, 'gc_q_chunk_size': 2, 'gc_p_chunk_size': 2, 'interleave_stopping_strategy': 'all_exhausted', 'interleave_batch_size': 0}
experiments/public/all_scores/LamRA-Ret.json ADDED
@@ -0,0 +1,2198 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "metadata": {
3
+ "model_name": "LamRA-Ret",
4
+ "report_generated_date": "2025-06-28T08:54:18.459213"
5
+ },
6
+ "metrics": {
7
+ "image": {
8
+ "ImageNet-1K": {
9
+ "hit@1": 0.723,
10
+ "hit@5": 0.91,
11
+ "hit@10": 0.944,
12
+ "ndcg_linear@1": 0.723,
13
+ "ndcg_linear@5": 0.8268476572075378,
14
+ "ndcg_linear@10": 0.8378788241843189,
15
+ "ndcg_exponential@1": 0.723,
16
+ "ndcg_exponential@5": 0.8268476572075378,
17
+ "ndcg_exponential@10": 0.8378788241843189,
18
+ "precision@1": 0.723,
19
+ "precision@5": 0.18200000000000002,
20
+ "precision@10": 0.09440000000000001,
21
+ "recall@1": 0.723,
22
+ "recall@5": 0.91,
23
+ "recall@10": 0.944,
24
+ "f1@1": 0.723,
25
+ "f1@5": 0.30333333333333334,
26
+ "f1@10": 0.17163636363636361,
27
+ "map@1": 0.723,
28
+ "map@5": 0.7987666666666666,
29
+ "map@10": 0.8033428571428571,
30
+ "mrr@1": 0.723,
31
+ "mrr@5": 0.7987666666666666,
32
+ "mrr@10": 0.8033428571428571,
33
+ "num_pred": 1000,
34
+ "num_data": 1000
35
+ },
36
+ "N24News": {
37
+ "hit@1": 0.513,
38
+ "hit@5": 0.804,
39
+ "hit@10": 0.929,
40
+ "ndcg_linear@1": 0.513,
41
+ "ndcg_linear@5": 0.6693842522947794,
42
+ "ndcg_linear@10": 0.7099458858472819,
43
+ "ndcg_exponential@1": 0.513,
44
+ "ndcg_exponential@5": 0.6693842522947794,
45
+ "ndcg_exponential@10": 0.7099458858472819,
46
+ "precision@1": 0.513,
47
+ "precision@5": 0.1608,
48
+ "precision@10": 0.09290000000000001,
49
+ "recall@1": 0.513,
50
+ "recall@5": 0.804,
51
+ "recall@10": 0.929,
52
+ "f1@1": 0.513,
53
+ "f1@5": 0.268,
54
+ "f1@10": 0.1689090909090909,
55
+ "map@1": 0.513,
56
+ "map@5": 0.6244166666666666,
57
+ "map@10": 0.641238492063492,
58
+ "mrr@1": 0.513,
59
+ "mrr@5": 0.6244166666666666,
60
+ "mrr@10": 0.641238492063492,
61
+ "num_pred": 1000,
62
+ "num_data": 1000
63
+ },
64
+ "HatefulMemes": {
65
+ "hit@1": 0.49,
66
+ "hit@5": 1.0,
67
+ "hit@10": 1.0,
68
+ "ndcg_linear@1": 0.49,
69
+ "ndcg_linear@5": 0.8117741743214435,
70
+ "ndcg_linear@10": 0.8117741743214435,
71
+ "ndcg_exponential@1": 0.49,
72
+ "ndcg_exponential@5": 0.8117741743214435,
73
+ "ndcg_exponential@10": 0.8117741743214435,
74
+ "precision@1": 0.49,
75
+ "precision@5": 0.20000000000000004,
76
+ "precision@10": 0.10000000000000002,
77
+ "recall@1": 0.49,
78
+ "recall@5": 1.0,
79
+ "recall@10": 1.0,
80
+ "f1@1": 0.49,
81
+ "f1@5": 0.3333333333333333,
82
+ "f1@10": 0.18181818181818182,
83
+ "map@1": 0.49,
84
+ "map@5": 0.745,
85
+ "map@10": 0.745,
86
+ "mrr@1": 0.49,
87
+ "mrr@5": 0.745,
88
+ "mrr@10": 0.745,
89
+ "num_pred": 1000,
90
+ "num_data": 1000
91
+ },
92
+ "VOC2007": {
93
+ "hit@1": 0.801,
94
+ "hit@5": 0.976,
95
+ "hit@10": 0.992,
96
+ "ndcg_linear@1": 0.801,
97
+ "ndcg_linear@5": 0.9010597839851336,
98
+ "ndcg_linear@10": 0.9062744300991276,
99
+ "ndcg_exponential@1": 0.801,
100
+ "ndcg_exponential@5": 0.9010597839851336,
101
+ "ndcg_exponential@10": 0.9062744300991276,
102
+ "precision@1": 0.801,
103
+ "precision@5": 0.1952,
104
+ "precision@10": 0.09920000000000001,
105
+ "recall@1": 0.801,
106
+ "recall@5": 0.976,
107
+ "recall@10": 0.992,
108
+ "f1@1": 0.801,
109
+ "f1@5": 0.32533333333333336,
110
+ "f1@10": 0.18036363636363634,
111
+ "map@1": 0.801,
112
+ "map@5": 0.8754666666666667,
113
+ "map@10": 0.877640873015873,
114
+ "mrr@1": 0.801,
115
+ "mrr@5": 0.8754666666666667,
116
+ "mrr@10": 0.877640873015873,
117
+ "num_pred": 1000,
118
+ "num_data": 1000
119
+ },
120
+ "SUN397": {
121
+ "hit@1": 0.685,
122
+ "hit@5": 0.928,
123
+ "hit@10": 0.957,
124
+ "ndcg_linear@1": 0.685,
125
+ "ndcg_linear@5": 0.8224140927675592,
126
+ "ndcg_linear@10": 0.8318463032340889,
127
+ "ndcg_exponential@1": 0.685,
128
+ "ndcg_exponential@5": 0.8224140927675592,
129
+ "ndcg_exponential@10": 0.8318463032340889,
130
+ "precision@1": 0.685,
131
+ "precision@5": 0.18560000000000001,
132
+ "precision@10": 0.09570000000000002,
133
+ "recall@1": 0.685,
134
+ "recall@5": 0.928,
135
+ "recall@10": 0.957,
136
+ "f1@1": 0.685,
137
+ "f1@5": 0.30933333333333335,
138
+ "f1@10": 0.174,
139
+ "map@1": 0.685,
140
+ "map@5": 0.7865500000000001,
141
+ "map@10": 0.7904702380952381,
142
+ "mrr@1": 0.685,
143
+ "mrr@5": 0.7865500000000001,
144
+ "mrr@10": 0.7904702380952381,
145
+ "num_pred": 1000,
146
+ "num_data": 1000
147
+ },
148
+ "Place365": {
149
+ "hit@1": 0.406,
150
+ "hit@5": 0.684,
151
+ "hit@10": 0.787,
152
+ "ndcg_linear@1": 0.406,
153
+ "ndcg_linear@5": 0.5555467482483895,
154
+ "ndcg_linear@10": 0.5889145891921053,
155
+ "ndcg_exponential@1": 0.406,
156
+ "ndcg_exponential@5": 0.5555467482483895,
157
+ "ndcg_exponential@10": 0.5889145891921053,
158
+ "precision@1": 0.406,
159
+ "precision@5": 0.1368,
160
+ "precision@10": 0.0787,
161
+ "recall@1": 0.406,
162
+ "recall@5": 0.684,
163
+ "recall@10": 0.787,
164
+ "f1@1": 0.406,
165
+ "f1@5": 0.22800000000000006,
166
+ "f1@10": 0.1430909090909091,
167
+ "map@1": 0.406,
168
+ "map@5": 0.5126499999999999,
169
+ "map@10": 0.5264646825396826,
170
+ "mrr@1": 0.406,
171
+ "mrr@5": 0.5126499999999999,
172
+ "mrr@10": 0.5264646825396826,
173
+ "num_pred": 1000,
174
+ "num_data": 1000
175
+ },
176
+ "ImageNet-A": {
177
+ "hit@1": 0.47,
178
+ "hit@5": 0.683,
179
+ "hit@10": 0.776,
180
+ "ndcg_linear@1": 0.47,
181
+ "ndcg_linear@5": 0.5846080932069478,
182
+ "ndcg_linear@10": 0.6143872769865809,
183
+ "ndcg_exponential@1": 0.47,
184
+ "ndcg_exponential@5": 0.5846080932069478,
185
+ "ndcg_exponential@10": 0.6143872769865809,
186
+ "precision@1": 0.47,
187
+ "precision@5": 0.13659999999999997,
188
+ "precision@10": 0.07759999999999999,
189
+ "recall@1": 0.47,
190
+ "recall@5": 0.683,
191
+ "recall@10": 0.776,
192
+ "f1@1": 0.47,
193
+ "f1@5": 0.2276666666666667,
194
+ "f1@10": 0.1410909090909091,
195
+ "map@1": 0.47,
196
+ "map@5": 0.5517333333333333,
197
+ "map@10": 0.5638619047619047,
198
+ "mrr@1": 0.47,
199
+ "mrr@5": 0.5517333333333333,
200
+ "mrr@10": 0.5638619047619047,
201
+ "num_pred": 1000,
202
+ "num_data": 1000
203
+ },
204
+ "ImageNet-R": {
205
+ "hit@1": 0.885,
206
+ "hit@5": 0.968,
207
+ "hit@10": 0.981,
208
+ "ndcg_linear@1": 0.885,
209
+ "ndcg_linear@5": 0.9317946929268162,
210
+ "ndcg_linear@10": 0.9361395162551376,
211
+ "ndcg_exponential@1": 0.885,
212
+ "ndcg_exponential@5": 0.9317946929268162,
213
+ "ndcg_exponential@10": 0.9361395162551376,
214
+ "precision@1": 0.885,
215
+ "precision@5": 0.19360000000000002,
216
+ "precision@10": 0.09810000000000002,
217
+ "recall@1": 0.885,
218
+ "recall@5": 0.968,
219
+ "recall@10": 0.981,
220
+ "f1@1": 0.885,
221
+ "f1@5": 0.3226666666666666,
222
+ "f1@10": 0.17836363636363634,
223
+ "map@1": 0.885,
224
+ "map@5": 0.9195166666666666,
225
+ "map@10": 0.9213904761904762,
226
+ "mrr@1": 0.885,
227
+ "mrr@5": 0.9195166666666666,
228
+ "mrr@10": 0.9213904761904762,
229
+ "num_pred": 1000,
230
+ "num_data": 1000
231
+ },
232
+ "ObjectNet": {
233
+ "hit@1": 0.664,
234
+ "hit@5": 0.857,
235
+ "hit@10": 0.904,
236
+ "ndcg_linear@1": 0.664,
237
+ "ndcg_linear@5": 0.770759337476306,
238
+ "ndcg_linear@10": 0.7861961843019063,
239
+ "ndcg_exponential@1": 0.664,
240
+ "ndcg_exponential@5": 0.770759337476306,
241
+ "ndcg_exponential@10": 0.7861961843019063,
242
+ "precision@1": 0.664,
243
+ "precision@5": 0.17140000000000002,
244
+ "precision@10": 0.09040000000000001,
245
+ "recall@1": 0.664,
246
+ "recall@5": 0.857,
247
+ "recall@10": 0.904,
248
+ "f1@1": 0.664,
249
+ "f1@5": 0.28566666666666674,
250
+ "f1@10": 0.16436363636363635,
251
+ "map@1": 0.664,
252
+ "map@5": 0.7417666666666667,
253
+ "map@10": 0.7482793650793651,
254
+ "mrr@1": 0.664,
255
+ "mrr@5": 0.7417666666666667,
256
+ "mrr@10": 0.7482793650793651,
257
+ "num_pred": 1000,
258
+ "num_data": 1000
259
+ },
260
+ "Country211": {
261
+ "hit@1": 0.283,
262
+ "hit@5": 0.535,
263
+ "hit@10": 0.628,
264
+ "ndcg_linear@1": 0.283,
265
+ "ndcg_linear@5": 0.4166269842150015,
266
+ "ndcg_linear@10": 0.44677345697388055,
267
+ "ndcg_exponential@1": 0.283,
268
+ "ndcg_exponential@5": 0.4166269842150015,
269
+ "ndcg_exponential@10": 0.44677345697388055,
270
+ "precision@1": 0.283,
271
+ "precision@5": 0.107,
272
+ "precision@10": 0.0628,
273
+ "recall@1": 0.283,
274
+ "recall@5": 0.535,
275
+ "recall@10": 0.628,
276
+ "f1@1": 0.283,
277
+ "f1@5": 0.17833333333333337,
278
+ "f1@10": 0.11418181818181819,
279
+ "map@1": 0.283,
280
+ "map@5": 0.37723333333333336,
281
+ "map@10": 0.3897083333333334,
282
+ "mrr@1": 0.283,
283
+ "mrr@5": 0.37723333333333336,
284
+ "mrr@10": 0.3897083333333334,
285
+ "num_pred": 1000,
286
+ "num_data": 1000
287
+ },
288
+ "OK-VQA": {
289
+ "hit@1": 0.378,
290
+ "hit@5": 0.65,
291
+ "hit@10": 0.748,
292
+ "ndcg_linear@1": 0.378,
293
+ "ndcg_linear@5": 0.523495748191076,
294
+ "ndcg_linear@10": 0.5551119641095289,
295
+ "ndcg_exponential@1": 0.378,
296
+ "ndcg_exponential@5": 0.523495748191076,
297
+ "ndcg_exponential@10": 0.5551119641095289,
298
+ "precision@1": 0.378,
299
+ "precision@5": 0.13,
300
+ "precision@10": 0.07479999999999999,
301
+ "recall@1": 0.378,
302
+ "recall@5": 0.65,
303
+ "recall@10": 0.748,
304
+ "f1@1": 0.378,
305
+ "f1@5": 0.2166666666666667,
306
+ "f1@10": 0.136,
307
+ "map@1": 0.378,
308
+ "map@5": 0.4814,
309
+ "map@10": 0.49440396825396826,
310
+ "mrr@1": 0.378,
311
+ "mrr@5": 0.4814,
312
+ "mrr@10": 0.49440396825396826,
313
+ "num_pred": 1000,
314
+ "num_data": 1000
315
+ },
316
+ "A-OKVQA": {
317
+ "hit@1": 0.27,
318
+ "hit@5": 0.566,
319
+ "hit@10": 0.693,
320
+ "ndcg_linear@1": 0.27,
321
+ "ndcg_linear@5": 0.425833923116744,
322
+ "ndcg_linear@10": 0.46711405957319874,
323
+ "ndcg_exponential@1": 0.27,
324
+ "ndcg_exponential@5": 0.425833923116744,
325
+ "ndcg_exponential@10": 0.46711405957319874,
326
+ "precision@1": 0.27,
327
+ "precision@5": 0.1132,
328
+ "precision@10": 0.0693,
329
+ "recall@1": 0.27,
330
+ "recall@5": 0.566,
331
+ "recall@10": 0.693,
332
+ "f1@1": 0.27,
333
+ "f1@5": 0.1886666666666667,
334
+ "f1@10": 0.126,
335
+ "map@1": 0.27,
336
+ "map@5": 0.3793666666666667,
337
+ "map@10": 0.39652301587301586,
338
+ "mrr@1": 0.27,
339
+ "mrr@5": 0.3793666666666667,
340
+ "mrr@10": 0.39652301587301586,
341
+ "num_pred": 1000,
342
+ "num_data": 1000
343
+ },
344
+ "DocVQA": {
345
+ "hit@1": 0.223,
346
+ "hit@5": 0.382,
347
+ "hit@10": 0.448,
348
+ "ndcg_linear@1": 0.223,
349
+ "ndcg_linear@5": 0.3079314538526157,
350
+ "ndcg_linear@10": 0.32933154522617863,
351
+ "ndcg_exponential@1": 0.223,
352
+ "ndcg_exponential@5": 0.3079314538526157,
353
+ "ndcg_exponential@10": 0.32933154522617863,
354
+ "precision@1": 0.223,
355
+ "precision@5": 0.0764,
356
+ "precision@10": 0.0448,
357
+ "recall@1": 0.223,
358
+ "recall@5": 0.382,
359
+ "recall@10": 0.448,
360
+ "f1@1": 0.223,
361
+ "f1@5": 0.12733333333333338,
362
+ "f1@10": 0.08145454545454547,
363
+ "map@1": 0.223,
364
+ "map@5": 0.28323333333333334,
365
+ "map@10": 0.2921019841269841,
366
+ "mrr@1": 0.223,
367
+ "mrr@5": 0.28323333333333334,
368
+ "mrr@10": 0.2921019841269841,
369
+ "num_pred": 1000,
370
+ "num_data": 1000
371
+ },
372
+ "InfographicsVQA": {
373
+ "hit@1": 0.165,
374
+ "hit@5": 0.304,
375
+ "hit@10": 0.351,
376
+ "ndcg_linear@1": 0.165,
377
+ "ndcg_linear@5": 0.24083608989579428,
378
+ "ndcg_linear@10": 0.25582539133402193,
379
+ "ndcg_exponential@1": 0.165,
380
+ "ndcg_exponential@5": 0.24083608989579428,
381
+ "ndcg_exponential@10": 0.25582539133402193,
382
+ "precision@1": 0.165,
383
+ "precision@5": 0.0608,
384
+ "precision@10": 0.03509999999999999,
385
+ "recall@1": 0.165,
386
+ "recall@5": 0.304,
387
+ "recall@10": 0.351,
388
+ "f1@1": 0.165,
389
+ "f1@5": 0.10133333333333334,
390
+ "f1@10": 0.06381818181818183,
391
+ "map@1": 0.165,
392
+ "map@5": 0.21964999999999998,
393
+ "map@10": 0.22571349206349206,
394
+ "mrr@1": 0.165,
395
+ "mrr@5": 0.21964999999999998,
396
+ "mrr@10": 0.22571349206349206,
397
+ "num_pred": 1000,
398
+ "num_data": 1000
399
+ },
400
+ "ChartQA": {
401
+ "hit@1": 0.117,
402
+ "hit@5": 0.162,
403
+ "hit@10": 0.18,
404
+ "ndcg_linear@1": 0.117,
405
+ "ndcg_linear@5": 0.14132891302231343,
406
+ "ndcg_linear@10": 0.14726088628648307,
407
+ "ndcg_exponential@1": 0.117,
408
+ "ndcg_exponential@5": 0.14132891302231343,
409
+ "ndcg_exponential@10": 0.14726088628648307,
410
+ "precision@1": 0.117,
411
+ "precision@5": 0.032400000000000005,
412
+ "precision@10": 0.018,
413
+ "recall@1": 0.117,
414
+ "recall@5": 0.162,
415
+ "recall@10": 0.18,
416
+ "f1@1": 0.117,
417
+ "f1@5": 0.054,
418
+ "f1@10": 0.03272727272727273,
419
+ "map@1": 0.117,
420
+ "map@5": 0.13443333333333335,
421
+ "map@10": 0.13694960317460317,
422
+ "mrr@1": 0.117,
423
+ "mrr@5": 0.13443333333333335,
424
+ "mrr@10": 0.13694960317460317,
425
+ "num_pred": 1000,
426
+ "num_data": 1000
427
+ },
428
+ "Visual7W": {
429
+ "hit@1": 0.196,
430
+ "hit@5": 0.434,
431
+ "hit@10": 0.541,
432
+ "ndcg_linear@1": 0.196,
433
+ "ndcg_linear@5": 0.32114419847722886,
434
+ "ndcg_linear@10": 0.35574139683294936,
435
+ "ndcg_exponential@1": 0.196,
436
+ "ndcg_exponential@5": 0.32114419847722886,
437
+ "ndcg_exponential@10": 0.35574139683294936,
438
+ "precision@1": 0.196,
439
+ "precision@5": 0.0868,
440
+ "precision@10": 0.054099999999999995,
441
+ "recall@1": 0.196,
442
+ "recall@5": 0.434,
443
+ "recall@10": 0.541,
444
+ "f1@1": 0.196,
445
+ "f1@5": 0.1446666666666667,
446
+ "f1@10": 0.09836363636363639,
447
+ "map@1": 0.196,
448
+ "map@5": 0.28375,
449
+ "map@10": 0.29802619047619044,
450
+ "mrr@1": 0.196,
451
+ "mrr@5": 0.28375,
452
+ "mrr@10": 0.29802619047619044,
453
+ "num_pred": 1000,
454
+ "num_data": 1000
455
+ },
456
+ "ScienceQA": {
457
+ "hit@1": 0.263,
458
+ "hit@5": 0.57,
459
+ "hit@10": 0.683,
460
+ "ndcg_linear@1": 0.263,
461
+ "ndcg_linear@5": 0.4232608546664754,
462
+ "ndcg_linear@10": 0.46061584821555157,
463
+ "ndcg_exponential@1": 0.263,
464
+ "ndcg_exponential@5": 0.4232608546664754,
465
+ "ndcg_exponential@10": 0.46061584821555157,
466
+ "precision@1": 0.263,
467
+ "precision@5": 0.114,
468
+ "precision@10": 0.0683,
469
+ "recall@1": 0.263,
470
+ "recall@5": 0.57,
471
+ "recall@10": 0.683,
472
+ "f1@1": 0.263,
473
+ "f1@5": 0.19000000000000003,
474
+ "f1@10": 0.12418181818181821,
475
+ "map@1": 0.263,
476
+ "map@5": 0.37475,
477
+ "map@10": 0.39065079365079364,
478
+ "mrr@1": 0.263,
479
+ "mrr@5": 0.37475,
480
+ "mrr@10": 0.39065079365079364,
481
+ "num_pred": 1000,
482
+ "num_data": 1000
483
+ },
484
+ "VizWiz": {
485
+ "hit@1": 0.32,
486
+ "hit@5": 0.526,
487
+ "hit@10": 0.582,
488
+ "ndcg_linear@1": 0.32,
489
+ "ndcg_linear@5": 0.42951324327429996,
490
+ "ndcg_linear@10": 0.44772604037996566,
491
+ "ndcg_exponential@1": 0.32,
492
+ "ndcg_exponential@5": 0.42951324327429996,
493
+ "ndcg_exponential@10": 0.44772604037996566,
494
+ "precision@1": 0.32,
495
+ "precision@5": 0.10519999999999999,
496
+ "precision@10": 0.0582,
497
+ "recall@1": 0.32,
498
+ "recall@5": 0.526,
499
+ "recall@10": 0.582,
500
+ "f1@1": 0.32,
501
+ "f1@5": 0.17533333333333337,
502
+ "f1@10": 0.10581818181818184,
503
+ "map@1": 0.32,
504
+ "map@5": 0.39741666666666664,
505
+ "map@10": 0.4049861111111111,
506
+ "mrr@1": 0.32,
507
+ "mrr@5": 0.39741666666666664,
508
+ "mrr@10": 0.4049861111111111,
509
+ "num_pred": 1000,
510
+ "num_data": 1000
511
+ },
512
+ "GQA": {
513
+ "hit@1": 0.385,
514
+ "hit@5": 0.709,
515
+ "hit@10": 0.832,
516
+ "ndcg_linear@1": 0.385,
517
+ "ndcg_linear@5": 0.5587878569139205,
518
+ "ndcg_linear@10": 0.5988209254862948,
519
+ "ndcg_exponential@1": 0.385,
520
+ "ndcg_exponential@5": 0.5587878569139205,
521
+ "ndcg_exponential@10": 0.5988209254862948,
522
+ "precision@1": 0.385,
523
+ "precision@5": 0.14179999999999998,
524
+ "precision@10": 0.08320000000000002,
525
+ "recall@1": 0.385,
526
+ "recall@5": 0.709,
527
+ "recall@10": 0.832,
528
+ "f1@1": 0.385,
529
+ "f1@5": 0.23633333333333337,
530
+ "f1@10": 0.15127272727272728,
531
+ "map@1": 0.385,
532
+ "map@5": 0.5087166666666667,
533
+ "map@10": 0.5253928571428572,
534
+ "mrr@1": 0.385,
535
+ "mrr@5": 0.5087166666666667,
536
+ "mrr@10": 0.5253928571428572,
537
+ "num_pred": 1000,
538
+ "num_data": 1000
539
+ },
540
+ "TextVQA": {
541
+ "hit@1": 0.33,
542
+ "hit@5": 0.501,
543
+ "hit@10": 0.572,
544
+ "ndcg_linear@1": 0.33,
545
+ "ndcg_linear@5": 0.42213712812714405,
546
+ "ndcg_linear@10": 0.44510553711635736,
547
+ "ndcg_exponential@1": 0.33,
548
+ "ndcg_exponential@5": 0.42213712812714405,
549
+ "ndcg_exponential@10": 0.44510553711635736,
550
+ "precision@1": 0.33,
551
+ "precision@5": 0.10019999999999998,
552
+ "precision@10": 0.057199999999999994,
553
+ "recall@1": 0.33,
554
+ "recall@5": 0.501,
555
+ "recall@10": 0.572,
556
+ "f1@1": 0.33,
557
+ "f1@5": 0.16700000000000007,
558
+ "f1@10": 0.10400000000000001,
559
+ "map@1": 0.33,
560
+ "map@5": 0.39581666666666665,
561
+ "map@10": 0.40530873015873015,
562
+ "mrr@1": 0.33,
563
+ "mrr@5": 0.39581666666666665,
564
+ "mrr@10": 0.40530873015873015,
565
+ "num_pred": 1000,
566
+ "num_data": 1000
567
+ },
568
+ "VisDial": {
569
+ "hit@1": 0.613,
570
+ "hit@5": 0.861,
571
+ "hit@10": 0.923,
572
+ "ndcg_linear@1": 0.613,
573
+ "ndcg_linear@5": 0.7480330953397659,
574
+ "ndcg_linear@10": 0.7684474643796165,
575
+ "ndcg_exponential@1": 0.613,
576
+ "ndcg_exponential@5": 0.7480330953397659,
577
+ "ndcg_exponential@10": 0.7684474643796165,
578
+ "precision@1": 0.613,
579
+ "precision@5": 0.17220000000000002,
580
+ "precision@10": 0.09230000000000001,
581
+ "recall@1": 0.613,
582
+ "recall@5": 0.861,
583
+ "recall@10": 0.923,
584
+ "f1@1": 0.613,
585
+ "f1@5": 0.28700000000000003,
586
+ "f1@10": 0.1678181818181818,
587
+ "map@1": 0.613,
588
+ "map@5": 0.7101999999999999,
589
+ "map@10": 0.7188412698412698,
590
+ "mrr@1": 0.613,
591
+ "mrr@5": 0.7101999999999999,
592
+ "mrr@10": 0.7188412698412698,
593
+ "num_pred": 1000,
594
+ "num_data": 1000
595
+ },
596
+ "CIRR": {
597
+ "hit@1": 0.517,
598
+ "hit@5": 0.863,
599
+ "hit@10": 0.931,
600
+ "ndcg_linear@1": 0.517,
601
+ "ndcg_linear@5": 0.7053164568585676,
602
+ "ndcg_linear@10": 0.7275391721374201,
603
+ "ndcg_exponential@1": 0.517,
604
+ "ndcg_exponential@5": 0.7053164568585676,
605
+ "ndcg_exponential@10": 0.7275391721374201,
606
+ "precision@1": 0.517,
607
+ "precision@5": 0.17260000000000003,
608
+ "precision@10": 0.0931,
609
+ "recall@1": 0.517,
610
+ "recall@5": 0.863,
611
+ "recall@10": 0.931,
612
+ "f1@1": 0.517,
613
+ "f1@5": 0.28766666666666674,
614
+ "f1@10": 0.16927272727272724,
615
+ "map@1": 0.517,
616
+ "map@5": 0.6524333333333334,
617
+ "map@10": 0.6617317460317461,
618
+ "mrr@1": 0.517,
619
+ "mrr@5": 0.6524333333333334,
620
+ "mrr@10": 0.6617317460317461,
621
+ "num_pred": 1000,
622
+ "num_data": 1000
623
+ },
624
+ "VisualNews_t2i": {
625
+ "hit@1": 0.704,
626
+ "hit@5": 0.875,
627
+ "hit@10": 0.91,
628
+ "ndcg_linear@1": 0.704,
629
+ "ndcg_linear@5": 0.7989749726833766,
630
+ "ndcg_linear@10": 0.8104235859208543,
631
+ "ndcg_exponential@1": 0.704,
632
+ "ndcg_exponential@5": 0.7989749726833766,
633
+ "ndcg_exponential@10": 0.8104235859208543,
634
+ "precision@1": 0.704,
635
+ "precision@5": 0.17500000000000002,
636
+ "precision@10": 0.09100000000000001,
637
+ "recall@1": 0.704,
638
+ "recall@5": 0.875,
639
+ "recall@10": 0.91,
640
+ "f1@1": 0.704,
641
+ "f1@5": 0.29166666666666663,
642
+ "f1@10": 0.16545454545454544,
643
+ "map@1": 0.704,
644
+ "map@5": 0.7733166666666667,
645
+ "map@10": 0.7781194444444445,
646
+ "mrr@1": 0.704,
647
+ "mrr@5": 0.7733166666666667,
648
+ "mrr@10": 0.7781194444444445,
649
+ "num_pred": 1000,
650
+ "num_data": 1000
651
+ },
652
+ "VisualNews_i2t": {
653
+ "hit@1": 0.839,
654
+ "hit@5": 0.938,
655
+ "hit@10": 0.953,
656
+ "ndcg_linear@1": 0.839,
657
+ "ndcg_linear@5": 0.8947751558137038,
658
+ "ndcg_linear@10": 0.8997533519597807,
659
+ "ndcg_exponential@1": 0.839,
660
+ "ndcg_exponential@5": 0.8947751558137038,
661
+ "ndcg_exponential@10": 0.8997533519597807,
662
+ "precision@1": 0.839,
663
+ "precision@5": 0.18760000000000002,
664
+ "precision@10": 0.09530000000000001,
665
+ "recall@1": 0.839,
666
+ "recall@5": 0.938,
667
+ "recall@10": 0.953,
668
+ "f1@1": 0.839,
669
+ "f1@5": 0.3126666666666667,
670
+ "f1@10": 0.17327272727272724,
671
+ "map@1": 0.839,
672
+ "map@5": 0.8801333333333333,
673
+ "map@10": 0.8822630952380953,
674
+ "mrr@1": 0.839,
675
+ "mrr@5": 0.8801333333333333,
676
+ "mrr@10": 0.8822630952380953,
677
+ "num_pred": 1000,
678
+ "num_data": 1000
679
+ },
680
+ "MSCOCO_t2i": {
681
+ "hit@1": 0.722,
682
+ "hit@5": 0.935,
683
+ "hit@10": 0.965,
684
+ "ndcg_linear@1": 0.722,
685
+ "ndcg_linear@5": 0.8400063048969685,
686
+ "ndcg_linear@10": 0.8496978391851898,
687
+ "ndcg_exponential@1": 0.722,
688
+ "ndcg_exponential@5": 0.8400063048969685,
689
+ "ndcg_exponential@10": 0.8496978391851898,
690
+ "precision@1": 0.722,
691
+ "precision@5": 0.187,
692
+ "precision@10": 0.09650000000000002,
693
+ "recall@1": 0.722,
694
+ "recall@5": 0.935,
695
+ "recall@10": 0.965,
696
+ "f1@1": 0.722,
697
+ "f1@5": 0.31166666666666665,
698
+ "f1@10": 0.17545454545454545,
699
+ "map@1": 0.722,
700
+ "map@5": 0.8079333333333333,
701
+ "map@10": 0.8119218253968254,
702
+ "mrr@1": 0.722,
703
+ "mrr@5": 0.8079333333333333,
704
+ "mrr@10": 0.8119218253968254,
705
+ "num_pred": 1000,
706
+ "num_data": 1000
707
+ },
708
+ "MSCOCO_i2t": {
709
+ "hit@1": 0.737,
710
+ "hit@5": 0.957,
711
+ "hit@10": 0.982,
712
+ "ndcg_linear@1": 0.737,
713
+ "ndcg_linear@5": 0.8594668192272695,
714
+ "ndcg_linear@10": 0.8676497166665621,
715
+ "ndcg_exponential@1": 0.737,
716
+ "ndcg_exponential@5": 0.8594668192272695,
717
+ "ndcg_exponential@10": 0.8676497166665621,
718
+ "precision@1": 0.737,
719
+ "precision@5": 0.19140000000000004,
720
+ "precision@10": 0.09820000000000002,
721
+ "recall@1": 0.737,
722
+ "recall@5": 0.957,
723
+ "recall@10": 0.982,
724
+ "f1@1": 0.737,
725
+ "f1@5": 0.319,
726
+ "f1@10": 0.17854545454545453,
727
+ "map@1": 0.737,
728
+ "map@5": 0.8265833333333333,
729
+ "map@10": 0.8300186507936508,
730
+ "mrr@1": 0.737,
731
+ "mrr@5": 0.8265833333333333,
732
+ "mrr@10": 0.8300186507936508,
733
+ "num_pred": 1000,
734
+ "num_data": 1000
735
+ },
736
+ "NIGHTS": {
737
+ "hit@1": 0.656,
738
+ "hit@5": 0.974,
739
+ "hit@10": 0.993,
740
+ "ndcg_linear@1": 0.656,
741
+ "ndcg_linear@5": 0.8392219252539634,
742
+ "ndcg_linear@10": 0.8454923298699608,
743
+ "ndcg_exponential@1": 0.656,
744
+ "ndcg_exponential@5": 0.8392219252539634,
745
+ "ndcg_exponential@10": 0.8454923298699608,
746
+ "precision@1": 0.656,
747
+ "precision@5": 0.1948,
748
+ "precision@10": 0.09930000000000001,
749
+ "recall@1": 0.656,
750
+ "recall@5": 0.974,
751
+ "recall@10": 0.993,
752
+ "f1@1": 0.656,
753
+ "f1@5": 0.3246666666666666,
754
+ "f1@10": 0.1805454545454545,
755
+ "map@1": 0.656,
756
+ "map@5": 0.7931000000000001,
757
+ "map@10": 0.7957623015873017,
758
+ "mrr@1": 0.656,
759
+ "mrr@5": 0.7931000000000001,
760
+ "mrr@10": 0.7957623015873017,
761
+ "num_pred": 1000,
762
+ "num_data": 1000
763
+ },
764
+ "WebQA": {
765
+ "hit@1": 0.81,
766
+ "hit@5": 0.971,
767
+ "hit@10": 0.986,
768
+ "ndcg_linear@1": 0.81,
769
+ "ndcg_linear@5": 0.9037144327529909,
770
+ "ndcg_linear@10": 0.9087487966017537,
771
+ "ndcg_exponential@1": 0.81,
772
+ "ndcg_exponential@5": 0.9037144327529909,
773
+ "ndcg_exponential@10": 0.9087487966017537,
774
+ "precision@1": 0.81,
775
+ "precision@5": 0.1942,
776
+ "precision@10": 0.09860000000000002,
777
+ "recall@1": 0.81,
778
+ "recall@5": 0.971,
779
+ "recall@10": 0.986,
780
+ "f1@1": 0.81,
781
+ "f1@5": 0.3236666666666666,
782
+ "f1@10": 0.17927272727272725,
783
+ "map@1": 0.81,
784
+ "map@5": 0.8806333333333335,
785
+ "map@10": 0.8828166666666666,
786
+ "mrr@1": 0.81,
787
+ "mrr@5": 0.8806333333333335,
788
+ "mrr@10": 0.8828166666666666,
789
+ "num_pred": 1000,
790
+ "num_data": 1000
791
+ },
792
+ "FashionIQ": {
793
+ "hit@1": 0.42,
794
+ "hit@5": 0.689,
795
+ "hit@10": 0.794,
796
+ "ndcg_linear@1": 0.42,
797
+ "ndcg_linear@5": 0.5636864513304993,
798
+ "ndcg_linear@10": 0.598000278473528,
799
+ "ndcg_exponential@1": 0.42,
800
+ "ndcg_exponential@5": 0.5636864513304993,
801
+ "ndcg_exponential@10": 0.598000278473528,
802
+ "precision@1": 0.42,
803
+ "precision@5": 0.13779999999999998,
804
+ "precision@10": 0.07940000000000001,
805
+ "recall@1": 0.42,
806
+ "recall@5": 0.689,
807
+ "recall@10": 0.794,
808
+ "f1@1": 0.42,
809
+ "f1@5": 0.2296666666666667,
810
+ "f1@10": 0.14436363636363636,
811
+ "map@1": 0.42,
812
+ "map@5": 0.5219166666666666,
813
+ "map@10": 0.5362988095238095,
814
+ "mrr@1": 0.42,
815
+ "mrr@5": 0.5219166666666666,
816
+ "mrr@10": 0.5362988095238095,
817
+ "num_pred": 1000,
818
+ "num_data": 1000
819
+ },
820
+ "Wiki-SS-NQ": {
821
+ "hit@1": 0.697,
822
+ "hit@5": 0.884,
823
+ "hit@10": 0.921,
824
+ "ndcg_linear@1": 0.697,
825
+ "ndcg_linear@5": 0.801194685185507,
826
+ "ndcg_linear@10": 0.8131568214002816,
827
+ "ndcg_exponential@1": 0.697,
828
+ "ndcg_exponential@5": 0.801194685185507,
829
+ "ndcg_exponential@10": 0.8131568214002816,
830
+ "precision@1": 0.697,
831
+ "precision@5": 0.1768,
832
+ "precision@10": 0.09210000000000003,
833
+ "recall@1": 0.697,
834
+ "recall@5": 0.884,
835
+ "recall@10": 0.921,
836
+ "f1@1": 0.697,
837
+ "f1@5": 0.2946666666666667,
838
+ "f1@10": 0.16745454545454544,
839
+ "map@1": 0.697,
840
+ "map@5": 0.77325,
841
+ "map@10": 0.7781892857142857,
842
+ "mrr@1": 0.697,
843
+ "mrr@5": 0.77325,
844
+ "mrr@10": 0.7781892857142857,
845
+ "num_pred": 1000,
846
+ "num_data": 1000
847
+ },
848
+ "OVEN": {
849
+ "hit@1": 0.82,
850
+ "hit@5": 0.974,
851
+ "hit@10": 0.991,
852
+ "ndcg_linear@1": 0.82,
853
+ "ndcg_linear@5": 0.9071538558399693,
854
+ "ndcg_linear@10": 0.912778314510714,
855
+ "ndcg_exponential@1": 0.82,
856
+ "ndcg_exponential@5": 0.9071538558399693,
857
+ "ndcg_exponential@10": 0.912778314510714,
858
+ "precision@1": 0.82,
859
+ "precision@5": 0.19480000000000003,
860
+ "precision@10": 0.09910000000000001,
861
+ "recall@1": 0.82,
862
+ "recall@5": 0.974,
863
+ "recall@10": 0.991,
864
+ "f1@1": 0.82,
865
+ "f1@5": 0.3246666666666666,
866
+ "f1@10": 0.18018181818181817,
867
+ "map@1": 0.82,
868
+ "map@5": 0.88445,
869
+ "map@10": 0.8868444444444444,
870
+ "mrr@1": 0.82,
871
+ "mrr@5": 0.88445,
872
+ "mrr@10": 0.8868444444444444,
873
+ "num_pred": 1000,
874
+ "num_data": 1000
875
+ },
876
+ "EDIS": {
877
+ "hit@1": 0.859,
878
+ "hit@5": 0.987,
879
+ "hit@10": 0.997,
880
+ "ndcg_linear@1": 0.859,
881
+ "ndcg_linear@5": 0.9331780902287048,
882
+ "ndcg_linear@10": 0.9365900559178164,
883
+ "ndcg_exponential@1": 0.859,
884
+ "ndcg_exponential@5": 0.9331780902287048,
885
+ "ndcg_exponential@10": 0.9365900559178164,
886
+ "precision@1": 0.859,
887
+ "precision@5": 0.19740000000000005,
888
+ "precision@10": 0.09970000000000001,
889
+ "recall@1": 0.859,
890
+ "recall@5": 0.987,
891
+ "recall@10": 0.997,
892
+ "f1@1": 0.859,
893
+ "f1@5": 0.329,
894
+ "f1@10": 0.18127272727272725,
895
+ "map@1": 0.859,
896
+ "map@5": 0.91475,
897
+ "map@10": 0.9162619047619048,
898
+ "mrr@1": 0.859,
899
+ "mrr@5": 0.91475,
900
+ "mrr@10": 0.9162619047619048,
901
+ "num_pred": 1000,
902
+ "num_data": 1000
903
+ },
904
+ "MSCOCO": {
905
+ "hit@1": 0.448,
906
+ "hit@5": 0.625,
907
+ "hit@10": 0.685,
908
+ "ndcg_linear@1": 0.448,
909
+ "ndcg_linear@5": 0.5408899777268813,
910
+ "ndcg_linear@10": 0.5602258062625833,
911
+ "ndcg_exponential@1": 0.448,
912
+ "ndcg_exponential@5": 0.5408899777268813,
913
+ "ndcg_exponential@10": 0.5602258062625833,
914
+ "precision@1": 0.448,
915
+ "precision@5": 0.12499999999999999,
916
+ "precision@10": 0.0685,
917
+ "recall@1": 0.448,
918
+ "recall@5": 0.625,
919
+ "recall@10": 0.685,
920
+ "f1@1": 0.448,
921
+ "f1@5": 0.20833333333333337,
922
+ "f1@10": 0.12454545454545456,
923
+ "map@1": 0.448,
924
+ "map@5": 0.5130333333333333,
925
+ "map@10": 0.5209734126984127,
926
+ "mrr@1": 0.448,
927
+ "mrr@5": 0.5130333333333333,
928
+ "mrr@10": 0.5209734126984127,
929
+ "num_pred": 1000,
930
+ "num_data": 1000
931
+ },
932
+ "RefCOCO": {
933
+ "hit@1": 0.628,
934
+ "hit@5": 0.848,
935
+ "hit@10": 0.897,
936
+ "ndcg_linear@1": 0.628,
937
+ "ndcg_linear@5": 0.7457621998007221,
938
+ "ndcg_linear@10": 0.7619311912107107,
939
+ "ndcg_exponential@1": 0.628,
940
+ "ndcg_exponential@5": 0.7457621998007221,
941
+ "ndcg_exponential@10": 0.7619311912107107,
942
+ "precision@1": 0.628,
943
+ "precision@5": 0.16960000000000003,
944
+ "precision@10": 0.0897,
945
+ "recall@1": 0.628,
946
+ "recall@5": 0.848,
947
+ "recall@10": 0.897,
948
+ "f1@1": 0.628,
949
+ "f1@5": 0.28266666666666673,
950
+ "f1@10": 0.1630909090909091,
951
+ "map@1": 0.628,
952
+ "map@5": 0.7117333333333333,
953
+ "map@10": 0.7185992063492063,
954
+ "mrr@1": 0.628,
955
+ "mrr@5": 0.7117333333333333,
956
+ "mrr@10": 0.7185992063492063,
957
+ "num_pred": 1000,
958
+ "num_data": 1000
959
+ },
960
+ "RefCOCO-Matching": {
961
+ "hit@1": 0.757,
962
+ "hit@5": 0.999,
963
+ "hit@10": 0.999,
964
+ "ndcg_linear@1": 0.757,
965
+ "ndcg_linear@5": 0.9102862746500986,
966
+ "ndcg_linear@10": 0.9102862746500986,
967
+ "ndcg_exponential@1": 0.757,
968
+ "ndcg_exponential@5": 0.9102862746500986,
969
+ "ndcg_exponential@10": 0.9102862746500986,
970
+ "precision@1": 0.757,
971
+ "precision@5": 0.19980000000000003,
972
+ "precision@10": 0.09990000000000002,
973
+ "recall@1": 0.757,
974
+ "recall@5": 0.999,
975
+ "recall@10": 0.999,
976
+ "f1@1": 0.757,
977
+ "f1@5": 0.333,
978
+ "f1@10": 0.18163636363636362,
979
+ "map@1": 0.757,
980
+ "map@5": 0.8793666666666666,
981
+ "map@10": 0.8793666666666666,
982
+ "mrr@1": 0.757,
983
+ "mrr@5": 0.8763666666666666,
984
+ "mrr@10": 0.8763666666666666,
985
+ "num_pred": 1000,
986
+ "num_data": 1000
987
+ },
988
+ "Visual7W-Pointing": {
989
+ "hit@1": 0.673,
990
+ "hit@5": 0.863,
991
+ "hit@10": 0.919,
992
+ "ndcg_linear@1": 0.673,
993
+ "ndcg_linear@5": 0.7774031702105983,
994
+ "ndcg_linear@10": 0.7954662572023203,
995
+ "ndcg_exponential@1": 0.673,
996
+ "ndcg_exponential@5": 0.7774031702105983,
997
+ "ndcg_exponential@10": 0.7954662572023203,
998
+ "precision@1": 0.673,
999
+ "precision@5": 0.17260000000000003,
1000
+ "precision@10": 0.09190000000000001,
1001
+ "recall@1": 0.673,
1002
+ "recall@5": 0.863,
1003
+ "recall@10": 0.919,
1004
+ "f1@1": 0.673,
1005
+ "f1@5": 0.2876666666666667,
1006
+ "f1@10": 0.16709090909090907,
1007
+ "map@1": 0.673,
1008
+ "map@5": 0.7486166666666667,
1009
+ "map@10": 0.756040873015873,
1010
+ "mrr@1": 0.673,
1011
+ "mrr@5": 0.7486166666666667,
1012
+ "mrr@10": 0.756040873015873,
1013
+ "num_pred": 1000,
1014
+ "num_data": 1000
1015
+ }
1016
+ },
1017
+ "video": {
1018
+ "K700": {
1019
+ "hit@1": 0.423,
1020
+ "hit@5": 0.653,
1021
+ "hit@10": 0.731,
1022
+ "ndcg_linear@1": 0.423,
1023
+ "ndcg_linear@5": 0.546371218016443,
1024
+ "ndcg_linear@10": 0.5718997969605862,
1025
+ "ndcg_exponential@1": 0.423,
1026
+ "ndcg_exponential@5": 0.546371218016443,
1027
+ "ndcg_exponential@10": 0.5718997969605862,
1028
+ "precision@1": 0.423,
1029
+ "precision@5": 0.13059999999999997,
1030
+ "precision@10": 0.0731,
1031
+ "recall@1": 0.423,
1032
+ "recall@5": 0.653,
1033
+ "recall@10": 0.731,
1034
+ "f1@1": 0.423,
1035
+ "f1@5": 0.21766666666666673,
1036
+ "f1@10": 0.13290909090909092,
1037
+ "map@1": 0.423,
1038
+ "map@5": 0.5107999999999999,
1039
+ "map@10": 0.5215190476190475,
1040
+ "mrr@1": 0.423,
1041
+ "mrr@5": 0.5107999999999999,
1042
+ "mrr@10": 0.5215190476190475,
1043
+ "num_pred": 1000,
1044
+ "num_data": 1000
1045
+ },
1046
+ "SmthSmthV2": {
1047
+ "hit@1": 0.363,
1048
+ "hit@5": 0.602,
1049
+ "hit@10": 0.698,
1050
+ "ndcg_linear@1": 0.363,
1051
+ "ndcg_linear@5": 0.4890606806277336,
1052
+ "ndcg_linear@10": 0.5200630033328641,
1053
+ "ndcg_exponential@1": 0.363,
1054
+ "ndcg_exponential@5": 0.4890606806277336,
1055
+ "ndcg_exponential@10": 0.5200630033328641,
1056
+ "precision@1": 0.363,
1057
+ "precision@5": 0.1204,
1058
+ "precision@10": 0.06979999999999999,
1059
+ "recall@1": 0.363,
1060
+ "recall@5": 0.602,
1061
+ "recall@10": 0.698,
1062
+ "f1@1": 0.363,
1063
+ "f1@5": 0.20066666666666674,
1064
+ "f1@10": 0.12690909090909094,
1065
+ "map@1": 0.363,
1066
+ "map@5": 0.45156666666666667,
1067
+ "map@10": 0.4643380952380952,
1068
+ "mrr@1": 0.363,
1069
+ "mrr@5": 0.45156666666666667,
1070
+ "mrr@10": 0.4643380952380952,
1071
+ "num_pred": 1000,
1072
+ "num_data": 1000
1073
+ },
1074
+ "HMDB51": {
1075
+ "hit@1": 0.405,
1076
+ "hit@5": 0.658,
1077
+ "hit@10": 0.783,
1078
+ "ndcg_linear@1": 0.405,
1079
+ "ndcg_linear@5": 0.5405643217050999,
1080
+ "ndcg_linear@10": 0.5815107823708526,
1081
+ "ndcg_exponential@1": 0.405,
1082
+ "ndcg_exponential@5": 0.5405643217050999,
1083
+ "ndcg_exponential@10": 0.5815107823708526,
1084
+ "precision@1": 0.405,
1085
+ "precision@5": 0.1316,
1086
+ "precision@10": 0.0783,
1087
+ "recall@1": 0.405,
1088
+ "recall@5": 0.658,
1089
+ "recall@10": 0.783,
1090
+ "f1@1": 0.405,
1091
+ "f1@5": 0.21933333333333338,
1092
+ "f1@10": 0.1423636363636364,
1093
+ "map@1": 0.405,
1094
+ "map@5": 0.5013833333333333,
1095
+ "map@10": 0.5185896825396826,
1096
+ "mrr@1": 0.405,
1097
+ "mrr@5": 0.5013833333333333,
1098
+ "mrr@10": 0.5185896825396826,
1099
+ "num_pred": 1000,
1100
+ "num_data": 1000
1101
+ },
1102
+ "UCF101": {
1103
+ "hit@1": 0.604,
1104
+ "hit@5": 0.852,
1105
+ "hit@10": 0.89,
1106
+ "ndcg_linear@1": 0.604,
1107
+ "ndcg_linear@5": 0.7417818963613594,
1108
+ "ndcg_linear@10": 0.7541096692471368,
1109
+ "ndcg_exponential@1": 0.604,
1110
+ "ndcg_exponential@5": 0.7417818963613594,
1111
+ "ndcg_exponential@10": 0.7541096692471368,
1112
+ "precision@1": 0.604,
1113
+ "precision@5": 0.17040000000000002,
1114
+ "precision@10": 0.08900000000000001,
1115
+ "recall@1": 0.604,
1116
+ "recall@5": 0.852,
1117
+ "recall@10": 0.89,
1118
+ "f1@1": 0.604,
1119
+ "f1@5": 0.284,
1120
+ "f1@10": 0.1618181818181818,
1121
+ "map@1": 0.604,
1122
+ "map@5": 0.7046166666666666,
1123
+ "map@10": 0.7097305555555556,
1124
+ "mrr@1": 0.604,
1125
+ "mrr@5": 0.7046166666666666,
1126
+ "mrr@10": 0.7097305555555556,
1127
+ "num_pred": 1000,
1128
+ "num_data": 1000
1129
+ },
1130
+ "Breakfast": {
1131
+ "hit@1": 0.16859122401847576,
1132
+ "hit@5": 0.6235565819861432,
1133
+ "hit@10": 1.0,
1134
+ "ndcg_linear@1": 0.16859122401847576,
1135
+ "ndcg_linear@5": 0.400691767704696,
1136
+ "ndcg_linear@10": 0.5235817090775436,
1137
+ "ndcg_exponential@1": 0.16859122401847576,
1138
+ "ndcg_exponential@5": 0.400691767704696,
1139
+ "ndcg_exponential@10": 0.5235817090775436,
1140
+ "precision@1": 0.16859122401847576,
1141
+ "precision@5": 0.12471131639722864,
1142
+ "precision@10": 0.1,
1143
+ "recall@1": 0.16859122401847576,
1144
+ "recall@5": 0.6235565819861432,
1145
+ "recall@10": 1.0,
1146
+ "f1@1": 0.16859122401847576,
1147
+ "f1@5": 0.20785219399538113,
1148
+ "f1@10": 0.1818181818181818,
1149
+ "map@1": 0.16859122401847576,
1150
+ "map@5": 0.32763664357197847,
1151
+ "map@10": 0.37902140840939913,
1152
+ "mrr@1": 0.16859122401847576,
1153
+ "mrr@5": 0.32763664357197847,
1154
+ "mrr@10": 0.37902140840939913,
1155
+ "num_pred": 433,
1156
+ "num_data": 433
1157
+ },
1158
+ "MVBench": {
1159
+ "hit@1": 0.372,
1160
+ "hit@5": 1.0,
1161
+ "hit@10": 1.0,
1162
+ "ndcg_linear@1": 0.372,
1163
+ "ndcg_linear@5": 0.7114371453270959,
1164
+ "ndcg_linear@10": 0.7114371453270959,
1165
+ "ndcg_exponential@1": 0.372,
1166
+ "ndcg_exponential@5": 0.7114371453270959,
1167
+ "ndcg_exponential@10": 0.7114371453270959,
1168
+ "precision@1": 0.372,
1169
+ "precision@5": 0.20000000000000004,
1170
+ "precision@10": 0.10000000000000002,
1171
+ "recall@1": 0.372,
1172
+ "recall@5": 1.0,
1173
+ "recall@10": 1.0,
1174
+ "f1@1": 0.372,
1175
+ "f1@5": 0.3333333333333333,
1176
+ "f1@10": 0.18181818181818182,
1177
+ "map@1": 0.372,
1178
+ "map@5": 0.6143833333333334,
1179
+ "map@10": 0.6143833333333334,
1180
+ "mrr@1": 0.372,
1181
+ "mrr@5": 0.6143833333333334,
1182
+ "mrr@10": 0.6143833333333334,
1183
+ "num_pred": 4000,
1184
+ "num_data": 4000
1185
+ },
1186
+ "Video-MME": {
1187
+ "hit@1": 0.34074074074074073,
1188
+ "hit@5": 1.0,
1189
+ "hit@10": 1.0,
1190
+ "ndcg_linear@1": 0.34074074074074073,
1191
+ "ndcg_linear@5": 0.6905732385187221,
1192
+ "ndcg_linear@10": 0.6905732385187221,
1193
+ "ndcg_exponential@1": 0.34074074074074073,
1194
+ "ndcg_exponential@5": 0.6905732385187221,
1195
+ "ndcg_exponential@10": 0.6905732385187221,
1196
+ "precision@1": 0.34074074074074073,
1197
+ "precision@5": 0.19999999999999996,
1198
+ "precision@10": 0.09999999999999998,
1199
+ "recall@1": 0.34074074074074073,
1200
+ "recall@5": 1.0,
1201
+ "recall@10": 1.0,
1202
+ "f1@1": 0.34074074074074073,
1203
+ "f1@5": 0.3333333333333334,
1204
+ "f1@10": 0.18181818181818188,
1205
+ "map@1": 0.34074074074074073,
1206
+ "map@5": 0.5870987654320988,
1207
+ "map@10": 0.5870987654320988,
1208
+ "mrr@1": 0.34074074074074073,
1209
+ "mrr@5": 0.5870987654320988,
1210
+ "mrr@10": 0.5870987654320988,
1211
+ "num_pred": 2700,
1212
+ "num_data": 2700
1213
+ },
1214
+ "NExTQA": {
1215
+ "hit@1": 0.4371788883699206,
1216
+ "hit@5": 1.0,
1217
+ "hit@10": 1.0,
1218
+ "ndcg_linear@1": 0.4371788883699206,
1219
+ "ndcg_linear@5": 0.7269325524352686,
1220
+ "ndcg_linear@10": 0.7269325524352686,
1221
+ "ndcg_exponential@1": 0.4371788883699206,
1222
+ "ndcg_exponential@5": 0.7269325524352686,
1223
+ "ndcg_exponential@10": 0.7269325524352686,
1224
+ "precision@1": 0.4371788883699206,
1225
+ "precision@5": 0.20000000000000004,
1226
+ "precision@10": 0.10000000000000002,
1227
+ "recall@1": 0.4371788883699206,
1228
+ "recall@5": 1.0,
1229
+ "recall@10": 1.0,
1230
+ "f1@1": 0.4371788883699206,
1231
+ "f1@5": 0.3333333333333333,
1232
+ "f1@10": 0.1818181818181818,
1233
+ "map@1": 0.4371788883699206,
1234
+ "map@5": 0.6369803829985987,
1235
+ "map@10": 0.6369803829985987,
1236
+ "mrr@1": 0.4371788883699206,
1237
+ "mrr@5": 0.6367857698894598,
1238
+ "mrr@10": 0.6367857698894598,
1239
+ "num_pred": 8564,
1240
+ "num_data": 8564
1241
+ },
1242
+ "EgoSchema": {
1243
+ "hit@1": 0.448,
1244
+ "hit@5": 1.0,
1245
+ "hit@10": 1.0,
1246
+ "ndcg_linear@1": 0.448,
1247
+ "ndcg_linear@5": 0.7459721375093364,
1248
+ "ndcg_linear@10": 0.7459721375093364,
1249
+ "ndcg_exponential@1": 0.448,
1250
+ "ndcg_exponential@5": 0.7459721375093364,
1251
+ "ndcg_exponential@10": 0.7459721375093364,
1252
+ "precision@1": 0.448,
1253
+ "precision@5": 0.2,
1254
+ "precision@10": 0.1,
1255
+ "recall@1": 0.448,
1256
+ "recall@5": 1.0,
1257
+ "recall@10": 1.0,
1258
+ "f1@1": 0.448,
1259
+ "f1@5": 0.3333333333333333,
1260
+ "f1@10": 0.18181818181818182,
1261
+ "map@1": 0.448,
1262
+ "map@5": 0.6608999999999999,
1263
+ "map@10": 0.6608999999999999,
1264
+ "mrr@1": 0.448,
1265
+ "mrr@5": 0.6608999999999999,
1266
+ "mrr@10": 0.6608999999999999,
1267
+ "num_pred": 500,
1268
+ "num_data": 500
1269
+ },
1270
+ "ActivityNetQA": {
1271
+ "hit@1": 0.532,
1272
+ "hit@5": 1.0,
1273
+ "hit@10": 1.0,
1274
+ "ndcg_linear@1": 0.532,
1275
+ "ndcg_linear@5": 0.8272751246714422,
1276
+ "ndcg_linear@10": 0.8272751246714422,
1277
+ "ndcg_exponential@1": 0.532,
1278
+ "ndcg_exponential@5": 0.8272751246714422,
1279
+ "ndcg_exponential@10": 0.8272751246714422,
1280
+ "precision@1": 0.532,
1281
+ "precision@5": 0.20000000000000004,
1282
+ "precision@10": 0.10000000000000002,
1283
+ "recall@1": 0.532,
1284
+ "recall@5": 1.0,
1285
+ "recall@10": 1.0,
1286
+ "f1@1": 0.532,
1287
+ "f1@5": 0.3333333333333333,
1288
+ "f1@10": 0.18181818181818182,
1289
+ "map@1": 0.532,
1290
+ "map@5": 0.766,
1291
+ "map@10": 0.766,
1292
+ "mrr@1": 0.532,
1293
+ "mrr@5": 0.766,
1294
+ "mrr@10": 0.766,
1295
+ "num_pred": 1000,
1296
+ "num_data": 1000
1297
+ },
1298
+ "DiDeMo": {
1299
+ "hit@1": 0.24800796812749004,
1300
+ "hit@5": 0.4711155378486056,
1301
+ "hit@10": 0.5677290836653387,
1302
+ "ndcg_linear@1": 0.24800796812749004,
1303
+ "ndcg_linear@5": 0.36275185397452103,
1304
+ "ndcg_linear@10": 0.3937078477068639,
1305
+ "ndcg_exponential@1": 0.24800796812749004,
1306
+ "ndcg_exponential@5": 0.36275185397452103,
1307
+ "ndcg_exponential@10": 0.3937078477068639,
1308
+ "precision@1": 0.24800796812749004,
1309
+ "precision@5": 0.0942231075697211,
1310
+ "precision@10": 0.05677290836653386,
1311
+ "recall@1": 0.24800796812749004,
1312
+ "recall@5": 0.4711155378486056,
1313
+ "recall@10": 0.5677290836653387,
1314
+ "f1@1": 0.24800796812749004,
1315
+ "f1@5": 0.15703851261620191,
1316
+ "f1@10": 0.10322346975733432,
1317
+ "map@1": 0.24800796812749004,
1318
+ "map@5": 0.3271082337317397,
1319
+ "map@10": 0.33971653070258645,
1320
+ "mrr@1": 0.24800796812749004,
1321
+ "mrr@5": 0.3271082337317397,
1322
+ "mrr@10": 0.33971653070258645,
1323
+ "num_pred": 1004,
1324
+ "num_data": 1004
1325
+ },
1326
+ "MSR-VTT": {
1327
+ "hit@1": 0.221,
1328
+ "hit@5": 0.441,
1329
+ "hit@10": 0.558,
1330
+ "ndcg_linear@1": 0.221,
1331
+ "ndcg_linear@5": 0.3378462330246669,
1332
+ "ndcg_linear@10": 0.37615489678599645,
1333
+ "ndcg_exponential@1": 0.221,
1334
+ "ndcg_exponential@5": 0.3378462330246669,
1335
+ "ndcg_exponential@10": 0.37615489678599645,
1336
+ "precision@1": 0.221,
1337
+ "precision@5": 0.08819999999999999,
1338
+ "precision@10": 0.055799999999999995,
1339
+ "recall@1": 0.221,
1340
+ "recall@5": 0.441,
1341
+ "recall@10": 0.558,
1342
+ "f1@1": 0.221,
1343
+ "f1@5": 0.14700000000000002,
1344
+ "f1@10": 0.10145454545454546,
1345
+ "map@1": 0.221,
1346
+ "map@5": 0.30355,
1347
+ "map@10": 0.31964126984126984,
1348
+ "mrr@1": 0.221,
1349
+ "mrr@5": 0.30355,
1350
+ "mrr@10": 0.31964126984126984,
1351
+ "num_pred": 1000,
1352
+ "num_data": 1000
1353
+ },
1354
+ "MSVD": {
1355
+ "hit@1": 0.46119402985074626,
1356
+ "hit@5": 0.7,
1357
+ "hit@10": 0.7850746268656716,
1358
+ "ndcg_linear@1": 0.46119402985074626,
1359
+ "ndcg_linear@5": 0.5909143508859,
1360
+ "ndcg_linear@10": 0.6184940826509501,
1361
+ "ndcg_exponential@1": 0.46119402985074626,
1362
+ "ndcg_exponential@5": 0.5909143508859,
1363
+ "ndcg_exponential@10": 0.6184940826509501,
1364
+ "precision@1": 0.46119402985074626,
1365
+ "precision@5": 0.13999999999999999,
1366
+ "precision@10": 0.07850746268656715,
1367
+ "recall@1": 0.46119402985074626,
1368
+ "recall@5": 0.7,
1369
+ "recall@10": 0.7850746268656716,
1370
+ "f1@1": 0.46119402985074626,
1371
+ "f1@5": 0.2333333333333334,
1372
+ "f1@10": 0.14274084124830397,
1373
+ "map@1": 0.46119402985074626,
1374
+ "map@5": 0.5543781094527364,
1375
+ "map@10": 0.5658019426676143,
1376
+ "mrr@1": 0.46119402985074626,
1377
+ "mrr@5": 0.5543781094527364,
1378
+ "mrr@10": 0.5658019426676143,
1379
+ "num_pred": 670,
1380
+ "num_data": 670
1381
+ },
1382
+ "VATEX": {
1383
+ "hit@1": 0.19138008039303261,
1384
+ "hit@5": 0.41692719964269764,
1385
+ "hit@10": 0.5225547119249665,
1386
+ "ndcg_linear@1": 0.19138008039303261,
1387
+ "ndcg_linear@5": 0.31066559826092355,
1388
+ "ndcg_linear@10": 0.3449304405187584,
1389
+ "ndcg_exponential@1": 0.19138008039303261,
1390
+ "ndcg_exponential@5": 0.31066559826092355,
1391
+ "ndcg_exponential@10": 0.3449304405187584,
1392
+ "precision@1": 0.19138008039303261,
1393
+ "precision@5": 0.08338543992853951,
1394
+ "precision@10": 0.05225547119249665,
1395
+ "recall@1": 0.19138008039303261,
1396
+ "recall@5": 0.41692719964269764,
1397
+ "recall@10": 0.5225547119249665,
1398
+ "f1@1": 0.19138008039303261,
1399
+ "f1@5": 0.13897573321423257,
1400
+ "f1@10": 0.09500994762272119,
1401
+ "map@1": 0.19138008039303261,
1402
+ "map@5": 0.27535730236712824,
1403
+ "map@10": 0.28956069177708305,
1404
+ "mrr@1": 0.19138008039303261,
1405
+ "mrr@5": 0.27535730236712824,
1406
+ "mrr@10": 0.28956069177708305,
1407
+ "num_pred": 4478,
1408
+ "num_data": 4478
1409
+ },
1410
+ "YouCook2": {
1411
+ "hit@1": 0.09153821956590123,
1412
+ "hit@5": 0.21358917898710286,
1413
+ "hit@10": 0.29285938974520287,
1414
+ "ndcg_linear@1": 0.09153821956590123,
1415
+ "ndcg_linear@5": 0.15446626761982413,
1416
+ "ndcg_linear@10": 0.18024480954320224,
1417
+ "ndcg_exponential@1": 0.09153821956590123,
1418
+ "ndcg_exponential@5": 0.15446626761982413,
1419
+ "ndcg_exponential@10": 0.18024480954320224,
1420
+ "precision@1": 0.09153821956590123,
1421
+ "precision@5": 0.04271783579742058,
1422
+ "precision@10": 0.02928593897452029,
1423
+ "recall@1": 0.09153821956590123,
1424
+ "recall@5": 0.21358917898710286,
1425
+ "recall@10": 0.29285938974520287,
1426
+ "f1@1": 0.09153821956590123,
1427
+ "f1@5": 0.07119639299570096,
1428
+ "f1@10": 0.053247161771855074,
1429
+ "map@1": 0.09153821956590123,
1430
+ "map@5": 0.13498479605746042,
1431
+ "map@10": 0.14571006655781743,
1432
+ "mrr@1": 0.09153821956590123,
1433
+ "mrr@5": 0.13498479605746042,
1434
+ "mrr@10": 0.14571006655781743,
1435
+ "num_pred": 3179,
1436
+ "num_data": 3179
1437
+ },
1438
+ "QVHighlight": {
1439
+ "hit@1": 0.5383194829178208,
1440
+ "hit@5": 0.863342566943675,
1441
+ "hit@10": 1.0,
1442
+ "ndcg_linear@1": 0.5383194829178208,
1443
+ "ndcg_linear@5": 0.7079527214519653,
1444
+ "ndcg_linear@10": 0.7516086585604039,
1445
+ "ndcg_exponential@1": 0.5383194829178208,
1446
+ "ndcg_exponential@5": 0.7079527214519653,
1447
+ "ndcg_exponential@10": 0.7516086585604039,
1448
+ "precision@1": 0.5383194829178208,
1449
+ "precision@5": 0.17266851338873498,
1450
+ "precision@10": 0.09999999999999998,
1451
+ "recall@1": 0.5383194829178208,
1452
+ "recall@5": 0.863342566943675,
1453
+ "recall@10": 1.0,
1454
+ "f1@1": 0.5383194829178208,
1455
+ "f1@5": 0.28778085564789174,
1456
+ "f1@10": 0.18181818181818185,
1457
+ "map@1": 0.5383194829178208,
1458
+ "map@5": 0.6565712526931364,
1459
+ "map@10": 0.6742862272640666,
1460
+ "mrr@1": 0.5383194829178208,
1461
+ "mrr@5": 0.6565712526931364,
1462
+ "mrr@10": 0.6742862272640666,
1463
+ "num_pred": 1083,
1464
+ "num_data": 1083
1465
+ },
1466
+ "Charades-STA": {
1467
+ "hit@1": 0.10866574965612105,
1468
+ "hit@5": 0.4786795048143054,
1469
+ "hit@10": 1.0,
1470
+ "ndcg_linear@1": 0.10866574965612105,
1471
+ "ndcg_linear@5": 0.2926265568216908,
1472
+ "ndcg_linear@10": 0.4575713199023012,
1473
+ "ndcg_exponential@1": 0.10866574965612105,
1474
+ "ndcg_exponential@5": 0.2926265568216908,
1475
+ "ndcg_exponential@10": 0.4575713199023012,
1476
+ "precision@1": 0.10866574965612105,
1477
+ "precision@5": 0.09573590096286107,
1478
+ "precision@10": 0.09999999999999998,
1479
+ "recall@1": 0.10866574965612105,
1480
+ "recall@5": 0.4786795048143054,
1481
+ "recall@10": 1.0,
1482
+ "f1@1": 0.10866574965612105,
1483
+ "f1@5": 0.15955983493810183,
1484
+ "f1@10": 0.18181818181818185,
1485
+ "map@1": 0.10866574965612105,
1486
+ "map@5": 0.23207244383310408,
1487
+ "map@10": 0.2980508067509443,
1488
+ "mrr@1": 0.10866574965612105,
1489
+ "mrr@5": 0.23207244383310408,
1490
+ "mrr@10": 0.2980508067509443,
1491
+ "num_pred": 727,
1492
+ "num_data": 727
1493
+ },
1494
+ "MomentSeeker": {
1495
+ "hit@1": 0.3383333333333333,
1496
+ "hit@5": 0.8205555555555556,
1497
+ "hit@10": 1.0,
1498
+ "ndcg_linear@1": 0.3383333333333333,
1499
+ "ndcg_linear@5": 0.5821798365943692,
1500
+ "ndcg_linear@10": 0.6491829437988351,
1501
+ "ndcg_exponential@1": 0.3383333333333333,
1502
+ "ndcg_exponential@5": 0.5821798365943692,
1503
+ "ndcg_exponential@10": 0.6491829437988351,
1504
+ "precision@1": 0.3383333333333333,
1505
+ "precision@5": 0.17922222222222223,
1506
+ "precision@10": 0.11311111111111112,
1507
+ "recall@1": 0.31546296296296295,
1508
+ "recall@5": 0.8009259259259259,
1509
+ "recall@10": 0.9988888888888889,
1510
+ "f1@1": 0.3220299823633157,
1511
+ "f1@5": 0.28780555863889207,
1512
+ "f1@10": 0.20050498883832216,
1513
+ "map@1": 0.3383333333333333,
1514
+ "map@5": 0.5041177469135804,
1515
+ "map@10": 0.5349385196208113,
1516
+ "mrr@1": 0.3383333333333333,
1517
+ "mrr@5": 0.5154722222222222,
1518
+ "mrr@10": 0.540335758377425,
1519
+ "num_pred": 1800,
1520
+ "num_data": 1800
1521
+ }
1522
+ },
1523
+ "visdoc": {
1524
+ "ViDoRe_arxivqa": {
1525
+ "hit@1": 0.052,
1526
+ "hit@5": 0.172,
1527
+ "hit@10": 0.286,
1528
+ "ndcg_linear@1": 0.052,
1529
+ "ndcg_linear@5": 0.10801878370138777,
1530
+ "ndcg_linear@10": 0.14373908906362196,
1531
+ "ndcg_exponential@1": 0.052,
1532
+ "ndcg_exponential@5": 0.10801878370138777,
1533
+ "ndcg_exponential@10": 0.14373908906362196,
1534
+ "precision@1": 0.052,
1535
+ "precision@5": 0.03440000000000001,
1536
+ "precision@10": 0.0286,
1537
+ "recall@1": 0.052,
1538
+ "recall@5": 0.172,
1539
+ "recall@10": 0.286,
1540
+ "f1@1": 0.052,
1541
+ "f1@5": 0.05733333333333333,
1542
+ "f1@10": 0.052,
1543
+ "map@1": 0.052,
1544
+ "map@5": 0.08753333333333334,
1545
+ "map@10": 0.10160873015873015,
1546
+ "mrr@1": 0.052,
1547
+ "mrr@5": 0.08753333333333334,
1548
+ "mrr@10": 0.10160873015873015,
1549
+ "num_pred": 500,
1550
+ "num_data": 500
1551
+ },
1552
+ "ViDoRe_docvqa": {
1553
+ "hit@1": 0.13747228381374724,
1554
+ "hit@5": 0.2549889135254989,
1555
+ "hit@10": 0.3148558758314856,
1556
+ "ndcg_linear@1": 0.13747228381374724,
1557
+ "ndcg_linear@5": 0.19129511635223329,
1558
+ "ndcg_linear@10": 0.2105752120749416,
1559
+ "ndcg_exponential@1": 0.13747228381374724,
1560
+ "ndcg_exponential@5": 0.19129511635223329,
1561
+ "ndcg_exponential@10": 0.2105752120749416,
1562
+ "precision@1": 0.13747228381374724,
1563
+ "precision@5": 0.050997782705099776,
1564
+ "precision@10": 0.031929046563192905,
1565
+ "recall@1": 0.13458980044345897,
1566
+ "recall@5": 0.24811529933481155,
1567
+ "recall@10": 0.30842572062084256,
1568
+ "f1@1": 0.1352549889135255,
1569
+ "f1@5": 0.08408826945412314,
1570
+ "f1@10": 0.057562319424847144,
1571
+ "map@1": 0.13747228381374724,
1572
+ "map@5": 0.17147080561714712,
1573
+ "map@10": 0.17921637982613592,
1574
+ "mrr@1": 0.13747228381374724,
1575
+ "mrr@5": 0.17597930524759794,
1576
+ "mrr@10": 0.1834661950515609,
1577
+ "num_pred": 451,
1578
+ "num_data": 451
1579
+ },
1580
+ "ViDoRe_infovqa": {
1581
+ "hit@1": 0.3319838056680162,
1582
+ "hit@5": 0.5748987854251012,
1583
+ "hit@10": 0.6923076923076923,
1584
+ "ndcg_linear@1": 0.3319838056680162,
1585
+ "ndcg_linear@5": 0.46253535711806587,
1586
+ "ndcg_linear@10": 0.5004886054716596,
1587
+ "ndcg_exponential@1": 0.3319838056680162,
1588
+ "ndcg_exponential@5": 0.46253535711806587,
1589
+ "ndcg_exponential@10": 0.5004886054716596,
1590
+ "precision@1": 0.3319838056680162,
1591
+ "precision@5": 0.11497975708502024,
1592
+ "precision@10": 0.06923076923076922,
1593
+ "recall@1": 0.3319838056680162,
1594
+ "recall@5": 0.5748987854251012,
1595
+ "recall@10": 0.6912955465587044,
1596
+ "f1@1": 0.3319838056680162,
1597
+ "f1@5": 0.19163292847503377,
1598
+ "f1@10": 0.12584345479082323,
1599
+ "map@1": 0.3319838056680162,
1600
+ "map@5": 0.4250337381916329,
1601
+ "map@10": 0.4408127691022428,
1602
+ "mrr@1": 0.3319838056680162,
1603
+ "mrr@5": 0.4250337381916329,
1604
+ "mrr@10": 0.4409252297410192,
1605
+ "num_pred": 494,
1606
+ "num_data": 494
1607
+ },
1608
+ "ViDoRe_tabfquad": {
1609
+ "hit@1": 0.275,
1610
+ "hit@5": 0.5678571428571428,
1611
+ "hit@10": 0.6928571428571428,
1612
+ "ndcg_linear@1": 0.275,
1613
+ "ndcg_linear@5": 0.42836855281007846,
1614
+ "ndcg_linear@10": 0.4688038965463907,
1615
+ "ndcg_exponential@1": 0.275,
1616
+ "ndcg_exponential@5": 0.42836855281007846,
1617
+ "ndcg_exponential@10": 0.4688038965463907,
1618
+ "precision@1": 0.275,
1619
+ "precision@5": 0.11357142857142856,
1620
+ "precision@10": 0.06928571428571428,
1621
+ "recall@1": 0.275,
1622
+ "recall@5": 0.5678571428571428,
1623
+ "recall@10": 0.6928571428571428,
1624
+ "f1@1": 0.275,
1625
+ "f1@5": 0.1892857142857143,
1626
+ "f1@10": 0.125974025974026,
1627
+ "map@1": 0.275,
1628
+ "map@5": 0.3823214285714286,
1629
+ "map@10": 0.3990192743764172,
1630
+ "mrr@1": 0.275,
1631
+ "mrr@5": 0.3823214285714286,
1632
+ "mrr@10": 0.3990192743764172,
1633
+ "num_pred": 280,
1634
+ "num_data": 280
1635
+ },
1636
+ "ViDoRe_tatdqa": {
1637
+ "hit@1": 0.06804374240583232,
1638
+ "hit@5": 0.1591737545565006,
1639
+ "hit@10": 0.22053462940461727,
1640
+ "ndcg_linear@1": 0.06804374240583232,
1641
+ "ndcg_linear@5": 0.11430035232416713,
1642
+ "ndcg_linear@10": 0.13412008753307786,
1643
+ "ndcg_exponential@1": 0.06804374240583232,
1644
+ "ndcg_exponential@5": 0.11430035232416713,
1645
+ "ndcg_exponential@10": 0.13412008753307786,
1646
+ "precision@1": 0.06804374240583232,
1647
+ "precision@5": 0.03183475091130013,
1648
+ "precision@10": 0.022053462940461725,
1649
+ "recall@1": 0.06804374240583232,
1650
+ "recall@5": 0.1586269744835966,
1651
+ "recall@10": 0.21998784933171325,
1652
+ "f1@1": 0.06804374240583232,
1653
+ "f1@5": 0.052936411502632646,
1654
+ "f1@10": 0.04004749806693913,
1655
+ "map@1": 0.06804374240583232,
1656
+ "map@5": 0.09965978128797083,
1657
+ "map@10": 0.1078442689347914,
1658
+ "mrr@1": 0.06804374240583232,
1659
+ "mrr@5": 0.09975698663426488,
1660
+ "mrr@10": 0.10795362494937222,
1661
+ "num_pred": 1646,
1662
+ "num_data": 1646
1663
+ },
1664
+ "ViDoRe_shiftproject": {
1665
+ "hit@1": 0.07,
1666
+ "hit@5": 0.17,
1667
+ "hit@10": 0.27,
1668
+ "ndcg_linear@1": 0.07,
1669
+ "ndcg_linear@5": 0.12035565121611999,
1670
+ "ndcg_linear@10": 0.1523429715395014,
1671
+ "ndcg_exponential@1": 0.07,
1672
+ "ndcg_exponential@5": 0.12035565121611999,
1673
+ "ndcg_exponential@10": 0.1523429715395014,
1674
+ "precision@1": 0.07,
1675
+ "precision@5": 0.034,
1676
+ "precision@10": 0.027000000000000003,
1677
+ "recall@1": 0.07,
1678
+ "recall@5": 0.17,
1679
+ "recall@10": 0.27,
1680
+ "f1@1": 0.07,
1681
+ "f1@5": 0.05666666666666667,
1682
+ "f1@10": 0.049090909090909095,
1683
+ "map@1": 0.07,
1684
+ "map@5": 0.10400000000000001,
1685
+ "map@10": 0.116984126984127,
1686
+ "mrr@1": 0.07,
1687
+ "mrr@5": 0.10400000000000001,
1688
+ "mrr@10": 0.116984126984127,
1689
+ "num_pred": 100,
1690
+ "num_data": 100
1691
+ },
1692
+ "ViDoRe_syntheticDocQA_artificial_intelligence": {
1693
+ "hit@1": 0.05,
1694
+ "hit@5": 0.15,
1695
+ "hit@10": 0.22,
1696
+ "ndcg_linear@1": 0.05,
1697
+ "ndcg_linear@5": 0.1031574868850601,
1698
+ "ndcg_linear@10": 0.12568086090486966,
1699
+ "ndcg_exponential@1": 0.05,
1700
+ "ndcg_exponential@5": 0.1031574868850601,
1701
+ "ndcg_exponential@10": 0.12568086090486966,
1702
+ "precision@1": 0.05,
1703
+ "precision@5": 0.030000000000000006,
1704
+ "precision@10": 0.022,
1705
+ "recall@1": 0.05,
1706
+ "recall@5": 0.15,
1707
+ "recall@10": 0.22,
1708
+ "f1@1": 0.05,
1709
+ "f1@5": 0.05,
1710
+ "f1@10": 0.04,
1711
+ "map@1": 0.05,
1712
+ "map@5": 0.0875,
1713
+ "map@10": 0.09673412698412699,
1714
+ "mrr@1": 0.05,
1715
+ "mrr@5": 0.0875,
1716
+ "mrr@10": 0.09673412698412699,
1717
+ "num_pred": 100,
1718
+ "num_data": 100
1719
+ },
1720
+ "ViDoRe_syntheticDocQA_energy": {
1721
+ "hit@1": 0.18,
1722
+ "hit@5": 0.31,
1723
+ "hit@10": 0.41,
1724
+ "ndcg_linear@1": 0.18,
1725
+ "ndcg_linear@5": 0.24771924937667159,
1726
+ "ndcg_linear@10": 0.2802583416144934,
1727
+ "ndcg_exponential@1": 0.18,
1728
+ "ndcg_exponential@5": 0.24771924937667159,
1729
+ "ndcg_exponential@10": 0.2802583416144934,
1730
+ "precision@1": 0.18,
1731
+ "precision@5": 0.062,
1732
+ "precision@10": 0.040999999999999995,
1733
+ "recall@1": 0.18,
1734
+ "recall@5": 0.31,
1735
+ "recall@10": 0.41,
1736
+ "f1@1": 0.18,
1737
+ "f1@5": 0.10333333333333336,
1738
+ "f1@10": 0.07454545454545455,
1739
+ "map@1": 0.18,
1740
+ "map@5": 0.22699999999999998,
1741
+ "map@10": 0.24053968253968258,
1742
+ "mrr@1": 0.18,
1743
+ "mrr@5": 0.22699999999999998,
1744
+ "mrr@10": 0.24053968253968258,
1745
+ "num_pred": 100,
1746
+ "num_data": 100
1747
+ },
1748
+ "ViDoRe_syntheticDocQA_government_reports": {
1749
+ "hit@1": 0.09,
1750
+ "hit@5": 0.23,
1751
+ "hit@10": 0.27,
1752
+ "ndcg_linear@1": 0.09,
1753
+ "ndcg_linear@5": 0.16359030940399763,
1754
+ "ndcg_linear@10": 0.17675975017719422,
1755
+ "ndcg_exponential@1": 0.09,
1756
+ "ndcg_exponential@5": 0.16359030940399763,
1757
+ "ndcg_exponential@10": 0.17675975017719422,
1758
+ "precision@1": 0.09,
1759
+ "precision@5": 0.046000000000000006,
1760
+ "precision@10": 0.027000000000000007,
1761
+ "recall@1": 0.09,
1762
+ "recall@5": 0.23,
1763
+ "recall@10": 0.27,
1764
+ "f1@1": 0.09,
1765
+ "f1@5": 0.07666666666666667,
1766
+ "f1@10": 0.04909090909090908,
1767
+ "map@1": 0.09,
1768
+ "map@5": 0.14150000000000001,
1769
+ "map@10": 0.14708333333333334,
1770
+ "mrr@1": 0.09,
1771
+ "mrr@5": 0.14150000000000001,
1772
+ "mrr@10": 0.14708333333333334,
1773
+ "num_pred": 100,
1774
+ "num_data": 100
1775
+ },
1776
+ "ViDoRe_syntheticDocQA_healthcare_industry": {
1777
+ "hit@1": 0.14,
1778
+ "hit@5": 0.36,
1779
+ "hit@10": 0.4,
1780
+ "ndcg_linear@1": 0.14,
1781
+ "ndcg_linear@5": 0.2593663913604869,
1782
+ "ndcg_linear@10": 0.2717200597145647,
1783
+ "ndcg_exponential@1": 0.14,
1784
+ "ndcg_exponential@5": 0.2593663913604869,
1785
+ "ndcg_exponential@10": 0.2717200597145647,
1786
+ "precision@1": 0.14,
1787
+ "precision@5": 0.07200000000000001,
1788
+ "precision@10": 0.04,
1789
+ "recall@1": 0.14,
1790
+ "recall@5": 0.36,
1791
+ "recall@10": 0.4,
1792
+ "f1@1": 0.14,
1793
+ "f1@5": 0.12000000000000002,
1794
+ "f1@10": 0.07272727272727274,
1795
+ "map@1": 0.14,
1796
+ "map@5": 0.22566666666666665,
1797
+ "map@10": 0.2304444444444444,
1798
+ "mrr@1": 0.14,
1799
+ "mrr@5": 0.22566666666666665,
1800
+ "mrr@10": 0.2304444444444444,
1801
+ "num_pred": 100,
1802
+ "num_data": 100
1803
+ },
1804
+ "ViDoRe_esg_reports_human_labeled_v2": {
1805
+ "hit@1": 0.038461538461538464,
1806
+ "hit@5": 0.17307692307692307,
1807
+ "hit@10": 0.23076923076923078,
1808
+ "ndcg_linear@1": 0.038461538461538464,
1809
+ "ndcg_linear@5": 0.07581945100217463,
1810
+ "ndcg_linear@10": 0.08884346676199335,
1811
+ "ndcg_exponential@1": 0.038461538461538464,
1812
+ "ndcg_exponential@5": 0.07527592503218486,
1813
+ "ndcg_exponential@10": 0.0882008820280547,
1814
+ "precision@1": 0.038461538461538464,
1815
+ "precision@5": 0.05000000000000001,
1816
+ "precision@10": 0.038461538461538464,
1817
+ "recall@1": 0.020833333333333332,
1818
+ "recall@5": 0.10961538461538461,
1819
+ "recall@10": 0.14761904761904762,
1820
+ "f1@1": 0.022189349112426034,
1821
+ "f1@5": 0.057642031171442946,
1822
+ "f1@10": 0.054193845370315956,
1823
+ "map@1": 0.038461538461538464,
1824
+ "map@5": 0.05387820512820513,
1825
+ "map@10": 0.05896291208791209,
1826
+ "mrr@1": 0.038461538461538464,
1827
+ "mrr@5": 0.07724358974358975,
1828
+ "mrr@10": 0.08392094017094018,
1829
+ "num_pred": 52,
1830
+ "num_data": 52
1831
+ },
1832
+ "ViDoRe_biomedical_lectures_v2_multilingual": {
1833
+ "hit@1": 0.096875,
1834
+ "hit@5": 0.296875,
1835
+ "hit@10": 0.3796875,
1836
+ "ndcg_linear@1": 0.096875,
1837
+ "ndcg_linear@5": 0.1327817509891042,
1838
+ "ndcg_linear@10": 0.15578005969658662,
1839
+ "ndcg_exponential@1": 0.096875,
1840
+ "ndcg_exponential@5": 0.1327817509891042,
1841
+ "ndcg_exponential@10": 0.15578005969658662,
1842
+ "precision@1": 0.096875,
1843
+ "precision@5": 0.06625,
1844
+ "precision@10": 0.05015625,
1845
+ "recall@1": 0.05542025862068965,
1846
+ "recall@5": 0.1645906222010748,
1847
+ "recall@10": 0.23159770265864968,
1848
+ "f1@1": 0.06360192325036075,
1849
+ "f1@5": 0.08230852582874641,
1850
+ "f1@10": 0.07338045655325068,
1851
+ "map@1": 0.096875,
1852
+ "map@5": 0.09772092013888889,
1853
+ "map@10": 0.10609532519605062,
1854
+ "mrr@1": 0.096875,
1855
+ "mrr@5": 0.16531250000000003,
1856
+ "mrr@10": 0.1761204117063492,
1857
+ "num_pred": 640,
1858
+ "num_data": 640
1859
+ },
1860
+ "ViDoRe_economics_reports_v2_multilingual": {
1861
+ "hit@1": 0.1939655172413793,
1862
+ "hit@5": 0.46551724137931033,
1863
+ "hit@10": 0.5948275862068966,
1864
+ "ndcg_linear@1": 0.1939655172413793,
1865
+ "ndcg_linear@5": 0.19075341400656756,
1866
+ "ndcg_linear@10": 0.19262260915535673,
1867
+ "ndcg_exponential@1": 0.1939655172413793,
1868
+ "ndcg_exponential@5": 0.19075341400656748,
1869
+ "ndcg_exponential@10": 0.19262260915535673,
1870
+ "precision@1": 0.1939655172413793,
1871
+ "precision@5": 0.18448275862068964,
1872
+ "precision@10": 0.16724137931034483,
1873
+ "recall@1": 0.016014854892863833,
1874
+ "recall@5": 0.07300449328968175,
1875
+ "recall@10": 0.14033065985008555,
1876
+ "f1@1": 0.029036373118143485,
1877
+ "f1@5": 0.0903316153795555,
1878
+ "f1@10": 0.12402634113864117,
1879
+ "map@1": 0.1939655172413793,
1880
+ "map@5": 0.12855603448275862,
1881
+ "map@10": 0.1083281829653956,
1882
+ "mrr@1": 0.1939655172413793,
1883
+ "mrr@5": 0.2959051724137931,
1884
+ "mrr@10": 0.3119937055281883,
1885
+ "num_pred": 232,
1886
+ "num_data": 232
1887
+ },
1888
+ "ViDoRe_esg_reports_v2_multilingual": {
1889
+ "hit@1": 0.043859649122807015,
1890
+ "hit@5": 0.16228070175438597,
1891
+ "hit@10": 0.25877192982456143,
1892
+ "ndcg_linear@1": 0.043859649122807015,
1893
+ "ndcg_linear@5": 0.05924300567334283,
1894
+ "ndcg_linear@10": 0.09666072127808396,
1895
+ "ndcg_exponential@1": 0.043859649122807015,
1896
+ "ndcg_exponential@5": 0.05924300567334283,
1897
+ "ndcg_exponential@10": 0.09666072127808396,
1898
+ "precision@1": 0.043859649122807015,
1899
+ "precision@5": 0.04912280701754387,
1900
+ "precision@10": 0.054385964912280704,
1901
+ "recall@1": 0.008406432748538011,
1902
+ "recall@5": 0.07328216374269006,
1903
+ "recall@10": 0.17160087719298245,
1904
+ "f1@1": 0.013420302893987103,
1905
+ "f1@5": 0.05224007874936668,
1906
+ "f1@10": 0.07439770268717638,
1907
+ "map@1": 0.043859649122807015,
1908
+ "map@5": 0.03577850877192982,
1909
+ "map@10": 0.0544104619186856,
1910
+ "mrr@1": 0.043859649122807015,
1911
+ "mrr@5": 0.07339181286549706,
1912
+ "mrr@10": 0.08703181565023671,
1913
+ "num_pred": 228,
1914
+ "num_data": 228
1915
+ },
1916
+ "VisRAG_ArxivQA": {
1917
+ "hit@1": 0.012254901960784314,
1918
+ "hit@5": 0.02696078431372549,
1919
+ "hit@10": 0.03553921568627451,
1920
+ "ndcg_linear@1": 0.012254901960784314,
1921
+ "ndcg_linear@5": 0.020155243188820424,
1922
+ "ndcg_linear@10": 0.022825943867728897,
1923
+ "ndcg_exponential@1": 0.012254901960784314,
1924
+ "ndcg_exponential@5": 0.020155243188820424,
1925
+ "ndcg_exponential@10": 0.022825943867728897,
1926
+ "precision@1": 0.012254901960784314,
1927
+ "precision@5": 0.005392156862745099,
1928
+ "precision@10": 0.0035539215686274514,
1929
+ "recall@1": 0.012254901960784314,
1930
+ "recall@5": 0.02696078431372549,
1931
+ "recall@10": 0.03553921568627451,
1932
+ "f1@1": 0.012254901960784314,
1933
+ "f1@5": 0.008986928104575164,
1934
+ "f1@10": 0.006461675579322638,
1935
+ "map@1": 0.012254901960784314,
1936
+ "map@5": 0.01787173202614379,
1937
+ "map@10": 0.018913398692810456,
1938
+ "mrr@1": 0.012254901960784314,
1939
+ "mrr@5": 0.01787173202614379,
1940
+ "mrr@10": 0.018913398692810456,
1941
+ "num_pred": 816,
1942
+ "num_data": 816
1943
+ },
1944
+ "VisRAG_ChartQA": {
1945
+ "hit@1": 0.31746031746031744,
1946
+ "hit@5": 0.49206349206349204,
1947
+ "hit@10": 0.5396825396825397,
1948
+ "ndcg_linear@1": 0.31746031746031744,
1949
+ "ndcg_linear@5": 0.41335716785860044,
1950
+ "ndcg_linear@10": 0.42995633781970166,
1951
+ "ndcg_exponential@1": 0.31746031746031744,
1952
+ "ndcg_exponential@5": 0.41335716785860044,
1953
+ "ndcg_exponential@10": 0.42995633781970166,
1954
+ "precision@1": 0.31746031746031744,
1955
+ "precision@5": 0.09841269841269841,
1956
+ "precision@10": 0.05396825396825397,
1957
+ "recall@1": 0.31746031746031744,
1958
+ "recall@5": 0.49206349206349204,
1959
+ "recall@10": 0.5396825396825397,
1960
+ "f1@1": 0.31746031746031744,
1961
+ "f1@5": 0.1640211640211641,
1962
+ "f1@10": 0.09812409812409813,
1963
+ "map@1": 0.31746031746031744,
1964
+ "map@5": 0.3867724867724867,
1965
+ "map@10": 0.39433106575963717,
1966
+ "mrr@1": 0.31746031746031744,
1967
+ "mrr@5": 0.3867724867724867,
1968
+ "mrr@10": 0.39433106575963717,
1969
+ "num_pred": 63,
1970
+ "num_data": 63
1971
+ },
1972
+ "VisRAG_MP-DocVQA": {
1973
+ "hit@1": 0.2436548223350254,
1974
+ "hit@5": 0.41624365482233505,
1975
+ "hit@10": 0.48223350253807107,
1976
+ "ndcg_linear@1": 0.2436548223350254,
1977
+ "ndcg_linear@5": 0.33378850914695807,
1978
+ "ndcg_linear@10": 0.3551570419412752,
1979
+ "ndcg_exponential@1": 0.2436548223350254,
1980
+ "ndcg_exponential@5": 0.33378850914695807,
1981
+ "ndcg_exponential@10": 0.3551570419412752,
1982
+ "precision@1": 0.2436548223350254,
1983
+ "precision@5": 0.08324873096446701,
1984
+ "precision@10": 0.048223350253807105,
1985
+ "recall@1": 0.2436548223350254,
1986
+ "recall@5": 0.41624365482233505,
1987
+ "recall@10": 0.48223350253807107,
1988
+ "f1@1": 0.2436548223350254,
1989
+ "f1@5": 0.13874788494077836,
1990
+ "f1@10": 0.08767881864328564,
1991
+ "map@1": 0.2436548223350254,
1992
+ "map@5": 0.30654258319232935,
1993
+ "map@10": 0.31538353073886066,
1994
+ "mrr@1": 0.2436548223350254,
1995
+ "mrr@5": 0.30654258319232935,
1996
+ "mrr@10": 0.31538353073886066,
1997
+ "num_pred": 591,
1998
+ "num_data": 591
1999
+ },
2000
+ "VisRAG_SlideVQA": {
2001
+ "hit@1": 0.44964028776978415,
2002
+ "hit@5": 0.7086330935251799,
2003
+ "hit@10": 0.7859712230215827,
2004
+ "ndcg_linear@1": 0.44964028776978415,
2005
+ "ndcg_linear@5": 0.5648847466987875,
2006
+ "ndcg_linear@10": 0.5955590007686733,
2007
+ "ndcg_exponential@1": 0.44964028776978415,
2008
+ "ndcg_exponential@5": 0.5648847466987875,
2009
+ "ndcg_exponential@10": 0.5955590007686733,
2010
+ "precision@1": 0.44964028776978415,
2011
+ "precision@5": 0.1723021582733813,
2012
+ "precision@10": 0.09766187050359712,
2013
+ "recall@1": 0.36960431654676257,
2014
+ "recall@5": 0.6735611510791367,
2015
+ "recall@10": 0.7616906474820144,
2016
+ "f1@1": 0.3962829736211031,
2017
+ "f1@5": 0.2692702980472765,
2018
+ "f1@10": 0.17105406583823854,
2019
+ "map@1": 0.44964028776978415,
2020
+ "map@5": 0.5169964028776978,
2021
+ "map@10": 0.5313963115222108,
2022
+ "mrr@1": 0.44964028776978415,
2023
+ "mrr@5": 0.5481115107913669,
2024
+ "mrr@10": 0.5588072399223478,
2025
+ "num_pred": 556,
2026
+ "num_data": 556
2027
+ },
2028
+ "VisRAG_InfoVQA": {
2029
+ "hit@1": 0.4415041782729805,
2030
+ "hit@5": 0.6713091922005571,
2031
+ "hit@10": 0.754874651810585,
2032
+ "ndcg_linear@1": 0.4415041782729805,
2033
+ "ndcg_linear@5": 0.5633673128694291,
2034
+ "ndcg_linear@10": 0.5903761050947809,
2035
+ "ndcg_exponential@1": 0.4415041782729805,
2036
+ "ndcg_exponential@5": 0.5633673128694291,
2037
+ "ndcg_exponential@10": 0.5903761050947809,
2038
+ "precision@1": 0.4415041782729805,
2039
+ "precision@5": 0.13426183844011141,
2040
+ "precision@10": 0.07548746518105848,
2041
+ "recall@1": 0.4415041782729805,
2042
+ "recall@5": 0.6713091922005571,
2043
+ "recall@10": 0.754874651810585,
2044
+ "f1@1": 0.4415041782729805,
2045
+ "f1@5": 0.2237697307335191,
2046
+ "f1@10": 0.13724993669283364,
2047
+ "map@1": 0.4415041782729805,
2048
+ "map@5": 0.5274373259052925,
2049
+ "map@10": 0.5385661228279612,
2050
+ "mrr@1": 0.4415041782729805,
2051
+ "mrr@5": 0.5274373259052925,
2052
+ "mrr@10": 0.5385661228279612,
2053
+ "num_pred": 718,
2054
+ "num_data": 718
2055
+ },
2056
+ "VisRAG_PlotQA": {
2057
+ "hit@1": 0.2410196987253766,
2058
+ "hit@5": 0.4380069524913094,
2059
+ "hit@10": 0.5365005793742758,
2060
+ "ndcg_linear@1": 0.2410196987253766,
2061
+ "ndcg_linear@5": 0.3455373205552205,
2062
+ "ndcg_linear@10": 0.3774838122200841,
2063
+ "ndcg_exponential@1": 0.2410196987253766,
2064
+ "ndcg_exponential@5": 0.3455373205552205,
2065
+ "ndcg_exponential@10": 0.3774838122200841,
2066
+ "precision@1": 0.2410196987253766,
2067
+ "precision@5": 0.08760139049826188,
2068
+ "precision@10": 0.053650057937427574,
2069
+ "recall@1": 0.2410196987253766,
2070
+ "recall@5": 0.4380069524913094,
2071
+ "recall@10": 0.5365005793742758,
2072
+ "f1@1": 0.2410196987253766,
2073
+ "f1@5": 0.14600231749710316,
2074
+ "f1@10": 0.09754555988623198,
2075
+ "map@1": 0.2410196987253766,
2076
+ "map@5": 0.3148319814600232,
2077
+ "map@10": 0.32806792473652263,
2078
+ "mrr@1": 0.2410196987253766,
2079
+ "mrr@5": 0.3148319814600232,
2080
+ "mrr@10": 0.32806792473652263,
2081
+ "num_pred": 863,
2082
+ "num_data": 863
2083
+ },
2084
+ "ViDoSeek-page": {
2085
+ "hit@1": 0.040280210157618214,
2086
+ "hit@5": 0.18563922942206654,
2087
+ "hit@10": 0.287215411558669,
2088
+ "ndcg_linear@1": 0.040280210157618214,
2089
+ "ndcg_linear@5": 0.11294100510293231,
2090
+ "ndcg_linear@10": 0.14594536433240723,
2091
+ "ndcg_exponential@1": 0.040280210157618214,
2092
+ "ndcg_exponential@5": 0.11294100510293234,
2093
+ "ndcg_exponential@10": 0.14594536433240726,
2094
+ "precision@1": 0.040280210157618214,
2095
+ "precision@5": 0.03712784588441331,
2096
+ "precision@10": 0.028721541155866902,
2097
+ "recall@1": 0.040280210157618214,
2098
+ "recall@5": 0.18563922942206654,
2099
+ "recall@10": 0.287215411558669,
2100
+ "f1@1": 0.040280210157618214,
2101
+ "f1@5": 0.06187974314068886,
2102
+ "f1@10": 0.052220983919758,
2103
+ "map@1": 0.040280210157618214,
2104
+ "map@5": 0.08917104495037945,
2105
+ "map@10": 0.10288862480193478,
2106
+ "mrr@1": 0.040280210157618214,
2107
+ "mrr@5": 0.08917104495037945,
2108
+ "mrr@10": 0.10288862480193478,
2109
+ "num_pred": 1142,
2110
+ "num_data": 1142
2111
+ },
2112
+ "ViDoSeek-doc": {
2113
+ "hit@1": 0.4982486865148862,
2114
+ "hit@5": 0.6567425569176882,
2115
+ "hit@10": 0.7338003502626971,
2116
+ "ndcg_linear@1": 0.3429655575014594,
2117
+ "ndcg_linear@5": 0.3714170601904285,
2118
+ "ndcg_linear@10": 0.35019901577656104,
2119
+ "ndcg_exponential@1": 0.23204903677758318,
2120
+ "ndcg_exponential@5": 0.3146728814563305,
2121
+ "ndcg_exponential@10": 0.3162182310328309,
2122
+ "precision@1": 0.4982486865148862,
2123
+ "precision@5": 0.4001751313485114,
2124
+ "precision@10": 0.3430823117338004,
2125
+ "recall@1": 0.02844268284063671,
2126
+ "recall@5": 0.11354378337205699,
2127
+ "recall@10": 0.19116020046136178,
2128
+ "f1@1": 0.05349597259677307,
2129
+ "f1@5": 0.1736704243149188,
2130
+ "f1@10": 0.24068949848035567,
2131
+ "map@1": 0.4982486865148862,
2132
+ "map@5": 0.3603765323992995,
2133
+ "map@10": 0.2910387701490404,
2134
+ "mrr@1": 0.4982486865148862,
2135
+ "mrr@5": 0.5563776999416229,
2136
+ "mrr@10": 0.5669967753592973,
2137
+ "num_pred": 1142,
2138
+ "num_data": 1142
2139
+ },
2140
+ "MMLongBench-page": {
2141
+ "hit@1": 0.059665871121718374,
2142
+ "hit@5": 0.14797136038186157,
2143
+ "hit@10": 0.2159904534606205,
2144
+ "ndcg_linear@1": 0.059665871121718374,
2145
+ "ndcg_linear@5": 0.07951086728623444,
2146
+ "ndcg_linear@10": 0.09880430458699743,
2147
+ "ndcg_exponential@1": 0.059665871121718374,
2148
+ "ndcg_exponential@5": 0.07951086728623444,
2149
+ "ndcg_exponential@10": 0.09880430458699746,
2150
+ "precision@1": 0.059665871121718374,
2151
+ "precision@5": 0.03293556085918855,
2152
+ "precision@10": 0.0256563245823389,
2153
+ "recall@1": 0.038929139674963066,
2154
+ "recall@5": 0.10381908929044967,
2155
+ "recall@10": 0.15813207940296245,
2156
+ "f1@1": 0.04444323907331067,
2157
+ "f1@5": 0.04737172798031987,
2158
+ "f1@10": 0.042217267935243885,
2159
+ "map@1": 0.059665871121718374,
2160
+ "map@5": 0.06207769822328295,
2161
+ "map@10": 0.06994553516182395,
2162
+ "mrr@1": 0.059665871121718374,
2163
+ "mrr@5": 0.08904136833731105,
2164
+ "mrr@10": 0.09803860287153843,
2165
+ "num_pred": 838,
2166
+ "num_data": 838
2167
+ },
2168
+ "MMLongBench-doc": {
2169
+ "hit@1": 0.34725536992840095,
2170
+ "hit@5": 0.5238663484486874,
2171
+ "hit@10": 0.5883054892601431,
2172
+ "ndcg_linear@1": 0.24701670644391405,
2173
+ "ndcg_linear@5": 0.2758146276737757,
2174
+ "ndcg_linear@10": 0.2683418556525889,
2175
+ "ndcg_exponential@1": 0.17541766109785203,
2176
+ "ndcg_exponential@5": 0.2302031604572782,
2177
+ "ndcg_exponential@10": 0.23834477001816015,
2178
+ "precision@1": 0.34725536992840095,
2179
+ "precision@5": 0.31169451073985677,
2180
+ "precision@10": 0.27792362768496426,
2181
+ "recall@1": 0.011458219705852956,
2182
+ "recall@5": 0.0473748134486053,
2183
+ "recall@10": 0.08146579365576306,
2184
+ "f1@1": 0.021977357536621576,
2185
+ "f1@5": 0.0790594246656723,
2186
+ "f1@10": 0.11819035378881726,
2187
+ "map@1": 0.34725536992840095,
2188
+ "map@5": 0.2678878281622912,
2189
+ "map@10": 0.22411547713755348,
2190
+ "mrr@1": 0.34725536992840095,
2191
+ "mrr@5": 0.41585123309466987,
2192
+ "mrr@10": 0.4247144561882032,
2193
+ "num_pred": 838,
2194
+ "num_data": 838
2195
+ }
2196
+ }
2197
+ }
2198
+ }
experiments/public/all_scores/VLM2Vec-V2.0-Qwen2VL-2B.json ADDED
@@ -0,0 +1,2198 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "metadata": {
3
+ "model_name": "VLM2Vec-V2.0-Qwen2VL-2B",
4
+ "report_generated_date": "2025-06-28T08:54:17.882723"
5
+ },
6
+ "metrics": {
7
+ "image": {
8
+ "ImageNet-1K": {
9
+ "hit@1": 0.808,
10
+ "hit@5": 0.956,
11
+ "hit@10": 0.981,
12
+ "ndcg_linear@1": 0.808,
13
+ "ndcg_linear@5": 0.8917355668881671,
14
+ "ndcg_linear@10": 0.8996344961395271,
15
+ "ndcg_exponential@1": 0.808,
16
+ "ndcg_exponential@5": 0.8917355668881671,
17
+ "ndcg_exponential@10": 0.8996344961395271,
18
+ "precision@1": 0.808,
19
+ "precision@5": 0.19120000000000004,
20
+ "precision@10": 0.09810000000000002,
21
+ "recall@1": 0.808,
22
+ "recall@5": 0.956,
23
+ "recall@10": 0.981,
24
+ "f1@1": 0.808,
25
+ "f1@5": 0.3186666666666667,
26
+ "f1@10": 0.17836363636363634,
27
+ "map@1": 0.808,
28
+ "map@5": 0.8699166666666668,
29
+ "map@10": 0.8730702380952381,
30
+ "mrr@1": 0.808,
31
+ "mrr@5": 0.8699166666666668,
32
+ "mrr@10": 0.8730702380952381,
33
+ "num_pred": 1000,
34
+ "num_data": 1000
35
+ },
36
+ "N24News": {
37
+ "hit@1": 0.729,
38
+ "hit@5": 0.954,
39
+ "hit@10": 0.985,
40
+ "ndcg_linear@1": 0.729,
41
+ "ndcg_linear@5": 0.8542486272909989,
42
+ "ndcg_linear@10": 0.8643817096780151,
43
+ "ndcg_exponential@1": 0.729,
44
+ "ndcg_exponential@5": 0.8542486272909989,
45
+ "ndcg_exponential@10": 0.8643817096780151,
46
+ "precision@1": 0.729,
47
+ "precision@5": 0.19080000000000003,
48
+ "precision@10": 0.09850000000000003,
49
+ "recall@1": 0.729,
50
+ "recall@5": 0.954,
51
+ "recall@10": 0.985,
52
+ "f1@1": 0.729,
53
+ "f1@5": 0.318,
54
+ "f1@10": 0.17909090909090908,
55
+ "map@1": 0.729,
56
+ "map@5": 0.82055,
57
+ "map@10": 0.8247988095238095,
58
+ "mrr@1": 0.729,
59
+ "mrr@5": 0.82055,
60
+ "mrr@10": 0.8247988095238095,
61
+ "num_pred": 1000,
62
+ "num_data": 1000
63
+ },
64
+ "HatefulMemes": {
65
+ "hit@1": 0.563,
66
+ "hit@5": 1.0,
67
+ "hit@10": 1.0,
68
+ "ndcg_linear@1": 0.563,
69
+ "ndcg_linear@5": 0.8387163023107271,
70
+ "ndcg_linear@10": 0.8387163023107271,
71
+ "ndcg_exponential@1": 0.563,
72
+ "ndcg_exponential@5": 0.8387163023107271,
73
+ "ndcg_exponential@10": 0.8387163023107271,
74
+ "precision@1": 0.563,
75
+ "precision@5": 0.20000000000000004,
76
+ "precision@10": 0.10000000000000002,
77
+ "recall@1": 0.563,
78
+ "recall@5": 1.0,
79
+ "recall@10": 1.0,
80
+ "f1@1": 0.563,
81
+ "f1@5": 0.3333333333333333,
82
+ "f1@10": 0.18181818181818182,
83
+ "map@1": 0.563,
84
+ "map@5": 0.7815,
85
+ "map@10": 0.7815,
86
+ "mrr@1": 0.563,
87
+ "mrr@5": 0.7815,
88
+ "mrr@10": 0.7815,
89
+ "num_pred": 1000,
90
+ "num_data": 1000
91
+ },
92
+ "VOC2007": {
93
+ "hit@1": 0.85,
94
+ "hit@5": 0.975,
95
+ "hit@10": 0.988,
96
+ "ndcg_linear@1": 0.85,
97
+ "ndcg_linear@5": 0.920705885295906,
98
+ "ndcg_linear@10": 0.9248925595376308,
99
+ "ndcg_exponential@1": 0.85,
100
+ "ndcg_exponential@5": 0.920705885295906,
101
+ "ndcg_exponential@10": 0.9248925595376308,
102
+ "precision@1": 0.85,
103
+ "precision@5": 0.19500000000000006,
104
+ "precision@10": 0.09880000000000001,
105
+ "recall@1": 0.85,
106
+ "recall@5": 0.975,
107
+ "recall@10": 0.988,
108
+ "f1@1": 0.85,
109
+ "f1@5": 0.325,
110
+ "f1@10": 0.17963636363636362,
111
+ "map@1": 0.85,
112
+ "map@5": 0.9022666666666667,
113
+ "map@10": 0.9039853174603174,
114
+ "mrr@1": 0.85,
115
+ "mrr@5": 0.9022666666666667,
116
+ "mrr@10": 0.9039853174603174,
117
+ "num_pred": 1000,
118
+ "num_data": 1000
119
+ },
120
+ "SUN397": {
121
+ "hit@1": 0.71,
122
+ "hit@5": 0.93,
123
+ "hit@10": 0.957,
124
+ "ndcg_linear@1": 0.71,
125
+ "ndcg_linear@5": 0.8327114376725517,
126
+ "ndcg_linear@10": 0.841469031189054,
127
+ "ndcg_exponential@1": 0.71,
128
+ "ndcg_exponential@5": 0.8327114376725517,
129
+ "ndcg_exponential@10": 0.841469031189054,
130
+ "precision@1": 0.71,
131
+ "precision@5": 0.186,
132
+ "precision@10": 0.09570000000000002,
133
+ "recall@1": 0.71,
134
+ "recall@5": 0.93,
135
+ "recall@10": 0.957,
136
+ "f1@1": 0.71,
137
+ "f1@5": 0.31,
138
+ "f1@10": 0.174,
139
+ "map@1": 0.71,
140
+ "map@5": 0.7998666666666666,
141
+ "map@10": 0.803498015873016,
142
+ "mrr@1": 0.71,
143
+ "mrr@5": 0.7998666666666666,
144
+ "mrr@10": 0.803498015873016,
145
+ "num_pred": 1000,
146
+ "num_data": 1000
147
+ },
148
+ "Place365": {
149
+ "hit@1": 0.359,
150
+ "hit@5": 0.636,
151
+ "hit@10": 0.728,
152
+ "ndcg_linear@1": 0.359,
153
+ "ndcg_linear@5": 0.5085200093794449,
154
+ "ndcg_linear@10": 0.5380972787675244,
155
+ "ndcg_exponential@1": 0.359,
156
+ "ndcg_exponential@5": 0.5085200093794449,
157
+ "ndcg_exponential@10": 0.5380972787675244,
158
+ "precision@1": 0.359,
159
+ "precision@5": 0.12719999999999998,
160
+ "precision@10": 0.0728,
161
+ "recall@1": 0.359,
162
+ "recall@5": 0.636,
163
+ "recall@10": 0.728,
164
+ "f1@1": 0.359,
165
+ "f1@5": 0.21200000000000005,
166
+ "f1@10": 0.13236363636363638,
167
+ "map@1": 0.359,
168
+ "map@5": 0.4659,
169
+ "map@10": 0.478006746031746,
170
+ "mrr@1": 0.359,
171
+ "mrr@5": 0.4659,
172
+ "mrr@10": 0.478006746031746,
173
+ "num_pred": 1000,
174
+ "num_data": 1000
175
+ },
176
+ "ImageNet-A": {
177
+ "hit@1": 0.474,
178
+ "hit@5": 0.706,
179
+ "hit@10": 0.787,
180
+ "ndcg_linear@1": 0.474,
181
+ "ndcg_linear@5": 0.5955931729705578,
182
+ "ndcg_linear@10": 0.6222176191859202,
183
+ "ndcg_exponential@1": 0.474,
184
+ "ndcg_exponential@5": 0.5955931729705578,
185
+ "ndcg_exponential@10": 0.6222176191859202,
186
+ "precision@1": 0.474,
187
+ "precision@5": 0.1412,
188
+ "precision@10": 0.07869999999999999,
189
+ "recall@1": 0.474,
190
+ "recall@5": 0.706,
191
+ "recall@10": 0.787,
192
+ "f1@1": 0.474,
193
+ "f1@5": 0.23533333333333337,
194
+ "f1@10": 0.1430909090909091,
195
+ "map@1": 0.474,
196
+ "map@5": 0.559,
197
+ "map@10": 0.5702273809523809,
198
+ "mrr@1": 0.474,
199
+ "mrr@5": 0.559,
200
+ "mrr@10": 0.5702273809523809,
201
+ "num_pred": 1000,
202
+ "num_data": 1000
203
+ },
204
+ "ImageNet-R": {
205
+ "hit@1": 0.893,
206
+ "hit@5": 0.968,
207
+ "hit@10": 0.98,
208
+ "ndcg_linear@1": 0.893,
209
+ "ndcg_linear@5": 0.9354717686069736,
210
+ "ndcg_linear@10": 0.939360041159753,
211
+ "ndcg_exponential@1": 0.893,
212
+ "ndcg_exponential@5": 0.9354717686069736,
213
+ "ndcg_exponential@10": 0.939360041159753,
214
+ "precision@1": 0.893,
215
+ "precision@5": 0.19360000000000002,
216
+ "precision@10": 0.098,
217
+ "recall@1": 0.893,
218
+ "recall@5": 0.968,
219
+ "recall@10": 0.98,
220
+ "f1@1": 0.893,
221
+ "f1@5": 0.3226666666666666,
222
+ "f1@10": 0.17818181818181816,
223
+ "map@1": 0.893,
224
+ "map@5": 0.9244166666666668,
225
+ "map@10": 0.9260246031746031,
226
+ "mrr@1": 0.893,
227
+ "mrr@5": 0.9244166666666668,
228
+ "mrr@10": 0.9260246031746031,
229
+ "num_pred": 1000,
230
+ "num_data": 1000
231
+ },
232
+ "ObjectNet": {
233
+ "hit@1": 0.652,
234
+ "hit@5": 0.861,
235
+ "hit@10": 0.9,
236
+ "ndcg_linear@1": 0.652,
237
+ "ndcg_linear@5": 0.7682237991543275,
238
+ "ndcg_linear@10": 0.7806771789358414,
239
+ "ndcg_exponential@1": 0.652,
240
+ "ndcg_exponential@5": 0.7682237991543275,
241
+ "ndcg_exponential@10": 0.7806771789358414,
242
+ "precision@1": 0.652,
243
+ "precision@5": 0.1722,
244
+ "precision@10": 0.09000000000000001,
245
+ "recall@1": 0.652,
246
+ "recall@5": 0.861,
247
+ "recall@10": 0.9,
248
+ "f1@1": 0.652,
249
+ "f1@5": 0.287,
250
+ "f1@10": 0.16363636363636364,
251
+ "map@1": 0.652,
252
+ "map@5": 0.7369,
253
+ "map@10": 0.7419404761904761,
254
+ "mrr@1": 0.652,
255
+ "mrr@5": 0.7369,
256
+ "mrr@10": 0.7419404761904761,
257
+ "num_pred": 1000,
258
+ "num_data": 1000
259
+ },
260
+ "Country211": {
261
+ "hit@1": 0.252,
262
+ "hit@5": 0.442,
263
+ "hit@10": 0.531,
264
+ "ndcg_linear@1": 0.252,
265
+ "ndcg_linear@5": 0.35154694867048564,
266
+ "ndcg_linear@10": 0.3803077107107121,
267
+ "ndcg_exponential@1": 0.252,
268
+ "ndcg_exponential@5": 0.35154694867048564,
269
+ "ndcg_exponential@10": 0.3803077107107121,
270
+ "precision@1": 0.252,
271
+ "precision@5": 0.0884,
272
+ "precision@10": 0.053099999999999994,
273
+ "recall@1": 0.252,
274
+ "recall@5": 0.442,
275
+ "recall@10": 0.531,
276
+ "f1@1": 0.252,
277
+ "f1@5": 0.14733333333333337,
278
+ "f1@10": 0.09654545454545456,
279
+ "map@1": 0.252,
280
+ "map@5": 0.32154999999999995,
281
+ "map@10": 0.33340992063492064,
282
+ "mrr@1": 0.252,
283
+ "mrr@5": 0.32154999999999995,
284
+ "mrr@10": 0.33340992063492064,
285
+ "num_pred": 1000,
286
+ "num_data": 1000
287
+ },
288
+ "OK-VQA": {
289
+ "hit@1": 0.515,
290
+ "hit@5": 0.777,
291
+ "hit@10": 0.844,
292
+ "ndcg_linear@1": 0.515,
293
+ "ndcg_linear@5": 0.6561916901050675,
294
+ "ndcg_linear@10": 0.6779083028403337,
295
+ "ndcg_exponential@1": 0.515,
296
+ "ndcg_exponential@5": 0.6561916901050675,
297
+ "ndcg_exponential@10": 0.6779083028403337,
298
+ "precision@1": 0.515,
299
+ "precision@5": 0.15539999999999998,
300
+ "precision@10": 0.0844,
301
+ "recall@1": 0.515,
302
+ "recall@5": 0.777,
303
+ "recall@10": 0.844,
304
+ "f1@1": 0.515,
305
+ "f1@5": 0.259,
306
+ "f1@10": 0.15345454545454545,
307
+ "map@1": 0.515,
308
+ "map@5": 0.6158166666666667,
309
+ "map@10": 0.6248087301587302,
310
+ "mrr@1": 0.515,
311
+ "mrr@5": 0.6158166666666667,
312
+ "mrr@10": 0.6248087301587302,
313
+ "num_pred": 1000,
314
+ "num_data": 1000
315
+ },
316
+ "A-OKVQA": {
317
+ "hit@1": 0.436,
318
+ "hit@5": 0.727,
319
+ "hit@10": 0.799,
320
+ "ndcg_linear@1": 0.436,
321
+ "ndcg_linear@5": 0.5940223844793209,
322
+ "ndcg_linear@10": 0.6174487179188798,
323
+ "ndcg_exponential@1": 0.436,
324
+ "ndcg_exponential@5": 0.5940223844793209,
325
+ "ndcg_exponential@10": 0.6174487179188798,
326
+ "precision@1": 0.436,
327
+ "precision@5": 0.14539999999999997,
328
+ "precision@10": 0.0799,
329
+ "recall@1": 0.436,
330
+ "recall@5": 0.727,
331
+ "recall@10": 0.799,
332
+ "f1@1": 0.436,
333
+ "f1@5": 0.24233333333333337,
334
+ "f1@10": 0.14527272727272728,
335
+ "map@1": 0.436,
336
+ "map@5": 0.5494666666666667,
337
+ "map@10": 0.559218253968254,
338
+ "mrr@1": 0.436,
339
+ "mrr@5": 0.5494666666666667,
340
+ "mrr@10": 0.559218253968254,
341
+ "num_pred": 1000,
342
+ "num_data": 1000
343
+ },
344
+ "DocVQA": {
345
+ "hit@1": 0.901,
346
+ "hit@5": 0.97,
347
+ "hit@10": 0.98,
348
+ "ndcg_linear@1": 0.901,
349
+ "ndcg_linear@5": 0.9408983161880025,
350
+ "ndcg_linear@10": 0.9442465730917498,
351
+ "ndcg_exponential@1": 0.901,
352
+ "ndcg_exponential@5": 0.9408983161880025,
353
+ "ndcg_exponential@10": 0.9442465730917498,
354
+ "precision@1": 0.901,
355
+ "precision@5": 0.19400000000000003,
356
+ "precision@10": 0.09800000000000002,
357
+ "recall@1": 0.901,
358
+ "recall@5": 0.97,
359
+ "recall@10": 0.98,
360
+ "f1@1": 0.901,
361
+ "f1@5": 0.32333333333333336,
362
+ "f1@10": 0.17818181818181816,
363
+ "map@1": 0.901,
364
+ "map@5": 0.9309333333333333,
365
+ "map@10": 0.9323825396825398,
366
+ "mrr@1": 0.901,
367
+ "mrr@5": 0.9309333333333333,
368
+ "mrr@10": 0.9323825396825398,
369
+ "num_pred": 1000,
370
+ "num_data": 1000
371
+ },
372
+ "InfographicsVQA": {
373
+ "hit@1": 0.588,
374
+ "hit@5": 0.811,
375
+ "hit@10": 0.869,
376
+ "ndcg_linear@1": 0.588,
377
+ "ndcg_linear@5": 0.7072011349880222,
378
+ "ndcg_linear@10": 0.7260241531938669,
379
+ "ndcg_exponential@1": 0.588,
380
+ "ndcg_exponential@5": 0.7072011349880222,
381
+ "ndcg_exponential@10": 0.7260241531938669,
382
+ "precision@1": 0.588,
383
+ "precision@5": 0.16219999999999998,
384
+ "precision@10": 0.0869,
385
+ "recall@1": 0.588,
386
+ "recall@5": 0.811,
387
+ "recall@10": 0.869,
388
+ "f1@1": 0.588,
389
+ "f1@5": 0.27033333333333337,
390
+ "f1@10": 0.158,
391
+ "map@1": 0.588,
392
+ "map@5": 0.6726333333333334,
393
+ "map@10": 0.680443253968254,
394
+ "mrr@1": 0.588,
395
+ "mrr@5": 0.6726333333333334,
396
+ "mrr@10": 0.680443253968254,
397
+ "num_pred": 1000,
398
+ "num_data": 1000
399
+ },
400
+ "ChartQA": {
401
+ "hit@1": 0.474,
402
+ "hit@5": 0.676,
403
+ "hit@10": 0.753,
404
+ "ndcg_linear@1": 0.474,
405
+ "ndcg_linear@5": 0.5825057091236183,
406
+ "ndcg_linear@10": 0.607378542448543,
407
+ "ndcg_exponential@1": 0.474,
408
+ "ndcg_exponential@5": 0.5825057091236183,
409
+ "ndcg_exponential@10": 0.607378542448543,
410
+ "precision@1": 0.474,
411
+ "precision@5": 0.1352,
412
+ "precision@10": 0.0753,
413
+ "recall@1": 0.474,
414
+ "recall@5": 0.676,
415
+ "recall@10": 0.753,
416
+ "f1@1": 0.474,
417
+ "f1@5": 0.22533333333333336,
418
+ "f1@10": 0.1369090909090909,
419
+ "map@1": 0.474,
420
+ "map@5": 0.5513666666666666,
421
+ "map@10": 0.5616107142857143,
422
+ "mrr@1": 0.474,
423
+ "mrr@5": 0.5513666666666666,
424
+ "mrr@10": 0.5616107142857143,
425
+ "num_pred": 1000,
426
+ "num_data": 1000
427
+ },
428
+ "Visual7W": {
429
+ "hit@1": 0.529,
430
+ "hit@5": 0.877,
431
+ "hit@10": 0.953,
432
+ "ndcg_linear@1": 0.529,
433
+ "ndcg_linear@5": 0.7205350870379457,
434
+ "ndcg_linear@10": 0.7455710489687404,
435
+ "ndcg_exponential@1": 0.529,
436
+ "ndcg_exponential@5": 0.7205350870379457,
437
+ "ndcg_exponential@10": 0.7455710489687404,
438
+ "precision@1": 0.529,
439
+ "precision@5": 0.1754,
440
+ "precision@10": 0.09530000000000001,
441
+ "recall@1": 0.529,
442
+ "recall@5": 0.877,
443
+ "recall@10": 0.953,
444
+ "f1@1": 0.529,
445
+ "f1@5": 0.2923333333333334,
446
+ "f1@10": 0.17327272727272724,
447
+ "map@1": 0.529,
448
+ "map@5": 0.6679166666666665,
449
+ "map@10": 0.6785115079365078,
450
+ "mrr@1": 0.529,
451
+ "mrr@5": 0.6679166666666665,
452
+ "mrr@10": 0.6785115079365078,
453
+ "num_pred": 1000,
454
+ "num_data": 1000
455
+ },
456
+ "ScienceQA": {
457
+ "hit@1": 0.382,
458
+ "hit@5": 0.662,
459
+ "hit@10": 0.771,
460
+ "ndcg_linear@1": 0.382,
461
+ "ndcg_linear@5": 0.5275673656588401,
462
+ "ndcg_linear@10": 0.5626365394128282,
463
+ "ndcg_exponential@1": 0.382,
464
+ "ndcg_exponential@5": 0.5275673656588401,
465
+ "ndcg_exponential@10": 0.5626365394128282,
466
+ "precision@1": 0.382,
467
+ "precision@5": 0.1324,
468
+ "precision@10": 0.07709999999999999,
469
+ "recall@1": 0.382,
470
+ "recall@5": 0.662,
471
+ "recall@10": 0.771,
472
+ "f1@1": 0.382,
473
+ "f1@5": 0.2206666666666667,
474
+ "f1@10": 0.14018181818181819,
475
+ "map@1": 0.382,
476
+ "map@5": 0.4832666666666667,
477
+ "map@10": 0.49763412698412696,
478
+ "mrr@1": 0.382,
479
+ "mrr@5": 0.4832666666666667,
480
+ "mrr@10": 0.49763412698412696,
481
+ "num_pred": 1000,
482
+ "num_data": 1000
483
+ },
484
+ "VizWiz": {
485
+ "hit@1": 0.433,
486
+ "hit@5": 0.61,
487
+ "hit@10": 0.671,
488
+ "ndcg_linear@1": 0.433,
489
+ "ndcg_linear@5": 0.5297118471987433,
490
+ "ndcg_linear@10": 0.5497377057138165,
491
+ "ndcg_exponential@1": 0.433,
492
+ "ndcg_exponential@5": 0.5297118471987433,
493
+ "ndcg_exponential@10": 0.5497377057138165,
494
+ "precision@1": 0.433,
495
+ "precision@5": 0.12199999999999997,
496
+ "precision@10": 0.06709999999999999,
497
+ "recall@1": 0.433,
498
+ "recall@5": 0.61,
499
+ "recall@10": 0.671,
500
+ "f1@1": 0.433,
501
+ "f1@5": 0.20333333333333337,
502
+ "f1@10": 0.12200000000000003,
503
+ "map@1": 0.433,
504
+ "map@5": 0.5027333333333334,
505
+ "map@10": 0.5111761904761905,
506
+ "mrr@1": 0.433,
507
+ "mrr@5": 0.5027333333333334,
508
+ "mrr@10": 0.5111761904761905,
509
+ "num_pred": 1000,
510
+ "num_data": 1000
511
+ },
512
+ "GQA": {
513
+ "hit@1": 0.649,
514
+ "hit@5": 0.886,
515
+ "hit@10": 0.927,
516
+ "ndcg_linear@1": 0.649,
517
+ "ndcg_linear@5": 0.7797599318993801,
518
+ "ndcg_linear@10": 0.7931564189677488,
519
+ "ndcg_exponential@1": 0.649,
520
+ "ndcg_exponential@5": 0.7797599318993801,
521
+ "ndcg_exponential@10": 0.7931564189677488,
522
+ "precision@1": 0.649,
523
+ "precision@5": 0.17720000000000005,
524
+ "precision@10": 0.09270000000000002,
525
+ "recall@1": 0.649,
526
+ "recall@5": 0.886,
527
+ "recall@10": 0.927,
528
+ "f1@1": 0.649,
529
+ "f1@5": 0.2953333333333334,
530
+ "f1@10": 0.16854545454545455,
531
+ "map@1": 0.649,
532
+ "map@5": 0.7439666666666667,
533
+ "map@10": 0.7495777777777778,
534
+ "mrr@1": 0.649,
535
+ "mrr@5": 0.7439666666666667,
536
+ "mrr@10": 0.7495777777777778,
537
+ "num_pred": 1000,
538
+ "num_data": 1000
539
+ },
540
+ "TextVQA": {
541
+ "hit@1": 0.722,
542
+ "hit@5": 0.833,
543
+ "hit@10": 0.863,
544
+ "ndcg_linear@1": 0.722,
545
+ "ndcg_linear@5": 0.7819030121133494,
546
+ "ndcg_linear@10": 0.7918381023735301,
547
+ "ndcg_exponential@1": 0.722,
548
+ "ndcg_exponential@5": 0.7819030121133494,
549
+ "ndcg_exponential@10": 0.7918381023735301,
550
+ "precision@1": 0.722,
551
+ "precision@5": 0.16660000000000003,
552
+ "precision@10": 0.08630000000000002,
553
+ "recall@1": 0.722,
554
+ "recall@5": 0.833,
555
+ "recall@10": 0.863,
556
+ "f1@1": 0.722,
557
+ "f1@5": 0.2776666666666667,
558
+ "f1@10": 0.15690909090909091,
559
+ "map@1": 0.722,
560
+ "map@5": 0.7648166666666666,
561
+ "map@10": 0.7690543650793651,
562
+ "mrr@1": 0.722,
563
+ "mrr@5": 0.7648166666666666,
564
+ "mrr@10": 0.7690543650793651,
565
+ "num_pred": 1000,
566
+ "num_data": 1000
567
+ },
568
+ "VisDial": {
569
+ "hit@1": 0.827,
570
+ "hit@5": 0.968,
571
+ "hit@10": 0.986,
572
+ "ndcg_linear@1": 0.827,
573
+ "ndcg_linear@5": 0.9045672377369148,
574
+ "ndcg_linear@10": 0.9104807612339774,
575
+ "ndcg_exponential@1": 0.827,
576
+ "ndcg_exponential@5": 0.9045672377369148,
577
+ "ndcg_exponential@10": 0.9104807612339774,
578
+ "precision@1": 0.827,
579
+ "precision@5": 0.19360000000000002,
580
+ "precision@10": 0.09860000000000002,
581
+ "recall@1": 0.827,
582
+ "recall@5": 0.968,
583
+ "recall@10": 0.986,
584
+ "f1@1": 0.827,
585
+ "f1@5": 0.3226666666666667,
586
+ "f1@10": 0.17927272727272725,
587
+ "map@1": 0.827,
588
+ "map@5": 0.88325,
589
+ "map@10": 0.8857444444444444,
590
+ "mrr@1": 0.827,
591
+ "mrr@5": 0.88325,
592
+ "mrr@10": 0.8857444444444444,
593
+ "num_pred": 1000,
594
+ "num_data": 1000
595
+ },
596
+ "CIRR": {
597
+ "hit@1": 0.575,
598
+ "hit@5": 0.899,
599
+ "hit@10": 0.953,
600
+ "ndcg_linear@1": 0.575,
601
+ "ndcg_linear@5": 0.7551683396424022,
602
+ "ndcg_linear@10": 0.7727898661723096,
603
+ "ndcg_exponential@1": 0.575,
604
+ "ndcg_exponential@5": 0.7551683396424022,
605
+ "ndcg_exponential@10": 0.7727898661723096,
606
+ "precision@1": 0.575,
607
+ "precision@5": 0.17980000000000002,
608
+ "precision@10": 0.09530000000000001,
609
+ "recall@1": 0.575,
610
+ "recall@5": 0.899,
611
+ "recall@10": 0.953,
612
+ "f1@1": 0.575,
613
+ "f1@5": 0.2996666666666667,
614
+ "f1@10": 0.17327272727272727,
615
+ "map@1": 0.575,
616
+ "map@5": 0.7066166666666667,
617
+ "map@10": 0.7139825396825397,
618
+ "mrr@1": 0.575,
619
+ "mrr@5": 0.7066166666666667,
620
+ "mrr@10": 0.7139825396825397,
621
+ "num_pred": 1000,
622
+ "num_data": 1000
623
+ },
624
+ "VisualNews_t2i": {
625
+ "hit@1": 0.745,
626
+ "hit@5": 0.895,
627
+ "hit@10": 0.928,
628
+ "ndcg_linear@1": 0.745,
629
+ "ndcg_linear@5": 0.8286638944708601,
630
+ "ndcg_linear@10": 0.8393509120511464,
631
+ "ndcg_exponential@1": 0.745,
632
+ "ndcg_exponential@5": 0.8286638944708601,
633
+ "ndcg_exponential@10": 0.8393509120511464,
634
+ "precision@1": 0.745,
635
+ "precision@5": 0.17900000000000002,
636
+ "precision@10": 0.09280000000000001,
637
+ "recall@1": 0.745,
638
+ "recall@5": 0.895,
639
+ "recall@10": 0.928,
640
+ "f1@1": 0.745,
641
+ "f1@5": 0.2983333333333334,
642
+ "f1@10": 0.1687272727272727,
643
+ "map@1": 0.745,
644
+ "map@5": 0.8062833333333334,
645
+ "map@10": 0.8107011904761905,
646
+ "mrr@1": 0.745,
647
+ "mrr@5": 0.8062833333333334,
648
+ "mrr@10": 0.8107011904761905,
649
+ "num_pred": 1000,
650
+ "num_data": 1000
651
+ },
652
+ "VisualNews_i2t": {
653
+ "hit@1": 0.782,
654
+ "hit@5": 0.906,
655
+ "hit@10": 0.935,
656
+ "ndcg_linear@1": 0.782,
657
+ "ndcg_linear@5": 0.8486488958609838,
658
+ "ndcg_linear@10": 0.8583163159480872,
659
+ "ndcg_exponential@1": 0.782,
660
+ "ndcg_exponential@5": 0.8486488958609838,
661
+ "ndcg_exponential@10": 0.8583163159480872,
662
+ "precision@1": 0.782,
663
+ "precision@5": 0.18120000000000003,
664
+ "precision@10": 0.09350000000000001,
665
+ "recall@1": 0.782,
666
+ "recall@5": 0.906,
667
+ "recall@10": 0.935,
668
+ "f1@1": 0.782,
669
+ "f1@5": 0.302,
670
+ "f1@10": 0.17,
671
+ "map@1": 0.782,
672
+ "map@5": 0.8295,
673
+ "map@10": 0.833656746031746,
674
+ "mrr@1": 0.782,
675
+ "mrr@5": 0.8295,
676
+ "mrr@10": 0.833656746031746,
677
+ "num_pred": 1000,
678
+ "num_data": 1000
679
+ },
680
+ "MSCOCO_t2i": {
681
+ "hit@1": 0.753,
682
+ "hit@5": 0.949,
683
+ "hit@10": 0.981,
684
+ "ndcg_linear@1": 0.753,
685
+ "ndcg_linear@5": 0.8611598177428067,
686
+ "ndcg_linear@10": 0.8714056173186473,
687
+ "ndcg_exponential@1": 0.753,
688
+ "ndcg_exponential@5": 0.8611598177428067,
689
+ "ndcg_exponential@10": 0.8714056173186473,
690
+ "precision@1": 0.753,
691
+ "precision@5": 0.18980000000000002,
692
+ "precision@10": 0.0981,
693
+ "recall@1": 0.753,
694
+ "recall@5": 0.949,
695
+ "recall@10": 0.981,
696
+ "f1@1": 0.753,
697
+ "f1@5": 0.3163333333333333,
698
+ "f1@10": 0.1783636363636363,
699
+ "map@1": 0.753,
700
+ "map@5": 0.8315833333333333,
701
+ "map@10": 0.83575,
702
+ "mrr@1": 0.753,
703
+ "mrr@5": 0.8315833333333333,
704
+ "mrr@10": 0.83575,
705
+ "num_pred": 1000,
706
+ "num_data": 1000
707
+ },
708
+ "MSCOCO_i2t": {
709
+ "hit@1": 0.714,
710
+ "hit@5": 0.94,
711
+ "hit@10": 0.987,
712
+ "ndcg_linear@1": 0.714,
713
+ "ndcg_linear@5": 0.8382480589924204,
714
+ "ndcg_linear@10": 0.8536803755951516,
715
+ "ndcg_exponential@1": 0.714,
716
+ "ndcg_exponential@5": 0.8382480589924204,
717
+ "ndcg_exponential@10": 0.8536803755951516,
718
+ "precision@1": 0.714,
719
+ "precision@5": 0.18800000000000003,
720
+ "precision@10": 0.09870000000000002,
721
+ "recall@1": 0.714,
722
+ "recall@5": 0.94,
723
+ "recall@10": 0.987,
724
+ "f1@1": 0.714,
725
+ "f1@5": 0.31333333333333335,
726
+ "f1@10": 0.17945454545454545,
727
+ "map@1": 0.714,
728
+ "map@5": 0.8040333333333333,
729
+ "map@10": 0.8105345238095237,
730
+ "mrr@1": 0.714,
731
+ "mrr@5": 0.8040333333333333,
732
+ "mrr@10": 0.8105345238095237,
733
+ "num_pred": 1000,
734
+ "num_data": 1000
735
+ },
736
+ "NIGHTS": {
737
+ "hit@1": 0.686,
738
+ "hit@5": 0.98,
739
+ "hit@10": 0.996,
740
+ "ndcg_linear@1": 0.686,
741
+ "ndcg_linear@5": 0.8539747226047097,
742
+ "ndcg_linear@10": 0.8594110413481301,
743
+ "ndcg_exponential@1": 0.686,
744
+ "ndcg_exponential@5": 0.8539747226047097,
745
+ "ndcg_exponential@10": 0.8594110413481301,
746
+ "precision@1": 0.686,
747
+ "precision@5": 0.196,
748
+ "precision@10": 0.09960000000000002,
749
+ "recall@1": 0.686,
750
+ "recall@5": 0.98,
751
+ "recall@10": 0.996,
752
+ "f1@1": 0.686,
753
+ "f1@5": 0.3266666666666666,
754
+ "f1@10": 0.18109090909090905,
755
+ "map@1": 0.686,
756
+ "map@5": 0.81095,
757
+ "map@10": 0.813347619047619,
758
+ "mrr@1": 0.686,
759
+ "mrr@5": 0.81095,
760
+ "mrr@10": 0.813347619047619,
761
+ "num_pred": 1000,
762
+ "num_data": 1000
763
+ },
764
+ "WebQA": {
765
+ "hit@1": 0.906,
766
+ "hit@5": 0.988,
767
+ "hit@10": 0.993,
768
+ "ndcg_linear@1": 0.906,
769
+ "ndcg_linear@5": 0.953453471346856,
770
+ "ndcg_linear@10": 0.9551658857210721,
771
+ "ndcg_exponential@1": 0.906,
772
+ "ndcg_exponential@5": 0.953453471346856,
773
+ "ndcg_exponential@10": 0.9551658857210721,
774
+ "precision@1": 0.906,
775
+ "precision@5": 0.19760000000000003,
776
+ "precision@10": 0.09930000000000001,
777
+ "recall@1": 0.906,
778
+ "recall@5": 0.988,
779
+ "recall@10": 0.993,
780
+ "f1@1": 0.906,
781
+ "f1@5": 0.3293333333333333,
782
+ "f1@10": 0.18054545454545454,
783
+ "map@1": 0.906,
784
+ "map@5": 0.9415999999999999,
785
+ "map@10": 0.9423619047619047,
786
+ "mrr@1": 0.906,
787
+ "mrr@5": 0.9415999999999999,
788
+ "mrr@10": 0.9423619047619047,
789
+ "num_pred": 1000,
790
+ "num_data": 1000
791
+ },
792
+ "FashionIQ": {
793
+ "hit@1": 0.195,
794
+ "hit@5": 0.434,
795
+ "hit@10": 0.567,
796
+ "ndcg_linear@1": 0.195,
797
+ "ndcg_linear@5": 0.3199008192098037,
798
+ "ndcg_linear@10": 0.36332550239850325,
799
+ "ndcg_exponential@1": 0.195,
800
+ "ndcg_exponential@5": 0.3199008192098037,
801
+ "ndcg_exponential@10": 0.36332550239850325,
802
+ "precision@1": 0.195,
803
+ "precision@5": 0.08680000000000002,
804
+ "precision@10": 0.05669999999999999,
805
+ "recall@1": 0.195,
806
+ "recall@5": 0.434,
807
+ "recall@10": 0.567,
808
+ "f1@1": 0.195,
809
+ "f1@5": 0.1446666666666667,
810
+ "f1@10": 0.10309090909090911,
811
+ "map@1": 0.195,
812
+ "map@5": 0.28218333333333334,
813
+ "map@10": 0.3003369047619047,
814
+ "mrr@1": 0.195,
815
+ "mrr@5": 0.28218333333333334,
816
+ "mrr@10": 0.3003369047619047,
817
+ "num_pred": 1000,
818
+ "num_data": 1000
819
+ },
820
+ "Wiki-SS-NQ": {
821
+ "hit@1": 0.669,
822
+ "hit@5": 0.88,
823
+ "hit@10": 0.921,
824
+ "ndcg_linear@1": 0.669,
825
+ "ndcg_linear@5": 0.787070983987401,
826
+ "ndcg_linear@10": 0.8003663875618333,
827
+ "ndcg_exponential@1": 0.669,
828
+ "ndcg_exponential@5": 0.787070983987401,
829
+ "ndcg_exponential@10": 0.8003663875618333,
830
+ "precision@1": 0.669,
831
+ "precision@5": 0.176,
832
+ "precision@10": 0.09210000000000002,
833
+ "recall@1": 0.669,
834
+ "recall@5": 0.88,
835
+ "recall@10": 0.921,
836
+ "f1@1": 0.669,
837
+ "f1@5": 0.2933333333333334,
838
+ "f1@10": 0.16745454545454547,
839
+ "map@1": 0.669,
840
+ "map@5": 0.7556499999999999,
841
+ "map@10": 0.7611603174603174,
842
+ "mrr@1": 0.669,
843
+ "mrr@5": 0.7556499999999999,
844
+ "mrr@10": 0.7611603174603174,
845
+ "num_pred": 1000,
846
+ "num_data": 1000
847
+ },
848
+ "OVEN": {
849
+ "hit@1": 0.643,
850
+ "hit@5": 0.851,
851
+ "hit@10": 0.907,
852
+ "ndcg_linear@1": 0.643,
853
+ "ndcg_linear@5": 0.75896196577168,
854
+ "ndcg_linear@10": 0.7771824352969045,
855
+ "ndcg_exponential@1": 0.643,
856
+ "ndcg_exponential@5": 0.75896196577168,
857
+ "ndcg_exponential@10": 0.7771824352969045,
858
+ "precision@1": 0.643,
859
+ "precision@5": 0.1702,
860
+ "precision@10": 0.09070000000000002,
861
+ "recall@1": 0.643,
862
+ "recall@5": 0.851,
863
+ "recall@10": 0.907,
864
+ "f1@1": 0.643,
865
+ "f1@5": 0.28366666666666673,
866
+ "f1@10": 0.16490909090909087,
867
+ "map@1": 0.643,
868
+ "map@5": 0.7279166666666668,
869
+ "map@10": 0.7354976190476191,
870
+ "mrr@1": 0.643,
871
+ "mrr@5": 0.7279166666666668,
872
+ "mrr@10": 0.7354976190476191,
873
+ "num_pred": 1000,
874
+ "num_data": 1000
875
+ },
876
+ "EDIS": {
877
+ "hit@1": 0.841,
878
+ "hit@5": 0.982,
879
+ "hit@10": 0.991,
880
+ "ndcg_linear@1": 0.841,
881
+ "ndcg_linear@5": 0.919465963451109,
882
+ "ndcg_linear@10": 0.9224571152777739,
883
+ "ndcg_exponential@1": 0.841,
884
+ "ndcg_exponential@5": 0.919465963451109,
885
+ "ndcg_exponential@10": 0.9224571152777739,
886
+ "precision@1": 0.841,
887
+ "precision@5": 0.19640000000000005,
888
+ "precision@10": 0.09910000000000002,
889
+ "recall@1": 0.841,
890
+ "recall@5": 0.982,
891
+ "recall@10": 0.991,
892
+ "f1@1": 0.841,
893
+ "f1@5": 0.3273333333333333,
894
+ "f1@10": 0.18018181818181817,
895
+ "map@1": 0.841,
896
+ "map@5": 0.8983833333333333,
897
+ "map@10": 0.8996650793650793,
898
+ "mrr@1": 0.841,
899
+ "mrr@5": 0.8983833333333333,
900
+ "mrr@10": 0.8996650793650793,
901
+ "num_pred": 1000,
902
+ "num_data": 1000
903
+ },
904
+ "MSCOCO": {
905
+ "hit@1": 0.671,
906
+ "hit@5": 0.796,
907
+ "hit@10": 0.846,
908
+ "ndcg_linear@1": 0.671,
909
+ "ndcg_linear@5": 0.7385700746119735,
910
+ "ndcg_linear@10": 0.75471044609582,
911
+ "ndcg_exponential@1": 0.671,
912
+ "ndcg_exponential@5": 0.7385700746119735,
913
+ "ndcg_exponential@10": 0.75471044609582,
914
+ "precision@1": 0.671,
915
+ "precision@5": 0.1592,
916
+ "precision@10": 0.0846,
917
+ "recall@1": 0.671,
918
+ "recall@5": 0.796,
919
+ "recall@10": 0.846,
920
+ "f1@1": 0.671,
921
+ "f1@5": 0.26533333333333337,
922
+ "f1@10": 0.15381818181818183,
923
+ "map@1": 0.671,
924
+ "map@5": 0.7193833333333334,
925
+ "map@10": 0.7260313492063492,
926
+ "mrr@1": 0.671,
927
+ "mrr@5": 0.7193833333333334,
928
+ "mrr@10": 0.7260313492063492,
929
+ "num_pred": 1000,
930
+ "num_data": 1000
931
+ },
932
+ "RefCOCO": {
933
+ "hit@1": 0.871,
934
+ "hit@5": 0.978,
935
+ "hit@10": 0.992,
936
+ "ndcg_linear@1": 0.871,
937
+ "ndcg_linear@5": 0.9320666707886123,
938
+ "ndcg_linear@10": 0.9367513120480281,
939
+ "ndcg_exponential@1": 0.871,
940
+ "ndcg_exponential@5": 0.9320666707886123,
941
+ "ndcg_exponential@10": 0.9367513120480281,
942
+ "precision@1": 0.871,
943
+ "precision@5": 0.19560000000000002,
944
+ "precision@10": 0.09920000000000001,
945
+ "recall@1": 0.871,
946
+ "recall@5": 0.978,
947
+ "recall@10": 0.992,
948
+ "f1@1": 0.871,
949
+ "f1@5": 0.326,
950
+ "f1@10": 0.18036363636363634,
951
+ "map@1": 0.871,
952
+ "map@5": 0.9164333333333334,
953
+ "map@10": 0.9184607142857143,
954
+ "mrr@1": 0.871,
955
+ "mrr@5": 0.9164333333333334,
956
+ "mrr@10": 0.9184607142857143,
957
+ "num_pred": 1000,
958
+ "num_data": 1000
959
+ },
960
+ "RefCOCO-Matching": {
961
+ "hit@1": 0.858,
962
+ "hit@5": 1.0,
963
+ "hit@10": 1.0,
964
+ "ndcg_linear@1": 0.858,
965
+ "ndcg_linear@5": 0.948647694865312,
966
+ "ndcg_linear@10": 0.948647694865312,
967
+ "ndcg_exponential@1": 0.858,
968
+ "ndcg_exponential@5": 0.948647694865312,
969
+ "ndcg_exponential@10": 0.948647694865312,
970
+ "precision@1": 0.858,
971
+ "precision@5": 0.20000000000000004,
972
+ "precision@10": 0.10000000000000002,
973
+ "recall@1": 0.858,
974
+ "recall@5": 1.0,
975
+ "recall@10": 1.0,
976
+ "f1@1": 0.858,
977
+ "f1@5": 0.3333333333333333,
978
+ "f1@10": 0.18181818181818182,
979
+ "map@1": 0.858,
980
+ "map@5": 0.93095,
981
+ "map@10": 0.93095,
982
+ "mrr@1": 0.858,
983
+ "mrr@5": 0.92795,
984
+ "mrr@10": 0.92795,
985
+ "num_pred": 1000,
986
+ "num_data": 1000
987
+ },
988
+ "Visual7W-Pointing": {
989
+ "hit@1": 0.692,
990
+ "hit@5": 0.865,
991
+ "hit@10": 0.906,
992
+ "ndcg_linear@1": 0.692,
993
+ "ndcg_linear@5": 0.7886508353101727,
994
+ "ndcg_linear@10": 0.8018399920089694,
995
+ "ndcg_exponential@1": 0.692,
996
+ "ndcg_exponential@5": 0.7886508353101727,
997
+ "ndcg_exponential@10": 0.8018399920089694,
998
+ "precision@1": 0.692,
999
+ "precision@5": 0.173,
1000
+ "precision@10": 0.09060000000000001,
1001
+ "recall@1": 0.692,
1002
+ "recall@5": 0.865,
1003
+ "recall@10": 0.906,
1004
+ "f1@1": 0.692,
1005
+ "f1@5": 0.2883333333333334,
1006
+ "f1@10": 0.16472727272727272,
1007
+ "map@1": 0.692,
1008
+ "map@5": 0.7628499999999999,
1009
+ "map@10": 0.7682543650793651,
1010
+ "mrr@1": 0.692,
1011
+ "mrr@5": 0.7628499999999999,
1012
+ "mrr@10": 0.7682543650793651,
1013
+ "num_pred": 1000,
1014
+ "num_data": 1000
1015
+ }
1016
+ },
1017
+ "video": {
1018
+ "K700": {
1019
+ "hit@1": 0.38,
1020
+ "hit@5": 0.623,
1021
+ "hit@10": 0.697,
1022
+ "ndcg_linear@1": 0.38,
1023
+ "ndcg_linear@5": 0.5087323881529896,
1024
+ "ndcg_linear@10": 0.5328292310353233,
1025
+ "ndcg_exponential@1": 0.38,
1026
+ "ndcg_exponential@5": 0.5087323881529896,
1027
+ "ndcg_exponential@10": 0.5328292310353233,
1028
+ "precision@1": 0.38,
1029
+ "precision@5": 0.12459999999999999,
1030
+ "precision@10": 0.06969999999999998,
1031
+ "recall@1": 0.38,
1032
+ "recall@5": 0.623,
1033
+ "recall@10": 0.697,
1034
+ "f1@1": 0.38,
1035
+ "f1@5": 0.20766666666666675,
1036
+ "f1@10": 0.12672727272727274,
1037
+ "map@1": 0.38,
1038
+ "map@5": 0.4706833333333333,
1039
+ "map@10": 0.4807186507936508,
1040
+ "mrr@1": 0.38,
1041
+ "mrr@5": 0.4706833333333333,
1042
+ "mrr@10": 0.4807186507936508,
1043
+ "num_pred": 1000,
1044
+ "num_data": 1000
1045
+ },
1046
+ "SmthSmthV2": {
1047
+ "hit@1": 0.428,
1048
+ "hit@5": 0.692,
1049
+ "hit@10": 0.786,
1050
+ "ndcg_linear@1": 0.428,
1051
+ "ndcg_linear@5": 0.5672834391090181,
1052
+ "ndcg_linear@10": 0.5981163502873708,
1053
+ "ndcg_exponential@1": 0.428,
1054
+ "ndcg_exponential@5": 0.5672834391090181,
1055
+ "ndcg_exponential@10": 0.5981163502873708,
1056
+ "precision@1": 0.428,
1057
+ "precision@5": 0.13839999999999997,
1058
+ "precision@10": 0.07859999999999999,
1059
+ "recall@1": 0.428,
1060
+ "recall@5": 0.692,
1061
+ "recall@10": 0.786,
1062
+ "f1@1": 0.428,
1063
+ "f1@5": 0.23066666666666674,
1064
+ "f1@10": 0.14290909090909093,
1065
+ "map@1": 0.428,
1066
+ "map@5": 0.5259333333333333,
1067
+ "map@10": 0.5389079365079364,
1068
+ "mrr@1": 0.428,
1069
+ "mrr@5": 0.5259333333333333,
1070
+ "mrr@10": 0.5389079365079364,
1071
+ "num_pred": 1000,
1072
+ "num_data": 1000
1073
+ },
1074
+ "HMDB51": {
1075
+ "hit@1": 0.409,
1076
+ "hit@5": 0.638,
1077
+ "hit@10": 0.713,
1078
+ "ndcg_linear@1": 0.409,
1079
+ "ndcg_linear@5": 0.5335348498920724,
1080
+ "ndcg_linear@10": 0.5576824580140078,
1081
+ "ndcg_exponential@1": 0.409,
1082
+ "ndcg_exponential@5": 0.5335348498920724,
1083
+ "ndcg_exponential@10": 0.5576824580140078,
1084
+ "precision@1": 0.409,
1085
+ "precision@5": 0.12760000000000002,
1086
+ "precision@10": 0.0713,
1087
+ "recall@1": 0.409,
1088
+ "recall@5": 0.638,
1089
+ "recall@10": 0.713,
1090
+ "f1@1": 0.409,
1091
+ "f1@5": 0.21266666666666673,
1092
+ "f1@10": 0.12963636363636366,
1093
+ "map@1": 0.409,
1094
+ "map@5": 0.49854999999999994,
1095
+ "map@10": 0.5084662698412699,
1096
+ "mrr@1": 0.409,
1097
+ "mrr@5": 0.49854999999999994,
1098
+ "mrr@10": 0.5084662698412699,
1099
+ "num_pred": 1000,
1100
+ "num_data": 1000
1101
+ },
1102
+ "UCF101": {
1103
+ "hit@1": 0.6,
1104
+ "hit@5": 0.831,
1105
+ "hit@10": 0.888,
1106
+ "ndcg_linear@1": 0.6,
1107
+ "ndcg_linear@5": 0.728875610371988,
1108
+ "ndcg_linear@10": 0.7473187422682429,
1109
+ "ndcg_exponential@1": 0.6,
1110
+ "ndcg_exponential@5": 0.728875610371988,
1111
+ "ndcg_exponential@10": 0.7473187422682429,
1112
+ "precision@1": 0.6,
1113
+ "precision@5": 0.16620000000000001,
1114
+ "precision@10": 0.08880000000000002,
1115
+ "recall@1": 0.6,
1116
+ "recall@5": 0.831,
1117
+ "recall@10": 0.888,
1118
+ "f1@1": 0.6,
1119
+ "f1@5": 0.277,
1120
+ "f1@10": 0.16145454545454543,
1121
+ "map@1": 0.6,
1122
+ "map@5": 0.6944166666666668,
1123
+ "map@10": 0.7020325396825396,
1124
+ "mrr@1": 0.6,
1125
+ "mrr@5": 0.6944166666666668,
1126
+ "mrr@10": 0.7020325396825396,
1127
+ "num_pred": 1000,
1128
+ "num_data": 1000
1129
+ },
1130
+ "Breakfast": {
1131
+ "hit@1": 0.14780600461893764,
1132
+ "hit@5": 0.6327944572748267,
1133
+ "hit@10": 1.0,
1134
+ "ndcg_linear@1": 0.14780600461893764,
1135
+ "ndcg_linear@5": 0.3858298763211173,
1136
+ "ndcg_linear@10": 0.5069598731135728,
1137
+ "ndcg_exponential@1": 0.14780600461893764,
1138
+ "ndcg_exponential@5": 0.3858298763211173,
1139
+ "ndcg_exponential@10": 0.5069598731135728,
1140
+ "precision@1": 0.14780600461893764,
1141
+ "precision@5": 0.12655889145496535,
1142
+ "precision@10": 0.1,
1143
+ "recall@1": 0.14780600461893764,
1144
+ "recall@5": 0.6327944572748267,
1145
+ "recall@10": 1.0,
1146
+ "f1@1": 0.14780600461893764,
1147
+ "f1@5": 0.21093148575827564,
1148
+ "f1@10": 0.1818181818181818,
1149
+ "map@1": 0.14780600461893764,
1150
+ "map@5": 0.30546574287913775,
1151
+ "map@10": 0.3568477583489131,
1152
+ "mrr@1": 0.14780600461893764,
1153
+ "mrr@5": 0.30546574287913775,
1154
+ "mrr@10": 0.3568477583489131,
1155
+ "num_pred": 433,
1156
+ "num_data": 433
1157
+ },
1158
+ "MVBench": {
1159
+ "hit@1": 0.337,
1160
+ "hit@5": 1.0,
1161
+ "hit@10": 1.0,
1162
+ "ndcg_linear@1": 0.337,
1163
+ "ndcg_linear@5": 0.7011998180757394,
1164
+ "ndcg_linear@10": 0.7011998180757394,
1165
+ "ndcg_exponential@1": 0.337,
1166
+ "ndcg_exponential@5": 0.7011998180757394,
1167
+ "ndcg_exponential@10": 0.7011998180757394,
1168
+ "precision@1": 0.337,
1169
+ "precision@5": 0.20000000000000004,
1170
+ "precision@10": 0.10000000000000002,
1171
+ "recall@1": 0.337,
1172
+ "recall@5": 1.0,
1173
+ "recall@10": 1.0,
1174
+ "f1@1": 0.337,
1175
+ "f1@5": 0.3333333333333333,
1176
+ "f1@10": 0.18181818181818182,
1177
+ "map@1": 0.337,
1178
+ "map@5": 0.6002625,
1179
+ "map@10": 0.6002625,
1180
+ "mrr@1": 0.337,
1181
+ "mrr@5": 0.6002625,
1182
+ "mrr@10": 0.6002625,
1183
+ "num_pred": 4000,
1184
+ "num_data": 4000
1185
+ },
1186
+ "Video-MME": {
1187
+ "hit@1": 0.30703703703703705,
1188
+ "hit@5": 1.0,
1189
+ "hit@10": 1.0,
1190
+ "ndcg_linear@1": 0.30703703703703705,
1191
+ "ndcg_linear@5": 0.6745941548531916,
1192
+ "ndcg_linear@10": 0.6745941548531916,
1193
+ "ndcg_exponential@1": 0.30703703703703705,
1194
+ "ndcg_exponential@5": 0.6745941548531916,
1195
+ "ndcg_exponential@10": 0.6745941548531916,
1196
+ "precision@1": 0.30703703703703705,
1197
+ "precision@5": 0.19999999999999996,
1198
+ "precision@10": 0.09999999999999998,
1199
+ "recall@1": 0.30703703703703705,
1200
+ "recall@5": 1.0,
1201
+ "recall@10": 1.0,
1202
+ "f1@1": 0.30703703703703705,
1203
+ "f1@5": 0.3333333333333334,
1204
+ "f1@10": 0.18181818181818188,
1205
+ "map@1": 0.30703703703703705,
1206
+ "map@5": 0.5658024691358025,
1207
+ "map@10": 0.5658024691358025,
1208
+ "mrr@1": 0.30703703703703705,
1209
+ "mrr@5": 0.5658024691358025,
1210
+ "mrr@10": 0.5658024691358025,
1211
+ "num_pred": 2700,
1212
+ "num_data": 2700
1213
+ },
1214
+ "NExTQA": {
1215
+ "hit@1": 0.20924801494628678,
1216
+ "hit@5": 1.0,
1217
+ "hit@10": 1.0,
1218
+ "ndcg_linear@1": 0.20924801494628678,
1219
+ "ndcg_linear@5": 0.6098815656327321,
1220
+ "ndcg_linear@10": 0.6098815656327321,
1221
+ "ndcg_exponential@1": 0.20924801494628678,
1222
+ "ndcg_exponential@5": 0.6098815656327321,
1223
+ "ndcg_exponential@10": 0.6098815656327321,
1224
+ "precision@1": 0.20924801494628678,
1225
+ "precision@5": 0.20000000000000004,
1226
+ "precision@10": 0.10000000000000002,
1227
+ "recall@1": 0.20924801494628678,
1228
+ "recall@5": 1.0,
1229
+ "recall@10": 1.0,
1230
+ "f1@1": 0.20924801494628678,
1231
+ "f1@5": 0.3333333333333333,
1232
+ "f1@10": 0.1818181818181818,
1233
+ "map@1": 0.20924801494628678,
1234
+ "map@5": 0.4819554725206289,
1235
+ "map@10": 0.4819554725206289,
1236
+ "mrr@1": 0.20924801494628678,
1237
+ "mrr@5": 0.4817803207224038,
1238
+ "mrr@10": 0.4817803207224038,
1239
+ "num_pred": 8564,
1240
+ "num_data": 8564
1241
+ },
1242
+ "EgoSchema": {
1243
+ "hit@1": 0.34,
1244
+ "hit@5": 1.0,
1245
+ "hit@10": 1.0,
1246
+ "ndcg_linear@1": 0.34,
1247
+ "ndcg_linear@5": 0.6804792280158065,
1248
+ "ndcg_linear@10": 0.6804792280158065,
1249
+ "ndcg_exponential@1": 0.34,
1250
+ "ndcg_exponential@5": 0.6804792280158065,
1251
+ "ndcg_exponential@10": 0.6804792280158065,
1252
+ "precision@1": 0.34,
1253
+ "precision@5": 0.2,
1254
+ "precision@10": 0.1,
1255
+ "recall@1": 0.34,
1256
+ "recall@5": 1.0,
1257
+ "recall@10": 1.0,
1258
+ "f1@1": 0.34,
1259
+ "f1@5": 0.3333333333333333,
1260
+ "f1@10": 0.18181818181818182,
1261
+ "map@1": 0.34,
1262
+ "map@5": 0.5750333333333333,
1263
+ "map@10": 0.5750333333333333,
1264
+ "mrr@1": 0.34,
1265
+ "mrr@5": 0.5750333333333333,
1266
+ "mrr@10": 0.5750333333333333,
1267
+ "num_pred": 500,
1268
+ "num_data": 500
1269
+ },
1270
+ "ActivityNetQA": {
1271
+ "hit@1": 0.523,
1272
+ "hit@5": 1.0,
1273
+ "hit@10": 1.0,
1274
+ "ndcg_linear@1": 0.523,
1275
+ "ndcg_linear@5": 0.8239534924535853,
1276
+ "ndcg_linear@10": 0.8239534924535853,
1277
+ "ndcg_exponential@1": 0.523,
1278
+ "ndcg_exponential@5": 0.8239534924535853,
1279
+ "ndcg_exponential@10": 0.8239534924535853,
1280
+ "precision@1": 0.523,
1281
+ "precision@5": 0.20000000000000004,
1282
+ "precision@10": 0.10000000000000002,
1283
+ "recall@1": 0.523,
1284
+ "recall@5": 1.0,
1285
+ "recall@10": 1.0,
1286
+ "f1@1": 0.523,
1287
+ "f1@5": 0.3333333333333333,
1288
+ "f1@10": 0.18181818181818182,
1289
+ "map@1": 0.523,
1290
+ "map@5": 0.7615,
1291
+ "map@10": 0.7615,
1292
+ "mrr@1": 0.523,
1293
+ "mrr@5": 0.7615,
1294
+ "mrr@10": 0.7615,
1295
+ "num_pred": 1000,
1296
+ "num_data": 1000
1297
+ },
1298
+ "DiDeMo": {
1299
+ "hit@1": 0.30378486055776893,
1300
+ "hit@5": 0.5388446215139442,
1301
+ "hit@10": 0.6314741035856574,
1302
+ "ndcg_linear@1": 0.30378486055776893,
1303
+ "ndcg_linear@5": 0.42742924340418204,
1304
+ "ndcg_linear@10": 0.4573351329841821,
1305
+ "ndcg_exponential@1": 0.30378486055776893,
1306
+ "ndcg_exponential@5": 0.42742924340418204,
1307
+ "ndcg_exponential@10": 0.4573351329841821,
1308
+ "precision@1": 0.30378486055776893,
1309
+ "precision@5": 0.10776892430278884,
1310
+ "precision@10": 0.06314741035856573,
1311
+ "recall@1": 0.30378486055776893,
1312
+ "recall@5": 0.5388446215139442,
1313
+ "recall@10": 0.6314741035856574,
1314
+ "f1@1": 0.30378486055776893,
1315
+ "f1@5": 0.17961487383798144,
1316
+ "f1@10": 0.11481347337921044,
1317
+ "map@1": 0.30378486055776893,
1318
+ "map@5": 0.39047144754316065,
1319
+ "map@10": 0.40278568266616077,
1320
+ "mrr@1": 0.30378486055776893,
1321
+ "mrr@5": 0.39047144754316065,
1322
+ "mrr@10": 0.40278568266616077,
1323
+ "num_pred": 1004,
1324
+ "num_data": 1004
1325
+ },
1326
+ "MSR-VTT": {
1327
+ "hit@1": 0.283,
1328
+ "hit@5": 0.504,
1329
+ "hit@10": 0.594,
1330
+ "ndcg_linear@1": 0.283,
1331
+ "ndcg_linear@5": 0.3981240408165469,
1332
+ "ndcg_linear@10": 0.4272757830933265,
1333
+ "ndcg_exponential@1": 0.283,
1334
+ "ndcg_exponential@5": 0.3981240408165469,
1335
+ "ndcg_exponential@10": 0.4272757830933265,
1336
+ "precision@1": 0.283,
1337
+ "precision@5": 0.1008,
1338
+ "precision@10": 0.059399999999999994,
1339
+ "recall@1": 0.283,
1340
+ "recall@5": 0.504,
1341
+ "recall@10": 0.594,
1342
+ "f1@1": 0.283,
1343
+ "f1@5": 0.16800000000000007,
1344
+ "f1@10": 0.10800000000000003,
1345
+ "map@1": 0.283,
1346
+ "map@5": 0.36315000000000003,
1347
+ "map@10": 0.3752111111111111,
1348
+ "mrr@1": 0.283,
1349
+ "mrr@5": 0.36315000000000003,
1350
+ "mrr@10": 0.3752111111111111,
1351
+ "num_pred": 1000,
1352
+ "num_data": 1000
1353
+ },
1354
+ "MSVD": {
1355
+ "hit@1": 0.48059701492537316,
1356
+ "hit@5": 0.7597014925373134,
1357
+ "hit@10": 0.844776119402985,
1358
+ "ndcg_linear@1": 0.48059701492537316,
1359
+ "ndcg_linear@5": 0.63096871065978,
1360
+ "ndcg_linear@10": 0.6588553080260654,
1361
+ "ndcg_exponential@1": 0.48059701492537316,
1362
+ "ndcg_exponential@5": 0.63096871065978,
1363
+ "ndcg_exponential@10": 0.6588553080260654,
1364
+ "precision@1": 0.48059701492537316,
1365
+ "precision@5": 0.15194029850746266,
1366
+ "precision@10": 0.0844776119402985,
1367
+ "recall@1": 0.48059701492537316,
1368
+ "recall@5": 0.7597014925373134,
1369
+ "recall@10": 0.844776119402985,
1370
+ "f1@1": 0.48059701492537316,
1371
+ "f1@5": 0.2532338308457712,
1372
+ "f1@10": 0.15359565807327005,
1373
+ "map@1": 0.48059701492537316,
1374
+ "map@5": 0.5879104477611939,
1375
+ "map@10": 0.5996434494195687,
1376
+ "mrr@1": 0.48059701492537316,
1377
+ "mrr@5": 0.5879104477611939,
1378
+ "mrr@10": 0.5996434494195687,
1379
+ "num_pred": 670,
1380
+ "num_data": 670
1381
+ },
1382
+ "VATEX": {
1383
+ "hit@1": 0.26462706565430993,
1384
+ "hit@5": 0.5015631978561857,
1385
+ "hit@10": 0.6045109423849933,
1386
+ "ndcg_linear@1": 0.26462706565430993,
1387
+ "ndcg_linear@5": 0.3881950217969347,
1388
+ "ndcg_linear@10": 0.4215820887400626,
1389
+ "ndcg_exponential@1": 0.26462706565430993,
1390
+ "ndcg_exponential@5": 0.3881950217969347,
1391
+ "ndcg_exponential@10": 0.4215820887400626,
1392
+ "precision@1": 0.26462706565430993,
1393
+ "precision@5": 0.10031263957123716,
1394
+ "precision@10": 0.06045109423849933,
1395
+ "recall@1": 0.26462706565430993,
1396
+ "recall@5": 0.5015631978561857,
1397
+ "recall@10": 0.6045109423849933,
1398
+ "f1@1": 0.26462706565430993,
1399
+ "f1@5": 0.16718773261872863,
1400
+ "f1@10": 0.10991108043363516,
1401
+ "map@1": 0.26462706565430993,
1402
+ "map@5": 0.35071460473425636,
1403
+ "map@10": 0.364550678094671,
1404
+ "mrr@1": 0.26462706565430993,
1405
+ "mrr@5": 0.35071460473425636,
1406
+ "mrr@10": 0.364550678094671,
1407
+ "num_pred": 4478,
1408
+ "num_data": 4478
1409
+ },
1410
+ "YouCook2": {
1411
+ "hit@1": 0.10632274300094369,
1412
+ "hit@5": 0.23057565272098143,
1413
+ "hit@10": 0.30009436929852157,
1414
+ "ndcg_linear@1": 0.10632274300094369,
1415
+ "ndcg_linear@5": 0.17033555328162955,
1416
+ "ndcg_linear@10": 0.19266164698283084,
1417
+ "ndcg_exponential@1": 0.10632274300094369,
1418
+ "ndcg_exponential@5": 0.17033555328162955,
1419
+ "ndcg_exponential@10": 0.19266164698283084,
1420
+ "precision@1": 0.10632274300094369,
1421
+ "precision@5": 0.04611513054419629,
1422
+ "precision@10": 0.030009436929852158,
1423
+ "recall@1": 0.10632274300094369,
1424
+ "recall@5": 0.23057565272098143,
1425
+ "recall@10": 0.30009436929852157,
1426
+ "f1@1": 0.10632274300094369,
1427
+ "f1@5": 0.07685855090699381,
1428
+ "f1@10": 0.054562612599731185,
1429
+ "map@1": 0.10632274300094369,
1430
+ "map@5": 0.150487574709028,
1431
+ "map@10": 0.15961231194795208,
1432
+ "mrr@1": 0.10632274300094369,
1433
+ "mrr@5": 0.150487574709028,
1434
+ "mrr@10": 0.15961231194795208,
1435
+ "num_pred": 3179,
1436
+ "num_data": 3179
1437
+ },
1438
+ "QVHighlight": {
1439
+ "hit@1": 0.4939981532779317,
1440
+ "hit@5": 0.8679593721144968,
1441
+ "hit@10": 1.0,
1442
+ "ndcg_linear@1": 0.4939981532779317,
1443
+ "ndcg_linear@5": 0.6946135135669718,
1444
+ "ndcg_linear@10": 0.7373262762832604,
1445
+ "ndcg_exponential@1": 0.4939981532779317,
1446
+ "ndcg_exponential@5": 0.6946135135669718,
1447
+ "ndcg_exponential@10": 0.7373262762832604,
1448
+ "precision@1": 0.4939981532779317,
1449
+ "precision@5": 0.17359187442289936,
1450
+ "precision@10": 0.09999999999999998,
1451
+ "recall@1": 0.4939981532779317,
1452
+ "recall@5": 0.8679593721144968,
1453
+ "recall@10": 1.0,
1454
+ "f1@1": 0.4939981532779317,
1455
+ "f1@5": 0.2893197907048323,
1456
+ "f1@10": 0.18181818181818185,
1457
+ "map@1": 0.4939981532779317,
1458
+ "map@5": 0.636734379809172,
1459
+ "map@10": 0.6543771709976696,
1460
+ "mrr@1": 0.4939981532779317,
1461
+ "mrr@5": 0.636734379809172,
1462
+ "mrr@10": 0.6543771709976696,
1463
+ "num_pred": 1083,
1464
+ "num_data": 1083
1465
+ },
1466
+ "Charades-STA": {
1467
+ "hit@1": 0.20220082530949107,
1468
+ "hit@5": 0.6011004126547456,
1469
+ "hit@10": 1.0,
1470
+ "ndcg_linear@1": 0.20220082530949107,
1471
+ "ndcg_linear@5": 0.3987840994710363,
1472
+ "ndcg_linear@10": 0.524544158533619,
1473
+ "ndcg_exponential@1": 0.20220082530949107,
1474
+ "ndcg_exponential@5": 0.3987840994710363,
1475
+ "ndcg_exponential@10": 0.524544158533619,
1476
+ "precision@1": 0.20220082530949107,
1477
+ "precision@5": 0.1202200825309491,
1478
+ "precision@10": 0.09999999999999998,
1479
+ "recall@1": 0.20220082530949107,
1480
+ "recall@5": 0.6011004126547456,
1481
+ "recall@10": 1.0,
1482
+ "f1@1": 0.20220082530949107,
1483
+ "f1@5": 0.20036680421824854,
1484
+ "f1@10": 0.18181818181818185,
1485
+ "map@1": 0.20220082530949107,
1486
+ "map@5": 0.3330353049060064,
1487
+ "map@10": 0.38307897207484554,
1488
+ "mrr@1": 0.20220082530949107,
1489
+ "mrr@5": 0.3330353049060064,
1490
+ "mrr@10": 0.38307897207484554,
1491
+ "num_pred": 727,
1492
+ "num_data": 727
1493
+ },
1494
+ "MomentSeeker": {
1495
+ "hit@1": 0.4083333333333333,
1496
+ "hit@5": 0.8861111111111111,
1497
+ "hit@10": 1.0,
1498
+ "ndcg_linear@1": 0.4083333333333333,
1499
+ "ndcg_linear@5": 0.6586571278564146,
1500
+ "ndcg_linear@10": 0.7020363910751584,
1501
+ "ndcg_exponential@1": 0.4083333333333333,
1502
+ "ndcg_exponential@5": 0.6586571278564146,
1503
+ "ndcg_exponential@10": 0.7020363910751584,
1504
+ "precision@1": 0.4083333333333333,
1505
+ "precision@5": 0.1951111111111111,
1506
+ "precision@10": 0.11277777777777781,
1507
+ "recall@1": 0.3842824074074074,
1508
+ "recall@5": 0.8708564814814814,
1509
+ "recall@10": 0.9982175925925925,
1510
+ "f1@1": 0.39165520282186944,
1511
+ "f1@5": 0.3137015453682121,
1512
+ "f1@10": 0.20007009194509193,
1513
+ "map@1": 0.4083333333333333,
1514
+ "map@5": 0.5822586419753087,
1515
+ "map@10": 0.6026371527777779,
1516
+ "mrr@1": 0.4083333333333333,
1517
+ "mrr@5": 0.5929629629629629,
1518
+ "mrr@10": 0.6089462081128747,
1519
+ "num_pred": 1800,
1520
+ "num_data": 1800
1521
+ }
1522
+ },
1523
+ "visdoc": {
1524
+ "ViDoRe_arxivqa": {
1525
+ "hit@1": 0.734,
1526
+ "hit@5": 0.866,
1527
+ "hit@10": 0.906,
1528
+ "ndcg_linear@1": 0.734,
1529
+ "ndcg_linear@5": 0.8057573987022552,
1530
+ "ndcg_linear@10": 0.8188064742981096,
1531
+ "ndcg_exponential@1": 0.734,
1532
+ "ndcg_exponential@5": 0.8057573987022552,
1533
+ "ndcg_exponential@10": 0.8188064742981096,
1534
+ "precision@1": 0.734,
1535
+ "precision@5": 0.1732,
1536
+ "precision@10": 0.0906,
1537
+ "recall@1": 0.734,
1538
+ "recall@5": 0.866,
1539
+ "recall@10": 0.906,
1540
+ "f1@1": 0.734,
1541
+ "f1@5": 0.28866666666666674,
1542
+ "f1@10": 0.16472727272727275,
1543
+ "map@1": 0.734,
1544
+ "map@5": 0.7856000000000001,
1545
+ "map@10": 0.7910603174603175,
1546
+ "mrr@1": 0.734,
1547
+ "mrr@5": 0.7856000000000001,
1548
+ "mrr@10": 0.7910603174603175,
1549
+ "num_pred": 500,
1550
+ "num_data": 500
1551
+ },
1552
+ "ViDoRe_docvqa": {
1553
+ "hit@1": 0.35033259423503327,
1554
+ "hit@5": 0.541019955654102,
1555
+ "hit@10": 0.6208425720620843,
1556
+ "ndcg_linear@1": 0.35033259423503327,
1557
+ "ndcg_linear@5": 0.4484886950768515,
1558
+ "ndcg_linear@10": 0.47338485947788617,
1559
+ "ndcg_exponential@1": 0.35033259423503327,
1560
+ "ndcg_exponential@5": 0.4484886950768515,
1561
+ "ndcg_exponential@10": 0.47338485947788617,
1562
+ "precision@1": 0.35033259423503327,
1563
+ "precision@5": 0.10953436807095342,
1564
+ "precision@10": 0.06341463414634146,
1565
+ "recall@1": 0.34320029563932003,
1566
+ "recall@5": 0.5335920177383592,
1567
+ "recall@10": 0.6106060606060606,
1568
+ "f1@1": 0.34476093012678377,
1569
+ "f1@5": 0.18059028489444562,
1570
+ "f1@10": 0.11417931661834103,
1571
+ "map@1": 0.35033259423503327,
1572
+ "map@5": 0.41779995072678,
1573
+ "map@10": 0.42790588814979064,
1574
+ "mrr@1": 0.35033259423503327,
1575
+ "mrr@5": 0.4246119733924612,
1576
+ "mrr@10": 0.4349144757681343,
1577
+ "num_pred": 451,
1578
+ "num_data": 451
1579
+ },
1580
+ "ViDoRe_infovqa": {
1581
+ "hit@1": 0.7732793522267206,
1582
+ "hit@5": 0.8947368421052632,
1583
+ "hit@10": 0.9412955465587044,
1584
+ "ndcg_linear@1": 0.7732793522267206,
1585
+ "ndcg_linear@5": 0.836933803347616,
1586
+ "ndcg_linear@10": 0.852452939253696,
1587
+ "ndcg_exponential@1": 0.7732793522267206,
1588
+ "ndcg_exponential@5": 0.836933803347616,
1589
+ "ndcg_exponential@10": 0.852452939253696,
1590
+ "precision@1": 0.7732793522267206,
1591
+ "precision@5": 0.17894736842105263,
1592
+ "precision@10": 0.09433198380566803,
1593
+ "recall@1": 0.7732793522267206,
1594
+ "recall@5": 0.8937246963562753,
1595
+ "recall@10": 0.9412955465587044,
1596
+ "f1@1": 0.7732793522267206,
1597
+ "f1@5": 0.29814921920185083,
1598
+ "f1@10": 0.17145135566188197,
1599
+ "map@1": 0.7732793522267206,
1600
+ "map@5": 0.817914979757085,
1601
+ "map@10": 0.8244569757727652,
1602
+ "mrr@1": 0.7732793522267206,
1603
+ "mrr@5": 0.8182523616734144,
1604
+ "mrr@10": 0.8245051731893837,
1605
+ "num_pred": 494,
1606
+ "num_data": 494
1607
+ },
1608
+ "ViDoRe_tabfquad": {
1609
+ "hit@1": 0.8107142857142857,
1610
+ "hit@5": 0.9571428571428572,
1611
+ "hit@10": 0.975,
1612
+ "ndcg_linear@1": 0.8107142857142857,
1613
+ "ndcg_linear@5": 0.8920767921191974,
1614
+ "ndcg_linear@10": 0.8982104341600656,
1615
+ "ndcg_exponential@1": 0.8107142857142857,
1616
+ "ndcg_exponential@5": 0.8920767921191974,
1617
+ "ndcg_exponential@10": 0.8982104341600656,
1618
+ "precision@1": 0.8107142857142857,
1619
+ "precision@5": 0.19142857142857142,
1620
+ "precision@10": 0.09749999999999999,
1621
+ "recall@1": 0.8107142857142857,
1622
+ "recall@5": 0.9571428571428572,
1623
+ "recall@10": 0.975,
1624
+ "f1@1": 0.8107142857142857,
1625
+ "f1@5": 0.31904761904761914,
1626
+ "f1@10": 0.1772727272727273,
1627
+ "map@1": 0.8107142857142857,
1628
+ "map@5": 0.8701190476190476,
1629
+ "map@10": 0.8728613945578231,
1630
+ "mrr@1": 0.8107142857142857,
1631
+ "mrr@5": 0.8701190476190476,
1632
+ "mrr@10": 0.8728613945578231,
1633
+ "num_pred": 280,
1634
+ "num_data": 280
1635
+ },
1636
+ "ViDoRe_tatdqa": {
1637
+ "hit@1": 0.30741190765492105,
1638
+ "hit@5": 0.5577156743620899,
1639
+ "hit@10": 0.6433778857837181,
1640
+ "ndcg_linear@1": 0.30741190765492105,
1641
+ "ndcg_linear@5": 0.4382195288905396,
1642
+ "ndcg_linear@10": 0.4658056006683759,
1643
+ "ndcg_exponential@1": 0.30741190765492105,
1644
+ "ndcg_exponential@5": 0.4382195288905396,
1645
+ "ndcg_exponential@10": 0.4658056006683759,
1646
+ "precision@1": 0.30741190765492105,
1647
+ "precision@5": 0.1117861482381531,
1648
+ "precision@10": 0.06452004860267314,
1649
+ "recall@1": 0.30650060753341435,
1650
+ "recall@5": 0.5565613608748481,
1651
+ "recall@10": 0.6422235722964762,
1652
+ "f1@1": 0.3068043742405832,
1653
+ "f1@5": 0.18601515940519592,
1654
+ "f1@10": 0.11718583158437353,
1655
+ "map@1": 0.30741190765492105,
1656
+ "map@5": 0.39878898339408664,
1657
+ "map@10": 0.41010757198788794,
1658
+ "mrr@1": 0.30741190765492105,
1659
+ "mrr@5": 0.39935196435803966,
1660
+ "mrr@10": 0.41067257806322205,
1661
+ "num_pred": 1646,
1662
+ "num_data": 1646
1663
+ },
1664
+ "ViDoRe_shiftproject": {
1665
+ "hit@1": 0.45,
1666
+ "hit@5": 0.74,
1667
+ "hit@10": 0.87,
1668
+ "ndcg_linear@1": 0.45,
1669
+ "ndcg_linear@5": 0.608217112664813,
1670
+ "ndcg_linear@10": 0.650000125092289,
1671
+ "ndcg_exponential@1": 0.45,
1672
+ "ndcg_exponential@5": 0.608217112664813,
1673
+ "ndcg_exponential@10": 0.650000125092289,
1674
+ "precision@1": 0.45,
1675
+ "precision@5": 0.14799999999999996,
1676
+ "precision@10": 0.08699999999999998,
1677
+ "recall@1": 0.45,
1678
+ "recall@5": 0.74,
1679
+ "recall@10": 0.87,
1680
+ "f1@1": 0.45,
1681
+ "f1@5": 0.24666666666666667,
1682
+ "f1@10": 0.1581818181818182,
1683
+ "map@1": 0.45,
1684
+ "map@5": 0.564,
1685
+ "map@10": 0.5810912698412699,
1686
+ "mrr@1": 0.45,
1687
+ "mrr@5": 0.564,
1688
+ "mrr@10": 0.5810912698412699,
1689
+ "num_pred": 100,
1690
+ "num_data": 100
1691
+ },
1692
+ "ViDoRe_syntheticDocQA_artificial_intelligence": {
1693
+ "hit@1": 0.76,
1694
+ "hit@5": 0.97,
1695
+ "hit@10": 0.98,
1696
+ "ndcg_linear@1": 0.76,
1697
+ "ndcg_linear@5": 0.8852555261521673,
1698
+ "ndcg_linear@10": 0.8882658261088071,
1699
+ "ndcg_exponential@1": 0.76,
1700
+ "ndcg_exponential@5": 0.8852555261521673,
1701
+ "ndcg_exponential@10": 0.8882658261088071,
1702
+ "precision@1": 0.76,
1703
+ "precision@5": 0.19399999999999995,
1704
+ "precision@10": 0.09799999999999998,
1705
+ "recall@1": 0.76,
1706
+ "recall@5": 0.97,
1707
+ "recall@10": 0.98,
1708
+ "f1@1": 0.76,
1709
+ "f1@5": 0.3233333333333334,
1710
+ "f1@10": 0.17818181818181827,
1711
+ "map@1": 0.76,
1712
+ "map@5": 0.8558333333333333,
1713
+ "map@10": 0.8569444444444444,
1714
+ "mrr@1": 0.76,
1715
+ "mrr@5": 0.8558333333333333,
1716
+ "mrr@10": 0.8569444444444444,
1717
+ "num_pred": 100,
1718
+ "num_data": 100
1719
+ },
1720
+ "ViDoRe_syntheticDocQA_energy": {
1721
+ "hit@1": 0.79,
1722
+ "hit@5": 0.93,
1723
+ "hit@10": 0.97,
1724
+ "ndcg_linear@1": 0.79,
1725
+ "ndcg_linear@5": 0.8650828475372231,
1726
+ "ndcg_linear@10": 0.8780588117396043,
1727
+ "ndcg_exponential@1": 0.79,
1728
+ "ndcg_exponential@5": 0.8650828475372231,
1729
+ "ndcg_exponential@10": 0.8780588117396043,
1730
+ "precision@1": 0.79,
1731
+ "precision@5": 0.18599999999999994,
1732
+ "precision@10": 0.09699999999999999,
1733
+ "recall@1": 0.79,
1734
+ "recall@5": 0.93,
1735
+ "recall@10": 0.97,
1736
+ "f1@1": 0.79,
1737
+ "f1@5": 0.31000000000000005,
1738
+ "f1@10": 0.17636363636363647,
1739
+ "map@1": 0.79,
1740
+ "map@5": 0.8433333333333333,
1741
+ "map@10": 0.8486904761904762,
1742
+ "mrr@1": 0.79,
1743
+ "mrr@5": 0.8433333333333333,
1744
+ "mrr@10": 0.8486904761904762,
1745
+ "num_pred": 100,
1746
+ "num_data": 100
1747
+ },
1748
+ "ViDoRe_syntheticDocQA_government_reports": {
1749
+ "hit@1": 0.74,
1750
+ "hit@5": 0.94,
1751
+ "hit@10": 0.98,
1752
+ "ndcg_linear@1": 0.74,
1753
+ "ndcg_linear@5": 0.8501367970825706,
1754
+ "ndcg_linear@10": 0.8630184664460052,
1755
+ "ndcg_exponential@1": 0.74,
1756
+ "ndcg_exponential@5": 0.8501367970825706,
1757
+ "ndcg_exponential@10": 0.8630184664460052,
1758
+ "precision@1": 0.74,
1759
+ "precision@5": 0.18799999999999997,
1760
+ "precision@10": 0.09799999999999999,
1761
+ "recall@1": 0.74,
1762
+ "recall@5": 0.94,
1763
+ "recall@10": 0.98,
1764
+ "f1@1": 0.74,
1765
+ "f1@5": 0.3133333333333334,
1766
+ "f1@10": 0.17818181818181825,
1767
+ "map@1": 0.74,
1768
+ "map@5": 0.8198333333333332,
1769
+ "map@10": 0.825111111111111,
1770
+ "mrr@1": 0.74,
1771
+ "mrr@5": 0.8198333333333332,
1772
+ "mrr@10": 0.825111111111111,
1773
+ "num_pred": 100,
1774
+ "num_data": 100
1775
+ },
1776
+ "ViDoRe_syntheticDocQA_healthcare_industry": {
1777
+ "hit@1": 0.84,
1778
+ "hit@5": 0.98,
1779
+ "hit@10": 0.99,
1780
+ "ndcg_linear@1": 0.84,
1781
+ "ndcg_linear@5": 0.9217065065186136,
1782
+ "ndcg_linear@10": 0.9252685783896938,
1783
+ "ndcg_exponential@1": 0.84,
1784
+ "ndcg_exponential@5": 0.9217065065186136,
1785
+ "ndcg_exponential@10": 0.9252685783896938,
1786
+ "precision@1": 0.84,
1787
+ "precision@5": 0.19599999999999998,
1788
+ "precision@10": 0.09899999999999999,
1789
+ "recall@1": 0.84,
1790
+ "recall@5": 0.98,
1791
+ "recall@10": 0.99,
1792
+ "f1@1": 0.84,
1793
+ "f1@5": 0.32666666666666677,
1794
+ "f1@10": 0.18000000000000008,
1795
+ "map@1": 0.84,
1796
+ "map@5": 0.9016666666666667,
1797
+ "map@10": 0.9033333333333334,
1798
+ "mrr@1": 0.84,
1799
+ "mrr@5": 0.9016666666666667,
1800
+ "mrr@10": 0.9033333333333334,
1801
+ "num_pred": 100,
1802
+ "num_data": 100
1803
+ },
1804
+ "ViDoRe_esg_reports_human_labeled_v2": {
1805
+ "hit@1": 0.38461538461538464,
1806
+ "hit@5": 0.6730769230769231,
1807
+ "hit@10": 0.8461538461538461,
1808
+ "ndcg_linear@1": 0.375,
1809
+ "ndcg_linear@5": 0.4555552886561195,
1810
+ "ndcg_linear@10": 0.511493540486886,
1811
+ "ndcg_exponential@1": 0.37179487179487186,
1812
+ "ndcg_exponential@5": 0.4541859231025376,
1813
+ "ndcg_exponential@10": 0.5099104815026472,
1814
+ "precision@1": 0.38461538461538464,
1815
+ "precision@5": 0.19230769230769226,
1816
+ "precision@10": 0.13076923076923078,
1817
+ "recall@1": 0.23621794871794868,
1818
+ "recall@5": 0.5487179487179487,
1819
+ "recall@10": 0.7033882783882782,
1820
+ "f1@1": 0.2715483234714004,
1821
+ "f1@5": 0.25723492194080433,
1822
+ "f1@10": 0.2026450736292365,
1823
+ "map@1": 0.38461538461538464,
1824
+ "map@5": 0.3914850427350427,
1825
+ "map@10": 0.415758547008547,
1826
+ "mrr@1": 0.38461538461538464,
1827
+ "mrr@5": 0.491025641025641,
1828
+ "mrr@10": 0.5144993894993896,
1829
+ "num_pred": 52,
1830
+ "num_data": 52
1831
+ },
1832
+ "ViDoRe_biomedical_lectures_v2_multilingual": {
1833
+ "hit@1": 0.36875,
1834
+ "hit@5": 0.7171875,
1835
+ "hit@10": 0.8203125,
1836
+ "ndcg_linear@1": 0.36875,
1837
+ "ndcg_linear@5": 0.4426897295015239,
1838
+ "ndcg_linear@10": 0.4850950127175607,
1839
+ "ndcg_exponential@1": 0.36875,
1840
+ "ndcg_exponential@5": 0.4426897295015239,
1841
+ "ndcg_exponential@10": 0.4850950127175607,
1842
+ "precision@1": 0.36875,
1843
+ "precision@5": 0.203125,
1844
+ "precision@10": 0.13968750000000002,
1845
+ "recall@1": 0.23270833333333335,
1846
+ "recall@5": 0.49864999124649856,
1847
+ "recall@10": 0.6150380777310923,
1848
+ "f1@1": 0.2621073457792208,
1849
+ "f1@5": 0.25601551313270066,
1850
+ "f1@10": 0.20543311717898116,
1851
+ "map@1": 0.36875,
1852
+ "map@5": 0.3719822048611111,
1853
+ "map@10": 0.3923365021789966,
1854
+ "mrr@1": 0.36875,
1855
+ "mrr@5": 0.497265625,
1856
+ "mrr@10": 0.5111972966269841,
1857
+ "num_pred": 640,
1858
+ "num_data": 640
1859
+ },
1860
+ "ViDoRe_economics_reports_v2_multilingual": {
1861
+ "hit@1": 0.4525862068965517,
1862
+ "hit@5": 0.8103448275862069,
1863
+ "hit@10": 0.9267241379310345,
1864
+ "ndcg_linear@1": 0.4525862068965517,
1865
+ "ndcg_linear@5": 0.42995014841633666,
1866
+ "ndcg_linear@10": 0.43467280891274934,
1867
+ "ndcg_exponential@1": 0.4525862068965517,
1868
+ "ndcg_exponential@5": 0.4299501484163365,
1869
+ "ndcg_exponential@10": 0.43467280891274934,
1870
+ "precision@1": 0.4525862068965517,
1871
+ "precision@5": 0.38448275862068965,
1872
+ "precision@10": 0.33103448275862074,
1873
+ "recall@1": 0.049016392011628045,
1874
+ "recall@5": 0.22829352926193736,
1875
+ "recall@10": 0.36167397868493684,
1876
+ "f1@1": 0.08115811949451532,
1877
+ "f1@5": 0.22694280671921516,
1878
+ "f1@10": 0.27660068249123476,
1879
+ "map@1": 0.4525862068965517,
1880
+ "map@5": 0.3282327586206897,
1881
+ "map@10": 0.2973695391710324,
1882
+ "mrr@1": 0.4525862068965517,
1883
+ "mrr@5": 0.5951867816091955,
1884
+ "mrr@10": 0.6120929118773947,
1885
+ "num_pred": 232,
1886
+ "num_data": 232
1887
+ },
1888
+ "ViDoRe_esg_reports_v2_multilingual": {
1889
+ "hit@1": 0.4692982456140351,
1890
+ "hit@5": 0.7719298245614035,
1891
+ "hit@10": 0.8640350877192983,
1892
+ "ndcg_linear@1": 0.4692982456140351,
1893
+ "ndcg_linear@5": 0.466179429204456,
1894
+ "ndcg_linear@10": 0.5017617250757785,
1895
+ "ndcg_exponential@1": 0.4692982456140351,
1896
+ "ndcg_exponential@5": 0.466179429204456,
1897
+ "ndcg_exponential@10": 0.5017617250757785,
1898
+ "precision@1": 0.4692982456140351,
1899
+ "precision@5": 0.21929824561403508,
1900
+ "precision@10": 0.15131578947368426,
1901
+ "recall@1": 0.2380325814536341,
1902
+ "recall@5": 0.4968671679197995,
1903
+ "recall@10": 0.6020624477861319,
1904
+ "f1@1": 0.28556649037592774,
1905
+ "f1@5": 0.26698957296533893,
1906
+ "f1@10": 0.21278941819922756,
1907
+ "map@1": 0.4692982456140351,
1908
+ "map@5": 0.38164961013645227,
1909
+ "map@10": 0.39600202763854087,
1910
+ "mrr@1": 0.4692982456140351,
1911
+ "mrr@5": 0.5818713450292398,
1912
+ "mrr@10": 0.594714216095795,
1913
+ "num_pred": 228,
1914
+ "num_data": 228
1915
+ },
1916
+ "VisRAG_ArxivQA": {
1917
+ "hit@1": 0.7022058823529411,
1918
+ "hit@5": 0.821078431372549,
1919
+ "hit@10": 0.8615196078431373,
1920
+ "ndcg_linear@1": 0.7022058823529411,
1921
+ "ndcg_linear@5": 0.7687028213602233,
1922
+ "ndcg_linear@10": 0.7817454060088397,
1923
+ "ndcg_exponential@1": 0.7022058823529411,
1924
+ "ndcg_exponential@5": 0.7687028213602233,
1925
+ "ndcg_exponential@10": 0.7817454060088397,
1926
+ "precision@1": 0.7022058823529411,
1927
+ "precision@5": 0.1642156862745098,
1928
+ "precision@10": 0.08615196078431371,
1929
+ "recall@1": 0.7022058823529411,
1930
+ "recall@5": 0.821078431372549,
1931
+ "recall@10": 0.8615196078431373,
1932
+ "f1@1": 0.7022058823529411,
1933
+ "f1@5": 0.2736928104575164,
1934
+ "f1@10": 0.15663992869875223,
1935
+ "map@1": 0.7022058823529411,
1936
+ "map@5": 0.7510212418300654,
1937
+ "map@10": 0.7563827614379085,
1938
+ "mrr@1": 0.7022058823529411,
1939
+ "mrr@5": 0.7510212418300654,
1940
+ "mrr@10": 0.7563827614379085,
1941
+ "num_pred": 816,
1942
+ "num_data": 816
1943
+ },
1944
+ "VisRAG_ChartQA": {
1945
+ "hit@1": 0.7301587301587301,
1946
+ "hit@5": 0.9206349206349206,
1947
+ "hit@10": 0.9365079365079365,
1948
+ "ndcg_linear@1": 0.7301587301587301,
1949
+ "ndcg_linear@5": 0.8441010759070336,
1950
+ "ndcg_linear@10": 0.849392081198039,
1951
+ "ndcg_exponential@1": 0.7301587301587301,
1952
+ "ndcg_exponential@5": 0.8441010759070336,
1953
+ "ndcg_exponential@10": 0.849392081198039,
1954
+ "precision@1": 0.7301587301587301,
1955
+ "precision@5": 0.18412698412698403,
1956
+ "precision@10": 0.0936507936507936,
1957
+ "recall@1": 0.7301587301587301,
1958
+ "recall@5": 0.9206349206349206,
1959
+ "recall@10": 0.9365079365079365,
1960
+ "f1@1": 0.7301587301587301,
1961
+ "f1@5": 0.3068783068783068,
1962
+ "f1@10": 0.1702741702741703,
1963
+ "map@1": 0.7301587301587301,
1964
+ "map@5": 0.8174603174603174,
1965
+ "map@10": 0.8197278911564626,
1966
+ "mrr@1": 0.7301587301587301,
1967
+ "mrr@5": 0.8174603174603174,
1968
+ "mrr@10": 0.8197278911564626,
1969
+ "num_pred": 63,
1970
+ "num_data": 63
1971
+ },
1972
+ "VisRAG_MP-DocVQA": {
1973
+ "hit@1": 0.5922165820642978,
1974
+ "hit@5": 0.8206429780033841,
1975
+ "hit@10": 0.8663282571912013,
1976
+ "ndcg_linear@1": 0.5922165820642978,
1977
+ "ndcg_linear@5": 0.717924714040525,
1978
+ "ndcg_linear@10": 0.7327402059542735,
1979
+ "ndcg_exponential@1": 0.5922165820642978,
1980
+ "ndcg_exponential@5": 0.717924714040525,
1981
+ "ndcg_exponential@10": 0.7327402059542735,
1982
+ "precision@1": 0.5922165820642978,
1983
+ "precision@5": 0.16412859560067683,
1984
+ "precision@10": 0.08663282571912012,
1985
+ "recall@1": 0.5922165820642978,
1986
+ "recall@5": 0.8206429780033841,
1987
+ "recall@10": 0.8663282571912013,
1988
+ "f1@1": 0.5922165820642978,
1989
+ "f1@5": 0.2735476593344614,
1990
+ "f1@10": 0.15751422858021846,
1991
+ "map@1": 0.5922165820642978,
1992
+ "map@5": 0.6833051325437113,
1993
+ "map@10": 0.6894455187602395,
1994
+ "mrr@1": 0.5922165820642978,
1995
+ "mrr@5": 0.6833051325437113,
1996
+ "mrr@10": 0.6894455187602395,
1997
+ "num_pred": 591,
1998
+ "num_data": 591
1999
+ },
2000
+ "VisRAG_SlideVQA": {
2001
+ "hit@1": 0.8794964028776978,
2002
+ "hit@5": 0.9748201438848921,
2003
+ "hit@10": 0.9802158273381295,
2004
+ "ndcg_linear@1": 0.8794964028776978,
2005
+ "ndcg_linear@5": 0.9150078016078801,
2006
+ "ndcg_linear@10": 0.9207838812109942,
2007
+ "ndcg_exponential@1": 0.8794964028776978,
2008
+ "ndcg_exponential@5": 0.9150078016078801,
2009
+ "ndcg_exponential@10": 0.9207838812109942,
2010
+ "precision@1": 0.8794964028776978,
2011
+ "precision@5": 0.2384892086330935,
2012
+ "precision@10": 0.12176258992805757,
2013
+ "recall@1": 0.7598920863309353,
2014
+ "recall@5": 0.954136690647482,
2015
+ "recall@10": 0.9694244604316546,
2016
+ "f1@1": 0.7997601918465228,
2017
+ "f1@5": 0.37478588557725256,
2018
+ "f1@10": 0.2138652714192283,
2019
+ "map@1": 0.8794964028776978,
2020
+ "map@5": 0.8905575539568344,
2021
+ "map@10": 0.894137547105173,
2022
+ "mrr@1": 0.8794964028776978,
2023
+ "mrr@5": 0.9226618705035972,
2024
+ "mrr@10": 0.9233213429256595,
2025
+ "num_pred": 556,
2026
+ "num_data": 556
2027
+ },
2028
+ "VisRAG_InfoVQA": {
2029
+ "hit@1": 0.7465181058495822,
2030
+ "hit@5": 0.9415041782729805,
2031
+ "hit@10": 0.9665738161559888,
2032
+ "ndcg_linear@1": 0.7465181058495822,
2033
+ "ndcg_linear@5": 0.8565495992280632,
2034
+ "ndcg_linear@10": 0.8647865140019099,
2035
+ "ndcg_exponential@1": 0.7465181058495822,
2036
+ "ndcg_exponential@5": 0.8565495992280632,
2037
+ "ndcg_exponential@10": 0.8647865140019099,
2038
+ "precision@1": 0.7465181058495822,
2039
+ "precision@5": 0.18830083565459607,
2040
+ "precision@10": 0.09665738161559885,
2041
+ "recall@1": 0.7465181058495822,
2042
+ "recall@5": 0.9415041782729805,
2043
+ "recall@10": 0.9665738161559888,
2044
+ "f1@1": 0.7465181058495822,
2045
+ "f1@5": 0.31383472609099355,
2046
+ "f1@10": 0.1757406938465435,
2047
+ "map@1": 0.7465181058495822,
2048
+ "map@5": 0.827669452181987,
2049
+ "map@10": 0.8311491356059602,
2050
+ "mrr@1": 0.7465181058495822,
2051
+ "mrr@5": 0.827669452181987,
2052
+ "mrr@10": 0.8311491356059602,
2053
+ "num_pred": 718,
2054
+ "num_data": 718
2055
+ },
2056
+ "VisRAG_PlotQA": {
2057
+ "hit@1": 0.5052143684820394,
2058
+ "hit@5": 0.7937427578215527,
2059
+ "hit@10": 0.8887601390498262,
2060
+ "ndcg_linear@1": 0.5052143684820394,
2061
+ "ndcg_linear@5": 0.6604877574932249,
2062
+ "ndcg_linear@10": 0.6916336549342924,
2063
+ "ndcg_exponential@1": 0.5052143684820394,
2064
+ "ndcg_exponential@5": 0.6604877574932249,
2065
+ "ndcg_exponential@10": 0.6916336549342924,
2066
+ "precision@1": 0.5052143684820394,
2067
+ "precision@5": 0.15874855156431056,
2068
+ "precision@10": 0.08887601390498262,
2069
+ "recall@1": 0.5052143684820394,
2070
+ "recall@5": 0.7937427578215527,
2071
+ "recall@10": 0.8887601390498262,
2072
+ "f1@1": 0.5052143684820394,
2073
+ "f1@5": 0.26458091927385097,
2074
+ "f1@10": 0.1615927525545139,
2075
+ "map@1": 0.5052143684820394,
2076
+ "map@5": 0.6159907300115876,
2077
+ "map@10": 0.629089646673656,
2078
+ "mrr@1": 0.5052143684820394,
2079
+ "mrr@5": 0.6159907300115876,
2080
+ "mrr@10": 0.629089646673656,
2081
+ "num_pred": 863,
2082
+ "num_data": 863
2083
+ },
2084
+ "ViDoSeek-page": {
2085
+ "hit@1": 0.03502626970227671,
2086
+ "hit@5": 0.3975481611208406,
2087
+ "hit@10": 0.5674255691768827,
2088
+ "ndcg_linear@1": 0.03502626970227671,
2089
+ "ndcg_linear@5": 0.21944808482459283,
2090
+ "ndcg_linear@10": 0.2752564930475152,
2091
+ "ndcg_exponential@1": 0.03502626970227671,
2092
+ "ndcg_exponential@5": 0.21944808482459285,
2093
+ "ndcg_exponential@10": 0.2752564930475153,
2094
+ "precision@1": 0.03502626970227671,
2095
+ "precision@5": 0.07950963222416814,
2096
+ "precision@10": 0.05674255691768828,
2097
+ "recall@1": 0.03502626970227671,
2098
+ "recall@5": 0.3975481611208406,
2099
+ "recall@10": 0.5674255691768827,
2100
+ "f1@1": 0.03502626970227671,
2101
+ "f1@5": 0.13251605370694688,
2102
+ "f1@10": 0.10316828530488775,
2103
+ "map@1": 0.03502626970227671,
2104
+ "map@5": 0.16103327495621714,
2105
+ "map@10": 0.184575236983293,
2106
+ "mrr@1": 0.03502626970227671,
2107
+ "mrr@5": 0.16103327495621714,
2108
+ "mrr@10": 0.184575236983293,
2109
+ "num_pred": 1142,
2110
+ "num_data": 1142
2111
+ },
2112
+ "ViDoSeek-doc": {
2113
+ "hit@1": 0.9903677758318739,
2114
+ "hit@5": 0.9973730297723292,
2115
+ "hit@10": 0.9982486865148862,
2116
+ "ndcg_linear@1": 0.6762988908347927,
2117
+ "ndcg_linear@5": 0.8018406693375459,
2118
+ "ndcg_linear@10": 0.767343136404217,
2119
+ "ndcg_exponential@1": 0.4519639729797348,
2120
+ "ndcg_exponential@5": 0.6874729261482034,
2121
+ "ndcg_exponential@10": 0.6978420362198057,
2122
+ "precision@1": 0.9903677758318739,
2123
+ "precision@5": 0.8740805604203151,
2124
+ "precision@10": 0.7643607705779335,
2125
+ "recall@1": 0.05845834634908238,
2126
+ "recall@5": 0.2559977615058973,
2127
+ "recall@10": 0.4381450224554127,
2128
+ "f1@1": 0.1096528022965413,
2129
+ "f1@5": 0.388099043607817,
2130
+ "f1@10": 0.5446572421004792,
2131
+ "map@1": 0.9903677758318739,
2132
+ "map@5": 0.8628546409807355,
2133
+ "map@10": 0.7436259056064535,
2134
+ "mrr@1": 0.9903677758318739,
2135
+ "mrr@5": 0.9936077057793345,
2136
+ "mrr@10": 0.9937327995996997,
2137
+ "num_pred": 1142,
2138
+ "num_data": 1142
2139
+ },
2140
+ "MMLongBench-page": {
2141
+ "hit@1": 0.05250596658711217,
2142
+ "hit@5": 0.24224343675417662,
2143
+ "hit@10": 0.33890214797136037,
2144
+ "ndcg_linear@1": 0.05250596658711217,
2145
+ "ndcg_linear@5": 0.11893466223008214,
2146
+ "ndcg_linear@10": 0.15008296554980238,
2147
+ "ndcg_exponential@1": 0.05250596658711217,
2148
+ "ndcg_exponential@5": 0.11893466223008214,
2149
+ "ndcg_exponential@10": 0.15008296554980238,
2150
+ "precision@1": 0.05250596658711217,
2151
+ "precision@5": 0.056324582338902154,
2152
+ "precision@10": 0.04307875894988067,
2153
+ "recall@1": 0.028838504375497214,
2154
+ "recall@5": 0.1757174110694397,
2155
+ "recall@10": 0.2610182975338106,
2156
+ "f1@1": 0.03586377822654672,
2157
+ "f1@5": 0.08071268195513599,
2158
+ "f1@10": 0.07038494595369645,
2159
+ "map@1": 0.05250596658711217,
2160
+ "map@5": 0.08618237867939538,
2161
+ "map@10": 0.10006671765099569,
2162
+ "mrr@1": 0.05250596658711217,
2163
+ "mrr@5": 0.12171837708830548,
2164
+ "mrr@10": 0.13489174906239346,
2165
+ "num_pred": 838,
2166
+ "num_data": 838
2167
+ },
2168
+ "MMLongBench-doc": {
2169
+ "hit@1": 0.6157517899761337,
2170
+ "hit@5": 0.7482100238663485,
2171
+ "hit@10": 0.7947494033412887,
2172
+ "ndcg_linear@1": 0.4287987271280827,
2173
+ "ndcg_linear@5": 0.43709371712705786,
2174
+ "ndcg_linear@10": 0.4147091530579679,
2175
+ "ndcg_exponential@1": 0.2952608250937606,
2176
+ "ndcg_exponential@5": 0.3633856276662273,
2177
+ "ndcg_exponential@10": 0.36808988125041325,
2178
+ "precision@1": 0.6157517899761337,
2179
+ "precision@5": 0.4797136038186158,
2180
+ "precision@10": 0.41563245823389017,
2181
+ "recall@1": 0.01970187328257191,
2182
+ "recall@5": 0.07488813025872536,
2183
+ "recall@10": 0.12545835862481708,
2184
+ "f1@1": 0.03781026144552173,
2185
+ "f1@5": 0.12459954660237356,
2186
+ "f1@10": 0.18139093061449052,
2187
+ "map@1": 0.6157517899761337,
2188
+ "map@5": 0.44125696101829753,
2189
+ "map@10": 0.36061324308738785,
2190
+ "mrr@1": 0.6157517899761337,
2191
+ "mrr@5": 0.6687947494033414,
2192
+ "mrr@10": 0.6751861006932606,
2193
+ "num_pred": 838,
2194
+ "num_data": 838
2195
+ }
2196
+ }
2197
+ }
2198
+ }