yydxlv commited on
Commit
baabfbf
1 Parent(s): 2b1b168

Upload 7 files

Browse files
.gitattributes CHANGED
@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ tokenizer.json filter=lfs diff=lfs merge=lfs -text
merges.txt ADDED
The diff for this file is too large to render. See raw diff
 
preprocessor_config.json ADDED
@@ -0,0 +1,29 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "do_convert_rgb": true,
3
+ "do_normalize": true,
4
+ "do_rescale": true,
5
+ "do_resize": true,
6
+ "image_mean": [
7
+ 0.48145466,
8
+ 0.4578275,
9
+ 0.40821073
10
+ ],
11
+ "image_processor_type": "Qwen2VLImageProcessor",
12
+ "image_std": [
13
+ 0.26862954,
14
+ 0.26130258,
15
+ 0.27577711
16
+ ],
17
+ "max_pixels": 12845056,
18
+ "merge_size": 2,
19
+ "min_pixels": 3136,
20
+ "patch_size": 14,
21
+ "processor_class": "ColQwen2Processor",
22
+ "resample": 3,
23
+ "rescale_factor": 0.00392156862745098,
24
+ "size": {
25
+ "max_pixels": 12845056,
26
+ "min_pixels": 3136
27
+ },
28
+ "temporal_patch_size": 2
29
+ }
results.json ADDED
@@ -0,0 +1,583 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "metrics": {
3
+ "syntheticDocQA_artificial_intelligence_test": {
4
+ "ndcg_at_1": 0.97,
5
+ "ndcg_at_3": 0.98893,
6
+ "ndcg_at_5": 0.98893,
7
+ "ndcg_at_10": 0.98893,
8
+ "ndcg_at_20": 0.98893,
9
+ "ndcg_at_50": 0.98893,
10
+ "ndcg_at_100": 0.98893,
11
+ "map_at_1": 0.97,
12
+ "map_at_3": 0.985,
13
+ "map_at_5": 0.985,
14
+ "map_at_10": 0.985,
15
+ "map_at_20": 0.985,
16
+ "map_at_50": 0.985,
17
+ "map_at_100": 0.985,
18
+ "recall_at_1": 0.97,
19
+ "recall_at_3": 1.0,
20
+ "recall_at_5": 1.0,
21
+ "recall_at_10": 1.0,
22
+ "recall_at_20": 1.0,
23
+ "recall_at_50": 1.0,
24
+ "recall_at_100": 1.0,
25
+ "precision_at_1": 0.97,
26
+ "precision_at_3": 0.33333,
27
+ "precision_at_5": 0.2,
28
+ "precision_at_10": 0.1,
29
+ "precision_at_20": 0.05,
30
+ "precision_at_50": 0.02,
31
+ "precision_at_100": 0.01,
32
+ "mrr_at_1": 0.98,
33
+ "mrr_at_3": 0.99,
34
+ "mrr_at_5": 0.99,
35
+ "mrr_at_10": 0.99,
36
+ "mrr_at_20": 0.99,
37
+ "mrr_at_50": 0.99,
38
+ "mrr_at_100": 0.99,
39
+ "naucs_at_1_max": 0.6661998132586402,
40
+ "naucs_at_1_std": -0.2198879551820713,
41
+ "naucs_at_1_diff1": 1.0,
42
+ "naucs_at_3_max": 1.0,
43
+ "naucs_at_3_std": 1.0,
44
+ "naucs_at_3_diff1": 1.0,
45
+ "naucs_at_5_max": 1.0,
46
+ "naucs_at_5_std": 1.0,
47
+ "naucs_at_5_diff1": 1.0,
48
+ "naucs_at_10_max": 1.0,
49
+ "naucs_at_10_std": 1.0,
50
+ "naucs_at_10_diff1": 1.0,
51
+ "naucs_at_20_max": 1.0,
52
+ "naucs_at_20_std": 1.0,
53
+ "naucs_at_20_diff1": 1.0,
54
+ "naucs_at_50_max": null,
55
+ "naucs_at_50_std": null,
56
+ "naucs_at_50_diff1": null,
57
+ "naucs_at_100_max": null,
58
+ "naucs_at_100_std": null,
59
+ "naucs_at_100_diff1": null
60
+ },
61
+ "tabfquad_test_subsampled": {
62
+ "ndcg_at_1": 0.86786,
63
+ "ndcg_at_3": 0.91012,
64
+ "ndcg_at_5": 0.92026,
65
+ "ndcg_at_10": 0.92608,
66
+ "ndcg_at_20": 0.92787,
67
+ "ndcg_at_50": 0.93015,
68
+ "ndcg_at_100": 0.93015,
69
+ "map_at_1": 0.86786,
70
+ "map_at_3": 0.9,
71
+ "map_at_5": 0.90554,
72
+ "map_at_10": 0.90797,
73
+ "map_at_20": 0.90845,
74
+ "map_at_50": 0.90888,
75
+ "map_at_100": 0.90888,
76
+ "recall_at_1": 0.86786,
77
+ "recall_at_3": 0.93929,
78
+ "recall_at_5": 0.96429,
79
+ "recall_at_10": 0.98214,
80
+ "recall_at_20": 0.98929,
81
+ "recall_at_50": 1.0,
82
+ "recall_at_100": 1.0,
83
+ "precision_at_1": 0.86786,
84
+ "precision_at_3": 0.3131,
85
+ "precision_at_5": 0.19286,
86
+ "precision_at_10": 0.09821,
87
+ "precision_at_20": 0.04946,
88
+ "precision_at_50": 0.02,
89
+ "precision_at_100": 0.01,
90
+ "mrr_at_1": 0.8714285714285714,
91
+ "mrr_at_3": 0.9017857142857143,
92
+ "mrr_at_5": 0.9073214285714286,
93
+ "mrr_at_10": 0.9097123015873015,
94
+ "mrr_at_20": 0.9102083333333333,
95
+ "mrr_at_50": 0.9106373626373626,
96
+ "mrr_at_100": 0.9106373626373626,
97
+ "naucs_at_1_max": 0.5190267677952406,
98
+ "naucs_at_1_std": 0.20565850861417337,
99
+ "naucs_at_1_diff1": 0.8928115307425651,
100
+ "naucs_at_3_max": 0.6486790794749274,
101
+ "naucs_at_3_std": 0.4622947218102944,
102
+ "naucs_at_3_diff1": 0.9004503762289242,
103
+ "naucs_at_5_max": 0.8830532212885142,
104
+ "naucs_at_5_std": 0.6742296918767519,
105
+ "naucs_at_5_diff1": 0.9460784313725463,
106
+ "naucs_at_10_max": 0.8216619981325874,
107
+ "naucs_at_10_std": 0.4857142857142915,
108
+ "naucs_at_10_diff1": 0.9183006535947714,
109
+ "naucs_at_20_max": 1.0,
110
+ "naucs_at_20_std": 0.9564270152505505,
111
+ "naucs_at_20_diff1": 1.0,
112
+ "naucs_at_50_max": 1.0,
113
+ "naucs_at_50_std": 1.0,
114
+ "naucs_at_50_diff1": 1.0,
115
+ "naucs_at_100_max": 1.0,
116
+ "naucs_at_100_std": 1.0,
117
+ "naucs_at_100_diff1": 1.0
118
+ },
119
+ "shiftproject_test": {
120
+ "ndcg_at_1": 0.76,
121
+ "ndcg_at_3": 0.87833,
122
+ "ndcg_at_5": 0.88651,
123
+ "ndcg_at_10": 0.8894,
124
+ "ndcg_at_20": 0.8894,
125
+ "ndcg_at_50": 0.89133,
126
+ "ndcg_at_100": 0.89133,
127
+ "map_at_1": 0.76,
128
+ "map_at_3": 0.85,
129
+ "map_at_5": 0.8545,
130
+ "map_at_10": 0.8555,
131
+ "map_at_20": 0.8555,
132
+ "map_at_50": 0.85579,
133
+ "map_at_100": 0.85579,
134
+ "recall_at_1": 0.76,
135
+ "recall_at_3": 0.96,
136
+ "recall_at_5": 0.98,
137
+ "recall_at_10": 0.99,
138
+ "recall_at_20": 0.99,
139
+ "recall_at_50": 1.0,
140
+ "recall_at_100": 1.0,
141
+ "precision_at_1": 0.76,
142
+ "precision_at_3": 0.32,
143
+ "precision_at_5": 0.196,
144
+ "precision_at_10": 0.099,
145
+ "precision_at_20": 0.0495,
146
+ "precision_at_50": 0.02,
147
+ "precision_at_100": 0.01,
148
+ "mrr_at_1": 0.77,
149
+ "mrr_at_3": 0.86,
150
+ "mrr_at_5": 0.8645,
151
+ "mrr_at_10": 0.8656111111111112,
152
+ "mrr_at_20": 0.8656111111111112,
153
+ "mrr_at_50": 0.86590522875817,
154
+ "mrr_at_100": 0.86590522875817,
155
+ "naucs_at_1_max": 0.19752098295405382,
156
+ "naucs_at_1_std": -0.1442415851864674,
157
+ "naucs_at_1_diff1": 0.8336722332785322,
158
+ "naucs_at_3_max": 0.19946311858076338,
159
+ "naucs_at_3_std": -0.029178338001868868,
160
+ "naucs_at_3_diff1": 0.8978758169934614,
161
+ "naucs_at_5_max": 0.540149393090577,
162
+ "naucs_at_5_std": 0.24042950513538955,
163
+ "naucs_at_5_diff1": 0.861111111111116,
164
+ "naucs_at_10_max": 0.7222222222222276,
165
+ "naucs_at_10_std": 0.35807656395891135,
166
+ "naucs_at_10_diff1": 0.7222222222222276,
167
+ "naucs_at_20_max": 0.7222222222222276,
168
+ "naucs_at_20_std": 0.35807656395891135,
169
+ "naucs_at_20_diff1": 0.7222222222222276,
170
+ "naucs_at_50_max": null,
171
+ "naucs_at_50_std": null,
172
+ "naucs_at_50_diff1": null,
173
+ "naucs_at_100_max": null,
174
+ "naucs_at_100_std": null,
175
+ "naucs_at_100_diff1": null
176
+ },
177
+ "syntheticDocQA_government_reports_test": {
178
+ "ndcg_at_1": 0.92,
179
+ "ndcg_at_3": 0.96286,
180
+ "ndcg_at_5": 0.96286,
181
+ "ndcg_at_10": 0.96286,
182
+ "ndcg_at_20": 0.96565,
183
+ "ndcg_at_50": 0.96565,
184
+ "ndcg_at_100": 0.96565,
185
+ "map_at_1": 0.92,
186
+ "map_at_3": 0.95333,
187
+ "map_at_5": 0.95333,
188
+ "map_at_10": 0.95333,
189
+ "map_at_20": 0.95424,
190
+ "map_at_50": 0.95424,
191
+ "map_at_100": 0.95424,
192
+ "recall_at_1": 0.92,
193
+ "recall_at_3": 0.99,
194
+ "recall_at_5": 0.99,
195
+ "recall_at_10": 0.99,
196
+ "recall_at_20": 1.0,
197
+ "recall_at_50": 1.0,
198
+ "recall_at_100": 1.0,
199
+ "precision_at_1": 0.92,
200
+ "precision_at_3": 0.33,
201
+ "precision_at_5": 0.198,
202
+ "precision_at_10": 0.099,
203
+ "precision_at_20": 0.05,
204
+ "precision_at_50": 0.02,
205
+ "precision_at_100": 0.01,
206
+ "mrr_at_1": 0.93,
207
+ "mrr_at_3": 0.96,
208
+ "mrr_at_5": 0.96,
209
+ "mrr_at_10": 0.961,
210
+ "mrr_at_20": 0.961,
211
+ "mrr_at_50": 0.961,
212
+ "mrr_at_100": 0.961,
213
+ "naucs_at_1_max": 0.4417016806722691,
214
+ "naucs_at_1_std": 0.09599673202614255,
215
+ "naucs_at_1_diff1": 0.8999183006535953,
216
+ "naucs_at_3_max": 1.0,
217
+ "naucs_at_3_std": 0.12278244631183229,
218
+ "naucs_at_3_diff1": 1.0,
219
+ "naucs_at_5_max": 1.0,
220
+ "naucs_at_5_std": 0.12278244631185926,
221
+ "naucs_at_5_diff1": 1.0,
222
+ "naucs_at_10_max": 1.0,
223
+ "naucs_at_10_std": 0.12278244631185926,
224
+ "naucs_at_10_diff1": 1.0,
225
+ "naucs_at_20_max": 1.0,
226
+ "naucs_at_20_std": 1.0,
227
+ "naucs_at_20_diff1": 1.0,
228
+ "naucs_at_50_max": null,
229
+ "naucs_at_50_std": null,
230
+ "naucs_at_50_diff1": null,
231
+ "naucs_at_100_max": null,
232
+ "naucs_at_100_std": null,
233
+ "naucs_at_100_diff1": null
234
+ },
235
+ "infovqa_test_subsampled": {
236
+ "ndcg_at_1": 0.90283,
237
+ "ndcg_at_3": 0.92859,
238
+ "ndcg_at_5": 0.93539,
239
+ "ndcg_at_10": 0.93877,
240
+ "ndcg_at_20": 0.94183,
241
+ "ndcg_at_50": 0.94346,
242
+ "ndcg_at_100": 0.94378,
243
+ "map_at_1": 0.90283,
244
+ "map_at_3": 0.92274,
245
+ "map_at_5": 0.92659,
246
+ "map_at_10": 0.92804,
247
+ "map_at_20": 0.92887,
248
+ "map_at_50": 0.92915,
249
+ "map_at_100": 0.92917,
250
+ "recall_at_1": 0.90283,
251
+ "recall_at_3": 0.94534,
252
+ "recall_at_5": 0.96154,
253
+ "recall_at_10": 0.97166,
254
+ "recall_at_20": 0.98381,
255
+ "recall_at_50": 0.9919,
256
+ "recall_at_100": 0.99393,
257
+ "precision_at_1": 0.90283,
258
+ "precision_at_3": 0.31511,
259
+ "precision_at_5": 0.19231,
260
+ "precision_at_10": 0.09717,
261
+ "precision_at_20": 0.04919,
262
+ "precision_at_50": 0.01984,
263
+ "precision_at_100": 0.00994,
264
+ "mrr_at_1": 0.8967611336032388,
265
+ "mrr_at_3": 0.918353576248313,
266
+ "mrr_at_5": 0.9223009446693656,
267
+ "mrr_at_10": 0.924116380695328,
268
+ "mrr_at_20": 0.9248166923205465,
269
+ "mrr_at_50": 0.9251925733928332,
270
+ "mrr_at_100": 0.9252178770365579,
271
+ "naucs_at_1_max": 0.7032099887107416,
272
+ "naucs_at_1_std": 0.0019003151834775542,
273
+ "naucs_at_1_diff1": 0.9557773557438912,
274
+ "naucs_at_3_max": 0.8288721769160055,
275
+ "naucs_at_3_std": 0.21068169315514182,
276
+ "naucs_at_3_diff1": 0.9504045111146412,
277
+ "naucs_at_5_max": 0.8647951304327424,
278
+ "naucs_at_5_std": 0.5047446344096794,
279
+ "naucs_at_5_diff1": 0.9570172429660248,
280
+ "naucs_at_10_max": 0.9308492405555852,
281
+ "naucs_at_10_std": 0.6471514357346168,
282
+ "naucs_at_10_diff1": 0.9603236088917129,
283
+ "naucs_at_20_max": 0.9673496364838108,
284
+ "naucs_at_20_std": 0.9305663155604971,
285
+ "naucs_at_20_diff1": 1.0,
286
+ "naucs_at_50_max": 0.9346992729676393,
287
+ "naucs_at_50_std": 0.8611326311210196,
288
+ "naucs_at_50_diff1": 1.0,
289
+ "naucs_at_100_max": 0.9564661819784259,
290
+ "naucs_at_100_std": 0.8148435081613579,
291
+ "naucs_at_100_diff1": 1.0
292
+ },
293
+ "syntheticDocQA_healthcare_industry_test": {
294
+ "ndcg_at_1": 0.99,
295
+ "ndcg_at_3": 0.99631,
296
+ "ndcg_at_5": 0.99631,
297
+ "ndcg_at_10": 0.99631,
298
+ "ndcg_at_20": 0.99631,
299
+ "ndcg_at_50": 0.99631,
300
+ "ndcg_at_100": 0.99631,
301
+ "map_at_1": 0.99,
302
+ "map_at_3": 0.995,
303
+ "map_at_5": 0.995,
304
+ "map_at_10": 0.995,
305
+ "map_at_20": 0.995,
306
+ "map_at_50": 0.995,
307
+ "map_at_100": 0.995,
308
+ "recall_at_1": 0.99,
309
+ "recall_at_3": 1.0,
310
+ "recall_at_5": 1.0,
311
+ "recall_at_10": 1.0,
312
+ "recall_at_20": 1.0,
313
+ "recall_at_50": 1.0,
314
+ "recall_at_100": 1.0,
315
+ "precision_at_1": 0.99,
316
+ "precision_at_3": 0.33333,
317
+ "precision_at_5": 0.2,
318
+ "precision_at_10": 0.1,
319
+ "precision_at_20": 0.05,
320
+ "precision_at_50": 0.02,
321
+ "precision_at_100": 0.01,
322
+ "mrr_at_1": 0.99,
323
+ "mrr_at_3": 0.995,
324
+ "mrr_at_5": 0.995,
325
+ "mrr_at_10": 0.995,
326
+ "mrr_at_20": 0.995,
327
+ "mrr_at_50": 0.995,
328
+ "mrr_at_100": 0.995,
329
+ "naucs_at_1_max": 0.35807656395891085,
330
+ "naucs_at_1_std": 0.7222222222222201,
331
+ "naucs_at_1_diff1": 1.0,
332
+ "naucs_at_3_max": 1.0,
333
+ "naucs_at_3_std": 1.0,
334
+ "naucs_at_3_diff1": 1.0,
335
+ "naucs_at_5_max": 1.0,
336
+ "naucs_at_5_std": 1.0,
337
+ "naucs_at_5_diff1": 1.0,
338
+ "naucs_at_10_max": 1.0,
339
+ "naucs_at_10_std": 1.0,
340
+ "naucs_at_10_diff1": 1.0,
341
+ "naucs_at_20_max": 1.0,
342
+ "naucs_at_20_std": 1.0,
343
+ "naucs_at_20_diff1": 1.0,
344
+ "naucs_at_50_max": null,
345
+ "naucs_at_50_std": null,
346
+ "naucs_at_50_diff1": null,
347
+ "naucs_at_100_max": null,
348
+ "naucs_at_100_std": null,
349
+ "naucs_at_100_diff1": null
350
+ },
351
+ "syntheticDocQA_energy_test": {
352
+ "ndcg_at_1": 0.94,
353
+ "ndcg_at_3": 0.95762,
354
+ "ndcg_at_5": 0.95762,
355
+ "ndcg_at_10": 0.96411,
356
+ "ndcg_at_20": 0.96411,
357
+ "ndcg_at_50": 0.96621,
358
+ "ndcg_at_100": 0.96621,
359
+ "map_at_1": 0.94,
360
+ "map_at_3": 0.95333,
361
+ "map_at_5": 0.95333,
362
+ "map_at_10": 0.95601,
363
+ "map_at_20": 0.95601,
364
+ "map_at_50": 0.9564,
365
+ "map_at_100": 0.9564,
366
+ "recall_at_1": 0.94,
367
+ "recall_at_3": 0.97,
368
+ "recall_at_5": 0.97,
369
+ "recall_at_10": 0.99,
370
+ "recall_at_20": 0.99,
371
+ "recall_at_50": 1.0,
372
+ "recall_at_100": 1.0,
373
+ "precision_at_1": 0.94,
374
+ "precision_at_3": 0.32333,
375
+ "precision_at_5": 0.194,
376
+ "precision_at_10": 0.099,
377
+ "precision_at_20": 0.0495,
378
+ "precision_at_50": 0.02,
379
+ "precision_at_100": 0.01,
380
+ "mrr_at_1": 0.94,
381
+ "mrr_at_3": 0.9533333333333333,
382
+ "mrr_at_5": 0.9533333333333333,
383
+ "mrr_at_10": 0.956190476190476,
384
+ "mrr_at_20": 0.956190476190476,
385
+ "mrr_at_50": 0.9566071428571428,
386
+ "mrr_at_100": 0.9566071428571428,
387
+ "naucs_at_1_max": 0.5553999377528803,
388
+ "naucs_at_1_std": -0.8576097105508842,
389
+ "naucs_at_1_diff1": 1.0,
390
+ "naucs_at_3_max": 0.7424525365701778,
391
+ "naucs_at_3_std": -1.21708683473389,
392
+ "naucs_at_3_diff1": 1.0,
393
+ "naucs_at_5_max": 0.742452536570183,
394
+ "naucs_at_5_std": -1.2170868347338881,
395
+ "naucs_at_5_diff1": 1.0,
396
+ "naucs_at_10_max": 0.8692810457516413,
397
+ "naucs_at_10_std": -1.7399626517273863,
398
+ "naucs_at_10_diff1": 1.0,
399
+ "naucs_at_20_max": 0.8692810457516413,
400
+ "naucs_at_20_std": -1.7399626517273863,
401
+ "naucs_at_20_diff1": 1.0,
402
+ "naucs_at_50_max": null,
403
+ "naucs_at_50_std": null,
404
+ "naucs_at_50_diff1": null,
405
+ "naucs_at_100_max": null,
406
+ "naucs_at_100_std": null,
407
+ "naucs_at_100_diff1": null
408
+ },
409
+ "arxivqa_test_subsampled": {
410
+ "ndcg_at_1": 0.844,
411
+ "ndcg_at_3": 0.89107,
412
+ "ndcg_at_5": 0.90114,
413
+ "ndcg_at_10": 0.90777,
414
+ "ndcg_at_20": 0.91077,
415
+ "ndcg_at_50": 0.91363,
416
+ "ndcg_at_100": 0.91429,
417
+ "map_at_1": 0.844,
418
+ "map_at_3": 0.87967,
419
+ "map_at_5": 0.88537,
420
+ "map_at_10": 0.88818,
421
+ "map_at_20": 0.88899,
422
+ "map_at_50": 0.88948,
423
+ "map_at_100": 0.88954,
424
+ "recall_at_1": 0.844,
425
+ "recall_at_3": 0.924,
426
+ "recall_at_5": 0.948,
427
+ "recall_at_10": 0.968,
428
+ "recall_at_20": 0.98,
429
+ "recall_at_50": 0.994,
430
+ "recall_at_100": 0.998,
431
+ "precision_at_1": 0.844,
432
+ "precision_at_3": 0.308,
433
+ "precision_at_5": 0.1896,
434
+ "precision_at_10": 0.0968,
435
+ "precision_at_20": 0.049,
436
+ "precision_at_50": 0.01988,
437
+ "precision_at_100": 0.00998,
438
+ "mrr_at_1": 0.844,
439
+ "mrr_at_3": 0.8806666666666665,
440
+ "mrr_at_5": 0.8857666666666666,
441
+ "mrr_at_10": 0.888461111111111,
442
+ "mrr_at_20": 0.8893815257841571,
443
+ "mrr_at_50": 0.8897941261308093,
444
+ "mrr_at_100": 0.889852538829222,
445
+ "naucs_at_1_max": 0.8003780552136457,
446
+ "naucs_at_1_std": -0.21850586550779852,
447
+ "naucs_at_1_diff1": 0.9469027104423614,
448
+ "naucs_at_3_max": 0.8196594427244622,
449
+ "naucs_at_3_std": -0.19168018084426927,
450
+ "naucs_at_3_diff1": 0.9294805641554886,
451
+ "naucs_at_5_max": 0.873770020828847,
452
+ "naucs_at_5_std": -0.24251238957121693,
453
+ "naucs_at_5_diff1": 0.9277275012569133,
454
+ "naucs_at_10_max": 0.894228524743232,
455
+ "naucs_at_10_std": -0.20824579831933768,
456
+ "naucs_at_10_diff1": 0.9581290849673211,
457
+ "naucs_at_20_max": 0.9330065359477141,
458
+ "naucs_at_20_std": 0.06372549019607167,
459
+ "naucs_at_20_diff1": 0.9460784313725465,
460
+ "naucs_at_50_max": 0.9074074074073771,
461
+ "naucs_at_50_std": 0.4609399315281356,
462
+ "naucs_at_50_diff1": 0.9128540305010608,
463
+ "naucs_at_100_max": 1.0,
464
+ "naucs_at_100_std": 1.0,
465
+ "naucs_at_100_diff1": 1.0
466
+ },
467
+ "tatdqa_test": {
468
+ "ndcg_at_1": 0.70717,
469
+ "ndcg_at_3": 0.79727,
470
+ "ndcg_at_5": 0.81602,
471
+ "ndcg_at_10": 0.83047,
472
+ "ndcg_at_20": 0.83494,
473
+ "ndcg_at_50": 0.83746,
474
+ "ndcg_at_100": 0.83864,
475
+ "map_at_1": 0.70717,
476
+ "map_at_3": 0.77582,
477
+ "map_at_5": 0.78636,
478
+ "map_at_10": 0.79239,
479
+ "map_at_20": 0.79362,
480
+ "map_at_50": 0.79407,
481
+ "map_at_100": 0.79418,
482
+ "recall_at_1": 0.70717,
483
+ "recall_at_3": 0.85905,
484
+ "recall_at_5": 0.90401,
485
+ "recall_at_10": 0.94836,
486
+ "recall_at_20": 0.96598,
487
+ "recall_at_50": 0.97813,
488
+ "recall_at_100": 0.98542,
489
+ "precision_at_1": 0.70717,
490
+ "precision_at_3": 0.28635,
491
+ "precision_at_5": 0.1808,
492
+ "precision_at_10": 0.09484,
493
+ "precision_at_20": 0.0483,
494
+ "precision_at_50": 0.01956,
495
+ "precision_at_100": 0.00985,
496
+ "mrr_at_1": 0.7023086269744836,
497
+ "mrr_at_3": 0.7742000810044553,
498
+ "mrr_at_5": 0.7843458890238966,
499
+ "mrr_at_10": 0.7906075816312756,
500
+ "mrr_at_20": 0.7916419924247091,
501
+ "mrr_at_50": 0.7921731327579793,
502
+ "mrr_at_100": 0.7922646391503263,
503
+ "naucs_at_1_max": 0.2906046127459578,
504
+ "naucs_at_1_std": -0.09142586663565208,
505
+ "naucs_at_1_diff1": 0.8309895120853787,
506
+ "naucs_at_3_max": 0.3796718885973771,
507
+ "naucs_at_3_std": 0.10482653238007278,
508
+ "naucs_at_3_diff1": 0.7471424147638421,
509
+ "naucs_at_5_max": 0.3864536158297513,
510
+ "naucs_at_5_std": 0.1181445112698976,
511
+ "naucs_at_5_diff1": 0.7150521389103268,
512
+ "naucs_at_10_max": 0.4839255339546331,
513
+ "naucs_at_10_std": 0.31833706007680107,
514
+ "naucs_at_10_diff1": 0.7381822584022644,
515
+ "naucs_at_20_max": 0.5400727292289017,
516
+ "naucs_at_20_std": 0.4498780215876757,
517
+ "naucs_at_20_diff1": 0.7079690151340217,
518
+ "naucs_at_50_max": 0.5474120233459462,
519
+ "naucs_at_50_std": 0.5368176937394507,
520
+ "naucs_at_50_diff1": 0.6888921944972604,
521
+ "naucs_at_100_max": 0.4582633436145468,
522
+ "naucs_at_100_std": 0.418915162414328,
523
+ "naucs_at_100_diff1": 0.6404117260785882
524
+ },
525
+ "docvqa_test_subsampled": {
526
+ "ndcg_at_1": 0.52772,
527
+ "ndcg_at_3": 0.59582,
528
+ "ndcg_at_5": 0.61394,
529
+ "ndcg_at_10": 0.63728,
530
+ "ndcg_at_20": 0.6482,
531
+ "ndcg_at_50": 0.65777,
532
+ "ndcg_at_100": 0.66501,
533
+ "map_at_1": 0.52772,
534
+ "map_at_3": 0.57945,
535
+ "map_at_5": 0.58943,
536
+ "map_at_10": 0.5993,
537
+ "map_at_20": 0.60214,
538
+ "map_at_50": 0.60364,
539
+ "map_at_100": 0.60429,
540
+ "recall_at_1": 0.52772,
541
+ "recall_at_3": 0.64302,
542
+ "recall_at_5": 0.68736,
543
+ "recall_at_10": 0.75831,
544
+ "recall_at_20": 0.80266,
545
+ "recall_at_50": 0.85144,
546
+ "recall_at_100": 0.89579,
547
+ "precision_at_1": 0.52772,
548
+ "precision_at_3": 0.21434,
549
+ "precision_at_5": 0.13747,
550
+ "precision_at_10": 0.07583,
551
+ "precision_at_20": 0.04013,
552
+ "precision_at_50": 0.01703,
553
+ "precision_at_100": 0.00896,
554
+ "mrr_at_1": 0.5254988913525499,
555
+ "mrr_at_3": 0.5728011825572803,
556
+ "mrr_at_5": 0.584109386548411,
557
+ "mrr_at_10": 0.5947524020694751,
558
+ "mrr_at_20": 0.5975668878612459,
559
+ "mrr_at_50": 0.5990890888004771,
560
+ "mrr_at_100": 0.5996060790906476,
561
+ "naucs_at_1_max": 0.09552367711502079,
562
+ "naucs_at_1_std": 0.4562953212349874,
563
+ "naucs_at_1_diff1": 0.9160946322832428,
564
+ "naucs_at_3_max": -0.044115438920847336,
565
+ "naucs_at_3_std": 0.5742733170326745,
566
+ "naucs_at_3_diff1": 0.8655963522117655,
567
+ "naucs_at_5_max": -0.10576767278069941,
568
+ "naucs_at_5_std": 0.6507173054255285,
569
+ "naucs_at_5_diff1": 0.8353615090128605,
570
+ "naucs_at_10_max": -0.2764424505277048,
571
+ "naucs_at_10_std": 0.7587119579895203,
572
+ "naucs_at_10_diff1": 0.8510524017981272,
573
+ "naucs_at_20_max": -0.43743463755515927,
574
+ "naucs_at_20_std": 0.7826668175451623,
575
+ "naucs_at_20_diff1": 0.8554676478694768,
576
+ "naucs_at_50_max": -0.4574288492202119,
577
+ "naucs_at_50_std": 0.8851253371587365,
578
+ "naucs_at_50_diff1": 0.8465829220076285,
579
+ "naucs_at_100_max": -0.5265892443150121,
580
+ "naucs_at_100_std": 0.8821668553153678,
581
+ "naucs_at_100_diff1": 0.8424554142175609
582
+ }
583
+ }
special_tokens_map.json ADDED
@@ -0,0 +1,31 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "additional_special_tokens": [
3
+ "<|im_start|>",
4
+ "<|im_end|>",
5
+ "<|object_ref_start|>",
6
+ "<|object_ref_end|>",
7
+ "<|box_start|>",
8
+ "<|box_end|>",
9
+ "<|quad_start|>",
10
+ "<|quad_end|>",
11
+ "<|vision_start|>",
12
+ "<|vision_end|>",
13
+ "<|vision_pad|>",
14
+ "<|image_pad|>",
15
+ "<|video_pad|>"
16
+ ],
17
+ "eos_token": {
18
+ "content": "<|im_end|>",
19
+ "lstrip": false,
20
+ "normalized": false,
21
+ "rstrip": false,
22
+ "single_word": false
23
+ },
24
+ "pad_token": {
25
+ "content": "<|endoftext|>",
26
+ "lstrip": false,
27
+ "normalized": false,
28
+ "rstrip": false,
29
+ "single_word": false
30
+ }
31
+ }
tokenizer.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:091aa7594dc2fcfbfa06b9e3c22a5f0562ac14f30375c13af7309407a0e67b8a
3
+ size 11420371
tokenizer_config.json ADDED
@@ -0,0 +1,145 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "add_prefix_space": false,
3
+ "added_tokens_decoder": {
4
+ "151643": {
5
+ "content": "<|endoftext|>",
6
+ "lstrip": false,
7
+ "normalized": false,
8
+ "rstrip": false,
9
+ "single_word": false,
10
+ "special": true
11
+ },
12
+ "151644": {
13
+ "content": "<|im_start|>",
14
+ "lstrip": false,
15
+ "normalized": false,
16
+ "rstrip": false,
17
+ "single_word": false,
18
+ "special": true
19
+ },
20
+ "151645": {
21
+ "content": "<|im_end|>",
22
+ "lstrip": false,
23
+ "normalized": false,
24
+ "rstrip": false,
25
+ "single_word": false,
26
+ "special": true
27
+ },
28
+ "151646": {
29
+ "content": "<|object_ref_start|>",
30
+ "lstrip": false,
31
+ "normalized": false,
32
+ "rstrip": false,
33
+ "single_word": false,
34
+ "special": true
35
+ },
36
+ "151647": {
37
+ "content": "<|object_ref_end|>",
38
+ "lstrip": false,
39
+ "normalized": false,
40
+ "rstrip": false,
41
+ "single_word": false,
42
+ "special": true
43
+ },
44
+ "151648": {
45
+ "content": "<|box_start|>",
46
+ "lstrip": false,
47
+ "normalized": false,
48
+ "rstrip": false,
49
+ "single_word": false,
50
+ "special": true
51
+ },
52
+ "151649": {
53
+ "content": "<|box_end|>",
54
+ "lstrip": false,
55
+ "normalized": false,
56
+ "rstrip": false,
57
+ "single_word": false,
58
+ "special": true
59
+ },
60
+ "151650": {
61
+ "content": "<|quad_start|>",
62
+ "lstrip": false,
63
+ "normalized": false,
64
+ "rstrip": false,
65
+ "single_word": false,
66
+ "special": true
67
+ },
68
+ "151651": {
69
+ "content": "<|quad_end|>",
70
+ "lstrip": false,
71
+ "normalized": false,
72
+ "rstrip": false,
73
+ "single_word": false,
74
+ "special": true
75
+ },
76
+ "151652": {
77
+ "content": "<|vision_start|>",
78
+ "lstrip": false,
79
+ "normalized": false,
80
+ "rstrip": false,
81
+ "single_word": false,
82
+ "special": true
83
+ },
84
+ "151653": {
85
+ "content": "<|vision_end|>",
86
+ "lstrip": false,
87
+ "normalized": false,
88
+ "rstrip": false,
89
+ "single_word": false,
90
+ "special": true
91
+ },
92
+ "151654": {
93
+ "content": "<|vision_pad|>",
94
+ "lstrip": false,
95
+ "normalized": false,
96
+ "rstrip": false,
97
+ "single_word": false,
98
+ "special": true
99
+ },
100
+ "151655": {
101
+ "content": "<|image_pad|>",
102
+ "lstrip": false,
103
+ "normalized": false,
104
+ "rstrip": false,
105
+ "single_word": false,
106
+ "special": true
107
+ },
108
+ "151656": {
109
+ "content": "<|video_pad|>",
110
+ "lstrip": false,
111
+ "normalized": false,
112
+ "rstrip": false,
113
+ "single_word": false,
114
+ "special": true
115
+ }
116
+ },
117
+ "additional_special_tokens": [
118
+ "<|im_start|>",
119
+ "<|im_end|>",
120
+ "<|object_ref_start|>",
121
+ "<|object_ref_end|>",
122
+ "<|box_start|>",
123
+ "<|box_end|>",
124
+ "<|quad_start|>",
125
+ "<|quad_end|>",
126
+ "<|vision_start|>",
127
+ "<|vision_end|>",
128
+ "<|vision_pad|>",
129
+ "<|image_pad|>",
130
+ "<|video_pad|>"
131
+ ],
132
+ "bos_token": null,
133
+ "chat_template": "{% set image_count = namespace(value=0) %}{% set video_count = namespace(value=0) %}{% for message in messages %}{% if loop.first and message['role'] != 'system' %}<|im_start|>system\nYou are a helpful assistant.<|im_end|>\n{% endif %}<|im_start|>{{ message['role'] }}\n{% if message['content'] is string %}{{ message['content'] }}<|im_end|>\n{% else %}{% for content in message['content'] %}{% if content['type'] == 'image' or 'image' in content or 'image_url' in content %}{% set image_count.value = image_count.value + 1 %}{% if add_vision_id %}Picture {{ image_count.value }}: {% endif %}<|vision_start|><|image_pad|><|vision_end|>{% elif content['type'] == 'video' or 'video' in content %}{% set video_count.value = video_count.value + 1 %}{% if add_vision_id %}Video {{ video_count.value }}: {% endif %}<|vision_start|><|video_pad|><|vision_end|>{% elif 'text' in content %}{{ content['text'] }}{% endif %}{% endfor %}<|im_end|>\n{% endif %}{% endfor %}{% if add_generation_prompt %}<|im_start|>assistant\n{% endif %}",
134
+ "clean_up_tokenization_spaces": false,
135
+ "eos_token": "<|im_end|>",
136
+ "errors": "replace",
137
+ "extra_special_tokens": {},
138
+ "model_max_length": 32768,
139
+ "pad_token": "<|endoftext|>",
140
+ "padding_side": "left",
141
+ "processor_class": "ColQwen2Processor",
142
+ "split_special_tokens": false,
143
+ "tokenizer_class": "Qwen2Tokenizer",
144
+ "unk_token": null
145
+ }
vocab.json ADDED
The diff for this file is too large to render. See raw diff