zpn commited on
Commit
a6a691e
·
verified ·
1 Parent(s): 47ff4dc

Update results.json

Browse files
Files changed (1) hide show
  1. results.json +1100 -1106
results.json CHANGED
@@ -1,1110 +1,1104 @@
1
  {
2
- "metrics": {
3
- "vidore/arxivqa_test_subsampled": {
4
- "ndcg_at_1": 0.824,
5
- "ndcg_at_3": 0.86202,
6
- "ndcg_at_5": 0.87442,
7
- "ndcg_at_10": 0.88303,
8
- "ndcg_at_20": 0.88861,
9
- "ndcg_at_50": 0.8927,
10
- "ndcg_at_100": 0.89339,
11
- "map_at_1": 0.824,
12
- "map_at_3": 0.853,
13
- "map_at_5": 0.8599,
14
- "map_at_10": 0.86358,
15
- "map_at_20": 0.86512,
16
- "map_at_50": 0.86583,
17
- "map_at_100": 0.86591,
18
- "recall_at_1": 0.824,
19
- "recall_at_3": 0.888,
20
- "recall_at_5": 0.918,
21
- "recall_at_10": 0.944,
22
- "recall_at_20": 0.966,
23
- "recall_at_50": 0.986,
24
- "recall_at_100": 0.99,
25
- "precision_at_1": 0.824,
26
- "precision_at_3": 0.296,
27
- "precision_at_5": 0.1836,
28
- "precision_at_10": 0.0944,
29
- "precision_at_20": 0.0483,
30
- "precision_at_50": 0.01972,
31
- "precision_at_100": 0.0099,
32
- "mrr_at_1": 0.832,
33
- "mrr_at_3": 0.856,
34
- "mrr_at_5": 0.8632,
35
- "mrr_at_10": 0.86755,
36
- "mrr_at_20": 0.8687646325896324,
37
- "mrr_at_50": 0.8694855987079559,
38
- "mrr_at_100": 0.8695150104726618,
39
- "naucs_at_1_max": 0.8110100305865411,
40
- "naucs_at_1_std": 0.07361011155091818,
41
- "naucs_at_1_diff1": 0.9603893037063689,
42
- "naucs_at_3_max": 0.7977881493506478,
43
- "naucs_at_3_std": 0.013342126623376577,
44
- "naucs_at_3_diff1": 0.9239464962121198,
45
- "naucs_at_5_max": 0.8150463437407489,
46
- "naucs_at_5_std": 0.14904010384641533,
47
- "naucs_at_5_diff1": 0.9183006535947713,
48
- "naucs_at_10_max": 0.8759670534880637,
49
- "naucs_at_10_std": 0.2408463385354136,
50
- "naucs_at_10_diff1": 0.9323062558356668,
51
- "naucs_at_20_max": 0.9013016971494501,
52
- "naucs_at_20_std": 0.4259076179491429,
53
- "naucs_at_20_diff1": 0.9115724721261116,
54
- "naucs_at_50_max": 0.9229691876750605,
55
- "naucs_at_50_std": 0.7222889155662164,
56
- "naucs_at_50_diff1": 0.9019607843137241,
57
- "naucs_at_100_max": 0.8921568627450854,
58
- "naucs_at_100_std": 0.6373482726423866,
59
- "naucs_at_100_diff1": 0.9183006535947666
60
- },
61
- "vidore/docvqa_test_subsampled": {
62
- "ndcg_at_1": 0.52993,
63
- "ndcg_at_3": 0.59967,
64
- "ndcg_at_5": 0.61961,
65
- "ndcg_at_10": 0.63197,
66
- "ndcg_at_20": 0.64596,
67
- "ndcg_at_50": 0.65515,
68
- "ndcg_at_100": 0.66198,
69
- "map_at_1": 0.52993,
70
- "map_at_3": 0.58241,
71
- "map_at_5": 0.59339,
72
- "map_at_10": 0.59817,
73
- "map_at_20": 0.602,
74
- "map_at_50": 0.60345,
75
- "map_at_100": 0.60405,
76
- "recall_at_1": 0.52993,
77
- "recall_at_3": 0.64967,
78
- "recall_at_5": 0.69845,
79
- "recall_at_10": 0.73836,
80
- "recall_at_20": 0.79379,
81
- "recall_at_50": 0.84035,
82
- "recall_at_100": 0.88248,
83
- "precision_at_1": 0.52993,
84
- "precision_at_3": 0.21656,
85
- "precision_at_5": 0.13969,
86
- "precision_at_10": 0.07384,
87
- "precision_at_20": 0.03969,
88
- "precision_at_50": 0.01681,
89
- "precision_at_100": 0.00882,
90
- "mrr_at_1": 0.5277161862527716,
91
- "mrr_at_3": 0.5776053215077607,
92
- "mrr_at_5": 0.5888026607538803,
93
- "mrr_at_10": 0.5944919579065918,
94
- "mrr_at_20": 0.5983219637865657,
95
- "mrr_at_50": 0.5999309966010471,
96
- "mrr_at_100": 0.6005501639541099,
97
- "naucs_at_1_max": 0.37096765728763215,
98
- "naucs_at_1_std": 0.5363118108228696,
99
- "naucs_at_1_diff1": 0.9084586513989499,
100
- "naucs_at_3_max": 0.28536364371043943,
101
- "naucs_at_3_std": 0.656382780997437,
102
- "naucs_at_3_diff1": 0.8754285629546056,
103
- "naucs_at_5_max": 0.26490606879524303,
104
- "naucs_at_5_std": 0.6794242484186521,
105
- "naucs_at_5_diff1": 0.8670235151833391,
106
- "naucs_at_10_max": 0.17906145941266727,
107
- "naucs_at_10_std": 0.71951378124067,
108
- "naucs_at_10_diff1": 0.8623037540857623,
109
- "naucs_at_20_max": 0.039717430802327786,
110
- "naucs_at_20_std": 0.77907518789845,
111
- "naucs_at_20_diff1": 0.8711346514573685,
112
- "naucs_at_50_max": -0.06591984153859125,
113
- "naucs_at_50_std": 0.8944335077781369,
114
- "naucs_at_50_diff1": 0.872338054901137,
115
- "naucs_at_100_max": -0.18390488993971363,
116
- "naucs_at_100_std": 0.9432351742842897,
117
- "naucs_at_100_diff1": 0.8529357662557685
118
- },
119
- "vidore/infovqa_test_subsampled": {
120
- "ndcg_at_1": 0.89069,
121
- "ndcg_at_3": 0.9279,
122
- "ndcg_at_5": 0.93217,
123
- "ndcg_at_10": 0.93547,
124
- "ndcg_at_20": 0.9379,
125
- "ndcg_at_50": 0.93869,
126
- "ndcg_at_100": 0.93902,
127
- "map_at_1": 0.89069,
128
- "map_at_3": 0.91903,
129
- "map_at_5": 0.92146,
130
- "map_at_10": 0.92284,
131
- "map_at_20": 0.92344,
132
- "map_at_50": 0.92356,
133
- "map_at_100": 0.92359,
134
- "recall_at_1": 0.89069,
135
- "recall_at_3": 0.95344,
136
- "recall_at_5": 0.96356,
137
- "recall_at_10": 0.97368,
138
- "recall_at_20": 0.98381,
139
- "recall_at_50": 0.98785,
140
- "recall_at_100": 0.98988,
141
- "precision_at_1": 0.89069,
142
- "precision_at_3": 0.31781,
143
- "precision_at_5": 0.19271,
144
- "precision_at_10": 0.09737,
145
- "precision_at_20": 0.04919,
146
- "precision_at_50": 0.01976,
147
- "precision_at_100": 0.0099,
148
- "mrr_at_1": 0.8866396761133604,
149
- "mrr_at_3": 0.915991902834008,
150
- "mrr_at_5": 0.9190283400809716,
151
- "mrr_at_10": 0.9202091767881241,
152
- "mrr_at_20": 0.9207680541852368,
153
- "mrr_at_50": 0.9210783259706008,
154
- "mrr_at_100": 0.9211072444205719,
155
- "naucs_at_1_max": 0.6570120332617708,
156
- "naucs_at_1_std": 0.027148367339034946,
157
- "naucs_at_1_diff1": 0.954693725587737,
158
- "naucs_at_3_max": 0.8518572112090398,
159
- "naucs_at_3_std": 0.5033227123520332,
160
- "naucs_at_3_diff1": 0.9410604334985626,
161
- "naucs_at_5_max": 0.9198784015441375,
162
- "naucs_at_5_std": 0.6599441606302139,
163
- "naucs_at_5_diff1": 0.9628033833359825,
164
- "naucs_at_10_max": 0.9585432580086493,
165
- "naucs_at_10_std": 0.7697000086081518,
166
- "naucs_at_10_diff1": 1.0,
167
- "naucs_at_20_max": 0.9673496364838108,
168
- "naucs_at_20_std": 0.8687019487486011,
169
- "naucs_at_20_diff1": 1.0,
170
- "naucs_at_50_max": 0.9564661819783937,
171
- "naucs_at_50_std": 0.9319439680295378,
172
- "naucs_at_50_diff1": 1.0,
173
- "naucs_at_100_max": 0.9477594183740937,
174
- "naucs_at_100_std": 0.9183327616354471,
175
- "naucs_at_100_diff1": 1.0
176
- },
177
- "vidore/tabfquad_test_subsampled": {
178
- "ndcg_at_1": 0.89286,
179
- "ndcg_at_3": 0.93962,
180
- "ndcg_at_5": 0.94408,
181
- "ndcg_at_10": 0.94894,
182
- "ndcg_at_20": 0.94977,
183
- "ndcg_at_50": 0.94977,
184
- "ndcg_at_100": 0.94977,
185
- "map_at_1": 0.89286,
186
- "map_at_3": 0.92857,
187
- "map_at_5": 0.93107,
188
- "map_at_10": 0.93322,
189
- "map_at_20": 0.93341,
190
- "map_at_50": 0.93341,
191
- "map_at_100": 0.93341,
192
- "recall_at_1": 0.89286,
193
- "recall_at_3": 0.97143,
194
- "recall_at_5": 0.98214,
195
- "recall_at_10": 0.99643,
196
- "recall_at_20": 1.0,
197
- "recall_at_50": 1.0,
198
- "recall_at_100": 1.0,
199
- "precision_at_1": 0.89286,
200
- "precision_at_3": 0.32381,
201
- "precision_at_5": 0.19643,
202
- "precision_at_10": 0.09964,
203
- "precision_at_20": 0.05,
204
- "precision_at_50": 0.02,
205
- "precision_at_100": 0.01,
206
- "mrr_at_1": 0.8964285714285715,
207
- "mrr_at_3": 0.930952380952381,
208
- "mrr_at_5": 0.9336309523809524,
209
- "mrr_at_10": 0.9357780612244897,
210
- "mrr_at_20": 0.9359660311493018,
211
- "mrr_at_50": 0.9359660311493018,
212
- "mrr_at_100": 0.9359660311493018,
213
- "naucs_at_1_max": 0.589419152276295,
214
- "naucs_at_1_std": 0.25799058084772386,
215
- "naucs_at_1_diff1": 0.9168759811616957,
216
- "naucs_at_3_max": 0.8952497665732961,
217
- "naucs_at_3_std": 0.5145891690009315,
218
- "naucs_at_3_diff1": 0.8978758169934691,
219
- "naucs_at_5_max": 0.8585434173669502,
220
- "naucs_at_5_std": 0.6536881419234349,
221
- "naucs_at_5_diff1": 0.8627450980392123,
222
- "naucs_at_10_max": 1.0,
223
- "naucs_at_10_std": 1.0,
224
- "naucs_at_10_diff1": 0.72222222222224,
225
- "naucs_at_20_max": 1.0,
226
- "naucs_at_20_std": 1.0,
227
- "naucs_at_20_diff1": 1.0,
228
- "naucs_at_50_max": 1.0,
229
- "naucs_at_50_std": 1.0,
230
- "naucs_at_50_diff1": 1.0,
231
- "naucs_at_100_max": 1.0,
232
- "naucs_at_100_std": 1.0,
233
- "naucs_at_100_diff1": 1.0
234
- },
235
- "vidore/tatdqa_test": {
236
- "ndcg_at_1": 0.70717,
237
- "ndcg_at_3": 0.79456,
238
- "ndcg_at_5": 0.81297,
239
- "ndcg_at_10": 0.82424,
240
- "ndcg_at_20": 0.82919,
241
- "ndcg_at_50": 0.83284,
242
- "ndcg_at_100": 0.83523,
243
- "map_at_1": 0.70717,
244
- "map_at_3": 0.77329,
245
- "map_at_5": 0.78359,
246
- "map_at_10": 0.7884,
247
- "map_at_20": 0.78977,
248
- "map_at_50": 0.79038,
249
- "map_at_100": 0.79059,
250
- "recall_at_1": 0.70717,
251
- "recall_at_3": 0.85601,
252
- "recall_at_5": 0.90036,
253
- "recall_at_10": 0.93439,
254
- "recall_at_20": 0.95383,
255
- "recall_at_50": 0.97205,
256
- "recall_at_100": 0.98663,
257
- "precision_at_1": 0.70717,
258
- "precision_at_3": 0.28534,
259
- "precision_at_5": 0.18007,
260
- "precision_at_10": 0.09344,
261
- "precision_at_20": 0.04769,
262
- "precision_at_50": 0.01944,
263
- "precision_at_100": 0.00987,
264
- "mrr_at_1": 0.7023086269744836,
265
- "mrr_at_3": 0.7717699473471039,
266
- "mrr_at_5": 0.7816727420008102,
267
- "mrr_at_10": 0.7864732203128313,
268
- "mrr_at_20": 0.787759657888834,
269
- "mrr_at_50": 0.788430475412044,
270
- "mrr_at_100": 0.7886237843491343,
271
- "naucs_at_1_max": 0.1976745629949593,
272
- "naucs_at_1_std": -0.07020091579321315,
273
- "naucs_at_1_diff1": 0.8341074480907863,
274
- "naucs_at_3_max": 0.2739593664910223,
275
- "naucs_at_3_std": 0.09719421770368855,
276
- "naucs_at_3_diff1": 0.733605301953241,
277
- "naucs_at_5_max": 0.28947443709217946,
278
- "naucs_at_5_std": 0.1533000171315339,
279
- "naucs_at_5_diff1": 0.6900117830352311,
280
- "naucs_at_10_max": 0.3583991399796331,
281
- "naucs_at_10_std": 0.24841173509752057,
282
- "naucs_at_10_diff1": 0.6368724254679143,
283
- "naucs_at_20_max": 0.3998152332693893,
284
- "naucs_at_20_std": 0.40035275451656677,
285
- "naucs_at_20_diff1": 0.5848768162171684,
286
- "naucs_at_50_max": 0.42687513985337017,
287
- "naucs_at_50_std": 0.41022440172224445,
288
- "naucs_at_50_diff1": 0.6184924487522029,
289
- "naucs_at_100_max": 0.48239198753920115,
290
- "naucs_at_100_std": 0.5542709753617254,
291
- "naucs_at_100_diff1": 0.6801547390328168
292
- },
293
- "vidore/shiftproject_test": {
294
- "ndcg_at_1": 0.83,
295
- "ndcg_at_3": 0.90309,
296
- "ndcg_at_5": 0.91083,
297
- "ndcg_at_10": 0.91439,
298
- "ndcg_at_20": 0.91718,
299
- "ndcg_at_50": 0.91902,
300
- "ndcg_at_100": 0.91902,
301
- "map_at_1": 0.83,
302
- "map_at_3": 0.88667,
303
- "map_at_5": 0.89067,
304
- "map_at_10": 0.89233,
305
- "map_at_20": 0.89324,
306
- "map_at_50": 0.89348,
307
- "map_at_100": 0.89348,
308
- "recall_at_1": 0.83,
309
- "recall_at_3": 0.95,
310
- "recall_at_5": 0.97,
311
- "recall_at_10": 0.98,
312
- "recall_at_20": 0.99,
313
- "recall_at_50": 1.0,
314
- "recall_at_100": 1.0,
315
- "precision_at_1": 0.83,
316
- "precision_at_3": 0.31667,
317
- "precision_at_5": 0.194,
318
- "precision_at_10": 0.098,
319
- "precision_at_20": 0.0495,
320
- "precision_at_50": 0.02,
321
- "precision_at_100": 0.01,
322
- "mrr_at_1": 0.82,
323
- "mrr_at_3": 0.885,
324
- "mrr_at_5": 0.887,
325
- "mrr_at_10": 0.8886666666666666,
326
- "mrr_at_20": 0.8895757575757576,
327
- "mrr_at_50": 0.8898138528138527,
328
- "mrr_at_100": 0.8898138528138527,
329
- "naucs_at_1_max": 0.06597202066523537,
330
- "naucs_at_1_std": -0.5197074360016254,
331
- "naucs_at_1_diff1": 0.6896441632321363,
332
- "naucs_at_3_max": 0.2547152194211014,
333
- "naucs_at_3_std": -0.7438842203548043,
334
- "naucs_at_3_diff1": 0.7722689075630248,
335
- "naucs_at_5_max": 0.3225957049486489,
336
- "naucs_at_5_std": -0.7791783380018631,
337
- "naucs_at_5_diff1": 0.9128540305010848,
338
- "naucs_at_10_max": 0.42250233426704475,
339
- "naucs_at_10_std": -0.2987861811391239,
340
- "naucs_at_10_diff1": 0.8692810457516353,
341
- "naucs_at_20_max": 0.7222222222222276,
342
- "naucs_at_20_std": 0.5541549953314738,
343
- "naucs_at_20_diff1": 0.8692810457516413,
344
- "naucs_at_50_max": null,
345
- "naucs_at_50_std": null,
346
- "naucs_at_50_diff1": null,
347
- "naucs_at_100_max": null,
348
- "naucs_at_100_std": null,
349
- "naucs_at_100_diff1": null
350
- },
351
- "vidore/syntheticDocQA_artificial_intelligence_test": {
352
- "ndcg_at_1": 0.96,
353
- "ndcg_at_3": 0.97893,
354
- "ndcg_at_5": 0.97893,
355
- "ndcg_at_10": 0.98249,
356
- "ndcg_at_20": 0.98249,
357
- "ndcg_at_50": 0.98249,
358
- "ndcg_at_100": 0.98249,
359
- "map_at_1": 0.96,
360
- "map_at_3": 0.975,
361
- "map_at_5": 0.975,
362
- "map_at_10": 0.97667,
363
- "map_at_20": 0.97667,
364
- "map_at_50": 0.97667,
365
- "map_at_100": 0.97667,
366
- "recall_at_1": 0.96,
367
- "recall_at_3": 0.99,
368
- "recall_at_5": 0.99,
369
- "recall_at_10": 1.0,
370
- "recall_at_20": 1.0,
371
- "recall_at_50": 1.0,
372
- "recall_at_100": 1.0,
373
- "precision_at_1": 0.96,
374
- "precision_at_3": 0.33,
375
- "precision_at_5": 0.198,
376
- "precision_at_10": 0.1,
377
- "precision_at_20": 0.05,
378
- "precision_at_50": 0.02,
379
- "precision_at_100": 0.01,
380
- "mrr_at_1": 0.98,
381
- "mrr_at_3": 0.985,
382
- "mrr_at_5": 0.985,
383
- "mrr_at_10": 0.9866666666666667,
384
- "mrr_at_20": 0.9866666666666667,
385
- "mrr_at_50": 0.9866666666666667,
386
- "mrr_at_100": 0.9866666666666667,
387
- "naucs_at_1_max": 0.3437208216620012,
388
- "naucs_at_1_std": -0.1860410830999054,
389
- "naucs_at_1_diff1": 1.0,
390
- "naucs_at_3_max": 0.8692810457516356,
391
- "naucs_at_3_std": -0.5634920634921204,
392
- "naucs_at_3_diff1": 1.0,
393
- "naucs_at_5_max": 0.8692810457516413,
394
- "naucs_at_5_std": -0.5634920634920767,
395
- "naucs_at_5_diff1": 1.0,
396
- "naucs_at_10_max": 1.0,
397
- "naucs_at_10_std": 1.0,
398
- "naucs_at_10_diff1": 1.0,
399
- "naucs_at_20_max": 1.0,
400
- "naucs_at_20_std": 1.0,
401
- "naucs_at_20_diff1": 1.0,
402
- "naucs_at_50_max": null,
403
- "naucs_at_50_std": null,
404
- "naucs_at_50_diff1": null,
405
- "naucs_at_100_max": null,
406
- "naucs_at_100_std": null,
407
- "naucs_at_100_diff1": null
408
- },
409
- "vidore/syntheticDocQA_energy_test": {
410
- "ndcg_at_1": 0.93,
411
- "ndcg_at_3": 0.96024,
412
- "ndcg_at_5": 0.96024,
413
- "ndcg_at_10": 0.96339,
414
- "ndcg_at_20": 0.96618,
415
- "ndcg_at_50": 0.96618,
416
- "ndcg_at_100": 0.96618,
417
- "map_at_1": 0.93,
418
- "map_at_3": 0.95333,
419
- "map_at_5": 0.95333,
420
- "map_at_10": 0.95458,
421
- "map_at_20": 0.95549,
422
- "map_at_50": 0.95549,
423
- "map_at_100": 0.95549,
424
- "recall_at_1": 0.93,
425
- "recall_at_3": 0.98,
426
- "recall_at_5": 0.98,
427
- "recall_at_10": 0.99,
428
- "recall_at_20": 1.0,
429
- "recall_at_50": 1.0,
430
- "recall_at_100": 1.0,
431
- "precision_at_1": 0.93,
432
- "precision_at_3": 0.32667,
433
- "precision_at_5": 0.196,
434
- "precision_at_10": 0.099,
435
- "precision_at_20": 0.05,
436
- "precision_at_50": 0.02,
437
- "precision_at_100": 0.01,
438
- "mrr_at_1": 0.94,
439
- "mrr_at_3": 0.9583333333333333,
440
- "mrr_at_5": 0.9583333333333333,
441
- "mrr_at_10": 0.960873015873016,
442
- "mrr_at_20": 0.960873015873016,
443
- "mrr_at_50": 0.960873015873016,
444
- "mrr_at_100": 0.960873015873016,
445
- "naucs_at_1_max": 0.6919434440442851,
446
- "naucs_at_1_std": -0.4906629318394028,
447
- "naucs_at_1_diff1": 0.9813258636788056,
448
- "naucs_at_3_max": 0.7117180205415458,
449
- "naucs_at_3_std": -1.4458450046685478,
450
- "naucs_at_3_diff1": 1.0,
451
- "naucs_at_5_max": 0.7117180205415541,
452
- "naucs_at_5_std": -1.445845004668519,
453
- "naucs_at_5_diff1": 1.0,
454
- "naucs_at_10_max": 0.8692810457516413,
455
- "naucs_at_10_std": -1.1517273576097316,
456
- "naucs_at_10_diff1": 1.0,
457
- "naucs_at_20_max": 1.0,
458
- "naucs_at_20_std": 1.0,
459
- "naucs_at_20_diff1": 1.0,
460
- "naucs_at_50_max": null,
461
- "naucs_at_50_std": null,
462
- "naucs_at_50_diff1": null,
463
- "naucs_at_100_max": null,
464
- "naucs_at_100_std": null,
465
- "naucs_at_100_diff1": null
466
- },
467
- "vidore/syntheticDocQA_government_reports_test": {
468
- "ndcg_at_1": 0.94,
469
- "ndcg_at_3": 0.97655,
470
- "ndcg_at_5": 0.97655,
471
- "ndcg_at_10": 0.97655,
472
- "ndcg_at_20": 0.97655,
473
- "ndcg_at_50": 0.97655,
474
- "ndcg_at_100": 0.97655,
475
- "map_at_1": 0.94,
476
- "map_at_3": 0.96833,
477
- "map_at_5": 0.96833,
478
- "map_at_10": 0.96833,
479
- "map_at_20": 0.96833,
480
- "map_at_50": 0.96833,
481
- "map_at_100": 0.96833,
482
- "recall_at_1": 0.94,
483
- "recall_at_3": 1.0,
484
- "recall_at_5": 1.0,
485
- "recall_at_10": 1.0,
486
- "recall_at_20": 1.0,
487
- "recall_at_50": 1.0,
488
- "recall_at_100": 1.0,
489
- "precision_at_1": 0.94,
490
- "precision_at_3": 0.33333,
491
- "precision_at_5": 0.2,
492
- "precision_at_10": 0.1,
493
- "precision_at_20": 0.05,
494
- "precision_at_50": 0.02,
495
- "precision_at_100": 0.01,
496
- "mrr_at_1": 0.96,
497
- "mrr_at_3": 0.975,
498
- "mrr_at_5": 0.9775,
499
- "mrr_at_10": 0.9775,
500
- "mrr_at_20": 0.9775,
501
- "mrr_at_50": 0.9775,
502
- "mrr_at_100": 0.9775,
503
- "naucs_at_1_max": 0.7468098350451301,
504
- "naucs_at_1_std": 0.40919701213818827,
505
- "naucs_at_1_diff1": 0.9782135076252712,
506
- "naucs_at_3_max": 1.0,
507
- "naucs_at_3_std": 1.0,
508
- "naucs_at_3_diff1": 1.0,
509
- "naucs_at_5_max": 1.0,
510
- "naucs_at_5_std": 1.0,
511
- "naucs_at_5_diff1": 1.0,
512
- "naucs_at_10_max": 1.0,
513
- "naucs_at_10_std": 1.0,
514
- "naucs_at_10_diff1": 1.0,
515
- "naucs_at_20_max": 1.0,
516
- "naucs_at_20_std": 1.0,
517
- "naucs_at_20_diff1": 1.0,
518
- "naucs_at_50_max": null,
519
- "naucs_at_50_std": null,
520
- "naucs_at_50_diff1": null,
521
- "naucs_at_100_max": null,
522
- "naucs_at_100_std": null,
523
- "naucs_at_100_diff1": null
524
- },
525
- "vidore/syntheticDocQA_healthcare_industry_test": {
526
- "ndcg_at_1": 0.97,
527
- "ndcg_at_3": 0.98893,
528
- "ndcg_at_5": 0.98893,
529
- "ndcg_at_10": 0.98893,
530
- "ndcg_at_20": 0.98893,
531
- "ndcg_at_50": 0.98893,
532
- "ndcg_at_100": 0.98893,
533
- "map_at_1": 0.97,
534
- "map_at_3": 0.985,
535
- "map_at_5": 0.985,
536
- "map_at_10": 0.985,
537
- "map_at_20": 0.985,
538
- "map_at_50": 0.985,
539
- "map_at_100": 0.985,
540
- "recall_at_1": 0.97,
541
- "recall_at_3": 1.0,
542
- "recall_at_5": 1.0,
543
- "recall_at_10": 1.0,
544
- "recall_at_20": 1.0,
545
- "recall_at_50": 1.0,
546
- "recall_at_100": 1.0,
547
- "precision_at_1": 0.97,
548
- "precision_at_3": 0.33333,
549
- "precision_at_5": 0.2,
550
- "precision_at_10": 0.1,
551
- "precision_at_20": 0.05,
552
- "precision_at_50": 0.02,
553
- "precision_at_100": 0.01,
554
- "mrr_at_1": 0.97,
555
- "mrr_at_3": 0.985,
556
- "mrr_at_5": 0.985,
557
- "mrr_at_10": 0.985,
558
- "mrr_at_20": 0.985,
559
- "mrr_at_50": 0.985,
560
- "mrr_at_100": 0.985,
561
- "naucs_at_1_max": 0.5938375350140056,
562
- "naucs_at_1_std": -0.1512605042016779,
563
- "naucs_at_1_diff1": 1.0,
564
- "naucs_at_3_max": 1.0,
565
- "naucs_at_3_std": 1.0,
566
- "naucs_at_3_diff1": 1.0,
567
- "naucs_at_5_max": 1.0,
568
- "naucs_at_5_std": 1.0,
569
- "naucs_at_5_diff1": 1.0,
570
- "naucs_at_10_max": 1.0,
571
- "naucs_at_10_std": 1.0,
572
- "naucs_at_10_diff1": 1.0,
573
- "naucs_at_20_max": 1.0,
574
- "naucs_at_20_std": 1.0,
575
- "naucs_at_20_diff1": 1.0,
576
- "naucs_at_50_max": null,
577
- "naucs_at_50_std": null,
578
- "naucs_at_50_diff1": null,
579
- "naucs_at_100_max": null,
580
- "naucs_at_100_std": null,
581
- "naucs_at_100_diff1": null
582
- },
583
- "vidore/synthetic_mit_biomedical_tissue_interactions_unfiltered": {
584
- "ndcg_at_1": 0.6,
585
- "ndcg_at_3": 0.6151,
586
- "ndcg_at_5": 0.63545,
587
- "ndcg_at_10": 0.67291,
588
- "ndcg_at_20": 0.69552,
589
- "ndcg_at_50": 0.71505,
590
- "ndcg_at_100": 0.72644,
591
- "map_at_1": 0.36564,
592
- "map_at_3": 0.49748,
593
- "map_at_5": 0.53983,
594
- "map_at_10": 0.57966,
595
- "map_at_20": 0.59407,
596
- "map_at_50": 0.60166,
597
- "map_at_100": 0.60419,
598
- "recall_at_1": 0.36564,
599
- "recall_at_3": 0.57915,
600
- "recall_at_5": 0.6723,
601
- "recall_at_10": 0.7796,
602
- "recall_at_20": 0.83839,
603
- "recall_at_50": 0.89828,
604
- "recall_at_100": 0.94039,
605
- "precision_at_1": 0.6,
606
- "precision_at_3": 0.38333,
607
- "precision_at_5": 0.28875,
608
- "precision_at_10": 0.18688,
609
- "precision_at_20": 0.10906,
610
- "precision_at_50": 0.05037,
611
- "precision_at_100": 0.02756,
612
- "mrr_at_1": 0.6125,
613
- "mrr_at_3": 0.7114583333333332,
614
- "mrr_at_5": 0.7258333333333333,
615
- "mrr_at_10": 0.7311706349206349,
616
- "mrr_at_20": 0.7328478057889821,
617
- "mrr_at_50": 0.7335337032248797,
618
- "mrr_at_100": 0.7337362495211759,
619
- "naucs_at_1_max": 0.3196794300979519,
620
- "naucs_at_1_std": -0.06999480558029103,
621
- "naucs_at_1_diff1": 0.46354630454140655,
622
- "naucs_at_3_max": -0.024028225250570488,
623
- "naucs_at_3_std": -0.0772467105431113,
624
- "naucs_at_3_diff1": -0.13384017605040516,
625
- "naucs_at_5_max": -0.1107018755412317,
626
- "naucs_at_5_std": -0.13468600304734307,
627
- "naucs_at_5_diff1": -0.1913870528096573,
628
- "naucs_at_10_max": -0.15104624102495343,
629
- "naucs_at_10_std": -0.11990214904902942,
630
- "naucs_at_10_diff1": -0.27309446189419934,
631
- "naucs_at_20_max": -0.1510467527515919,
632
- "naucs_at_20_std": -0.05158870650850273,
633
- "naucs_at_20_diff1": -0.2855800617041388,
634
- "naucs_at_50_max": -0.189407669514686,
635
- "naucs_at_50_std": 0.011655782821744832,
636
- "naucs_at_50_diff1": -0.29769313630537414,
637
- "naucs_at_100_max": -0.22560114991297742,
638
- "naucs_at_100_std": 0.03455222954387382,
639
- "naucs_at_100_diff1": -0.29629886192096655
640
- },
641
- "vidore/synthetic_economics_macro_economy_2024_filtered_v1.0": {
642
- "ndcg_at_1": 0.62069,
643
- "ndcg_at_3": 0.61762,
644
- "ndcg_at_5": 0.60225,
645
- "ndcg_at_10": 0.58048,
646
- "ndcg_at_20": 0.61347,
647
- "ndcg_at_50": 0.67491,
648
- "ndcg_at_100": 0.71101,
649
- "map_at_1": 0.09096,
650
- "map_at_3": 0.20035,
651
- "map_at_5": 0.26381,
652
- "map_at_10": 0.33202,
653
- "map_at_20": 0.39844,
654
- "map_at_50": 0.45746,
655
- "map_at_100": 0.48541,
656
- "recall_at_1": 0.09096,
657
- "recall_at_3": 0.24139,
658
- "recall_at_5": 0.33438,
659
- "recall_at_10": 0.4587,
660
- "recall_at_20": 0.62591,
661
- "recall_at_50": 0.81242,
662
- "recall_at_100": 0.91777,
663
- "precision_at_1": 0.62069,
664
- "precision_at_3": 0.57471,
665
- "precision_at_5": 0.53448,
666
- "precision_at_10": 0.42414,
667
- "precision_at_20": 0.32672,
668
- "precision_at_50": 0.19759,
669
- "precision_at_100": 0.12862,
670
- "mrr_at_1": 0.603448275862069,
671
- "mrr_at_3": 0.7241379310344828,
672
- "mrr_at_5": 0.7405172413793104,
673
- "mrr_at_10": 0.7462643678160921,
674
- "mrr_at_20": 0.7475906277630417,
675
- "mrr_at_50": 0.7484116458254391,
676
- "mrr_at_100": 0.7484116458254391,
677
- "naucs_at_1_max": 0.18510409805228442,
678
- "naucs_at_1_std": 0.35494696439734424,
679
- "naucs_at_1_diff1": 0.16217400181533045,
680
- "naucs_at_3_max": 0.11476072335324272,
681
- "naucs_at_3_std": 0.14220252935282734,
682
- "naucs_at_3_diff1": 0.20624608835397928,
683
- "naucs_at_5_max": 0.05768772419881633,
684
- "naucs_at_5_std": 0.06310746641396357,
685
- "naucs_at_5_diff1": 0.18987051287290022,
686
- "naucs_at_10_max": 0.0985016982729016,
687
- "naucs_at_10_std": 0.20584586715310207,
688
- "naucs_at_10_diff1": 0.06505841014753395,
689
- "naucs_at_20_max": 0.08004110479748268,
690
- "naucs_at_20_std": 0.287577784204017,
691
- "naucs_at_20_diff1": 0.020551986645709248,
692
- "naucs_at_50_max": 0.014573240638718194,
693
- "naucs_at_50_std": 0.24605332511304584,
694
- "naucs_at_50_diff1": -0.020387827810068312,
695
- "naucs_at_100_max": -0.05010509973449726,
696
- "naucs_at_100_std": 0.1897950634215769,
697
- "naucs_at_100_diff1": -0.014466845102017144
698
- },
699
- "vidore/synthetic_rse_restaurant_filtered_v1.0": {
700
- "ndcg_at_1": 0.52632,
701
- "ndcg_at_3": 0.55585,
702
- "ndcg_at_5": 0.56608,
703
- "ndcg_at_10": 0.60595,
704
- "ndcg_at_20": 0.63951,
705
- "ndcg_at_50": 0.67486,
706
- "ndcg_at_100": 0.68663,
707
- "map_at_1": 0.18937,
708
- "map_at_3": 0.38648,
709
- "map_at_5": 0.42924,
710
- "map_at_10": 0.4756,
711
- "map_at_20": 0.49684,
712
- "map_at_50": 0.51563,
713
- "map_at_100": 0.52215,
714
- "recall_at_1": 0.18937,
715
- "recall_at_3": 0.52147,
716
- "recall_at_5": 0.61387,
717
- "recall_at_10": 0.7448,
718
- "recall_at_20": 0.84958,
719
- "recall_at_50": 0.95384,
720
- "recall_at_100": 0.98246,
721
- "precision_at_1": 0.52632,
722
- "precision_at_3": 0.40351,
723
- "precision_at_5": 0.29825,
724
- "precision_at_10": 0.2,
725
- "precision_at_20": 0.12632,
726
- "precision_at_50": 0.06842,
727
- "precision_at_100": 0.03877,
728
- "mrr_at_1": 0.5263157894736842,
729
- "mrr_at_3": 0.6608187134502922,
730
- "mrr_at_5": 0.6687134502923976,
731
- "mrr_at_10": 0.6770676691729323,
732
- "mrr_at_20": 0.6805936409651578,
733
- "mrr_at_50": 0.6813246351172046,
734
- "mrr_at_100": 0.6813246351172046,
735
- "naucs_at_1_max": -0.3657070379375877,
736
- "naucs_at_1_std": -0.2598454613027199,
737
- "naucs_at_1_diff1": 0.20497205438323887,
738
- "naucs_at_3_max": -0.2760768601040555,
739
- "naucs_at_3_std": -0.19536511254108982,
740
- "naucs_at_3_diff1": 0.12639737194669312,
741
- "naucs_at_5_max": -0.32266979804661855,
742
- "naucs_at_5_std": -0.2321273259469018,
743
- "naucs_at_5_diff1": 0.12201056497848635,
744
- "naucs_at_10_max": -0.31327785677716363,
745
- "naucs_at_10_std": -0.20701857432203374,
746
- "naucs_at_10_diff1": 0.12714449010861775,
747
- "naucs_at_20_max": -0.3057758145014666,
748
- "naucs_at_20_std": -0.19196155860715694,
749
- "naucs_at_20_diff1": 0.004456792889016827,
750
- "naucs_at_50_max": -0.3443751963336487,
751
- "naucs_at_50_std": -0.19916004962508968,
752
- "naucs_at_50_diff1": -0.15313050707770795,
753
- "naucs_at_100_max": -0.33335268769256254,
754
- "naucs_at_100_std": -0.1759902263556841,
755
- "naucs_at_100_diff1": -0.16546750884331984
756
- },
757
- "vidore/synthetic_axa_filtered_v1.0": {
758
- "ndcg_at_1": 0.72222,
759
- "ndcg_at_3": 0.68859,
760
- "ndcg_at_5": 0.6877,
761
- "ndcg_at_10": 0.69829,
762
- "ndcg_at_20": 0.7342,
763
- "ndcg_at_50": 0.77785,
764
- "ndcg_at_100": 0.78996,
765
- "map_at_1": 0.36488,
766
- "map_at_3": 0.46953,
767
- "map_at_5": 0.52392,
768
- "map_at_10": 0.58858,
769
- "map_at_20": 0.62889,
770
- "map_at_50": 0.64917,
771
- "map_at_100": 0.65352,
772
- "recall_at_1": 0.36488,
773
- "recall_at_3": 0.54323,
774
- "recall_at_5": 0.61414,
775
- "recall_at_10": 0.71635,
776
- "recall_at_20": 0.82542,
777
- "recall_at_50": 0.95323,
778
- "recall_at_100": 0.98765,
779
- "precision_at_1": 0.72222,
780
- "precision_at_3": 0.44444,
781
- "precision_at_5": 0.37778,
782
- "precision_at_10": 0.27222,
783
- "precision_at_20": 0.175,
784
- "precision_at_50": 0.08667,
785
- "precision_at_100": 0.04667,
786
- "mrr_at_1": 0.6111111111111112,
787
- "mrr_at_3": 0.7592592592592592,
788
- "mrr_at_5": 0.7592592592592592,
789
- "mrr_at_10": 0.7592592592592592,
790
- "mrr_at_20": 0.7592592592592592,
791
- "mrr_at_50": 0.7611111111111111,
792
- "mrr_at_100": 0.7611111111111111,
793
- "naucs_at_1_max": -0.1072500882788756,
794
- "naucs_at_1_std": -0.07848008527574335,
795
- "naucs_at_1_diff1": 0.3888329697673727,
796
- "naucs_at_3_max": -0.5668751047952342,
797
- "naucs_at_3_std": -0.5329585384567367,
798
- "naucs_at_3_diff1": -0.2021392643633502,
799
- "naucs_at_5_max": -0.5633098595994385,
800
- "naucs_at_5_std": -0.43232123457673266,
801
- "naucs_at_5_diff1": -0.17951311814925686,
802
- "naucs_at_10_max": -0.6374122831555527,
803
- "naucs_at_10_std": -0.43175557593234065,
804
- "naucs_at_10_diff1": -0.31039799211753494,
805
- "naucs_at_20_max": -0.701465591207169,
806
- "naucs_at_20_std": -0.4917500935922029,
807
- "naucs_at_20_diff1": -0.35064529361083185,
808
- "naucs_at_50_max": -0.7021744453459953,
809
- "naucs_at_50_std": -0.4855377059097475,
810
- "naucs_at_50_diff1": -0.36456623920339126,
811
- "naucs_at_100_max": -0.6924863874111336,
812
- "naucs_at_100_std": -0.4863559555556065,
813
- "naucs_at_100_diff1": -0.3608886108131484
814
- },
815
- "vidore/synthetic_rse_restaurant_filtered_v1.0_multilingual": {
816
- "ndcg_at_1": 0.54386,
817
- "ndcg_at_3": 0.53992,
818
- "ndcg_at_5": 0.57161,
819
- "ndcg_at_10": 0.61517,
820
- "ndcg_at_20": 0.64796,
821
- "ndcg_at_50": 0.67915,
822
- "ndcg_at_100": 0.69235,
823
- "map_at_1": 0.22592,
824
- "map_at_3": 0.38229,
825
- "map_at_5": 0.43639,
826
- "map_at_10": 0.48456,
827
- "map_at_20": 0.50644,
828
- "map_at_50": 0.52393,
829
- "map_at_100": 0.53044,
830
- "recall_at_1": 0.22592,
831
- "recall_at_3": 0.48555,
832
- "recall_at_5": 0.61365,
833
- "recall_at_10": 0.75902,
834
- "recall_at_20": 0.86188,
835
- "recall_at_50": 0.94857,
836
- "recall_at_100": 0.98684,
837
- "precision_at_1": 0.54386,
838
- "precision_at_3": 0.3845,
839
- "precision_at_5": 0.30351,
840
- "precision_at_10": 0.20439,
841
- "precision_at_20": 0.12785,
842
- "precision_at_50": 0.06851,
843
- "precision_at_100": 0.03882,
844
- "mrr_at_1": 0.5394736842105263,
845
- "mrr_at_3": 0.6491228070175438,
846
- "mrr_at_5": 0.6675438596491228,
847
- "mrr_at_10": 0.6769945697577275,
848
- "mrr_at_20": 0.6792236734283947,
849
- "mrr_at_50": 0.6797428454113825,
850
- "mrr_at_100": 0.6798197921642295,
851
- "naucs_at_1_max": -0.20674277350895354,
852
- "naucs_at_1_std": -0.12027303922549912,
853
- "naucs_at_1_diff1": 0.23775810754837193,
854
- "naucs_at_3_max": -0.14132383047647284,
855
- "naucs_at_3_std": -0.11240148832069007,
856
- "naucs_at_3_diff1": 0.15033788234126377,
857
- "naucs_at_5_max": -0.17140084599390548,
858
- "naucs_at_5_std": -0.13104605490168167,
859
- "naucs_at_5_diff1": 0.1523799082346645,
860
- "naucs_at_10_max": -0.17604422702000652,
861
- "naucs_at_10_std": -0.1040197021731718,
862
- "naucs_at_10_diff1": 0.141987374687683,
863
- "naucs_at_20_max": -0.18707526779473269,
864
- "naucs_at_20_std": -0.05659957021660996,
865
- "naucs_at_20_diff1": 0.043138658571222205,
866
- "naucs_at_50_max": -0.23552302035441924,
867
- "naucs_at_50_std": -0.05397637299883905,
868
- "naucs_at_50_diff1": -0.09007005759845056,
869
- "naucs_at_100_max": -0.2339022131728518,
870
- "naucs_at_100_std": -0.0193642217972453,
871
- "naucs_at_100_diff1": -0.11400444827044932
872
- },
873
- "vidore/synthetic_axa_filtered_v1.0_multilingual": {
874
- "ndcg_at_1": 0.63889,
875
- "ndcg_at_3": 0.62281,
876
- "ndcg_at_5": 0.60952,
877
- "ndcg_at_10": 0.64318,
878
- "ndcg_at_20": 0.67634,
879
- "ndcg_at_50": 0.71094,
880
- "ndcg_at_100": 0.72844,
881
- "map_at_1": 0.32704,
882
- "map_at_3": 0.41888,
883
- "map_at_5": 0.46563,
884
- "map_at_10": 0.53051,
885
- "map_at_20": 0.56674,
886
- "map_at_50": 0.58314,
887
- "map_at_100": 0.58783,
888
- "recall_at_1": 0.32704,
889
- "recall_at_3": 0.48365,
890
- "recall_at_5": 0.54387,
891
- "recall_at_10": 0.69125,
892
- "recall_at_20": 0.78669,
893
- "recall_at_50": 0.8863,
894
- "recall_at_100": 0.9429,
895
- "precision_at_1": 0.63889,
896
- "precision_at_3": 0.41204,
897
- "precision_at_5": 0.33333,
898
- "precision_at_10": 0.25417,
899
- "precision_at_20": 0.16597,
900
- "precision_at_50": 0.07972,
901
- "precision_at_100": 0.04431,
902
- "mrr_at_1": 0.5972222222222222,
903
- "mrr_at_3": 0.7083333333333333,
904
- "mrr_at_5": 0.7083333333333333,
905
- "mrr_at_10": 0.7178791887125221,
906
- "mrr_at_20": 0.7191418149751484,
907
- "mrr_at_50": 0.7199862392542369,
908
- "mrr_at_100": 0.7201556159480039,
909
- "naucs_at_1_max": 0.11301406077201734,
910
- "naucs_at_1_std": 0.21519921250929616,
911
- "naucs_at_1_diff1": 0.3601399303857268,
912
- "naucs_at_3_max": -0.24927986503179209,
913
- "naucs_at_3_std": -0.09022708366608238,
914
- "naucs_at_3_diff1": 0.04489545233674075,
915
- "naucs_at_5_max": -0.26591050096906066,
916
- "naucs_at_5_std": -0.07265537709306702,
917
- "naucs_at_5_diff1": 0.0014191239058859906,
918
- "naucs_at_10_max": -0.3903220005756808,
919
- "naucs_at_10_std": -0.12521844950880665,
920
- "naucs_at_10_diff1": -0.19712230727571253,
921
- "naucs_at_20_max": -0.45199817313888363,
922
- "naucs_at_20_std": -0.1484667347150115,
923
- "naucs_at_20_diff1": -0.2608757999232997,
924
- "naucs_at_50_max": -0.48614207326501946,
925
- "naucs_at_50_std": -0.15554359778230578,
926
- "naucs_at_50_diff1": -0.27852375257122247,
927
- "naucs_at_100_max": -0.5125082706318165,
928
- "naucs_at_100_std": -0.18550458631758462,
929
- "naucs_at_100_diff1": -0.31194041608707157
930
- },
931
- "vidore/synthetic_mit_biomedical_tissue_interactions_unfiltered_multilingual": {
932
- "ndcg_at_1": 0.58125,
933
- "ndcg_at_3": 0.60975,
934
- "ndcg_at_5": 0.62539,
935
- "ndcg_at_10": 0.65521,
936
- "ndcg_at_20": 0.67922,
937
- "ndcg_at_50": 0.70341,
938
- "ndcg_at_100": 0.71315,
939
- "map_at_1": 0.35357,
940
- "map_at_3": 0.49223,
941
- "map_at_5": 0.5321,
942
- "map_at_10": 0.56549,
943
- "map_at_20": 0.5796,
944
- "map_at_50": 0.58865,
945
- "map_at_100": 0.59103,
946
- "recall_at_1": 0.35357,
947
- "recall_at_3": 0.57487,
948
- "recall_at_5": 0.65905,
949
- "recall_at_10": 0.7508,
950
- "recall_at_20": 0.81705,
951
- "recall_at_50": 0.89072,
952
- "recall_at_100": 0.92568,
953
- "precision_at_1": 0.58125,
954
- "precision_at_3": 0.3849,
955
- "precision_at_5": 0.28719,
956
- "precision_at_10": 0.18125,
957
- "precision_at_20": 0.10578,
958
- "precision_at_50": 0.05062,
959
- "precision_at_100": 0.02748,
960
- "mrr_at_1": 0.5796875,
961
- "mrr_at_3": 0.6901041666666663,
962
- "mrr_at_5": 0.7021354166666661,
963
- "mrr_at_10": 0.7074832589285712,
964
- "mrr_at_20": 0.7102574911812041,
965
- "mrr_at_50": 0.7110110149629919,
966
- "mrr_at_100": 0.7111676465392118,
967
- "naucs_at_1_max": 0.17241551553460638,
968
- "naucs_at_1_std": -0.10458500213424893,
969
- "naucs_at_1_diff1": 0.5014939741528845,
970
- "naucs_at_3_max": 0.04213476105852452,
971
- "naucs_at_3_std": -0.03593819184778826,
972
- "naucs_at_3_diff1": -0.03987788271154801,
973
- "naucs_at_5_max": 0.027250565594662386,
974
- "naucs_at_5_std": -0.037278236776539624,
975
- "naucs_at_5_diff1": -0.1239404049371398,
976
- "naucs_at_10_max": -0.06115387637712348,
977
- "naucs_at_10_std": -0.0718804318785458,
978
- "naucs_at_10_diff1": -0.19295981392132494,
979
- "naucs_at_20_max": -0.09125226002964483,
980
- "naucs_at_20_std": -0.028359299920185887,
981
- "naucs_at_20_diff1": -0.22651248920886707,
982
- "naucs_at_50_max": -0.10766546120682835,
983
- "naucs_at_50_std": 0.03593323121140819,
984
- "naucs_at_50_diff1": -0.25675662871310556,
985
- "naucs_at_100_max": -0.12997916463636278,
986
- "naucs_at_100_std": 0.05375545158818975,
987
- "naucs_at_100_diff1": -0.2582624772102094
988
- },
989
- "vidore/synthetics_economics_macro_economy_2024_filtered_v1.0_multilingual": {
990
- "ndcg_at_1": 0.57759,
991
- "ndcg_at_3": 0.57138,
992
- "ndcg_at_5": 0.55497,
993
- "ndcg_at_10": 0.5473,
994
- "ndcg_at_20": 0.58512,
995
- "ndcg_at_50": 0.65027,
996
- "ndcg_at_100": 0.68902,
997
- "map_at_1": 0.08005,
998
- "map_at_3": 0.17589,
999
- "map_at_5": 0.22976,
1000
- "map_at_10": 0.29906,
1001
- "map_at_20": 0.36451,
1002
- "map_at_50": 0.42404,
1003
- "map_at_100": 0.45273,
1004
- "recall_at_1": 0.08005,
1005
- "recall_at_3": 0.21653,
1006
- "recall_at_5": 0.30793,
1007
- "recall_at_10": 0.43982,
1008
- "recall_at_20": 0.60961,
1009
- "recall_at_50": 0.80111,
1010
- "recall_at_100": 0.91548,
1011
- "precision_at_1": 0.57759,
1012
- "precision_at_3": 0.53592,
1013
- "precision_at_5": 0.49138,
1014
- "precision_at_10": 0.40733,
1015
- "precision_at_20": 0.31832,
1016
- "precision_at_50": 0.19638,
1017
- "precision_at_100": 0.12836,
1018
- "mrr_at_1": 0.5646551724137931,
1019
- "mrr_at_3": 0.694683908045977,
1020
- "mrr_at_5": 0.7136494252873563,
1021
- "mrr_at_10": 0.7207478106185002,
1022
- "mrr_at_20": 0.7223871734108802,
1023
- "mrr_at_50": 0.7225924279264796,
1024
- "mrr_at_100": 0.7225924279264796,
1025
- "naucs_at_1_max": 0.025825981954306243,
1026
- "naucs_at_1_std": 0.06786701290377438,
1027
- "naucs_at_1_diff1": 0.3119241048950317,
1028
- "naucs_at_3_max": 0.0479066957744716,
1029
- "naucs_at_3_std": 0.06557391489213844,
1030
- "naucs_at_3_diff1": 0.23439300856464848,
1031
- "naucs_at_5_max": 0.0517250332191857,
1032
- "naucs_at_5_std": 0.09464648925799282,
1033
- "naucs_at_5_diff1": 0.2254037385021122,
1034
- "naucs_at_10_max": 0.07385165346450225,
1035
- "naucs_at_10_std": 0.14105623461417685,
1036
- "naucs_at_10_diff1": 0.09658147605174039,
1037
- "naucs_at_20_max": 0.04903637832153811,
1038
- "naucs_at_20_std": 0.1590552355815479,
1039
- "naucs_at_20_diff1": 0.028107412938548966,
1040
- "naucs_at_50_max": 0.02938750541507763,
1041
- "naucs_at_50_std": 0.15805354436493257,
1042
- "naucs_at_50_diff1": -0.04958795351145276,
1043
- "naucs_at_100_max": -0.0034893431750791983,
1044
- "naucs_at_100_std": 0.13285693605908278,
1045
- "naucs_at_100_diff1": -0.07289241471567467
1046
- },
1047
- "vidore/restaurant_esg_reports_beir": {
1048
- "ndcg_at_1": 0.66667,
1049
- "ndcg_at_3": 0.62961,
1050
- "ndcg_at_5": 0.65844,
1051
- "ndcg_at_10": 0.70149,
1052
- "ndcg_at_20": 0.72887,
1053
- "ndcg_at_50": 0.75185,
1054
- "ndcg_at_100": 0.75669,
1055
- "map_at_1": 0.47262,
1056
- "map_at_3": 0.55789,
1057
- "map_at_5": 0.59623,
1058
- "map_at_10": 0.62874,
1059
- "map_at_20": 0.64199,
1060
- "map_at_50": 0.64885,
1061
- "map_at_100": 0.65059,
1062
- "recall_at_1": 0.47262,
1063
- "recall_at_3": 0.58302,
1064
- "recall_at_5": 0.68751,
1065
- "recall_at_10": 0.8013,
1066
- "recall_at_20": 0.88308,
1067
- "recall_at_50": 0.9586,
1068
- "recall_at_100": 0.97619,
1069
- "precision_at_1": 0.69231,
1070
- "precision_at_3": 0.33974,
1071
- "precision_at_5": 0.24615,
1072
- "precision_at_10": 0.15577,
1073
- "precision_at_20": 0.09231,
1074
- "precision_at_50": 0.04269,
1075
- "precision_at_100": 0.02288,
1076
- "mrr_at_1": 0.6923076923076923,
1077
- "mrr_at_3": 0.7371794871794872,
1078
- "mrr_at_5": 0.7583333333333333,
1079
- "mrr_at_10": 0.7666666666666665,
1080
- "mrr_at_20": 0.7698942083557468,
1081
- "mrr_at_50": 0.7706954904070289,
1082
- "mrr_at_100": 0.7706954904070289,
1083
- "naucs_at_1_max": 0.21266459227612405,
1084
- "naucs_at_1_std": 0.19096494070335385,
1085
- "naucs_at_1_diff1": 0.49249886565541523,
1086
- "naucs_at_3_max": -0.03430599620876157,
1087
- "naucs_at_3_std": 0.017097041956098673,
1088
- "naucs_at_3_diff1": -0.03264969467214677,
1089
- "naucs_at_5_max": -0.022484350271713836,
1090
- "naucs_at_5_std": -0.0636467385979771,
1091
- "naucs_at_5_diff1": -0.16473803715393007,
1092
- "naucs_at_10_max": -0.07317891510820472,
1093
- "naucs_at_10_std": -0.04140978466752904,
1094
- "naucs_at_10_diff1": -0.26462899584834276,
1095
- "naucs_at_20_max": -0.0627742919035184,
1096
- "naucs_at_20_std": 0.04670746961963372,
1097
- "naucs_at_20_diff1": -0.3704708282580158,
1098
- "naucs_at_50_max": -0.06988684901669139,
1099
- "naucs_at_50_std": 0.005284407101443551,
1100
- "naucs_at_50_diff1": -0.38324540988500305,
1101
- "naucs_at_100_max": -0.11684726414295883,
1102
- "naucs_at_100_std": 0.005824353791349827,
1103
- "naucs_at_100_diff1": -0.3791953702270732
1104
- }
1105
  },
1106
- "metadata": {
1107
- "timestamp": "2025-03-26T12:04:56.582879",
1108
- "vidore_benchmark_version": "5.0.1.dev6+g9e0da63"
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1109
  }
1110
  }
 
1
  {
2
+ "vidore/arxivqa_test_subsampled":{
3
+ "ndcg_at_1":0.824,
4
+ "ndcg_at_3":0.86202,
5
+ "ndcg_at_5":0.87442,
6
+ "ndcg_at_10":0.88303,
7
+ "ndcg_at_20":0.88861,
8
+ "ndcg_at_50":0.8927,
9
+ "ndcg_at_100":0.89339,
10
+ "map_at_1":0.824,
11
+ "map_at_3":0.853,
12
+ "map_at_5":0.8599,
13
+ "map_at_10":0.86358,
14
+ "map_at_20":0.86512,
15
+ "map_at_50":0.86583,
16
+ "map_at_100":0.86591,
17
+ "recall_at_1":0.824,
18
+ "recall_at_3":0.888,
19
+ "recall_at_5":0.918,
20
+ "recall_at_10":0.944,
21
+ "recall_at_20":0.966,
22
+ "recall_at_50":0.986,
23
+ "recall_at_100":0.99,
24
+ "precision_at_1":0.824,
25
+ "precision_at_3":0.296,
26
+ "precision_at_5":0.1836,
27
+ "precision_at_10":0.0944,
28
+ "precision_at_20":0.0483,
29
+ "precision_at_50":0.01972,
30
+ "precision_at_100":0.0099,
31
+ "mrr_at_1":0.832,
32
+ "mrr_at_3":0.856,
33
+ "mrr_at_5":0.8632,
34
+ "mrr_at_10":0.86755,
35
+ "mrr_at_20":0.8687646325896324,
36
+ "mrr_at_50":0.8694855987079559,
37
+ "mrr_at_100":0.8695150104726618,
38
+ "naucs_at_1_max":0.8110100305865411,
39
+ "naucs_at_1_std":0.07361011155091818,
40
+ "naucs_at_1_diff1":0.9603893037063689,
41
+ "naucs_at_3_max":0.7977881493506478,
42
+ "naucs_at_3_std":0.013342126623376577,
43
+ "naucs_at_3_diff1":0.9239464962121198,
44
+ "naucs_at_5_max":0.8150463437407489,
45
+ "naucs_at_5_std":0.14904010384641533,
46
+ "naucs_at_5_diff1":0.9183006535947713,
47
+ "naucs_at_10_max":0.8759670534880637,
48
+ "naucs_at_10_std":0.2408463385354136,
49
+ "naucs_at_10_diff1":0.9323062558356668,
50
+ "naucs_at_20_max":0.9013016971494501,
51
+ "naucs_at_20_std":0.4259076179491429,
52
+ "naucs_at_20_diff1":0.9115724721261116,
53
+ "naucs_at_50_max":0.9229691876750605,
54
+ "naucs_at_50_std":0.7222889155662164,
55
+ "naucs_at_50_diff1":0.9019607843137241,
56
+ "naucs_at_100_max":0.8921568627450854,
57
+ "naucs_at_100_std":0.6373482726423866,
58
+ "naucs_at_100_diff1":0.9183006535947666
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
59
  },
60
+ "vidore/docvqa_test_subsampled":{
61
+ "ndcg_at_1":0.52993,
62
+ "ndcg_at_3":0.59967,
63
+ "ndcg_at_5":0.61961,
64
+ "ndcg_at_10":0.63197,
65
+ "ndcg_at_20":0.64596,
66
+ "ndcg_at_50":0.65515,
67
+ "ndcg_at_100":0.66198,
68
+ "map_at_1":0.52993,
69
+ "map_at_3":0.58241,
70
+ "map_at_5":0.59339,
71
+ "map_at_10":0.59817,
72
+ "map_at_20":0.602,
73
+ "map_at_50":0.60345,
74
+ "map_at_100":0.60405,
75
+ "recall_at_1":0.52993,
76
+ "recall_at_3":0.64967,
77
+ "recall_at_5":0.69845,
78
+ "recall_at_10":0.73836,
79
+ "recall_at_20":0.79379,
80
+ "recall_at_50":0.84035,
81
+ "recall_at_100":0.88248,
82
+ "precision_at_1":0.52993,
83
+ "precision_at_3":0.21656,
84
+ "precision_at_5":0.13969,
85
+ "precision_at_10":0.07384,
86
+ "precision_at_20":0.03969,
87
+ "precision_at_50":0.01681,
88
+ "precision_at_100":0.00882,
89
+ "mrr_at_1":0.5277161862527716,
90
+ "mrr_at_3":0.5776053215077607,
91
+ "mrr_at_5":0.5888026607538803,
92
+ "mrr_at_10":0.5944919579065918,
93
+ "mrr_at_20":0.5983219637865657,
94
+ "mrr_at_50":0.5999309966010471,
95
+ "mrr_at_100":0.6005501639541099,
96
+ "naucs_at_1_max":0.37096765728763215,
97
+ "naucs_at_1_std":0.5363118108228696,
98
+ "naucs_at_1_diff1":0.9084586513989499,
99
+ "naucs_at_3_max":0.28536364371043943,
100
+ "naucs_at_3_std":0.656382780997437,
101
+ "naucs_at_3_diff1":0.8754285629546056,
102
+ "naucs_at_5_max":0.26490606879524303,
103
+ "naucs_at_5_std":0.6794242484186521,
104
+ "naucs_at_5_diff1":0.8670235151833391,
105
+ "naucs_at_10_max":0.17906145941266727,
106
+ "naucs_at_10_std":0.71951378124067,
107
+ "naucs_at_10_diff1":0.8623037540857623,
108
+ "naucs_at_20_max":0.039717430802327786,
109
+ "naucs_at_20_std":0.77907518789845,
110
+ "naucs_at_20_diff1":0.8711346514573685,
111
+ "naucs_at_50_max":-0.06591984153859125,
112
+ "naucs_at_50_std":0.8944335077781369,
113
+ "naucs_at_50_diff1":0.872338054901137,
114
+ "naucs_at_100_max":-0.18390488993971363,
115
+ "naucs_at_100_std":0.9432351742842897,
116
+ "naucs_at_100_diff1":0.8529357662557685
117
+ },
118
+ "vidore/infovqa_test_subsampled":{
119
+ "ndcg_at_1":0.89069,
120
+ "ndcg_at_3":0.9279,
121
+ "ndcg_at_5":0.93217,
122
+ "ndcg_at_10":0.93547,
123
+ "ndcg_at_20":0.9379,
124
+ "ndcg_at_50":0.93869,
125
+ "ndcg_at_100":0.93902,
126
+ "map_at_1":0.89069,
127
+ "map_at_3":0.91903,
128
+ "map_at_5":0.92146,
129
+ "map_at_10":0.92284,
130
+ "map_at_20":0.92344,
131
+ "map_at_50":0.92356,
132
+ "map_at_100":0.92359,
133
+ "recall_at_1":0.89069,
134
+ "recall_at_3":0.95344,
135
+ "recall_at_5":0.96356,
136
+ "recall_at_10":0.97368,
137
+ "recall_at_20":0.98381,
138
+ "recall_at_50":0.98785,
139
+ "recall_at_100":0.98988,
140
+ "precision_at_1":0.89069,
141
+ "precision_at_3":0.31781,
142
+ "precision_at_5":0.19271,
143
+ "precision_at_10":0.09737,
144
+ "precision_at_20":0.04919,
145
+ "precision_at_50":0.01976,
146
+ "precision_at_100":0.0099,
147
+ "mrr_at_1":0.8866396761133604,
148
+ "mrr_at_3":0.915991902834008,
149
+ "mrr_at_5":0.9190283400809716,
150
+ "mrr_at_10":0.9202091767881241,
151
+ "mrr_at_20":0.9207680541852368,
152
+ "mrr_at_50":0.9210783259706008,
153
+ "mrr_at_100":0.9211072444205719,
154
+ "naucs_at_1_max":0.6570120332617708,
155
+ "naucs_at_1_std":0.027148367339034946,
156
+ "naucs_at_1_diff1":0.954693725587737,
157
+ "naucs_at_3_max":0.8518572112090398,
158
+ "naucs_at_3_std":0.5033227123520332,
159
+ "naucs_at_3_diff1":0.9410604334985626,
160
+ "naucs_at_5_max":0.9198784015441375,
161
+ "naucs_at_5_std":0.6599441606302139,
162
+ "naucs_at_5_diff1":0.9628033833359825,
163
+ "naucs_at_10_max":0.9585432580086493,
164
+ "naucs_at_10_std":0.7697000086081518,
165
+ "naucs_at_10_diff1":1.0,
166
+ "naucs_at_20_max":0.9673496364838108,
167
+ "naucs_at_20_std":0.8687019487486011,
168
+ "naucs_at_20_diff1":1.0,
169
+ "naucs_at_50_max":0.9564661819783937,
170
+ "naucs_at_50_std":0.9319439680295378,
171
+ "naucs_at_50_diff1":1.0,
172
+ "naucs_at_100_max":0.9477594183740937,
173
+ "naucs_at_100_std":0.9183327616354471,
174
+ "naucs_at_100_diff1":1.0
175
+ },
176
+ "vidore/tabfquad_test_subsampled":{
177
+ "ndcg_at_1":0.89286,
178
+ "ndcg_at_3":0.93962,
179
+ "ndcg_at_5":0.94408,
180
+ "ndcg_at_10":0.94894,
181
+ "ndcg_at_20":0.94977,
182
+ "ndcg_at_50":0.94977,
183
+ "ndcg_at_100":0.94977,
184
+ "map_at_1":0.89286,
185
+ "map_at_3":0.92857,
186
+ "map_at_5":0.93107,
187
+ "map_at_10":0.93322,
188
+ "map_at_20":0.93341,
189
+ "map_at_50":0.93341,
190
+ "map_at_100":0.93341,
191
+ "recall_at_1":0.89286,
192
+ "recall_at_3":0.97143,
193
+ "recall_at_5":0.98214,
194
+ "recall_at_10":0.99643,
195
+ "recall_at_20":1.0,
196
+ "recall_at_50":1.0,
197
+ "recall_at_100":1.0,
198
+ "precision_at_1":0.89286,
199
+ "precision_at_3":0.32381,
200
+ "precision_at_5":0.19643,
201
+ "precision_at_10":0.09964,
202
+ "precision_at_20":0.05,
203
+ "precision_at_50":0.02,
204
+ "precision_at_100":0.01,
205
+ "mrr_at_1":0.8964285714285715,
206
+ "mrr_at_3":0.930952380952381,
207
+ "mrr_at_5":0.9336309523809524,
208
+ "mrr_at_10":0.9357780612244897,
209
+ "mrr_at_20":0.9359660311493018,
210
+ "mrr_at_50":0.9359660311493018,
211
+ "mrr_at_100":0.9359660311493018,
212
+ "naucs_at_1_max":0.589419152276295,
213
+ "naucs_at_1_std":0.25799058084772386,
214
+ "naucs_at_1_diff1":0.9168759811616957,
215
+ "naucs_at_3_max":0.8952497665732961,
216
+ "naucs_at_3_std":0.5145891690009315,
217
+ "naucs_at_3_diff1":0.8978758169934691,
218
+ "naucs_at_5_max":0.8585434173669502,
219
+ "naucs_at_5_std":0.6536881419234349,
220
+ "naucs_at_5_diff1":0.8627450980392123,
221
+ "naucs_at_10_max":1.0,
222
+ "naucs_at_10_std":1.0,
223
+ "naucs_at_10_diff1":0.72222222222224,
224
+ "naucs_at_20_max":1.0,
225
+ "naucs_at_20_std":1.0,
226
+ "naucs_at_20_diff1":1.0,
227
+ "naucs_at_50_max":1.0,
228
+ "naucs_at_50_std":1.0,
229
+ "naucs_at_50_diff1":1.0,
230
+ "naucs_at_100_max":1.0,
231
+ "naucs_at_100_std":1.0,
232
+ "naucs_at_100_diff1":1.0
233
+ },
234
+ "vidore/tatdqa_test":{
235
+ "ndcg_at_1":0.70717,
236
+ "ndcg_at_3":0.79456,
237
+ "ndcg_at_5":0.81297,
238
+ "ndcg_at_10":0.82424,
239
+ "ndcg_at_20":0.82919,
240
+ "ndcg_at_50":0.83284,
241
+ "ndcg_at_100":0.83523,
242
+ "map_at_1":0.70717,
243
+ "map_at_3":0.77329,
244
+ "map_at_5":0.78359,
245
+ "map_at_10":0.7884,
246
+ "map_at_20":0.78977,
247
+ "map_at_50":0.79038,
248
+ "map_at_100":0.79059,
249
+ "recall_at_1":0.70717,
250
+ "recall_at_3":0.85601,
251
+ "recall_at_5":0.90036,
252
+ "recall_at_10":0.93439,
253
+ "recall_at_20":0.95383,
254
+ "recall_at_50":0.97205,
255
+ "recall_at_100":0.98663,
256
+ "precision_at_1":0.70717,
257
+ "precision_at_3":0.28534,
258
+ "precision_at_5":0.18007,
259
+ "precision_at_10":0.09344,
260
+ "precision_at_20":0.04769,
261
+ "precision_at_50":0.01944,
262
+ "precision_at_100":0.00987,
263
+ "mrr_at_1":0.7023086269744836,
264
+ "mrr_at_3":0.7717699473471039,
265
+ "mrr_at_5":0.7816727420008102,
266
+ "mrr_at_10":0.7864732203128313,
267
+ "mrr_at_20":0.787759657888834,
268
+ "mrr_at_50":0.788430475412044,
269
+ "mrr_at_100":0.7886237843491343,
270
+ "naucs_at_1_max":0.1976745629949593,
271
+ "naucs_at_1_std":-0.07020091579321315,
272
+ "naucs_at_1_diff1":0.8341074480907863,
273
+ "naucs_at_3_max":0.2739593664910223,
274
+ "naucs_at_3_std":0.09719421770368855,
275
+ "naucs_at_3_diff1":0.733605301953241,
276
+ "naucs_at_5_max":0.28947443709217946,
277
+ "naucs_at_5_std":0.1533000171315339,
278
+ "naucs_at_5_diff1":0.6900117830352311,
279
+ "naucs_at_10_max":0.3583991399796331,
280
+ "naucs_at_10_std":0.24841173509752057,
281
+ "naucs_at_10_diff1":0.6368724254679143,
282
+ "naucs_at_20_max":0.3998152332693893,
283
+ "naucs_at_20_std":0.40035275451656677,
284
+ "naucs_at_20_diff1":0.5848768162171684,
285
+ "naucs_at_50_max":0.42687513985337017,
286
+ "naucs_at_50_std":0.41022440172224445,
287
+ "naucs_at_50_diff1":0.6184924487522029,
288
+ "naucs_at_100_max":0.48239198753920115,
289
+ "naucs_at_100_std":0.5542709753617254,
290
+ "naucs_at_100_diff1":0.6801547390328168
291
+ },
292
+ "vidore/shiftproject_test":{
293
+ "ndcg_at_1":0.83,
294
+ "ndcg_at_3":0.90309,
295
+ "ndcg_at_5":0.91083,
296
+ "ndcg_at_10":0.91439,
297
+ "ndcg_at_20":0.91718,
298
+ "ndcg_at_50":0.91902,
299
+ "ndcg_at_100":0.91902,
300
+ "map_at_1":0.83,
301
+ "map_at_3":0.88667,
302
+ "map_at_5":0.89067,
303
+ "map_at_10":0.89233,
304
+ "map_at_20":0.89324,
305
+ "map_at_50":0.89348,
306
+ "map_at_100":0.89348,
307
+ "recall_at_1":0.83,
308
+ "recall_at_3":0.95,
309
+ "recall_at_5":0.97,
310
+ "recall_at_10":0.98,
311
+ "recall_at_20":0.99,
312
+ "recall_at_50":1.0,
313
+ "recall_at_100":1.0,
314
+ "precision_at_1":0.83,
315
+ "precision_at_3":0.31667,
316
+ "precision_at_5":0.194,
317
+ "precision_at_10":0.098,
318
+ "precision_at_20":0.0495,
319
+ "precision_at_50":0.02,
320
+ "precision_at_100":0.01,
321
+ "mrr_at_1":0.82,
322
+ "mrr_at_3":0.885,
323
+ "mrr_at_5":0.887,
324
+ "mrr_at_10":0.8886666666666666,
325
+ "mrr_at_20":0.8895757575757576,
326
+ "mrr_at_50":0.8898138528138527,
327
+ "mrr_at_100":0.8898138528138527,
328
+ "naucs_at_1_max":0.06597202066523537,
329
+ "naucs_at_1_std":-0.5197074360016254,
330
+ "naucs_at_1_diff1":0.6896441632321363,
331
+ "naucs_at_3_max":0.2547152194211014,
332
+ "naucs_at_3_std":-0.7438842203548043,
333
+ "naucs_at_3_diff1":0.7722689075630248,
334
+ "naucs_at_5_max":0.3225957049486489,
335
+ "naucs_at_5_std":-0.7791783380018631,
336
+ "naucs_at_5_diff1":0.9128540305010848,
337
+ "naucs_at_10_max":0.42250233426704475,
338
+ "naucs_at_10_std":-0.2987861811391239,
339
+ "naucs_at_10_diff1":0.8692810457516353,
340
+ "naucs_at_20_max":0.7222222222222276,
341
+ "naucs_at_20_std":0.5541549953314738,
342
+ "naucs_at_20_diff1":0.8692810457516413,
343
+ "naucs_at_50_max":null,
344
+ "naucs_at_50_std":null,
345
+ "naucs_at_50_diff1":null,
346
+ "naucs_at_100_max":null,
347
+ "naucs_at_100_std":null,
348
+ "naucs_at_100_diff1":null
349
+ },
350
+ "vidore/syntheticDocQA_artificial_intelligence_test":{
351
+ "ndcg_at_1":0.96,
352
+ "ndcg_at_3":0.97893,
353
+ "ndcg_at_5":0.97893,
354
+ "ndcg_at_10":0.98249,
355
+ "ndcg_at_20":0.98249,
356
+ "ndcg_at_50":0.98249,
357
+ "ndcg_at_100":0.98249,
358
+ "map_at_1":0.96,
359
+ "map_at_3":0.975,
360
+ "map_at_5":0.975,
361
+ "map_at_10":0.97667,
362
+ "map_at_20":0.97667,
363
+ "map_at_50":0.97667,
364
+ "map_at_100":0.97667,
365
+ "recall_at_1":0.96,
366
+ "recall_at_3":0.99,
367
+ "recall_at_5":0.99,
368
+ "recall_at_10":1.0,
369
+ "recall_at_20":1.0,
370
+ "recall_at_50":1.0,
371
+ "recall_at_100":1.0,
372
+ "precision_at_1":0.96,
373
+ "precision_at_3":0.33,
374
+ "precision_at_5":0.198,
375
+ "precision_at_10":0.1,
376
+ "precision_at_20":0.05,
377
+ "precision_at_50":0.02,
378
+ "precision_at_100":0.01,
379
+ "mrr_at_1":0.98,
380
+ "mrr_at_3":0.985,
381
+ "mrr_at_5":0.985,
382
+ "mrr_at_10":0.9866666666666667,
383
+ "mrr_at_20":0.9866666666666667,
384
+ "mrr_at_50":0.9866666666666667,
385
+ "mrr_at_100":0.9866666666666667,
386
+ "naucs_at_1_max":0.3437208216620012,
387
+ "naucs_at_1_std":-0.1860410830999054,
388
+ "naucs_at_1_diff1":1.0,
389
+ "naucs_at_3_max":0.8692810457516356,
390
+ "naucs_at_3_std":-0.5634920634921204,
391
+ "naucs_at_3_diff1":1.0,
392
+ "naucs_at_5_max":0.8692810457516413,
393
+ "naucs_at_5_std":-0.5634920634920767,
394
+ "naucs_at_5_diff1":1.0,
395
+ "naucs_at_10_max":1.0,
396
+ "naucs_at_10_std":1.0,
397
+ "naucs_at_10_diff1":1.0,
398
+ "naucs_at_20_max":1.0,
399
+ "naucs_at_20_std":1.0,
400
+ "naucs_at_20_diff1":1.0,
401
+ "naucs_at_50_max":null,
402
+ "naucs_at_50_std":null,
403
+ "naucs_at_50_diff1":null,
404
+ "naucs_at_100_max":null,
405
+ "naucs_at_100_std":null,
406
+ "naucs_at_100_diff1":null
407
+ },
408
+ "vidore/syntheticDocQA_energy_test":{
409
+ "ndcg_at_1":0.93,
410
+ "ndcg_at_3":0.96024,
411
+ "ndcg_at_5":0.96024,
412
+ "ndcg_at_10":0.96339,
413
+ "ndcg_at_20":0.96618,
414
+ "ndcg_at_50":0.96618,
415
+ "ndcg_at_100":0.96618,
416
+ "map_at_1":0.93,
417
+ "map_at_3":0.95333,
418
+ "map_at_5":0.95333,
419
+ "map_at_10":0.95458,
420
+ "map_at_20":0.95549,
421
+ "map_at_50":0.95549,
422
+ "map_at_100":0.95549,
423
+ "recall_at_1":0.93,
424
+ "recall_at_3":0.98,
425
+ "recall_at_5":0.98,
426
+ "recall_at_10":0.99,
427
+ "recall_at_20":1.0,
428
+ "recall_at_50":1.0,
429
+ "recall_at_100":1.0,
430
+ "precision_at_1":0.93,
431
+ "precision_at_3":0.32667,
432
+ "precision_at_5":0.196,
433
+ "precision_at_10":0.099,
434
+ "precision_at_20":0.05,
435
+ "precision_at_50":0.02,
436
+ "precision_at_100":0.01,
437
+ "mrr_at_1":0.94,
438
+ "mrr_at_3":0.9583333333333333,
439
+ "mrr_at_5":0.9583333333333333,
440
+ "mrr_at_10":0.960873015873016,
441
+ "mrr_at_20":0.960873015873016,
442
+ "mrr_at_50":0.960873015873016,
443
+ "mrr_at_100":0.960873015873016,
444
+ "naucs_at_1_max":0.6919434440442851,
445
+ "naucs_at_1_std":-0.4906629318394028,
446
+ "naucs_at_1_diff1":0.9813258636788056,
447
+ "naucs_at_3_max":0.7117180205415458,
448
+ "naucs_at_3_std":-1.4458450046685478,
449
+ "naucs_at_3_diff1":1.0,
450
+ "naucs_at_5_max":0.7117180205415541,
451
+ "naucs_at_5_std":-1.445845004668519,
452
+ "naucs_at_5_diff1":1.0,
453
+ "naucs_at_10_max":0.8692810457516413,
454
+ "naucs_at_10_std":-1.1517273576097316,
455
+ "naucs_at_10_diff1":1.0,
456
+ "naucs_at_20_max":1.0,
457
+ "naucs_at_20_std":1.0,
458
+ "naucs_at_20_diff1":1.0,
459
+ "naucs_at_50_max":null,
460
+ "naucs_at_50_std":null,
461
+ "naucs_at_50_diff1":null,
462
+ "naucs_at_100_max":null,
463
+ "naucs_at_100_std":null,
464
+ "naucs_at_100_diff1":null
465
+ },
466
+ "vidore/syntheticDocQA_government_reports_test":{
467
+ "ndcg_at_1":0.94,
468
+ "ndcg_at_3":0.97655,
469
+ "ndcg_at_5":0.97655,
470
+ "ndcg_at_10":0.97655,
471
+ "ndcg_at_20":0.97655,
472
+ "ndcg_at_50":0.97655,
473
+ "ndcg_at_100":0.97655,
474
+ "map_at_1":0.94,
475
+ "map_at_3":0.96833,
476
+ "map_at_5":0.96833,
477
+ "map_at_10":0.96833,
478
+ "map_at_20":0.96833,
479
+ "map_at_50":0.96833,
480
+ "map_at_100":0.96833,
481
+ "recall_at_1":0.94,
482
+ "recall_at_3":1.0,
483
+ "recall_at_5":1.0,
484
+ "recall_at_10":1.0,
485
+ "recall_at_20":1.0,
486
+ "recall_at_50":1.0,
487
+ "recall_at_100":1.0,
488
+ "precision_at_1":0.94,
489
+ "precision_at_3":0.33333,
490
+ "precision_at_5":0.2,
491
+ "precision_at_10":0.1,
492
+ "precision_at_20":0.05,
493
+ "precision_at_50":0.02,
494
+ "precision_at_100":0.01,
495
+ "mrr_at_1":0.96,
496
+ "mrr_at_3":0.975,
497
+ "mrr_at_5":0.9775,
498
+ "mrr_at_10":0.9775,
499
+ "mrr_at_20":0.9775,
500
+ "mrr_at_50":0.9775,
501
+ "mrr_at_100":0.9775,
502
+ "naucs_at_1_max":0.7468098350451301,
503
+ "naucs_at_1_std":0.40919701213818827,
504
+ "naucs_at_1_diff1":0.9782135076252712,
505
+ "naucs_at_3_max":1.0,
506
+ "naucs_at_3_std":1.0,
507
+ "naucs_at_3_diff1":1.0,
508
+ "naucs_at_5_max":1.0,
509
+ "naucs_at_5_std":1.0,
510
+ "naucs_at_5_diff1":1.0,
511
+ "naucs_at_10_max":1.0,
512
+ "naucs_at_10_std":1.0,
513
+ "naucs_at_10_diff1":1.0,
514
+ "naucs_at_20_max":1.0,
515
+ "naucs_at_20_std":1.0,
516
+ "naucs_at_20_diff1":1.0,
517
+ "naucs_at_50_max":null,
518
+ "naucs_at_50_std":null,
519
+ "naucs_at_50_diff1":null,
520
+ "naucs_at_100_max":null,
521
+ "naucs_at_100_std":null,
522
+ "naucs_at_100_diff1":null
523
+ },
524
+ "vidore/syntheticDocQA_healthcare_industry_test":{
525
+ "ndcg_at_1":0.97,
526
+ "ndcg_at_3":0.98893,
527
+ "ndcg_at_5":0.98893,
528
+ "ndcg_at_10":0.98893,
529
+ "ndcg_at_20":0.98893,
530
+ "ndcg_at_50":0.98893,
531
+ "ndcg_at_100":0.98893,
532
+ "map_at_1":0.97,
533
+ "map_at_3":0.985,
534
+ "map_at_5":0.985,
535
+ "map_at_10":0.985,
536
+ "map_at_20":0.985,
537
+ "map_at_50":0.985,
538
+ "map_at_100":0.985,
539
+ "recall_at_1":0.97,
540
+ "recall_at_3":1.0,
541
+ "recall_at_5":1.0,
542
+ "recall_at_10":1.0,
543
+ "recall_at_20":1.0,
544
+ "recall_at_50":1.0,
545
+ "recall_at_100":1.0,
546
+ "precision_at_1":0.97,
547
+ "precision_at_3":0.33333,
548
+ "precision_at_5":0.2,
549
+ "precision_at_10":0.1,
550
+ "precision_at_20":0.05,
551
+ "precision_at_50":0.02,
552
+ "precision_at_100":0.01,
553
+ "mrr_at_1":0.97,
554
+ "mrr_at_3":0.985,
555
+ "mrr_at_5":0.985,
556
+ "mrr_at_10":0.985,
557
+ "mrr_at_20":0.985,
558
+ "mrr_at_50":0.985,
559
+ "mrr_at_100":0.985,
560
+ "naucs_at_1_max":0.5938375350140056,
561
+ "naucs_at_1_std":-0.1512605042016779,
562
+ "naucs_at_1_diff1":1.0,
563
+ "naucs_at_3_max":1.0,
564
+ "naucs_at_3_std":1.0,
565
+ "naucs_at_3_diff1":1.0,
566
+ "naucs_at_5_max":1.0,
567
+ "naucs_at_5_std":1.0,
568
+ "naucs_at_5_diff1":1.0,
569
+ "naucs_at_10_max":1.0,
570
+ "naucs_at_10_std":1.0,
571
+ "naucs_at_10_diff1":1.0,
572
+ "naucs_at_20_max":1.0,
573
+ "naucs_at_20_std":1.0,
574
+ "naucs_at_20_diff1":1.0,
575
+ "naucs_at_50_max":null,
576
+ "naucs_at_50_std":null,
577
+ "naucs_at_50_diff1":null,
578
+ "naucs_at_100_max":null,
579
+ "naucs_at_100_std":null,
580
+ "naucs_at_100_diff1":null
581
+ },
582
+ "vidore/synthetic_mit_biomedical_tissue_interactions_unfiltered":{
583
+ "ndcg_at_1":0.6,
584
+ "ndcg_at_3":0.6151,
585
+ "ndcg_at_5":0.63545,
586
+ "ndcg_at_10":0.67291,
587
+ "ndcg_at_20":0.69552,
588
+ "ndcg_at_50":0.71505,
589
+ "ndcg_at_100":0.72644,
590
+ "map_at_1":0.36564,
591
+ "map_at_3":0.49748,
592
+ "map_at_5":0.53983,
593
+ "map_at_10":0.57966,
594
+ "map_at_20":0.59407,
595
+ "map_at_50":0.60166,
596
+ "map_at_100":0.60419,
597
+ "recall_at_1":0.36564,
598
+ "recall_at_3":0.57915,
599
+ "recall_at_5":0.6723,
600
+ "recall_at_10":0.7796,
601
+ "recall_at_20":0.83839,
602
+ "recall_at_50":0.89828,
603
+ "recall_at_100":0.94039,
604
+ "precision_at_1":0.6,
605
+ "precision_at_3":0.38333,
606
+ "precision_at_5":0.28875,
607
+ "precision_at_10":0.18688,
608
+ "precision_at_20":0.10906,
609
+ "precision_at_50":0.05037,
610
+ "precision_at_100":0.02756,
611
+ "mrr_at_1":0.6125,
612
+ "mrr_at_3":0.7114583333333332,
613
+ "mrr_at_5":0.7258333333333333,
614
+ "mrr_at_10":0.7311706349206349,
615
+ "mrr_at_20":0.7328478057889821,
616
+ "mrr_at_50":0.7335337032248797,
617
+ "mrr_at_100":0.7337362495211759,
618
+ "naucs_at_1_max":0.3196794300979519,
619
+ "naucs_at_1_std":-0.06999480558029103,
620
+ "naucs_at_1_diff1":0.46354630454140655,
621
+ "naucs_at_3_max":-0.024028225250570488,
622
+ "naucs_at_3_std":-0.0772467105431113,
623
+ "naucs_at_3_diff1":-0.13384017605040516,
624
+ "naucs_at_5_max":-0.1107018755412317,
625
+ "naucs_at_5_std":-0.13468600304734307,
626
+ "naucs_at_5_diff1":-0.1913870528096573,
627
+ "naucs_at_10_max":-0.15104624102495343,
628
+ "naucs_at_10_std":-0.11990214904902942,
629
+ "naucs_at_10_diff1":-0.27309446189419934,
630
+ "naucs_at_20_max":-0.1510467527515919,
631
+ "naucs_at_20_std":-0.05158870650850273,
632
+ "naucs_at_20_diff1":-0.2855800617041388,
633
+ "naucs_at_50_max":-0.189407669514686,
634
+ "naucs_at_50_std":0.011655782821744832,
635
+ "naucs_at_50_diff1":-0.29769313630537414,
636
+ "naucs_at_100_max":-0.22560114991297742,
637
+ "naucs_at_100_std":0.03455222954387382,
638
+ "naucs_at_100_diff1":-0.29629886192096655
639
+ },
640
+ "vidore/synthetic_economics_macro_economy_2024_filtered_v1.0":{
641
+ "ndcg_at_1":0.62069,
642
+ "ndcg_at_3":0.61762,
643
+ "ndcg_at_5":0.60225,
644
+ "ndcg_at_10":0.58048,
645
+ "ndcg_at_20":0.61347,
646
+ "ndcg_at_50":0.67491,
647
+ "ndcg_at_100":0.71101,
648
+ "map_at_1":0.09096,
649
+ "map_at_3":0.20035,
650
+ "map_at_5":0.26381,
651
+ "map_at_10":0.33202,
652
+ "map_at_20":0.39844,
653
+ "map_at_50":0.45746,
654
+ "map_at_100":0.48541,
655
+ "recall_at_1":0.09096,
656
+ "recall_at_3":0.24139,
657
+ "recall_at_5":0.33438,
658
+ "recall_at_10":0.4587,
659
+ "recall_at_20":0.62591,
660
+ "recall_at_50":0.81242,
661
+ "recall_at_100":0.91777,
662
+ "precision_at_1":0.62069,
663
+ "precision_at_3":0.57471,
664
+ "precision_at_5":0.53448,
665
+ "precision_at_10":0.42414,
666
+ "precision_at_20":0.32672,
667
+ "precision_at_50":0.19759,
668
+ "precision_at_100":0.12862,
669
+ "mrr_at_1":0.603448275862069,
670
+ "mrr_at_3":0.7241379310344828,
671
+ "mrr_at_5":0.7405172413793104,
672
+ "mrr_at_10":0.7462643678160921,
673
+ "mrr_at_20":0.7475906277630417,
674
+ "mrr_at_50":0.7484116458254391,
675
+ "mrr_at_100":0.7484116458254391,
676
+ "naucs_at_1_max":0.18510409805228442,
677
+ "naucs_at_1_std":0.35494696439734424,
678
+ "naucs_at_1_diff1":0.16217400181533045,
679
+ "naucs_at_3_max":0.11476072335324272,
680
+ "naucs_at_3_std":0.14220252935282734,
681
+ "naucs_at_3_diff1":0.20624608835397928,
682
+ "naucs_at_5_max":0.05768772419881633,
683
+ "naucs_at_5_std":0.06310746641396357,
684
+ "naucs_at_5_diff1":0.18987051287290022,
685
+ "naucs_at_10_max":0.0985016982729016,
686
+ "naucs_at_10_std":0.20584586715310207,
687
+ "naucs_at_10_diff1":0.06505841014753395,
688
+ "naucs_at_20_max":0.08004110479748268,
689
+ "naucs_at_20_std":0.287577784204017,
690
+ "naucs_at_20_diff1":0.020551986645709248,
691
+ "naucs_at_50_max":0.014573240638718194,
692
+ "naucs_at_50_std":0.24605332511304584,
693
+ "naucs_at_50_diff1":-0.020387827810068312,
694
+ "naucs_at_100_max":-0.05010509973449726,
695
+ "naucs_at_100_std":0.1897950634215769,
696
+ "naucs_at_100_diff1":-0.014466845102017144
697
+ },
698
+ "vidore/synthetic_rse_restaurant_filtered_v1.0":{
699
+ "ndcg_at_1":0.52632,
700
+ "ndcg_at_3":0.55585,
701
+ "ndcg_at_5":0.56608,
702
+ "ndcg_at_10":0.60595,
703
+ "ndcg_at_20":0.63951,
704
+ "ndcg_at_50":0.67486,
705
+ "ndcg_at_100":0.68663,
706
+ "map_at_1":0.18937,
707
+ "map_at_3":0.38648,
708
+ "map_at_5":0.42924,
709
+ "map_at_10":0.4756,
710
+ "map_at_20":0.49684,
711
+ "map_at_50":0.51563,
712
+ "map_at_100":0.52215,
713
+ "recall_at_1":0.18937,
714
+ "recall_at_3":0.52147,
715
+ "recall_at_5":0.61387,
716
+ "recall_at_10":0.7448,
717
+ "recall_at_20":0.84958,
718
+ "recall_at_50":0.95384,
719
+ "recall_at_100":0.98246,
720
+ "precision_at_1":0.52632,
721
+ "precision_at_3":0.40351,
722
+ "precision_at_5":0.29825,
723
+ "precision_at_10":0.2,
724
+ "precision_at_20":0.12632,
725
+ "precision_at_50":0.06842,
726
+ "precision_at_100":0.03877,
727
+ "mrr_at_1":0.5263157894736842,
728
+ "mrr_at_3":0.6608187134502922,
729
+ "mrr_at_5":0.6687134502923976,
730
+ "mrr_at_10":0.6770676691729323,
731
+ "mrr_at_20":0.6805936409651578,
732
+ "mrr_at_50":0.6813246351172046,
733
+ "mrr_at_100":0.6813246351172046,
734
+ "naucs_at_1_max":-0.3657070379375877,
735
+ "naucs_at_1_std":-0.2598454613027199,
736
+ "naucs_at_1_diff1":0.20497205438323887,
737
+ "naucs_at_3_max":-0.2760768601040555,
738
+ "naucs_at_3_std":-0.19536511254108982,
739
+ "naucs_at_3_diff1":0.12639737194669312,
740
+ "naucs_at_5_max":-0.32266979804661855,
741
+ "naucs_at_5_std":-0.2321273259469018,
742
+ "naucs_at_5_diff1":0.12201056497848635,
743
+ "naucs_at_10_max":-0.31327785677716363,
744
+ "naucs_at_10_std":-0.20701857432203374,
745
+ "naucs_at_10_diff1":0.12714449010861775,
746
+ "naucs_at_20_max":-0.3057758145014666,
747
+ "naucs_at_20_std":-0.19196155860715694,
748
+ "naucs_at_20_diff1":0.004456792889016827,
749
+ "naucs_at_50_max":-0.3443751963336487,
750
+ "naucs_at_50_std":-0.19916004962508968,
751
+ "naucs_at_50_diff1":-0.15313050707770795,
752
+ "naucs_at_100_max":-0.33335268769256254,
753
+ "naucs_at_100_std":-0.1759902263556841,
754
+ "naucs_at_100_diff1":-0.16546750884331984
755
+ },
756
+ "vidore/synthetic_axa_filtered_v1.0":{
757
+ "ndcg_at_1":0.72222,
758
+ "ndcg_at_3":0.68859,
759
+ "ndcg_at_5":0.6877,
760
+ "ndcg_at_10":0.69829,
761
+ "ndcg_at_20":0.7342,
762
+ "ndcg_at_50":0.77785,
763
+ "ndcg_at_100":0.78996,
764
+ "map_at_1":0.36488,
765
+ "map_at_3":0.46953,
766
+ "map_at_5":0.52392,
767
+ "map_at_10":0.58858,
768
+ "map_at_20":0.62889,
769
+ "map_at_50":0.64917,
770
+ "map_at_100":0.65352,
771
+ "recall_at_1":0.36488,
772
+ "recall_at_3":0.54323,
773
+ "recall_at_5":0.61414,
774
+ "recall_at_10":0.71635,
775
+ "recall_at_20":0.82542,
776
+ "recall_at_50":0.95323,
777
+ "recall_at_100":0.98765,
778
+ "precision_at_1":0.72222,
779
+ "precision_at_3":0.44444,
780
+ "precision_at_5":0.37778,
781
+ "precision_at_10":0.27222,
782
+ "precision_at_20":0.175,
783
+ "precision_at_50":0.08667,
784
+ "precision_at_100":0.04667,
785
+ "mrr_at_1":0.6111111111111112,
786
+ "mrr_at_3":0.7592592592592592,
787
+ "mrr_at_5":0.7592592592592592,
788
+ "mrr_at_10":0.7592592592592592,
789
+ "mrr_at_20":0.7592592592592592,
790
+ "mrr_at_50":0.7611111111111111,
791
+ "mrr_at_100":0.7611111111111111,
792
+ "naucs_at_1_max":-0.1072500882788756,
793
+ "naucs_at_1_std":-0.07848008527574335,
794
+ "naucs_at_1_diff1":0.3888329697673727,
795
+ "naucs_at_3_max":-0.5668751047952342,
796
+ "naucs_at_3_std":-0.5329585384567367,
797
+ "naucs_at_3_diff1":-0.2021392643633502,
798
+ "naucs_at_5_max":-0.5633098595994385,
799
+ "naucs_at_5_std":-0.43232123457673266,
800
+ "naucs_at_5_diff1":-0.17951311814925686,
801
+ "naucs_at_10_max":-0.6374122831555527,
802
+ "naucs_at_10_std":-0.43175557593234065,
803
+ "naucs_at_10_diff1":-0.31039799211753494,
804
+ "naucs_at_20_max":-0.701465591207169,
805
+ "naucs_at_20_std":-0.4917500935922029,
806
+ "naucs_at_20_diff1":-0.35064529361083185,
807
+ "naucs_at_50_max":-0.7021744453459953,
808
+ "naucs_at_50_std":-0.4855377059097475,
809
+ "naucs_at_50_diff1":-0.36456623920339126,
810
+ "naucs_at_100_max":-0.6924863874111336,
811
+ "naucs_at_100_std":-0.4863559555556065,
812
+ "naucs_at_100_diff1":-0.3608886108131484
813
+ },
814
+ "vidore/synthetic_rse_restaurant_filtered_v1.0_multilingual":{
815
+ "ndcg_at_1":0.54386,
816
+ "ndcg_at_3":0.53992,
817
+ "ndcg_at_5":0.57161,
818
+ "ndcg_at_10":0.61517,
819
+ "ndcg_at_20":0.64796,
820
+ "ndcg_at_50":0.67915,
821
+ "ndcg_at_100":0.69235,
822
+ "map_at_1":0.22592,
823
+ "map_at_3":0.38229,
824
+ "map_at_5":0.43639,
825
+ "map_at_10":0.48456,
826
+ "map_at_20":0.50644,
827
+ "map_at_50":0.52393,
828
+ "map_at_100":0.53044,
829
+ "recall_at_1":0.22592,
830
+ "recall_at_3":0.48555,
831
+ "recall_at_5":0.61365,
832
+ "recall_at_10":0.75902,
833
+ "recall_at_20":0.86188,
834
+ "recall_at_50":0.94857,
835
+ "recall_at_100":0.98684,
836
+ "precision_at_1":0.54386,
837
+ "precision_at_3":0.3845,
838
+ "precision_at_5":0.30351,
839
+ "precision_at_10":0.20439,
840
+ "precision_at_20":0.12785,
841
+ "precision_at_50":0.06851,
842
+ "precision_at_100":0.03882,
843
+ "mrr_at_1":0.5394736842105263,
844
+ "mrr_at_3":0.6491228070175438,
845
+ "mrr_at_5":0.6675438596491228,
846
+ "mrr_at_10":0.6769945697577275,
847
+ "mrr_at_20":0.6792236734283947,
848
+ "mrr_at_50":0.6797428454113825,
849
+ "mrr_at_100":0.6798197921642295,
850
+ "naucs_at_1_max":-0.20674277350895354,
851
+ "naucs_at_1_std":-0.12027303922549912,
852
+ "naucs_at_1_diff1":0.23775810754837193,
853
+ "naucs_at_3_max":-0.14132383047647284,
854
+ "naucs_at_3_std":-0.11240148832069007,
855
+ "naucs_at_3_diff1":0.15033788234126377,
856
+ "naucs_at_5_max":-0.17140084599390548,
857
+ "naucs_at_5_std":-0.13104605490168167,
858
+ "naucs_at_5_diff1":0.1523799082346645,
859
+ "naucs_at_10_max":-0.17604422702000652,
860
+ "naucs_at_10_std":-0.1040197021731718,
861
+ "naucs_at_10_diff1":0.141987374687683,
862
+ "naucs_at_20_max":-0.18707526779473269,
863
+ "naucs_at_20_std":-0.05659957021660996,
864
+ "naucs_at_20_diff1":0.043138658571222205,
865
+ "naucs_at_50_max":-0.23552302035441924,
866
+ "naucs_at_50_std":-0.05397637299883905,
867
+ "naucs_at_50_diff1":-0.09007005759845056,
868
+ "naucs_at_100_max":-0.2339022131728518,
869
+ "naucs_at_100_std":-0.0193642217972453,
870
+ "naucs_at_100_diff1":-0.11400444827044932
871
+ },
872
+ "vidore/synthetic_axa_filtered_v1.0_multilingual":{
873
+ "ndcg_at_1":0.63889,
874
+ "ndcg_at_3":0.62281,
875
+ "ndcg_at_5":0.60952,
876
+ "ndcg_at_10":0.64318,
877
+ "ndcg_at_20":0.67634,
878
+ "ndcg_at_50":0.71094,
879
+ "ndcg_at_100":0.72844,
880
+ "map_at_1":0.32704,
881
+ "map_at_3":0.41888,
882
+ "map_at_5":0.46563,
883
+ "map_at_10":0.53051,
884
+ "map_at_20":0.56674,
885
+ "map_at_50":0.58314,
886
+ "map_at_100":0.58783,
887
+ "recall_at_1":0.32704,
888
+ "recall_at_3":0.48365,
889
+ "recall_at_5":0.54387,
890
+ "recall_at_10":0.69125,
891
+ "recall_at_20":0.78669,
892
+ "recall_at_50":0.8863,
893
+ "recall_at_100":0.9429,
894
+ "precision_at_1":0.63889,
895
+ "precision_at_3":0.41204,
896
+ "precision_at_5":0.33333,
897
+ "precision_at_10":0.25417,
898
+ "precision_at_20":0.16597,
899
+ "precision_at_50":0.07972,
900
+ "precision_at_100":0.04431,
901
+ "mrr_at_1":0.5972222222222222,
902
+ "mrr_at_3":0.7083333333333333,
903
+ "mrr_at_5":0.7083333333333333,
904
+ "mrr_at_10":0.7178791887125221,
905
+ "mrr_at_20":0.7191418149751484,
906
+ "mrr_at_50":0.7199862392542369,
907
+ "mrr_at_100":0.7201556159480039,
908
+ "naucs_at_1_max":0.11301406077201734,
909
+ "naucs_at_1_std":0.21519921250929616,
910
+ "naucs_at_1_diff1":0.3601399303857268,
911
+ "naucs_at_3_max":-0.24927986503179209,
912
+ "naucs_at_3_std":-0.09022708366608238,
913
+ "naucs_at_3_diff1":0.04489545233674075,
914
+ "naucs_at_5_max":-0.26591050096906066,
915
+ "naucs_at_5_std":-0.07265537709306702,
916
+ "naucs_at_5_diff1":0.0014191239058859906,
917
+ "naucs_at_10_max":-0.3903220005756808,
918
+ "naucs_at_10_std":-0.12521844950880665,
919
+ "naucs_at_10_diff1":-0.19712230727571253,
920
+ "naucs_at_20_max":-0.45199817313888363,
921
+ "naucs_at_20_std":-0.1484667347150115,
922
+ "naucs_at_20_diff1":-0.2608757999232997,
923
+ "naucs_at_50_max":-0.48614207326501946,
924
+ "naucs_at_50_std":-0.15554359778230578,
925
+ "naucs_at_50_diff1":-0.27852375257122247,
926
+ "naucs_at_100_max":-0.5125082706318165,
927
+ "naucs_at_100_std":-0.18550458631758462,
928
+ "naucs_at_100_diff1":-0.31194041608707157
929
+ },
930
+ "vidore/synthetic_mit_biomedical_tissue_interactions_unfiltered_multilingual":{
931
+ "ndcg_at_1":0.58125,
932
+ "ndcg_at_3":0.60975,
933
+ "ndcg_at_5":0.62539,
934
+ "ndcg_at_10":0.65521,
935
+ "ndcg_at_20":0.67922,
936
+ "ndcg_at_50":0.70341,
937
+ "ndcg_at_100":0.71315,
938
+ "map_at_1":0.35357,
939
+ "map_at_3":0.49223,
940
+ "map_at_5":0.5321,
941
+ "map_at_10":0.56549,
942
+ "map_at_20":0.5796,
943
+ "map_at_50":0.58865,
944
+ "map_at_100":0.59103,
945
+ "recall_at_1":0.35357,
946
+ "recall_at_3":0.57487,
947
+ "recall_at_5":0.65905,
948
+ "recall_at_10":0.7508,
949
+ "recall_at_20":0.81705,
950
+ "recall_at_50":0.89072,
951
+ "recall_at_100":0.92568,
952
+ "precision_at_1":0.58125,
953
+ "precision_at_3":0.3849,
954
+ "precision_at_5":0.28719,
955
+ "precision_at_10":0.18125,
956
+ "precision_at_20":0.10578,
957
+ "precision_at_50":0.05062,
958
+ "precision_at_100":0.02748,
959
+ "mrr_at_1":0.5796875,
960
+ "mrr_at_3":0.6901041666666663,
961
+ "mrr_at_5":0.7021354166666661,
962
+ "mrr_at_10":0.7074832589285712,
963
+ "mrr_at_20":0.7102574911812041,
964
+ "mrr_at_50":0.7110110149629919,
965
+ "mrr_at_100":0.7111676465392118,
966
+ "naucs_at_1_max":0.17241551553460638,
967
+ "naucs_at_1_std":-0.10458500213424893,
968
+ "naucs_at_1_diff1":0.5014939741528845,
969
+ "naucs_at_3_max":0.04213476105852452,
970
+ "naucs_at_3_std":-0.03593819184778826,
971
+ "naucs_at_3_diff1":-0.03987788271154801,
972
+ "naucs_at_5_max":0.027250565594662386,
973
+ "naucs_at_5_std":-0.037278236776539624,
974
+ "naucs_at_5_diff1":-0.1239404049371398,
975
+ "naucs_at_10_max":-0.06115387637712348,
976
+ "naucs_at_10_std":-0.0718804318785458,
977
+ "naucs_at_10_diff1":-0.19295981392132494,
978
+ "naucs_at_20_max":-0.09125226002964483,
979
+ "naucs_at_20_std":-0.028359299920185887,
980
+ "naucs_at_20_diff1":-0.22651248920886707,
981
+ "naucs_at_50_max":-0.10766546120682835,
982
+ "naucs_at_50_std":0.03593323121140819,
983
+ "naucs_at_50_diff1":-0.25675662871310556,
984
+ "naucs_at_100_max":-0.12997916463636278,
985
+ "naucs_at_100_std":0.05375545158818975,
986
+ "naucs_at_100_diff1":-0.2582624772102094
987
+ },
988
+ "vidore/synthetics_economics_macro_economy_2024_filtered_v1.0_multilingual":{
989
+ "ndcg_at_1":0.57759,
990
+ "ndcg_at_3":0.57138,
991
+ "ndcg_at_5":0.55497,
992
+ "ndcg_at_10":0.5473,
993
+ "ndcg_at_20":0.58512,
994
+ "ndcg_at_50":0.65027,
995
+ "ndcg_at_100":0.68902,
996
+ "map_at_1":0.08005,
997
+ "map_at_3":0.17589,
998
+ "map_at_5":0.22976,
999
+ "map_at_10":0.29906,
1000
+ "map_at_20":0.36451,
1001
+ "map_at_50":0.42404,
1002
+ "map_at_100":0.45273,
1003
+ "recall_at_1":0.08005,
1004
+ "recall_at_3":0.21653,
1005
+ "recall_at_5":0.30793,
1006
+ "recall_at_10":0.43982,
1007
+ "recall_at_20":0.60961,
1008
+ "recall_at_50":0.80111,
1009
+ "recall_at_100":0.91548,
1010
+ "precision_at_1":0.57759,
1011
+ "precision_at_3":0.53592,
1012
+ "precision_at_5":0.49138,
1013
+ "precision_at_10":0.40733,
1014
+ "precision_at_20":0.31832,
1015
+ "precision_at_50":0.19638,
1016
+ "precision_at_100":0.12836,
1017
+ "mrr_at_1":0.5646551724137931,
1018
+ "mrr_at_3":0.694683908045977,
1019
+ "mrr_at_5":0.7136494252873563,
1020
+ "mrr_at_10":0.7207478106185002,
1021
+ "mrr_at_20":0.7223871734108802,
1022
+ "mrr_at_50":0.7225924279264796,
1023
+ "mrr_at_100":0.7225924279264796,
1024
+ "naucs_at_1_max":0.025825981954306243,
1025
+ "naucs_at_1_std":0.06786701290377438,
1026
+ "naucs_at_1_diff1":0.3119241048950317,
1027
+ "naucs_at_3_max":0.0479066957744716,
1028
+ "naucs_at_3_std":0.06557391489213844,
1029
+ "naucs_at_3_diff1":0.23439300856464848,
1030
+ "naucs_at_5_max":0.0517250332191857,
1031
+ "naucs_at_5_std":0.09464648925799282,
1032
+ "naucs_at_5_diff1":0.2254037385021122,
1033
+ "naucs_at_10_max":0.07385165346450225,
1034
+ "naucs_at_10_std":0.14105623461417685,
1035
+ "naucs_at_10_diff1":0.09658147605174039,
1036
+ "naucs_at_20_max":0.04903637832153811,
1037
+ "naucs_at_20_std":0.1590552355815479,
1038
+ "naucs_at_20_diff1":0.028107412938548966,
1039
+ "naucs_at_50_max":0.02938750541507763,
1040
+ "naucs_at_50_std":0.15805354436493257,
1041
+ "naucs_at_50_diff1":-0.04958795351145276,
1042
+ "naucs_at_100_max":-0.0034893431750791983,
1043
+ "naucs_at_100_std":0.13285693605908278,
1044
+ "naucs_at_100_diff1":-0.07289241471567467
1045
+ },
1046
+ "vidore/restaurant_esg_reports_beir":{
1047
+ "ndcg_at_1":0.66667,
1048
+ "ndcg_at_3":0.62961,
1049
+ "ndcg_at_5":0.65844,
1050
+ "ndcg_at_10":0.70149,
1051
+ "ndcg_at_20":0.72887,
1052
+ "ndcg_at_50":0.75185,
1053
+ "ndcg_at_100":0.75669,
1054
+ "map_at_1":0.47262,
1055
+ "map_at_3":0.55789,
1056
+ "map_at_5":0.59623,
1057
+ "map_at_10":0.62874,
1058
+ "map_at_20":0.64199,
1059
+ "map_at_50":0.64885,
1060
+ "map_at_100":0.65059,
1061
+ "recall_at_1":0.47262,
1062
+ "recall_at_3":0.58302,
1063
+ "recall_at_5":0.68751,
1064
+ "recall_at_10":0.8013,
1065
+ "recall_at_20":0.88308,
1066
+ "recall_at_50":0.9586,
1067
+ "recall_at_100":0.97619,
1068
+ "precision_at_1":0.69231,
1069
+ "precision_at_3":0.33974,
1070
+ "precision_at_5":0.24615,
1071
+ "precision_at_10":0.15577,
1072
+ "precision_at_20":0.09231,
1073
+ "precision_at_50":0.04269,
1074
+ "precision_at_100":0.02288,
1075
+ "mrr_at_1":0.6923076923076923,
1076
+ "mrr_at_3":0.7371794871794872,
1077
+ "mrr_at_5":0.7583333333333333,
1078
+ "mrr_at_10":0.7666666666666665,
1079
+ "mrr_at_20":0.7698942083557468,
1080
+ "mrr_at_50":0.7706954904070289,
1081
+ "mrr_at_100":0.7706954904070289,
1082
+ "naucs_at_1_max":0.21266459227612405,
1083
+ "naucs_at_1_std":0.19096494070335385,
1084
+ "naucs_at_1_diff1":0.49249886565541523,
1085
+ "naucs_at_3_max":-0.03430599620876157,
1086
+ "naucs_at_3_std":0.017097041956098673,
1087
+ "naucs_at_3_diff1":-0.03264969467214677,
1088
+ "naucs_at_5_max":-0.022484350271713836,
1089
+ "naucs_at_5_std":-0.0636467385979771,
1090
+ "naucs_at_5_diff1":-0.16473803715393007,
1091
+ "naucs_at_10_max":-0.07317891510820472,
1092
+ "naucs_at_10_std":-0.04140978466752904,
1093
+ "naucs_at_10_diff1":-0.26462899584834276,
1094
+ "naucs_at_20_max":-0.0627742919035184,
1095
+ "naucs_at_20_std":0.04670746961963372,
1096
+ "naucs_at_20_diff1":-0.3704708282580158,
1097
+ "naucs_at_50_max":-0.06988684901669139,
1098
+ "naucs_at_50_std":0.005284407101443551,
1099
+ "naucs_at_50_diff1":-0.38324540988500305,
1100
+ "naucs_at_100_max":-0.11684726414295883,
1101
+ "naucs_at_100_std":0.005824353791349827,
1102
+ "naucs_at_100_diff1":-0.3791953702270732
1103
  }
1104
  }