nv-bschifferer's picture
modify README
16cdad8
{
"metadata": {
"timestamp": "2025-06-26T06:21:27.128658",
"vidore_benchmark_version": "5.0.1.dev12+ge0eb903"
},
"metrics": {
"vidore/arxivqa_test_subsampled": {
"ndcg_at_1": 0.834,
"ndcg_at_3": 0.87602,
"ndcg_at_5": 0.88351,
"ndcg_at_10": 0.89382,
"ndcg_at_20": 0.89856,
"ndcg_at_50": 0.9021,
"ndcg_at_100": 0.90271,
"map_at_1": 0.834,
"map_at_3": 0.86567,
"map_at_5": 0.86987,
"map_at_10": 0.87409,
"map_at_20": 0.87549,
"map_at_50": 0.87605,
"map_at_100": 0.87609,
"recall_at_1": 0.834,
"recall_at_3": 0.906,
"recall_at_5": 0.924,
"recall_at_10": 0.956,
"recall_at_20": 0.974,
"recall_at_50": 0.992,
"recall_at_100": 0.996,
"precision_at_1": 0.834,
"precision_at_3": 0.302,
"precision_at_5": 0.1848,
"precision_at_10": 0.0956,
"precision_at_20": 0.0487,
"precision_at_50": 0.01984,
"precision_at_100": 0.00996,
"mrr_at_1": 0.834,
"mrr_at_3": 0.8656666666666666,
"mrr_at_5": 0.8698666666666666,
"mrr_at_10": 0.8740904761904763,
"mrr_at_20": 0.8754917376740906,
"mrr_at_50": 0.8760454757022237,
"mrr_at_100": 0.8760882870575352,
"naucs_at_1_max": 0.6703392545655197,
"naucs_at_1_std": 0.4132759009409903,
"naucs_at_1_diff1": 0.9520605650682898,
"naucs_at_3_max": 0.6840495063273536,
"naucs_at_3_std": 0.45158630828217644,
"naucs_at_3_diff1": 0.9315116117368949,
"naucs_at_5_max": 0.7034989434370238,
"naucs_at_5_std": 0.46818025455796014,
"naucs_at_5_diff1": 0.9329205366357055,
"naucs_at_10_max": 0.6890968508615603,
"naucs_at_10_std": 0.474195738901625,
"naucs_at_10_diff1": 0.9457813428401673,
"naucs_at_20_max": 0.7880126409538182,
"naucs_at_20_std": 0.5496301084536358,
"naucs_at_20_diff1": 0.9283559577677175,
"naucs_at_50_max": 0.7480158730158629,
"naucs_at_50_std": 0.8190943043884249,
"naucs_at_50_diff1": 0.8978758169934562,
"naucs_at_100_max": 1.0,
"naucs_at_100_std": 1.0,
"naucs_at_100_diff1": 1.0
},
"vidore/docvqa_test_subsampled": {
"ndcg_at_1": 0.58537,
"ndcg_at_3": 0.64531,
"ndcg_at_5": 0.65942,
"ndcg_at_10": 0.67939,
"ndcg_at_20": 0.69023,
"ndcg_at_50": 0.70398,
"ndcg_at_100": 0.71126,
"map_at_1": 0.58537,
"map_at_3": 0.63008,
"map_at_5": 0.63762,
"map_at_10": 0.64581,
"map_at_20": 0.64889,
"map_at_50": 0.65114,
"map_at_100": 0.65181,
"recall_at_1": 0.58537,
"recall_at_3": 0.68958,
"recall_at_5": 0.72506,
"recall_at_10": 0.78714,
"recall_at_20": 0.82927,
"recall_at_50": 0.898,
"recall_at_100": 0.94235,
"precision_at_1": 0.58537,
"precision_at_3": 0.22986,
"precision_at_5": 0.14501,
"precision_at_10": 0.07871,
"precision_at_20": 0.04146,
"precision_at_50": 0.01796,
"precision_at_100": 0.00942,
"mrr_at_1": 0.5853658536585366,
"mrr_at_3": 0.6300813008130081,
"mrr_at_5": 0.6376201034737617,
"mrr_at_10": 0.6458064970260089,
"mrr_at_20": 0.6488879496173225,
"mrr_at_50": 0.6511443628922823,
"mrr_at_100": 0.6518089180219389,
"naucs_at_1_max": 0.2585563149452475,
"naucs_at_1_std": 0.3159595366492725,
"naucs_at_1_diff1": 0.8678053985855875,
"naucs_at_3_max": 0.22128557788133152,
"naucs_at_3_std": 0.258482179935891,
"naucs_at_3_diff1": 0.8393573283409745,
"naucs_at_5_max": 0.21064270306895383,
"naucs_at_5_std": 0.23472397866953829,
"naucs_at_5_diff1": 0.8274386494106453,
"naucs_at_10_max": 0.15097771381217617,
"naucs_at_10_std": 0.2839241224708214,
"naucs_at_10_diff1": 0.7893641996302178,
"naucs_at_20_max": 0.15466073118900037,
"naucs_at_20_std": 0.33553862379172555,
"naucs_at_20_diff1": 0.7724781458006538,
"naucs_at_50_max": 0.10906657289614331,
"naucs_at_50_std": 0.5786081651360842,
"naucs_at_50_diff1": 0.7426293121947367,
"naucs_at_100_max": 0.072673798370254,
"naucs_at_100_std": 0.8933863552254951,
"naucs_at_100_diff1": 0.7602442332060952
},
"vidore/infovqa_test_subsampled": {
"ndcg_at_1": 0.91498,
"ndcg_at_3": 0.94325,
"ndcg_at_5": 0.94908,
"ndcg_at_10": 0.95095,
"ndcg_at_20": 0.95363,
"ndcg_at_50": 0.95442,
"ndcg_at_100": 0.95476,
"map_at_1": 0.91498,
"map_at_3": 0.93623,
"map_at_5": 0.93947,
"map_at_10": 0.94019,
"map_at_20": 0.94099,
"map_at_50": 0.94111,
"map_at_100": 0.94114,
"recall_at_1": 0.91498,
"recall_at_3": 0.96356,
"recall_at_5": 0.97773,
"recall_at_10": 0.98381,
"recall_at_20": 0.99393,
"recall_at_50": 0.99798,
"recall_at_100": 1.0,
"precision_at_1": 0.91498,
"precision_at_3": 0.32119,
"precision_at_5": 0.19555,
"precision_at_10": 0.09838,
"precision_at_20": 0.0497,
"precision_at_50": 0.01996,
"precision_at_100": 0.01,
"mrr_at_1": 0.9149797570850202,
"mrr_at_3": 0.936234817813765,
"mrr_at_5": 0.9394736842105261,
"mrr_at_10": 0.9401902191375874,
"mrr_at_20": 0.9409887775689154,
"mrr_at_50": 0.9411103076140448,
"mrr_at_100": 0.9411405209199847,
"naucs_at_1_max": 0.6703820792124877,
"naucs_at_1_std": 0.16833937392893533,
"naucs_at_1_diff1": 0.9498534501270284,
"naucs_at_3_max": 0.5822492726969997,
"naucs_at_3_std": 0.06259669593622658,
"naucs_at_3_diff1": 0.9492105456414766,
"naucs_at_5_max": 0.739556315880861,
"naucs_at_5_std": 0.5078895506993929,
"naucs_at_5_diff1": 0.9643814216187027,
"naucs_at_10_max": 0.6766067765559199,
"naucs_at_10_std": 0.3559984957278538,
"naucs_at_10_diff1": 0.9836748182418953,
"naucs_at_20_max": 0.9564661819784134,
"naucs_at_20_std": 0.8638879360590604,
"naucs_at_20_diff1": 1.0,
"naucs_at_50_max": 0.8693985459351681,
"naucs_at_50_std": 0.8693985459351681,
"naucs_at_50_diff1": 1.0,
"naucs_at_100_max": null,
"naucs_at_100_std": null,
"naucs_at_100_diff1": null
},
"vidore/tabfquad_test_subsampled": {
"ndcg_at_1": 0.91786,
"ndcg_at_3": 0.95383,
"ndcg_at_5": 0.95935,
"ndcg_at_10": 0.95935,
"ndcg_at_20": 0.96032,
"ndcg_at_50": 0.96109,
"ndcg_at_100": 0.96109,
"map_at_1": 0.91786,
"map_at_3": 0.94524,
"map_at_5": 0.9481,
"map_at_10": 0.9481,
"map_at_20": 0.94839,
"map_at_50": 0.94854,
"map_at_100": 0.94854,
"recall_at_1": 0.91786,
"recall_at_3": 0.97857,
"recall_at_5": 0.99286,
"recall_at_10": 0.99286,
"recall_at_20": 0.99643,
"recall_at_50": 1.0,
"recall_at_100": 1.0,
"precision_at_1": 0.91786,
"precision_at_3": 0.32619,
"precision_at_5": 0.19857,
"precision_at_10": 0.09929,
"precision_at_20": 0.04982,
"precision_at_50": 0.02,
"precision_at_100": 0.01,
"mrr_at_1": 0.9178571428571428,
"mrr_at_3": 0.9452380952380953,
"mrr_at_5": 0.948095238095238,
"mrr_at_10": 0.948095238095238,
"mrr_at_20": 0.9483928571428571,
"mrr_at_50": 0.9485416666666666,
"mrr_at_100": 0.9485416666666666,
"naucs_at_1_max": 0.04487882109365634,
"naucs_at_1_std": 0.15499533146591998,
"naucs_at_1_diff1": 0.928754110339789,
"naucs_at_3_max": 0.8358232181761669,
"naucs_at_3_std": 0.9101307189542569,
"naucs_at_3_diff1": 1.0,
"naucs_at_5_max": 0.9346405228758269,
"naucs_at_5_std": 0.9346405228758269,
"naucs_at_5_diff1": 1.0,
"naucs_at_10_max": 0.9346405228758269,
"naucs_at_10_std": 0.9346405228758269,
"naucs_at_10_diff1": 1.0,
"naucs_at_20_max": 1.0,
"naucs_at_20_std": 1.0,
"naucs_at_20_diff1": 1.0,
"naucs_at_50_max": 1.0,
"naucs_at_50_std": 1.0,
"naucs_at_50_diff1": 1.0,
"naucs_at_100_max": 1.0,
"naucs_at_100_std": 1.0,
"naucs_at_100_diff1": 1.0
},
"vidore/tatdqa_test": {
"ndcg_at_1": 0.70535,
"ndcg_at_3": 0.7868,
"ndcg_at_5": 0.80621,
"ndcg_at_10": 0.82194,
"ndcg_at_20": 0.82672,
"ndcg_at_50": 0.83053,
"ndcg_at_100": 0.83277,
"map_at_1": 0.70535,
"map_at_3": 0.76742,
"map_at_5": 0.77826,
"map_at_10": 0.78488,
"map_at_20": 0.78628,
"map_at_50": 0.78693,
"map_at_100": 0.78712,
"recall_at_1": 0.70535,
"recall_at_3": 0.84265,
"recall_at_5": 0.88943,
"recall_at_10": 0.93742,
"recall_at_20": 0.95565,
"recall_at_50": 0.97448,
"recall_at_100": 0.98846,
"precision_at_1": 0.70535,
"precision_at_3": 0.28088,
"precision_at_5": 0.17789,
"precision_at_10": 0.09374,
"precision_at_20": 0.04778,
"precision_at_50": 0.01949,
"precision_at_100": 0.00988,
"mrr_at_1": 0.7035236938031592,
"mrr_at_3": 0.767010935601458,
"mrr_at_5": 0.7775212636695018,
"mrr_at_10": 0.7841125190456905,
"mrr_at_20": 0.7855296898659594,
"mrr_at_50": 0.7861619428321974,
"mrr_at_100": 0.7863629532691659,
"naucs_at_1_max": 0.22208704220171518,
"naucs_at_1_std": 0.15415493193166072,
"naucs_at_1_diff1": 0.85100407554343,
"naucs_at_3_max": 0.21518686518713465,
"naucs_at_3_std": 0.23043576383644288,
"naucs_at_3_diff1": 0.8025394364016292,
"naucs_at_5_max": 0.2641753480647899,
"naucs_at_5_std": 0.2706978631234192,
"naucs_at_5_diff1": 0.7806280461098983,
"naucs_at_10_max": 0.2523834187563826,
"naucs_at_10_std": 0.32315905277258156,
"naucs_at_10_diff1": 0.7532415640618384,
"naucs_at_20_max": 0.26510647248798225,
"naucs_at_20_std": 0.3525755808522635,
"naucs_at_20_diff1": 0.7348455395997588,
"naucs_at_50_max": 0.242804665789723,
"naucs_at_50_std": 0.44822875988285776,
"naucs_at_50_diff1": 0.7286029440909012,
"naucs_at_100_max": 0.05932622574605986,
"naucs_at_100_std": 0.28624024988935604,
"naucs_at_100_diff1": 0.7502131245549767
},
"vidore/shiftproject_test": {
"ndcg_at_1": 0.81,
"ndcg_at_3": 0.88678,
"ndcg_at_5": 0.907,
"ndcg_at_10": 0.907,
"ndcg_at_20": 0.907,
"ndcg_at_50": 0.90904,
"ndcg_at_100": 0.90904,
"map_at_1": 0.81,
"map_at_3": 0.86833,
"map_at_5": 0.87933,
"map_at_10": 0.87933,
"map_at_20": 0.87933,
"map_at_50": 0.87968,
"map_at_100": 0.87968,
"recall_at_1": 0.81,
"recall_at_3": 0.94,
"recall_at_5": 0.99,
"recall_at_10": 0.99,
"recall_at_20": 0.99,
"recall_at_50": 1.0,
"recall_at_100": 1.0,
"precision_at_1": 0.81,
"precision_at_3": 0.31333,
"precision_at_5": 0.198,
"precision_at_10": 0.099,
"precision_at_20": 0.0495,
"precision_at_50": 0.02,
"precision_at_100": 0.01,
"mrr_at_1": 0.81,
"mrr_at_3": 0.8683333333333334,
"mrr_at_5": 0.8793333333333334,
"mrr_at_10": 0.8793333333333334,
"mrr_at_20": 0.8793333333333334,
"mrr_at_50": 0.8796781609195403,
"mrr_at_100": 0.8796781609195403,
"naucs_at_1_max": -0.18730682592068792,
"naucs_at_1_std": -0.7260202210697273,
"naucs_at_1_diff1": 0.8433652889098441,
"naucs_at_3_max": 0.3544195455960126,
"naucs_at_3_std": -0.26914098972922335,
"naucs_at_3_diff1": 0.9319172113289744,
"naucs_at_5_max": 0.12278244631185926,
"naucs_at_5_std": 0.35807656395891135,
"naucs_at_5_diff1": 1.0,
"naucs_at_10_max": 0.12278244631185926,
"naucs_at_10_std": 0.35807656395891135,
"naucs_at_10_diff1": 1.0,
"naucs_at_20_max": 0.12278244631185926,
"naucs_at_20_std": 0.35807656395891135,
"naucs_at_20_diff1": 1.0,
"naucs_at_50_max": null,
"naucs_at_50_std": null,
"naucs_at_50_diff1": null,
"naucs_at_100_max": null,
"naucs_at_100_std": null,
"naucs_at_100_diff1": null
},
"vidore/syntheticDocQA_artificial_intelligence_test": {
"ndcg_at_1": 0.99,
"ndcg_at_3": 0.99631,
"ndcg_at_5": 0.99631,
"ndcg_at_10": 0.99631,
"ndcg_at_20": 0.99631,
"ndcg_at_50": 0.99631,
"ndcg_at_100": 0.99631,
"map_at_1": 0.99,
"map_at_3": 0.995,
"map_at_5": 0.995,
"map_at_10": 0.995,
"map_at_20": 0.995,
"map_at_50": 0.995,
"map_at_100": 0.995,
"recall_at_1": 0.99,
"recall_at_3": 1.0,
"recall_at_5": 1.0,
"recall_at_10": 1.0,
"recall_at_20": 1.0,
"recall_at_50": 1.0,
"recall_at_100": 1.0,
"precision_at_1": 0.99,
"precision_at_3": 0.33333,
"precision_at_5": 0.2,
"precision_at_10": 0.1,
"precision_at_20": 0.05,
"precision_at_50": 0.02,
"precision_at_100": 0.01,
"mrr_at_1": 0.99,
"mrr_at_3": 0.995,
"mrr_at_5": 0.995,
"mrr_at_10": 0.995,
"mrr_at_20": 0.995,
"mrr_at_50": 0.995,
"mrr_at_100": 0.995,
"naucs_at_1_max": 0.12278244631185359,
"naucs_at_1_std": 0.12278244631185359,
"naucs_at_1_diff1": 1.0,
"naucs_at_3_max": 1.0,
"naucs_at_3_std": 1.0,
"naucs_at_3_diff1": 1.0,
"naucs_at_5_max": 1.0,
"naucs_at_5_std": 1.0,
"naucs_at_5_diff1": 1.0,
"naucs_at_10_max": 1.0,
"naucs_at_10_std": 1.0,
"naucs_at_10_diff1": 1.0,
"naucs_at_20_max": 1.0,
"naucs_at_20_std": 1.0,
"naucs_at_20_diff1": 1.0,
"naucs_at_50_max": null,
"naucs_at_50_std": null,
"naucs_at_50_diff1": null,
"naucs_at_100_max": null,
"naucs_at_100_std": null,
"naucs_at_100_diff1": null
},
"vidore/syntheticDocQA_energy_test": {
"ndcg_at_1": 0.96,
"ndcg_at_3": 0.96631,
"ndcg_at_5": 0.96631,
"ndcg_at_10": 0.96946,
"ndcg_at_20": 0.97209,
"ndcg_at_50": 0.97406,
"ndcg_at_100": 0.97406,
"map_at_1": 0.96,
"map_at_3": 0.965,
"map_at_5": 0.965,
"map_at_10": 0.96625,
"map_at_20": 0.96702,
"map_at_50": 0.96732,
"map_at_100": 0.96732,
"recall_at_1": 0.96,
"recall_at_3": 0.97,
"recall_at_5": 0.97,
"recall_at_10": 0.98,
"recall_at_20": 0.99,
"recall_at_50": 1.0,
"recall_at_100": 1.0,
"precision_at_1": 0.96,
"precision_at_3": 0.32333,
"precision_at_5": 0.194,
"precision_at_10": 0.098,
"precision_at_20": 0.0495,
"precision_at_50": 0.02,
"precision_at_100": 0.01,
"mrr_at_1": 0.96,
"mrr_at_3": 0.965,
"mrr_at_5": 0.965,
"mrr_at_10": 0.96625,
"mrr_at_20": 0.9670192307692308,
"mrr_at_50": 0.9673222610722612,
"mrr_at_100": 0.9673222610722612,
"naucs_at_1_max": 0.7169701213818873,
"naucs_at_1_std": -0.03863211951446941,
"naucs_at_1_diff1": 1.0,
"naucs_at_3_max": 0.7152194211017727,
"naucs_at_3_std": -0.34126984126984133,
"naucs_at_3_diff1": 1.0,
"naucs_at_5_max": 0.7152194211017693,
"naucs_at_5_std": -0.3412698412698435,
"naucs_at_5_diff1": 1.0,
"naucs_at_10_max": 0.7957516339869297,
"naucs_at_10_std": 0.35807656395892185,
"naucs_at_10_diff1": 1.0,
"naucs_at_20_max": 0.7222222222222276,
"naucs_at_20_std": 0.35807656395891135,
"naucs_at_20_diff1": 1.0,
"naucs_at_50_max": null,
"naucs_at_50_std": null,
"naucs_at_50_diff1": null,
"naucs_at_100_max": null,
"naucs_at_100_std": null,
"naucs_at_100_diff1": null
},
"vidore/syntheticDocQA_government_reports_test": {
"ndcg_at_1": 0.95,
"ndcg_at_3": 0.97393,
"ndcg_at_5": 0.97823,
"ndcg_at_10": 0.97823,
"ndcg_at_20": 0.97823,
"ndcg_at_50": 0.97823,
"ndcg_at_100": 0.97823,
"map_at_1": 0.95,
"map_at_3": 0.96833,
"map_at_5": 0.97083,
"map_at_10": 0.97083,
"map_at_20": 0.97083,
"map_at_50": 0.97083,
"map_at_100": 0.97083,
"recall_at_1": 0.95,
"recall_at_3": 0.99,
"recall_at_5": 1.0,
"recall_at_10": 1.0,
"recall_at_20": 1.0,
"recall_at_50": 1.0,
"recall_at_100": 1.0,
"precision_at_1": 0.95,
"precision_at_3": 0.33,
"precision_at_5": 0.2,
"precision_at_10": 0.1,
"precision_at_20": 0.05,
"precision_at_50": 0.02,
"precision_at_100": 0.01,
"mrr_at_1": 0.95,
"mrr_at_3": 0.9683333333333333,
"mrr_at_5": 0.9708333333333333,
"mrr_at_10": 0.9708333333333333,
"mrr_at_20": 0.9708333333333333,
"mrr_at_50": 0.9708333333333333,
"mrr_at_100": 0.9708333333333333,
"naucs_at_1_max": 0.6765639589168986,
"naucs_at_1_std": 0.5556489262371623,
"naucs_at_1_diff1": 0.9738562091503253,
"naucs_at_3_max": 1.0,
"naucs_at_3_std": 0.8692810457516356,
"naucs_at_3_diff1": 0.8692810457516356,
"naucs_at_5_max": 1.0,
"naucs_at_5_std": 1.0,
"naucs_at_5_diff1": 1.0,
"naucs_at_10_max": 1.0,
"naucs_at_10_std": 1.0,
"naucs_at_10_diff1": 1.0,
"naucs_at_20_max": 1.0,
"naucs_at_20_std": 1.0,
"naucs_at_20_diff1": 1.0,
"naucs_at_50_max": null,
"naucs_at_50_std": null,
"naucs_at_50_diff1": null,
"naucs_at_100_max": null,
"naucs_at_100_std": null,
"naucs_at_100_diff1": null
},
"vidore/syntheticDocQA_healthcare_industry_test": {
"ndcg_at_1": 0.98,
"ndcg_at_3": 0.99262,
"ndcg_at_5": 0.99262,
"ndcg_at_10": 0.99262,
"ndcg_at_20": 0.99262,
"ndcg_at_50": 0.99262,
"ndcg_at_100": 0.99262,
"map_at_1": 0.98,
"map_at_3": 0.99,
"map_at_5": 0.99,
"map_at_10": 0.99,
"map_at_20": 0.99,
"map_at_50": 0.99,
"map_at_100": 0.99,
"recall_at_1": 0.98,
"recall_at_3": 1.0,
"recall_at_5": 1.0,
"recall_at_10": 1.0,
"recall_at_20": 1.0,
"recall_at_50": 1.0,
"recall_at_100": 1.0,
"precision_at_1": 0.98,
"precision_at_3": 0.33333,
"precision_at_5": 0.2,
"precision_at_10": 0.1,
"precision_at_20": 0.05,
"precision_at_50": 0.02,
"precision_at_100": 0.01,
"mrr_at_1": 0.98,
"mrr_at_3": 0.99,
"mrr_at_5": 0.99,
"mrr_at_10": 0.99,
"mrr_at_20": 0.99,
"mrr_at_50": 0.99,
"mrr_at_100": 0.99,
"naucs_at_1_max": 0.6381886087768457,
"naucs_at_1_std": -0.14122315592903503,
"naucs_at_1_diff1": 1.0,
"naucs_at_3_max": 1.0,
"naucs_at_3_std": 1.0,
"naucs_at_3_diff1": 1.0,
"naucs_at_5_max": 1.0,
"naucs_at_5_std": 1.0,
"naucs_at_5_diff1": 1.0,
"naucs_at_10_max": 1.0,
"naucs_at_10_std": 1.0,
"naucs_at_10_diff1": 1.0,
"naucs_at_20_max": 1.0,
"naucs_at_20_std": 1.0,
"naucs_at_20_diff1": 1.0,
"naucs_at_50_max": null,
"naucs_at_50_std": null,
"naucs_at_50_diff1": null,
"naucs_at_100_max": null,
"naucs_at_100_std": null,
"naucs_at_100_diff1": null
},
"vidore/synthetic_rse_restaurant_filtered_v1.0_multilingual": {
"ndcg_at_1": 0.49561,
"ndcg_at_3": 0.53551,
"ndcg_at_5": 0.57573,
"ndcg_at_10": 0.62797,
"ndcg_at_20": 0.66435,
"ndcg_at_50": 0.68753,
"ndcg_at_100": 0.69778,
"map_at_1": 0.24991,
"map_at_3": 0.39804,
"map_at_5": 0.45596,
"map_at_10": 0.50329,
"map_at_20": 0.52856,
"map_at_50": 0.54302,
"map_at_100": 0.54853,
"recall_at_1": 0.24991,
"recall_at_3": 0.49812,
"recall_at_5": 0.62081,
"recall_at_10": 0.78505,
"recall_at_20": 0.89032,
"recall_at_50": 0.94781,
"recall_at_100": 0.97423,
"precision_at_1": 0.49561,
"precision_at_3": 0.37865,
"precision_at_5": 0.30965,
"precision_at_10": 0.20921,
"precision_at_20": 0.13246,
"precision_at_50": 0.06912,
"precision_at_100": 0.03846,
"mrr_at_1": 0.4956140350877193,
"mrr_at_3": 0.6271929824561403,
"mrr_at_5": 0.642982456140351,
"mrr_at_10": 0.6540744221665276,
"mrr_at_20": 0.6558978051818611,
"mrr_at_50": 0.6561780443192584,
"mrr_at_100": 0.6561780443192584,
"naucs_at_1_max": -0.07400167664801681,
"naucs_at_1_std": 0.03458415022230023,
"naucs_at_1_diff1": 0.36837819306504144,
"naucs_at_3_max": -0.12444851869211698,
"naucs_at_3_std": -0.03350495496687875,
"naucs_at_3_diff1": 0.14678568781036586,
"naucs_at_5_max": -0.18380991972520577,
"naucs_at_5_std": -0.04485546676356389,
"naucs_at_5_diff1": 0.09319332805741351,
"naucs_at_10_max": -0.2287733254906937,
"naucs_at_10_std": -0.11817355407871401,
"naucs_at_10_diff1": 0.039989126851164826,
"naucs_at_20_max": -0.26978462701811906,
"naucs_at_20_std": -0.17072707397422024,
"naucs_at_20_diff1": -0.043988113501541394,
"naucs_at_50_max": -0.2775075319567234,
"naucs_at_50_std": -0.20957246437121108,
"naucs_at_50_diff1": -0.1133061107255248,
"naucs_at_100_max": -0.27585910810842096,
"naucs_at_100_std": -0.2097908968784823,
"naucs_at_100_diff1": -0.14037054801741544
},
"vidore/synthetic_mit_biomedical_tissue_interactions_unfiltered_multilingual": {
"ndcg_at_1": 0.60469,
"ndcg_at_3": 0.61057,
"ndcg_at_5": 0.63196,
"ndcg_at_10": 0.66415,
"ndcg_at_20": 0.68919,
"ndcg_at_50": 0.71209,
"ndcg_at_100": 0.72404,
"map_at_1": 0.3749,
"map_at_3": 0.50426,
"map_at_5": 0.54282,
"map_at_10": 0.57771,
"map_at_20": 0.59195,
"map_at_50": 0.60066,
"map_at_100": 0.60317,
"recall_at_1": 0.3749,
"recall_at_3": 0.56825,
"recall_at_5": 0.65837,
"recall_at_10": 0.75073,
"recall_at_20": 0.81942,
"recall_at_50": 0.8876,
"recall_at_100": 0.93527,
"precision_at_1": 0.60469,
"precision_at_3": 0.37448,
"precision_at_5": 0.28031,
"precision_at_10": 0.17922,
"precision_at_20": 0.10523,
"precision_at_50": 0.05022,
"precision_at_100": 0.02742,
"mrr_at_1": 0.6046875,
"mrr_at_3": 0.693489583333333,
"mrr_at_5": 0.7104427083333327,
"mrr_at_10": 0.7158568948412692,
"mrr_at_20": 0.7190933507966805,
"mrr_at_50": 0.7196874906299467,
"mrr_at_100": 0.7198739903840827,
"naucs_at_1_max": 0.21052397754348515,
"naucs_at_1_std": 0.09375197289505234,
"naucs_at_1_diff1": 0.5111101758127156,
"naucs_at_3_max": 0.06090465086494804,
"naucs_at_3_std": -0.001418024019873419,
"naucs_at_3_diff1": -0.03565597745007234,
"naucs_at_5_max": 0.004465748594415919,
"naucs_at_5_std": -0.0484521722756207,
"naucs_at_5_diff1": -0.1245720478106472,
"naucs_at_10_max": -0.059499017411910264,
"naucs_at_10_std": -0.07086245514678893,
"naucs_at_10_diff1": -0.22255807507622197,
"naucs_at_20_max": -0.08861071305293747,
"naucs_at_20_std": -0.04972647301862899,
"naucs_at_20_diff1": -0.28111304038576185,
"naucs_at_50_max": -0.0772093711850375,
"naucs_at_50_std": -0.03833832084634795,
"naucs_at_50_diff1": -0.3229404564565436,
"naucs_at_100_max": -0.09326229510606512,
"naucs_at_100_std": -0.05851062266000862,
"naucs_at_100_diff1": -0.33725273449156307
},
"vidore/synthetics_economics_macro_economy_2024_filtered_v1.0_multilingual": {
"ndcg_at_1": 0.65086,
"ndcg_at_3": 0.60789,
"ndcg_at_5": 0.57982,
"ndcg_at_10": 0.56497,
"ndcg_at_20": 0.5906,
"ndcg_at_50": 0.66142,
"ndcg_at_100": 0.6981,
"map_at_1": 0.09835,
"map_at_3": 0.19265,
"map_at_5": 0.2438,
"map_at_10": 0.31201,
"map_at_20": 0.37105,
"map_at_50": 0.43282,
"map_at_100": 0.45993,
"recall_at_1": 0.09835,
"recall_at_3": 0.2383,
"recall_at_5": 0.31559,
"recall_at_10": 0.44357,
"recall_at_20": 0.59021,
"recall_at_50": 0.79179,
"recall_at_100": 0.90968,
"precision_at_1": 0.65086,
"precision_at_3": 0.55316,
"precision_at_5": 0.49828,
"precision_at_10": 0.40603,
"precision_at_20": 0.30948,
"precision_at_50": 0.1981,
"precision_at_100": 0.12724,
"mrr_at_1": 0.6508620689655172,
"mrr_at_3": 0.7586206896551727,
"mrr_at_5": 0.7706896551724141,
"mrr_at_10": 0.7741362205801864,
"mrr_at_20": 0.7757055120898937,
"mrr_at_50": 0.7760672193481526,
"mrr_at_100": 0.7760672193481526,
"naucs_at_1_max": -0.1577982313304122,
"naucs_at_1_std": 0.07083760025943213,
"naucs_at_1_diff1": 0.1180440061698451,
"naucs_at_3_max": -0.03551684594794198,
"naucs_at_3_std": 0.18649544217765762,
"naucs_at_3_diff1": 0.006931180468183028,
"naucs_at_5_max": -0.042439023438686566,
"naucs_at_5_std": 0.1463028288463992,
"naucs_at_5_diff1": 0.0052961279206988725,
"naucs_at_10_max": -0.014346231321749392,
"naucs_at_10_std": 0.13820096240926596,
"naucs_at_10_diff1": 0.060959204965535974,
"naucs_at_20_max": -0.04036150486209418,
"naucs_at_20_std": 0.10161400684234778,
"naucs_at_20_diff1": 0.058238772027959955,
"naucs_at_50_max": -0.027805254364547293,
"naucs_at_50_std": 0.06305093612338106,
"naucs_at_50_diff1": 0.014479645829478357,
"naucs_at_100_max": -0.04967371405554246,
"naucs_at_100_std": -0.0014108802561097272,
"naucs_at_100_diff1": 0.004463197803405348
},
"vidore/restaurant_esg_reports_beir": {
"ndcg_at_1": 0.66026,
"ndcg_at_3": 0.71844,
"ndcg_at_5": 0.74746,
"ndcg_at_10": 0.78463,
"ndcg_at_20": 0.79647,
"ndcg_at_50": 0.80898,
"ndcg_at_100": 0.81195,
"map_at_1": 0.46731,
"map_at_3": 0.6321,
"map_at_5": 0.67856,
"map_at_10": 0.71154,
"map_at_20": 0.71984,
"map_at_50": 0.72621,
"map_at_100": 0.72685,
"recall_at_1": 0.46731,
"recall_at_3": 0.71218,
"recall_at_5": 0.7989,
"recall_at_10": 0.89575,
"recall_at_20": 0.92767,
"recall_at_50": 0.97191,
"recall_at_100": 0.981,
"precision_at_1": 0.67308,
"precision_at_3": 0.41026,
"precision_at_5": 0.30769,
"precision_at_10": 0.18654,
"precision_at_20": 0.10096,
"precision_at_50": 0.04462,
"precision_at_100": 0.02308,
"mrr_at_1": 0.6730769230769231,
"mrr_at_3": 0.7756410256410257,
"mrr_at_5": 0.7852564102564104,
"mrr_at_10": 0.7940705128205129,
"mrr_at_20": 0.7940705128205129,
"mrr_at_50": 0.7949862637362638,
"mrr_at_100": 0.7949862637362638,
"naucs_at_1_max": 0.2155210634937776,
"naucs_at_1_std": 0.20643949634517547,
"naucs_at_1_diff1": 0.5572918449312647,
"naucs_at_3_max": -0.22870270992303324,
"naucs_at_3_std": -0.16008064610097344,
"naucs_at_3_diff1": -0.1052498381156227,
"naucs_at_5_max": -0.20249887866652966,
"naucs_at_5_std": -0.10577079083523987,
"naucs_at_5_diff1": -0.21560021268353965,
"naucs_at_10_max": -0.13190257359821772,
"naucs_at_10_std": -0.02595056097795122,
"naucs_at_10_diff1": -0.25059078573348686,
"naucs_at_20_max": -0.10804998986280905,
"naucs_at_20_std": 0.009844091874970871,
"naucs_at_20_diff1": -0.3106578658424983,
"naucs_at_50_max": -0.14217724030501422,
"naucs_at_50_std": -0.0010783625765841411,
"naucs_at_50_diff1": -0.2900029814490325,
"naucs_at_100_max": -0.15203872114868228,
"naucs_at_100_std": -0.01643757244869887,
"naucs_at_100_diff1": -0.2814362025783248
},
"vidore/synthetic_rse_restaurant_filtered_v1.0": {
"ndcg_at_1": 0.52632,
"ndcg_at_3": 0.55122,
"ndcg_at_5": 0.58777,
"ndcg_at_10": 0.63895,
"ndcg_at_20": 0.66853,
"ndcg_at_50": 0.69944,
"ndcg_at_100": 0.7087,
"map_at_1": 0.28596,
"map_at_3": 0.42149,
"map_at_5": 0.48239,
"map_at_10": 0.52458,
"map_at_20": 0.54701,
"map_at_50": 0.56361,
"map_at_100": 0.56876,
"recall_at_1": 0.28596,
"recall_at_3": 0.5136,
"recall_at_5": 0.6131,
"recall_at_10": 0.77097,
"recall_at_20": 0.8575,
"recall_at_50": 0.93975,
"recall_at_100": 0.96272,
"precision_at_1": 0.52632,
"precision_at_3": 0.37427,
"precision_at_5": 0.31228,
"precision_at_10": 0.21053,
"precision_at_20": 0.12807,
"precision_at_50": 0.06947,
"precision_at_100": 0.03842,
"mrr_at_1": 0.5263157894736842,
"mrr_at_3": 0.6461988304093568,
"mrr_at_5": 0.6549707602339182,
"mrr_at_10": 0.6659844054580898,
"mrr_at_20": 0.6673339331234068,
"mrr_at_50": 0.6679388938009629,
"mrr_at_100": 0.6679388938009629,
"naucs_at_1_max": -0.018448353550608226,
"naucs_at_1_std": 0.0821493132969922,
"naucs_at_1_diff1": 0.30290509894323814,
"naucs_at_3_max": -0.16441638665467292,
"naucs_at_3_std": 0.05181451792946125,
"naucs_at_3_diff1": 0.17081667434507056,
"naucs_at_5_max": -0.2223104695809391,
"naucs_at_5_std": -0.0034901998225501346,
"naucs_at_5_diff1": 0.11827209266301716,
"naucs_at_10_max": -0.3490810408001137,
"naucs_at_10_std": -0.10137127012539782,
"naucs_at_10_diff1": 0.024290790916341346,
"naucs_at_20_max": -0.41179472120133376,
"naucs_at_20_std": -0.18184189514711724,
"naucs_at_20_diff1": -0.026948094739752244,
"naucs_at_50_max": -0.4169831140986695,
"naucs_at_50_std": -0.2419827968566681,
"naucs_at_50_diff1": -0.14707184113572777,
"naucs_at_100_max": -0.41046730276590754,
"naucs_at_100_std": -0.2436064377498405,
"naucs_at_100_diff1": -0.16240322922206768
},
"vidore/synthetic_economics_macro_economy_2024_filtered_v1.0": {
"ndcg_at_1": 0.7931,
"ndcg_at_3": 0.69066,
"ndcg_at_5": 0.65993,
"ndcg_at_10": 0.62291,
"ndcg_at_20": 0.64258,
"ndcg_at_50": 0.70498,
"ndcg_at_100": 0.73984,
"map_at_1": 0.11768,
"map_at_3": 0.22479,
"map_at_5": 0.28825,
"map_at_10": 0.35934,
"map_at_20": 0.42423,
"map_at_50": 0.48412,
"map_at_100": 0.51142,
"recall_at_1": 0.11768,
"recall_at_3": 0.26124,
"recall_at_5": 0.34909,
"recall_at_10": 0.46824,
"recall_at_20": 0.62417,
"recall_at_50": 0.80904,
"recall_at_100": 0.92098,
"precision_at_1": 0.7931,
"precision_at_3": 0.62069,
"precision_at_5": 0.56552,
"precision_at_10": 0.43966,
"precision_at_20": 0.325,
"precision_at_50": 0.20172,
"precision_at_100": 0.12914,
"mrr_at_1": 0.7931034482758621,
"mrr_at_3": 0.8534482758620691,
"mrr_at_5": 0.8568965517241378,
"mrr_at_10": 0.8597701149425288,
"mrr_at_20": 0.8620158408190863,
"mrr_at_50": 0.8620158408190863,
"mrr_at_100": 0.8620158408190863,
"naucs_at_1_max": 0.271935938073248,
"naucs_at_1_std": 0.43674674991288676,
"naucs_at_1_diff1": 0.3617820074090711,
"naucs_at_3_max": 0.045282507585294354,
"naucs_at_3_std": 0.14844039042832088,
"naucs_at_3_diff1": 0.11059599624516278,
"naucs_at_5_max": 0.06086984174322351,
"naucs_at_5_std": 0.15073825039690825,
"naucs_at_5_diff1": 0.07597281303252662,
"naucs_at_10_max": 0.030803253605626704,
"naucs_at_10_std": 0.12023189876899391,
"naucs_at_10_diff1": 0.09409994930103974,
"naucs_at_20_max": 0.06111477495291343,
"naucs_at_20_std": 0.1377686346379398,
"naucs_at_20_diff1": 0.08342034215323584,
"naucs_at_50_max": -0.0214422324455313,
"naucs_at_50_std": 0.0629645228435432,
"naucs_at_50_diff1": 0.03433912496739525,
"naucs_at_100_max": -0.07270216260742496,
"naucs_at_100_std": -0.009713954266926159,
"naucs_at_100_diff1": -0.00289458364944889
},
"vidore/synthetic_mit_biomedical_tissue_interactions_unfiltered": {
"ndcg_at_1": 0.63125,
"ndcg_at_3": 0.63272,
"ndcg_at_5": 0.65663,
"ndcg_at_10": 0.68997,
"ndcg_at_20": 0.71467,
"ndcg_at_50": 0.73633,
"ndcg_at_100": 0.74718,
"map_at_1": 0.39991,
"map_at_3": 0.5245,
"map_at_5": 0.57059,
"map_at_10": 0.6074,
"map_at_20": 0.62094,
"map_at_50": 0.62966,
"map_at_100": 0.63202,
"recall_at_1": 0.39991,
"recall_at_3": 0.57796,
"recall_at_5": 0.67437,
"recall_at_10": 0.77096,
"recall_at_20": 0.84121,
"recall_at_50": 0.90687,
"recall_at_100": 0.94874,
"precision_at_1": 0.63125,
"precision_at_3": 0.38958,
"precision_at_5": 0.29375,
"precision_at_10": 0.18688,
"precision_at_20": 0.10844,
"precision_at_50": 0.05075,
"precision_at_100": 0.02756,
"mrr_at_1": 0.63125,
"mrr_at_3": 0.715625,
"mrr_at_5": 0.7274999999999998,
"mrr_at_10": 0.7328447420634919,
"mrr_at_20": 0.7370251189782439,
"mrr_at_50": 0.7376058481449105,
"mrr_at_100": 0.737786021875342,
"naucs_at_1_max": 0.40116615786322174,
"naucs_at_1_std": 0.12804177750728857,
"naucs_at_1_diff1": 0.5318484780069298,
"naucs_at_3_max": 0.031070174638639564,
"naucs_at_3_std": -0.03258401349687653,
"naucs_at_3_diff1": -0.08211207879257611,
"naucs_at_5_max": -0.03804589294380602,
"naucs_at_5_std": -0.0638529839983047,
"naucs_at_5_diff1": -0.1625118765251509,
"naucs_at_10_max": -0.08589738686452425,
"naucs_at_10_std": -0.0652662376777225,
"naucs_at_10_diff1": -0.27588514824978205,
"naucs_at_20_max": -0.14280800843691288,
"naucs_at_20_std": -0.050772727555263505,
"naucs_at_20_diff1": -0.33260125020460346,
"naucs_at_50_max": -0.18794085961226306,
"naucs_at_50_std": -0.09315309781822757,
"naucs_at_50_diff1": -0.3809855756340824,
"naucs_at_100_max": -0.20443798069201818,
"naucs_at_100_std": -0.09564469982214785,
"naucs_at_100_diff1": -0.416619080759233
}
}
}