Visual Document Retrieval
ColPali
Safetensors
English
vidore
vidore-experimental
colqwen2.5-v0.2 / results.json
QuentinJG's picture
Update results.json
80b8299 verified
{
"metadata": {
"timestamp": "2025-01-31T14:00:16.349261",
"vidore_benchmark_version": "4.0.3.dev20+g2d72668"
},
"metrics": {
"vidore/restaurant_esg_reports_beir": {"ndcg_at_1": 0.64103, "ndcg_at_3": 0.67538, "ndcg_at_5": 0.68397, "ndcg_at_10": 0.71199, "ndcg_at_20": 0.73099, "ndcg_at_50": 0.75581, "ndcg_at_100": 0.76163, "map_at_1": 0.43942, "map_at_3": 0.58034, "map_at_5": 0.6105, "map_at_10": 0.63715, "map_at_20": 0.64674, "map_at_50": 0.65463, "map_at_100": 0.65653, "recall_at_1": 0.43942, "recall_at_3": 0.6766, "recall_at_5": 0.73558, "recall_at_10": 0.81426, "recall_at_20": 0.87567, "recall_at_50": 0.95485, "recall_at_100": 0.981, "precision_at_1": 0.65385, "precision_at_3": 0.39744, "precision_at_5": 0.27692, "precision_at_10": 0.16538, "precision_at_20": 0.09423, "precision_at_50": 0.04346, "precision_at_100": 0.02308, "mrr_at_1": 0.6730769230769231, "mrr_at_3": 0.7467948717948718, "mrr_at_5": 0.7592948717948718, "mrr_at_10": 0.7647893772893772, "mrr_at_20": 0.7647893772893772, "mrr_at_50": 0.76724122651542, "mrr_at_100": 0.76724122651542, "naucs_at_1_max": 0.10629249714250551, "naucs_at_1_std": 0.03656703481974433, "naucs_at_1_diff1": 0.6471348946136236, "naucs_at_3_max": -0.04531273341377843, "naucs_at_3_std": 0.00041838369923711004, "naucs_at_3_diff1": -0.10904002079315368, "naucs_at_5_max": -0.11437346877355879, "naucs_at_5_std": -0.03247506128676773, "naucs_at_5_diff1": -0.23163739837531055, "naucs_at_10_max": -0.17966299098993738, "naucs_at_10_std": -0.08845607083585832, "naucs_at_10_diff1": -0.3668906677620788, "naucs_at_20_max": -0.1623997659302278, "naucs_at_20_std": -0.05328921373458377, "naucs_at_20_diff1": -0.4139154609733948, "naucs_at_50_max": -0.15835976853630981, "naucs_at_50_std": -0.042923187520787366, "naucs_at_50_diff1": -0.45626822378009313, "naucs_at_100_max": -0.14433851613678755, "naucs_at_100_std": -0.03148299510892002, "naucs_at_100_diff1": -0.44576138476398025},
"vidore/synthetics_economics_macro_economy_2024_filtered_v1.0_multilingual": {
"ndcg_at_1": 0.60345,
"ndcg_at_3": 0.59658,
"ndcg_at_5": 0.56521,
"ndcg_at_10": 0.55055,
"ndcg_at_20": 0.57899,
"ndcg_at_50": 0.65246,
"ndcg_at_100": 0.68858,
"map_at_1": 0.08192,
"map_at_3": 0.18869,
"map_at_5": 0.23861,
"map_at_10": 0.30685,
"map_at_20": 0.36485,
"map_at_50": 0.42784,
"map_at_100": 0.45362,
"recall_at_1": 0.08192,
"recall_at_3": 0.23525,
"recall_at_5": 0.31079,
"recall_at_10": 0.43833,
"recall_at_20": 0.58306,
"recall_at_50": 0.78859,
"recall_at_100": 0.90965,
"precision_at_1": 0.60345,
"precision_at_3": 0.5546,
"precision_at_5": 0.49138,
"precision_at_10": 0.39914,
"precision_at_20": 0.30539,
"precision_at_50": 0.1981,
"precision_at_100": 0.12647,
"mrr_at_1": 0.5948275862068966,
"mrr_at_3": 0.7140804597701149,
"mrr_at_5": 0.7311063218390805,
"mrr_at_10": 0.7372383004926109,
"mrr_at_20": 0.7380691285134744,
"mrr_at_50": 0.738889335917265,
"mrr_at_100": 0.738889335917265,
"naucs_at_1_max": 0.009301400086149124,
"naucs_at_1_std": -0.018176205759631064,
"naucs_at_1_diff1": 0.06589141538556753,
"naucs_at_3_max": 0.03608007053002765,
"naucs_at_3_std": 0.045332981794521165,
"naucs_at_3_diff1": 0.0027274204838523214,
"naucs_at_5_max": 0.06351874275538175,
"naucs_at_5_std": 0.09161670694703962,
"naucs_at_5_diff1": 0.030104357247264922,
"naucs_at_10_max": 0.09045732284339944,
"naucs_at_10_std": 0.11937912992266166,
"naucs_at_10_diff1": -0.007723827231040398,
"naucs_at_20_max": 0.04097490582062997,
"naucs_at_20_std": 0.11121740670187244,
"naucs_at_20_diff1": -0.04080919911505186,
"naucs_at_50_max": -0.04431654376754045,
"naucs_at_50_std": 0.1075378398002067,
"naucs_at_50_diff1": -0.0408768243788732,
"naucs_at_100_max": -0.08194156783211,
"naucs_at_100_std": 0.08152221906964778,
"naucs_at_100_diff1": -0.002462405639259035
},
"vidore/synthetic_axa_filtered_v1.0_multilingual": {
"ndcg_at_1": 0.44444,
"ndcg_at_3": 0.52927,
"ndcg_at_5": 0.53193,
"ndcg_at_10": 0.55273,
"ndcg_at_20": 0.57791,
"ndcg_at_50": 0.62959,
"ndcg_at_100": 0.64947,
"map_at_1": 0.19923,
"map_at_3": 0.31897,
"map_at_5": 0.3681,
"map_at_10": 0.4284,
"map_at_20": 0.45565,
"map_at_50": 0.47849,
"map_at_100": 0.48445,
"recall_at_1": 0.19923,
"recall_at_3": 0.43016,
"recall_at_5": 0.51283,
"recall_at_10": 0.63101,
"recall_at_20": 0.7193,
"recall_at_50": 0.86749,
"recall_at_100": 0.93786,
"precision_at_1": 0.44444,
"precision_at_3": 0.39815,
"precision_at_5": 0.33611,
"precision_at_10": 0.25,
"precision_at_20": 0.15347,
"precision_at_50": 0.08167,
"precision_at_100": 0.04556,
"mrr_at_1": 0.4444444444444444,
"mrr_at_3": 0.6041666666666666,
"mrr_at_5": 0.6111111111111112,
"mrr_at_10": 0.6134259259259259,
"mrr_at_20": 0.6134259259259259,
"mrr_at_50": 0.6156871267846877,
"mrr_at_100": 0.6160388005738615,
"naucs_at_1_max": -0.007676494689249098,
"naucs_at_1_std": 0.15632886231764911,
"naucs_at_1_diff1": 0.3454147669831923,
"naucs_at_3_max": -0.21520431732796824,
"naucs_at_3_std": -0.039307896873910286,
"naucs_at_3_diff1": 0.07075823324379214,
"naucs_at_5_max": -0.23427920743418434,
"naucs_at_5_std": -0.04955213973003769,
"naucs_at_5_diff1": 0.03587555672187707,
"naucs_at_10_max": -0.32076687527735803,
"naucs_at_10_std": -0.08584531062590048,
"naucs_at_10_diff1": -0.13920437910700148,
"naucs_at_20_max": -0.3500838034005256,
"naucs_at_20_std": -0.11679539412969686,
"naucs_at_20_diff1": -0.2051894549829469,
"naucs_at_50_max": -0.4102497000902005,
"naucs_at_50_std": -0.1409315271751862,
"naucs_at_50_diff1": -0.16443764913412845,
"naucs_at_100_max": -0.43730180953377223,
"naucs_at_100_std": -0.17380745870110292,
"naucs_at_100_diff1": -0.19442949153976513
},
"vidore/synthetic_mit_biomedical_tissue_interactions_unfiltered": {
"ndcg_at_1": 0.61875,
"ndcg_at_3": 0.61406,
"ndcg_at_5": 0.63644,
"ndcg_at_10": 0.67591,
"ndcg_at_20": 0.70178,
"ndcg_at_50": 0.72212,
"ndcg_at_100": 0.7297,
"map_at_1": 0.38142,
"map_at_3": 0.50057,
"map_at_5": 0.54282,
"map_at_10": 0.58278,
"map_at_20": 0.59965,
"map_at_50": 0.60789,
"map_at_100": 0.60942,
"recall_at_1": 0.38142,
"recall_at_3": 0.55686,
"recall_at_5": 0.65567,
"recall_at_10": 0.77349,
"recall_at_20": 0.84542,
"recall_at_50": 0.902,
"recall_at_100": 0.93314,
"precision_at_1": 0.61875,
"precision_at_3": 0.38333,
"precision_at_5": 0.28875,
"precision_at_10": 0.18875,
"precision_at_20": 0.11063,
"precision_at_50": 0.052,
"precision_at_100": 0.02756,
"mrr_at_1": 0.6,
"mrr_at_3": 0.6947916666666667,
"mrr_at_5": 0.7104166666666667,
"mrr_at_10": 0.7197544642857143,
"mrr_at_20": 0.7207690746753247,
"mrr_at_50": 0.7216319385110503,
"mrr_at_100": 0.7218020773999393,
"naucs_at_1_max": 0.23570942089460648,
"naucs_at_1_std": -0.0331808109585888,
"naucs_at_1_diff1": 0.38829894385449926,
"naucs_at_3_max": -0.02996939892755872,
"naucs_at_3_std": -0.06455703309969216,
"naucs_at_3_diff1": -0.10409043693090879,
"naucs_at_5_max": -0.10452188626653831,
"naucs_at_5_std": -0.052524231286355125,
"naucs_at_5_diff1": -0.26201383842532566,
"naucs_at_10_max": -0.18753439904110775,
"naucs_at_10_std": -0.07594574430351896,
"naucs_at_10_diff1": -0.3404263646481817,
"naucs_at_20_max": -0.20945097879456231,
"naucs_at_20_std": -0.04291331785264603,
"naucs_at_20_diff1": -0.35991045256760157,
"naucs_at_50_max": -0.25078519595626036,
"naucs_at_50_std": -0.021452523948669356,
"naucs_at_50_diff1": -0.3863780246795678,
"naucs_at_100_max": -0.2723431611743009,
"naucs_at_100_std": -0.031237471793638266,
"naucs_at_100_diff1": -0.38639136112161093
},
"vidore/synthetic_rse_restaurant_filtered_v1.0": {
"ndcg_at_1": 0.57895,
"ndcg_at_3": 0.57099,
"ndcg_at_5": 0.57396,
"ndcg_at_10": 0.6394,
"ndcg_at_20": 0.67256,
"ndcg_at_50": 0.70473,
"ndcg_at_100": 0.71518,
"map_at_1": 0.26466,
"map_at_3": 0.41771,
"map_at_5": 0.45328,
"map_at_10": 0.515,
"map_at_20": 0.53681,
"map_at_50": 0.55475,
"map_at_100": 0.55975,
"recall_at_1": 0.26466,
"recall_at_3": 0.50881,
"recall_at_5": 0.57932,
"recall_at_10": 0.77663,
"recall_at_20": 0.8768,
"recall_at_50": 0.96898,
"recall_at_100": 1.0,
"precision_at_1": 0.57895,
"precision_at_3": 0.39766,
"precision_at_5": 0.29123,
"precision_at_10": 0.21053,
"precision_at_20": 0.13246,
"precision_at_50": 0.07123,
"precision_at_100": 0.03895,
"mrr_at_1": 0.5614035087719298,
"mrr_at_3": 0.6637426900584795,
"mrr_at_5": 0.6751461988304094,
"mrr_at_10": 0.6886173767752715,
"mrr_at_20": 0.6913087643350802,
"mrr_at_50": 0.6925429103060682,
"mrr_at_100": 0.6925429103060682,
"naucs_at_1_max": -0.32399679124866293,
"naucs_at_1_std": -0.3157496852536844,
"naucs_at_1_diff1": 0.059217413521438306,
"naucs_at_3_max": -0.16317940152105928,
"naucs_at_3_std": -0.036766880845353206,
"naucs_at_3_diff1": 0.13451653330920363,
"naucs_at_5_max": -0.18872080560435078,
"naucs_at_5_std": -0.08965899629213353,
"naucs_at_5_diff1": 0.09733357617902798,
"naucs_at_10_max": -0.21096127425243222,
"naucs_at_10_std": -0.0492682492736064,
"naucs_at_10_diff1": 0.06579043413332678,
"naucs_at_20_max": -0.3151765999140926,
"naucs_at_20_std": -0.11272929289257284,
"naucs_at_20_diff1": -0.030784322032566636,
"naucs_at_50_max": -0.29489025135650376,
"naucs_at_50_std": -0.008523958191869246,
"naucs_at_50_diff1": -0.11796822928434904,
"naucs_at_100_max": -0.2661970083875134,
"naucs_at_100_std": 0.05555820249689567,
"naucs_at_100_diff1": -0.1271611921091859
},
"vidore/synthetic_rse_restaurant_filtered_v1.0_multilingual": {
"ndcg_at_1": 0.55702,
"ndcg_at_3": 0.5542,
"ndcg_at_5": 0.5738,
"ndcg_at_10": 0.62953,
"ndcg_at_20": 0.67065,
"ndcg_at_50": 0.6964,
"ndcg_at_100": 0.70872,
"map_at_1": 0.25589,
"map_at_3": 0.40701,
"map_at_5": 0.45304,
"map_at_10": 0.5087,
"map_at_20": 0.53389,
"map_at_50": 0.5501,
"map_at_100": 0.55542,
"recall_at_1": 0.25589,
"recall_at_3": 0.49373,
"recall_at_5": 0.59174,
"recall_at_10": 0.76938,
"recall_at_20": 0.89178,
"recall_at_50": 0.9594,
"recall_at_100": 1.0,
"precision_at_1": 0.55702,
"precision_at_3": 0.3845,
"precision_at_5": 0.29649,
"precision_at_10": 0.20746,
"precision_at_20": 0.13487,
"precision_at_50": 0.0707,
"precision_at_100": 0.03895,
"mrr_at_1": 0.5570175438596491,
"mrr_at_3": 0.6571637426900585,
"mrr_at_5": 0.6698830409356724,
"mrr_at_10": 0.683766708437761,
"mrr_at_20": 0.687599964534949,
"mrr_at_50": 0.6879085010276961,
"mrr_at_100": 0.6880572205275953,
"naucs_at_1_max": -0.17166276074798967,
"naucs_at_1_std": -0.20325235499471186,
"naucs_at_1_diff1": 0.33001833715444423,
"naucs_at_3_max": -0.04474887443402487,
"naucs_at_3_std": -0.008560331928141176,
"naucs_at_3_diff1": 0.1746255699902219,
"naucs_at_5_max": -0.08458531884834858,
"naucs_at_5_std": -0.06118868392476525,
"naucs_at_5_diff1": 0.13235525060593817,
"naucs_at_10_max": -0.12880215182381638,
"naucs_at_10_std": -0.08311726109553826,
"naucs_at_10_diff1": 0.11900519462159719,
"naucs_at_20_max": -0.18439650375622735,
"naucs_at_20_std": -0.051821500134533655,
"naucs_at_20_diff1": -0.015123572562768748,
"naucs_at_50_max": -0.20702547660326365,
"naucs_at_50_std": 0.02211997502899773,
"naucs_at_50_diff1": -0.1539679823951051,
"naucs_at_100_max": -0.1731060459048004,
"naucs_at_100_std": 0.1019715434458989,
"naucs_at_100_diff1": -0.1841288831466728
},
"vidore/synthetic_mit_biomedical_tissue_interactions_unfiltered_multilingual": {
"ndcg_at_1": 0.57812,
"ndcg_at_3": 0.58744,
"ndcg_at_5": 0.61127,
"ndcg_at_10": 0.64614,
"ndcg_at_20": 0.67298,
"ndcg_at_50": 0.6947,
"ndcg_at_100": 0.70357,
"map_at_1": 0.35834,
"map_at_3": 0.47597,
"map_at_5": 0.51819,
"map_at_10": 0.55455,
"map_at_20": 0.57016,
"map_at_50": 0.5782,
"map_at_100": 0.58034,
"recall_at_1": 0.35834,
"recall_at_3": 0.54214,
"recall_at_5": 0.63727,
"recall_at_10": 0.74383,
"recall_at_20": 0.82133,
"recall_at_50": 0.88659,
"recall_at_100": 0.91866,
"precision_at_1": 0.57812,
"precision_at_3": 0.3651,
"precision_at_5": 0.28,
"precision_at_10": 0.18,
"precision_at_20": 0.10617,
"precision_at_50": 0.05,
"precision_at_100": 0.02695,
"mrr_at_1": 0.5671875,
"mrr_at_3": 0.6708333333333333,
"mrr_at_5": 0.6866145833333334,
"mrr_at_10": 0.6939360119047618,
"mrr_at_20": 0.6963204666729361,
"mrr_at_50": 0.6971792252566347,
"mrr_at_100": 0.6973040137004454,
"naucs_at_1_max": 0.22350385772789982,
"naucs_at_1_std": -0.014236260379664127,
"naucs_at_1_diff1": 0.415396972645202,
"naucs_at_3_max": 0.05168321374193644,
"naucs_at_3_std": -0.05262932689279111,
"naucs_at_3_diff1": -0.046426105116023936,
"naucs_at_5_max": -0.019935793098795593,
"naucs_at_5_std": -0.07180552504536146,
"naucs_at_5_diff1": -0.15736139387093928,
"naucs_at_10_max": -0.1020058048777736,
"naucs_at_10_std": -0.09370704449884888,
"naucs_at_10_diff1": -0.23614803376814614,
"naucs_at_20_max": -0.13810591303119216,
"naucs_at_20_std": -0.0692107572861515,
"naucs_at_20_diff1": -0.28493482904408224,
"naucs_at_50_max": -0.17286447176352046,
"naucs_at_50_std": -0.04984221651971845,
"naucs_at_50_diff1": -0.317010129235068,
"naucs_at_100_max": -0.18980306870058375,
"naucs_at_100_std": -0.048954124365436114,
"naucs_at_100_diff1": -0.3281886367637723
},
"vidore/synthetic_axa_filtered_v1.0": {
"ndcg_at_1": 0.44444,
"ndcg_at_3": 0.55779,
"ndcg_at_5": 0.60297,
"ndcg_at_10": 0.63112,
"ndcg_at_20": 0.65055,
"ndcg_at_50": 0.69129,
"ndcg_at_100": 0.70318,
"map_at_1": 0.22361,
"map_at_3": 0.34019,
"map_at_5": 0.42558,
"map_at_10": 0.50246,
"map_at_20": 0.53023,
"map_at_50": 0.54858,
"map_at_100": 0.55304,
"recall_at_1": 0.22361,
"recall_at_3": 0.43907,
"recall_at_5": 0.59758,
"recall_at_10": 0.75267,
"recall_at_20": 0.82791,
"recall_at_50": 0.94587,
"recall_at_100": 0.9784,
"precision_at_1": 0.44444,
"precision_at_3": 0.42593,
"precision_at_5": 0.4,
"precision_at_10": 0.29444,
"precision_at_20": 0.175,
"precision_at_50": 0.08556,
"precision_at_100": 0.04611,
"mrr_at_1": 0.4444444444444444,
"mrr_at_3": 0.6111111111111112,
"mrr_at_5": 0.625,
"mrr_at_10": 0.6342592592592592,
"mrr_at_20": 0.6342592592592592,
"mrr_at_50": 0.6367845117845118,
"mrr_at_100": 0.6367845117845118,
"naucs_at_1_max": 0.27180734937990775,
"naucs_at_1_std": 0.1460001284215161,
"naucs_at_1_diff1": 0.52680845013576,
"naucs_at_3_max": -0.4472601618035251,
"naucs_at_3_std": -0.35334842300017605,
"naucs_at_3_diff1": -0.022038941836526545,
"naucs_at_5_max": -0.5746685319786979,
"naucs_at_5_std": -0.45581287349947885,
"naucs_at_5_diff1": -0.02909625842935311,
"naucs_at_10_max": -0.6670105211539744,
"naucs_at_10_std": -0.4579454710599414,
"naucs_at_10_diff1": -0.291350928264914,
"naucs_at_20_max": -0.7088454526103415,
"naucs_at_20_std": -0.45884776633256535,
"naucs_at_20_diff1": -0.39562206735708155,
"naucs_at_50_max": -0.7078100142972502,
"naucs_at_50_std": -0.4315828703198929,
"naucs_at_50_diff1": -0.37094602463897214,
"naucs_at_100_max": -0.7059796119743438,
"naucs_at_100_std": -0.400631653419931,
"naucs_at_100_diff1": -0.33114628268848284
},
"vidore/synthetic_economics_macro_economy_2024_filtered_v1.0": {
"ndcg_at_1": 0.67241,
"ndcg_at_3": 0.64169,
"ndcg_at_5": 0.5978,
"ndcg_at_10": 0.58577,
"ndcg_at_20": 0.61496,
"ndcg_at_50": 0.6772,
"ndcg_at_100": 0.71432,
"map_at_1": 0.08152,
"map_at_3": 0.20404,
"map_at_5": 0.2537,
"map_at_10": 0.32889,
"map_at_20": 0.39447,
"map_at_50": 0.4536,
"map_at_100": 0.48141,
"recall_at_1": 0.08152,
"recall_at_3": 0.2494,
"recall_at_5": 0.32267,
"recall_at_10": 0.45814,
"recall_at_20": 0.61677,
"recall_at_50": 0.80189,
"recall_at_100": 0.92313,
"precision_at_1": 0.67241,
"precision_at_3": 0.59195,
"precision_at_5": 0.51379,
"precision_at_10": 0.42586,
"precision_at_20": 0.325,
"precision_at_50": 0.20138,
"precision_at_100": 0.12983,
"mrr_at_1": 0.6724137931034483,
"mrr_at_3": 0.7729885057471265,
"mrr_at_5": 0.7807471264367816,
"mrr_at_10": 0.7857758620689655,
"mrr_at_20": 0.7868534482758621,
"mrr_at_50": 0.7876030734632684,
"mrr_at_100": 0.7876030734632684,
"naucs_at_1_max": 0.34454681161877004,
"naucs_at_1_std": 0.5235431895381841,
"naucs_at_1_diff1": -0.08387631081097016,
"naucs_at_3_max": 0.08884531420395679,
"naucs_at_3_std": 0.2382734233882671,
"naucs_at_3_diff1": -0.1871866677817215,
"naucs_at_5_max": 0.01311909348957855,
"naucs_at_5_std": 0.2167381673457986,
"naucs_at_5_diff1": -0.14497179289018872,
"naucs_at_10_max": 0.14293369671235354,
"naucs_at_10_std": 0.22265260242487017,
"naucs_at_10_diff1": -0.09048933555139305,
"naucs_at_20_max": 0.08115085333286959,
"naucs_at_20_std": 0.20688202040577058,
"naucs_at_20_diff1": -0.15069532949644948,
"naucs_at_50_max": -0.010126566692404412,
"naucs_at_50_std": 0.24164336672801914,
"naucs_at_50_diff1": -0.10468292902065172,
"naucs_at_100_max": -0.04114659355878923,
"naucs_at_100_std": 0.2129831852026439,
"naucs_at_100_diff1": -0.03795755522744344
},
"data_dir/eval_vidore/arxivqa_test_subsampled": {
"ndcg_at_1": 0.856,
"ndcg_at_3": 0.88745,
"ndcg_at_5": 0.89227,
"ndcg_at_10": 0.90332,
"ndcg_at_20": 0.90941,
"ndcg_at_50": 0.91153,
"ndcg_at_100": 0.91252,
"map_at_1": 0.856,
"map_at_3": 0.87967,
"map_at_5": 0.88227,
"map_at_10": 0.88687,
"map_at_20": 0.88854,
"map_at_50": 0.88895,
"map_at_100": 0.88904,
"recall_at_1": 0.856,
"recall_at_3": 0.91,
"recall_at_5": 0.922,
"recall_at_10": 0.956,
"recall_at_20": 0.98,
"recall_at_50": 0.99,
"recall_at_100": 0.996,
"precision_at_1": 0.856,
"precision_at_3": 0.30333,
"precision_at_5": 0.1844,
"precision_at_10": 0.0956,
"precision_at_20": 0.049,
"precision_at_50": 0.0198,
"precision_at_100": 0.00996,
"mrr_at_1": 0.854,
"mrr_at_3": 0.8773333333333334,
"mrr_at_5": 0.8809333333333332,
"mrr_at_10": 0.8855674603174604,
"mrr_at_20": 0.8873665921453847,
"mrr_at_50": 0.8876643128304966,
"mrr_at_100": 0.887751797810069,
"naucs_at_1_max": 0.8146679814134421,
"naucs_at_1_std": 0.07396801383185674,
"naucs_at_1_diff1": 0.9423560082126644,
"naucs_at_3_max": 0.8066396929142029,
"naucs_at_3_std": 0.07559912854030806,
"naucs_at_3_diff1": 0.9181969083929873,
"naucs_at_5_max": 0.8034068328185975,
"naucs_at_5_std": 0.02020637314754663,
"naucs_at_5_diff1": 0.9160860925566815,
"naucs_at_10_max": 0.825566590272474,
"naucs_at_10_std": -0.15187590187589842,
"naucs_at_10_diff1": 0.9390968508615584,
"naucs_at_20_max": 0.8921568627450932,
"naucs_at_20_std": 0.0641923436041116,
"naucs_at_20_diff1": 0.9738562091503187,
"naucs_at_50_max": 0.947712418300658,
"naucs_at_50_std": 0.37030812324930756,
"naucs_at_50_diff1": 0.9738562091503188,
"naucs_at_100_max": 1.0,
"naucs_at_100_std": 1.0,
"naucs_at_100_diff1": 1.0
},
"data_dir/eval_vidore/docvqa_test_subsampled": {
"ndcg_at_1": 0.55876,
"ndcg_at_3": 0.61485,
"ndcg_at_5": 0.63222,
"ndcg_at_10": 0.65493,
"ndcg_at_20": 0.66746,
"ndcg_at_50": 0.67657,
"ndcg_at_100": 0.68329,
"map_at_1": 0.55876,
"map_at_3": 0.60126,
"map_at_5": 0.6109,
"map_at_10": 0.62013,
"map_at_20": 0.62368,
"map_at_50": 0.62509,
"map_at_100": 0.62564,
"recall_at_1": 0.55876,
"recall_at_3": 0.6541,
"recall_at_5": 0.69623,
"recall_at_10": 0.76718,
"recall_at_20": 0.81596,
"recall_at_50": 0.86253,
"recall_at_100": 0.90466,
"precision_at_1": 0.55876,
"precision_at_3": 0.21803,
"precision_at_5": 0.13925,
"precision_at_10": 0.07672,
"precision_at_20": 0.0408,
"precision_at_50": 0.01725,
"precision_at_100": 0.00905,
"mrr_at_1": 0.5543237250554324,
"mrr_at_3": 0.599039172209904,
"mrr_at_5": 0.609349593495935,
"mrr_at_10": 0.6183401963889769,
"mrr_at_20": 0.6209344044461912,
"mrr_at_50": 0.6227106859869997,
"mrr_at_100": 0.6232889837626537,
"naucs_at_1_max": 0.29569387287927856,
"naucs_at_1_std": 0.6842470452244832,
"naucs_at_1_diff1": 0.9092758189268736,
"naucs_at_3_max": 0.21005633503267365,
"naucs_at_3_std": 0.805068083051039,
"naucs_at_3_diff1": 0.8754563618133548,
"naucs_at_5_max": 0.19259019824979384,
"naucs_at_5_std": 0.8409490067520664,
"naucs_at_5_diff1": 0.8726101181684977,
"naucs_at_10_max": 0.048646855770537796,
"naucs_at_10_std": 0.8833213018935924,
"naucs_at_10_diff1": 0.8643899050698751,
"naucs_at_20_max": -0.06225799483664109,
"naucs_at_20_std": 0.9127300541361831,
"naucs_at_20_diff1": 0.8597071895030789,
"naucs_at_50_max": -0.24442668101014947,
"naucs_at_50_std": 0.930294669379938,
"naucs_at_50_diff1": 0.8714057920484658,
"naucs_at_100_max": -0.3617257884810223,
"naucs_at_100_std": 0.9386292283530702,
"naucs_at_100_diff1": 0.8597379463433718
},
"data_dir/eval_vidore/syntheticDocQA_energy_test": {
"ndcg_at_1": 0.93,
"ndcg_at_3": 0.95893,
"ndcg_at_5": 0.95893,
"ndcg_at_10": 0.95893,
"ndcg_at_20": 0.96163,
"ndcg_at_50": 0.96365,
"ndcg_at_100": 0.96365,
"map_at_1": 0.93,
"map_at_3": 0.95167,
"map_at_5": 0.95167,
"map_at_10": 0.95167,
"map_at_20": 0.9525,
"map_at_50": 0.95283,
"map_at_100": 0.95283,
"recall_at_1": 0.93,
"recall_at_3": 0.98,
"recall_at_5": 0.98,
"recall_at_10": 0.98,
"recall_at_20": 0.99,
"recall_at_50": 1.0,
"recall_at_100": 1.0,
"precision_at_1": 0.93,
"precision_at_3": 0.32667,
"precision_at_5": 0.196,
"precision_at_10": 0.098,
"precision_at_20": 0.0495,
"precision_at_50": 0.02,
"precision_at_100": 0.01,
"mrr_at_1": 0.93,
"mrr_at_3": 0.9516666666666667,
"mrr_at_5": 0.9516666666666667,
"mrr_at_10": 0.9516666666666667,
"mrr_at_20": 0.9525757575757575,
"mrr_at_50": 0.9529205851619644,
"mrr_at_100": 0.9529205851619644,
"naucs_at_1_max": 0.39482459650526885,
"naucs_at_1_std": -0.31419234360410914,
"naucs_at_1_diff1": 1.0,
"naucs_at_3_max": 0.6790382819794457,
"naucs_at_3_std": -0.9556489262371661,
"naucs_at_3_diff1": 1.0,
"naucs_at_5_max": 0.6790382819794609,
"naucs_at_5_std": -0.9556489262371534,
"naucs_at_5_diff1": 1.0,
"naucs_at_10_max": 0.6790382819794609,
"naucs_at_10_std": -0.9556489262371534,
"naucs_at_10_diff1": 1.0,
"naucs_at_20_max": 1.0,
"naucs_at_20_std": -0.1713352007469681,
"naucs_at_20_diff1": 1.0,
"naucs_at_50_max": null,
"naucs_at_50_std": null,
"naucs_at_50_diff1": null,
"naucs_at_100_max": null,
"naucs_at_100_std": null,
"naucs_at_100_diff1": null
},
"data_dir/eval_vidore/tatdqa_test": {
"ndcg_at_1": 0.69927,
"ndcg_at_3": 0.79372,
"ndcg_at_5": 0.81105,
"ndcg_at_10": 0.82459,
"ndcg_at_20": 0.82878,
"ndcg_at_50": 0.83303,
"ndcg_at_100": 0.83442,
"map_at_1": 0.69927,
"map_at_3": 0.77106,
"map_at_5": 0.78072,
"map_at_10": 0.78653,
"map_at_20": 0.7877,
"map_at_50": 0.78839,
"map_at_100": 0.78852,
"recall_at_1": 0.69927,
"recall_at_3": 0.85905,
"recall_at_5": 0.90097,
"recall_at_10": 0.94168,
"recall_at_20": 0.95808,
"recall_at_50": 0.97934,
"recall_at_100": 0.98785,
"precision_at_1": 0.69927,
"precision_at_3": 0.28635,
"precision_at_5": 0.18019,
"precision_at_10": 0.09417,
"precision_at_20": 0.0479,
"precision_at_50": 0.01959,
"precision_at_100": 0.00988,
"mrr_at_1": 0.7004860267314702,
"mrr_at_3": 0.7722762251923856,
"mrr_at_5": 0.7813284730660186,
"mrr_at_10": 0.7874199598835079,
"mrr_at_20": 0.7885261582425689,
"mrr_at_50": 0.7892193634018624,
"mrr_at_100": 0.7893291443742743,
"naucs_at_1_max": 0.2682416909968819,
"naucs_at_1_std": -0.1346098281401034,
"naucs_at_1_diff1": 0.8296403667835969,
"naucs_at_3_max": 0.36050493227494845,
"naucs_at_3_std": -0.01834048113954263,
"naucs_at_3_diff1": 0.7445505884597561,
"naucs_at_5_max": 0.36523716935916267,
"naucs_at_5_std": 0.06489405058952001,
"naucs_at_5_diff1": 0.7142046612217674,
"naucs_at_10_max": 0.4293315802144752,
"naucs_at_10_std": 0.2564808038730297,
"naucs_at_10_diff1": 0.6873136665710184,
"naucs_at_20_max": 0.4688188620078513,
"naucs_at_20_std": 0.26917226500908054,
"naucs_at_20_diff1": 0.6720615167289586,
"naucs_at_50_max": 0.5671944664000176,
"naucs_at_50_std": 0.4964253483275758,
"naucs_at_50_diff1": 0.722603370462453,
"naucs_at_100_max": 0.6585255212623138,
"naucs_at_100_std": 0.5978336814194427,
"naucs_at_100_diff1": 0.8138609714332596
},
"data_dir/eval_vidore/infovqa_test_subsampled": {
"ndcg_at_1": 0.88462,
"ndcg_at_3": 0.91698,
"ndcg_at_5": 0.92378,
"ndcg_at_10": 0.92838,
"ndcg_at_20": 0.93146,
"ndcg_at_50": 0.93263,
"ndcg_at_100": 0.93362,
"map_at_1": 0.88462,
"map_at_3": 0.90924,
"map_at_5": 0.91309,
"map_at_10": 0.91501,
"map_at_20": 0.91585,
"map_at_50": 0.91603,
"map_at_100": 0.91612,
"recall_at_1": 0.88462,
"recall_at_3": 0.93927,
"recall_at_5": 0.95547,
"recall_at_10": 0.96964,
"recall_at_20": 0.98178,
"recall_at_50": 0.98785,
"recall_at_100": 0.99393,
"precision_at_1": 0.88462,
"precision_at_3": 0.31309,
"precision_at_5": 0.19109,
"precision_at_10": 0.09696,
"precision_at_20": 0.04909,
"precision_at_50": 0.01976,
"precision_at_100": 0.00994,
"mrr_at_1": 0.8846153846153846,
"mrr_at_3": 0.9092442645074225,
"mrr_at_5": 0.9129892037786774,
"mrr_at_10": 0.9147717049032839,
"mrr_at_20": 0.9154333931688503,
"mrr_at_50": 0.9156112743493511,
"mrr_at_100": 0.915698522470477,
"naucs_at_1_max": 0.6002033777762705,
"naucs_at_1_std": -0.07102965572007143,
"naucs_at_1_diff1": 0.9544715151522033,
"naucs_at_3_max": 0.8025453360230541,
"naucs_at_3_std": 0.19885112605813188,
"naucs_at_3_diff1": 0.960819563780572,
"naucs_at_5_max": 0.9121856227472513,
"naucs_at_5_std": 0.3583912666662475,
"naucs_at_5_diff1": 0.9584449918884831,
"naucs_at_10_max": 0.9368484108193146,
"naucs_at_10_std": 0.44097650713388975,
"naucs_at_10_diff1": 0.9651729455827266,
"naucs_at_20_max": 0.9709774546522766,
"naucs_at_20_std": 0.6007213904253922,
"naucs_at_20_diff1": 0.9854887273261383,
"naucs_at_50_max": 0.9782330909892136,
"naucs_at_50_std": 0.7577252323561762,
"naucs_at_50_diff1": 0.9782330909892136,
"naucs_at_100_max": 1.0,
"naucs_at_100_std": 0.7075525547215259,
"naucs_at_100_diff1": 0.9564661819784259
},
"data_dir/eval_vidore/syntheticDocQA_healthcare_industry_test": {
"ndcg_at_1": 0.95,
"ndcg_at_3": 0.97893,
"ndcg_at_5": 0.97893,
"ndcg_at_10": 0.97893,
"ndcg_at_20": 0.97893,
"ndcg_at_50": 0.97893,
"ndcg_at_100": 0.97893,
"map_at_1": 0.95,
"map_at_3": 0.97167,
"map_at_5": 0.97167,
"map_at_10": 0.97167,
"map_at_20": 0.97167,
"map_at_50": 0.97167,
"map_at_100": 0.97167,
"recall_at_1": 0.95,
"recall_at_3": 1.0,
"recall_at_5": 1.0,
"recall_at_10": 1.0,
"recall_at_20": 1.0,
"recall_at_50": 1.0,
"recall_at_100": 1.0,
"precision_at_1": 0.95,
"precision_at_3": 0.33333,
"precision_at_5": 0.2,
"precision_at_10": 0.1,
"precision_at_20": 0.05,
"precision_at_50": 0.02,
"precision_at_100": 0.01,
"mrr_at_1": 0.96,
"mrr_at_3": 0.9783333333333333,
"mrr_at_5": 0.9783333333333333,
"mrr_at_10": 0.9783333333333333,
"mrr_at_20": 0.9783333333333333,
"mrr_at_50": 0.9783333333333333,
"mrr_at_100": 0.9783333333333333,
"naucs_at_1_max": 0.7605042016806716,
"naucs_at_1_std": -0.35732959850606716,
"naucs_at_1_diff1": 0.9738562091503253,
"naucs_at_3_max": 1.0,
"naucs_at_3_std": 1.0,
"naucs_at_3_diff1": 1.0,
"naucs_at_5_max": 1.0,
"naucs_at_5_std": 1.0,
"naucs_at_5_diff1": 1.0,
"naucs_at_10_max": 1.0,
"naucs_at_10_std": 1.0,
"naucs_at_10_diff1": 1.0,
"naucs_at_20_max": 1.0,
"naucs_at_20_std": 1.0,
"naucs_at_20_diff1": 1.0,
"naucs_at_50_max": null,
"naucs_at_50_std": null,
"naucs_at_50_diff1": null,
"naucs_at_100_max": null,
"naucs_at_100_std": null,
"naucs_at_100_diff1": null
},
"data_dir/eval_vidore/tabfquad_test_subsampled": {
"ndcg_at_1": 0.85714,
"ndcg_at_3": 0.90523,
"ndcg_at_5": 0.91122,
"ndcg_at_10": 0.91807,
"ndcg_at_20": 0.92163,
"ndcg_at_50": 0.92385,
"ndcg_at_100": 0.92385,
"map_at_1": 0.85714,
"map_at_3": 0.89345,
"map_at_5": 0.89685,
"map_at_10": 0.89962,
"map_at_20": 0.90057,
"map_at_50": 0.90097,
"map_at_100": 0.90097,
"recall_at_1": 0.85714,
"recall_at_3": 0.93929,
"recall_at_5": 0.95357,
"recall_at_10": 0.975,
"recall_at_20": 0.98929,
"recall_at_50": 1.0,
"recall_at_100": 1.0,
"precision_at_1": 0.85714,
"precision_at_3": 0.3131,
"precision_at_5": 0.19071,
"precision_at_10": 0.0975,
"precision_at_20": 0.04946,
"precision_at_50": 0.02,
"precision_at_100": 0.01,
"mrr_at_1": 0.8571428571428571,
"mrr_at_3": 0.8928571428571429,
"mrr_at_5": 0.8955357142857143,
"mrr_at_10": 0.8989866780045351,
"mrr_at_20": 0.8999608080411652,
"mrr_at_50": 0.9003545809349381,
"mrr_at_100": 0.9003545809349381,
"naucs_at_1_max": 0.44880952380952394,
"naucs_at_1_std": 0.06635082604470473,
"naucs_at_1_diff1": 0.9110301263362479,
"naucs_at_3_max": 0.7531443950129105,
"naucs_at_3_std": 0.4460647003899606,
"naucs_at_3_diff1": 0.9288735101883916,
"naucs_at_5_max": 0.8075127486892179,
"naucs_at_5_std": 0.529124470300943,
"naucs_at_5_diff1": 0.917043740573152,
"naucs_at_10_max": 0.7902494331065706,
"naucs_at_10_std": 0.6329198346005056,
"naucs_at_10_diff1": 0.9626517273576021,
"naucs_at_20_max": 0.9564270152505505,
"naucs_at_20_std": 0.8638344226579515,
"naucs_at_20_diff1": 0.9564270152505505,
"naucs_at_50_max": 1.0,
"naucs_at_50_std": 1.0,
"naucs_at_50_diff1": 1.0,
"naucs_at_100_max": 1.0,
"naucs_at_100_std": 1.0,
"naucs_at_100_diff1": 1.0
},
"data_dir/eval_vidore/syntheticDocQA_government_reports_test": {
"ndcg_at_1": 0.92,
"ndcg_at_3": 0.96417,
"ndcg_at_5": 0.96417,
"ndcg_at_10": 0.9675,
"ndcg_at_20": 0.9675,
"ndcg_at_50": 0.9675,
"ndcg_at_100": 0.9675,
"map_at_1": 0.92,
"map_at_3": 0.955,
"map_at_5": 0.955,
"map_at_10": 0.95643,
"map_at_20": 0.95643,
"map_at_50": 0.95643,
"map_at_100": 0.95643,
"recall_at_1": 0.92,
"recall_at_3": 0.99,
"recall_at_5": 0.99,
"recall_at_10": 1.0,
"recall_at_20": 1.0,
"recall_at_50": 1.0,
"recall_at_100": 1.0,
"precision_at_1": 0.92,
"precision_at_3": 0.33,
"precision_at_5": 0.198,
"precision_at_10": 0.1,
"precision_at_20": 0.05,
"precision_at_50": 0.02,
"precision_at_100": 0.01,
"mrr_at_1": 0.92,
"mrr_at_3": 0.955,
"mrr_at_5": 0.955,
"mrr_at_10": 0.9564285714285714,
"mrr_at_20": 0.9564285714285714,
"mrr_at_50": 0.9564285714285714,
"mrr_at_100": 0.9564285714285714,
"naucs_at_1_max": 0.8768674136321195,
"naucs_at_1_std": 0.41940943043884304,
"naucs_at_1_diff1": 0.9673202614379083,
"naucs_at_3_max": 1.0,
"naucs_at_3_std": 0.8692810457516356,
"naucs_at_3_diff1": 1.0,
"naucs_at_5_max": 1.0,
"naucs_at_5_std": 0.8692810457516413,
"naucs_at_5_diff1": 1.0,
"naucs_at_10_max": 1.0,
"naucs_at_10_std": 1.0,
"naucs_at_10_diff1": 1.0,
"naucs_at_20_max": 1.0,
"naucs_at_20_std": 1.0,
"naucs_at_20_diff1": 1.0,
"naucs_at_50_max": null,
"naucs_at_50_std": null,
"naucs_at_50_diff1": null,
"naucs_at_100_max": null,
"naucs_at_100_std": null,
"naucs_at_100_diff1": null
},
"data_dir/eval_vidore/shiftproject_test": {
"ndcg_at_1": 0.78,
"ndcg_at_3": 0.8644,
"ndcg_at_5": 0.87302,
"ndcg_at_10": 0.8828,
"ndcg_at_20": 0.88795,
"ndcg_at_50": 0.88997,
"ndcg_at_100": 0.88997,
"map_at_1": 0.78,
"map_at_3": 0.845,
"map_at_5": 0.85,
"map_at_10": 0.8541,
"map_at_20": 0.85555,
"map_at_50": 0.85589,
"map_at_100": 0.85589,
"recall_at_1": 0.78,
"recall_at_3": 0.92,
"recall_at_5": 0.94,
"recall_at_10": 0.97,
"recall_at_20": 0.99,
"recall_at_50": 1.0,
"recall_at_100": 1.0,
"precision_at_1": 0.78,
"precision_at_3": 0.30667,
"precision_at_5": 0.188,
"precision_at_10": 0.097,
"precision_at_20": 0.0495,
"precision_at_50": 0.02,
"precision_at_100": 0.01,
"mrr_at_1": 0.81,
"mrr_at_3": 0.8633333333333333,
"mrr_at_5": 0.8658333333333332,
"mrr_at_10": 0.8699285714285715,
"mrr_at_20": 0.871412087912088,
"mrr_at_50": 0.8717454212454213,
"mrr_at_100": 0.8717454212454213,
"naucs_at_1_max": -0.24755413363008374,
"naucs_at_1_std": -0.6164510594890337,
"naucs_at_1_diff1": 0.8162006769601703,
"naucs_at_3_max": 0.2243814192343627,
"naucs_at_3_std": -0.23225957049486393,
"naucs_at_3_diff1": 0.8544000933706815,
"naucs_at_5_max": -0.012371615312794324,
"naucs_at_5_std": -0.5504201680672273,
"naucs_at_5_diff1": 0.9128540305010897,
"naucs_at_10_max": -0.049486461251166146,
"naucs_at_10_std": -0.27591036414565706,
"naucs_at_10_diff1": 0.9128540305010848,
"naucs_at_20_max": 0.7222222222222276,
"naucs_at_20_std": 0.5541549953314738,
"naucs_at_20_diff1": 0.8692810457516413,
"naucs_at_50_max": null,
"naucs_at_50_std": null,
"naucs_at_50_diff1": null,
"naucs_at_100_max": null,
"naucs_at_100_std": null,
"naucs_at_100_diff1": null
},
"data_dir/eval_vidore/syntheticDocQA_artificial_intelligence_test": {
"ndcg_at_1": 0.99,
"ndcg_at_3": 0.99631,
"ndcg_at_5": 0.99631,
"ndcg_at_10": 0.99631,
"ndcg_at_20": 0.99631,
"ndcg_at_50": 0.99631,
"ndcg_at_100": 0.99631,
"map_at_1": 0.99,
"map_at_3": 0.995,
"map_at_5": 0.995,
"map_at_10": 0.995,
"map_at_20": 0.995,
"map_at_50": 0.995,
"map_at_100": 0.995,
"recall_at_1": 0.99,
"recall_at_3": 1.0,
"recall_at_5": 1.0,
"recall_at_10": 1.0,
"recall_at_20": 1.0,
"recall_at_50": 1.0,
"recall_at_100": 1.0,
"precision_at_1": 0.99,
"precision_at_3": 0.33333,
"precision_at_5": 0.2,
"precision_at_10": 0.1,
"precision_at_20": 0.05,
"precision_at_50": 0.02,
"precision_at_100": 0.01,
"mrr_at_1": 0.99,
"mrr_at_3": 0.995,
"mrr_at_5": 0.995,
"mrr_at_10": 0.995,
"mrr_at_20": 0.995,
"mrr_at_50": 0.995,
"mrr_at_100": 0.995,
"naucs_at_1_max": 0.8692810457516276,
"naucs_at_1_std": -0.5634920634920657,
"naucs_at_1_diff1": 1.0,
"naucs_at_3_max": 1.0,
"naucs_at_3_std": 1.0,
"naucs_at_3_diff1": 1.0,
"naucs_at_5_max": 1.0,
"naucs_at_5_std": 1.0,
"naucs_at_5_diff1": 1.0,
"naucs_at_10_max": 1.0,
"naucs_at_10_std": 1.0,
"naucs_at_10_diff1": 1.0,
"naucs_at_20_max": 1.0,
"naucs_at_20_std": 1.0,
"naucs_at_20_diff1": 1.0,
"naucs_at_50_max": null,
"naucs_at_50_std": null,
"naucs_at_50_diff1": null,
"naucs_at_100_max": null,
"naucs_at_100_std": null,
"naucs_at_100_diff1": null
}
}
}