|
{ |
|
"metadata": { |
|
"timestamp": "2025-03-09T16:34:55.435464", |
|
"vidore_benchmark_version": "0.1.dev293+g9358cf6" |
|
}, |
|
"metrics": { |
|
"vidore/arxivqa_test_subsampled": { |
|
"ndcg_at_1": 0.896, |
|
"ndcg_at_3": 0.9285, |
|
"ndcg_at_5": 0.93409, |
|
"ndcg_at_10": 0.93887, |
|
"ndcg_at_20": 0.94191, |
|
"ndcg_at_50": 0.94277, |
|
"ndcg_at_100": 0.94346, |
|
"map_at_1": 0.896, |
|
"map_at_3": 0.921, |
|
"map_at_5": 0.924, |
|
"map_at_10": 0.92612, |
|
"map_at_20": 0.92696, |
|
"map_at_50": 0.92712, |
|
"map_at_100": 0.92719, |
|
"recall_at_1": 0.896, |
|
"recall_at_3": 0.95, |
|
"recall_at_5": 0.964, |
|
"recall_at_10": 0.978, |
|
"recall_at_20": 0.99, |
|
"recall_at_50": 0.994, |
|
"recall_at_100": 0.998, |
|
"precision_at_1": 0.896, |
|
"precision_at_3": 0.31667, |
|
"precision_at_5": 0.1928, |
|
"precision_at_10": 0.0978, |
|
"precision_at_20": 0.0495, |
|
"precision_at_50": 0.01988, |
|
"precision_at_100": 0.00998, |
|
"mrr_at_1": 0.896, |
|
"mrr_at_3": 0.9213333333333332, |
|
"mrr_at_5": 0.9240333333333333, |
|
"mrr_at_10": 0.9264857142857141, |
|
"mrr_at_20": 0.9274158230658229, |
|
"mrr_at_50": 0.9274847885830643, |
|
"mrr_at_100": 0.9275602871585629, |
|
"naucs_at_1_max": 0.8456651988738907, |
|
"naucs_at_1_std": -0.12317729011766297, |
|
"naucs_at_1_diff1": 0.9409423951490659, |
|
"naucs_at_3_max": 0.8706816059757188, |
|
"naucs_at_3_std": 0.006965452847808854, |
|
"naucs_at_3_diff1": 0.9522875816993475, |
|
"naucs_at_5_max": 0.9080558149185568, |
|
"naucs_at_5_std": -0.04549227098247105, |
|
"naucs_at_5_diff1": 0.9555192447349298, |
|
"naucs_at_10_max": 0.8866819455054739, |
|
"naucs_at_10_std": -0.08407605466429298, |
|
"naucs_at_10_diff1": 0.9762329174093952, |
|
"naucs_at_20_max": 0.9477124183006524, |
|
"naucs_at_20_std": 0.25144724556488873, |
|
"naucs_at_20_diff1": 1.0, |
|
"naucs_at_50_max": 0.9564270152505304, |
|
"naucs_at_50_std": 0.4352629940865033, |
|
"naucs_at_50_diff1": 1.0, |
|
"naucs_at_100_max": 1.0, |
|
"naucs_at_100_std": 1.0, |
|
"naucs_at_100_diff1": 1.0 |
|
}, |
|
"vidore/docvqa_test_subsampled": { |
|
"ndcg_at_1": 0.54324, |
|
"ndcg_at_3": 0.60994, |
|
"ndcg_at_5": 0.6398, |
|
"ndcg_at_10": 0.66199, |
|
"ndcg_at_20": 0.67267, |
|
"ndcg_at_50": 0.68225, |
|
"ndcg_at_100": 0.68945, |
|
"map_at_1": 0.54324, |
|
"map_at_3": 0.59387, |
|
"map_at_5": 0.61027, |
|
"map_at_10": 0.61899, |
|
"map_at_20": 0.62193, |
|
"map_at_50": 0.62343, |
|
"map_at_100": 0.62407, |
|
"recall_at_1": 0.54324, |
|
"recall_at_3": 0.65632, |
|
"recall_at_5": 0.72949, |
|
"recall_at_10": 0.80044, |
|
"recall_at_20": 0.84257, |
|
"recall_at_50": 0.89135, |
|
"recall_at_100": 0.9357, |
|
"precision_at_1": 0.54324, |
|
"precision_at_3": 0.21877, |
|
"precision_at_5": 0.1459, |
|
"precision_at_10": 0.08004, |
|
"precision_at_20": 0.04213, |
|
"precision_at_50": 0.01783, |
|
"precision_at_100": 0.00936, |
|
"mrr_at_1": 0.5432372505543237, |
|
"mrr_at_3": 0.5946045824094608, |
|
"mrr_at_5": 0.6103473762010347, |
|
"mrr_at_10": 0.6190493788054763, |
|
"mrr_at_20": 0.6220782499013536, |
|
"mrr_at_50": 0.623690385474884, |
|
"mrr_at_100": 0.624317545713404, |
|
"naucs_at_1_max": 0.5195120835206619, |
|
"naucs_at_1_std": -0.31481029514111575, |
|
"naucs_at_1_diff1": 0.8886195631998732, |
|
"naucs_at_3_max": 0.4894265436758743, |
|
"naucs_at_3_std": -0.35348286092835673, |
|
"naucs_at_3_diff1": 0.825360351363726, |
|
"naucs_at_5_max": 0.49365870598559275, |
|
"naucs_at_5_std": -0.3667256163548182, |
|
"naucs_at_5_diff1": 0.8190874936930554, |
|
"naucs_at_10_max": 0.49415281281253026, |
|
"naucs_at_10_std": -0.1787227124233066, |
|
"naucs_at_10_diff1": 0.760124698410118, |
|
"naucs_at_20_max": 0.4624420442016527, |
|
"naucs_at_20_std": -0.14955421166412503, |
|
"naucs_at_20_diff1": 0.7582711922759812, |
|
"naucs_at_50_max": 0.46372165402671495, |
|
"naucs_at_50_std": -0.009043079292315782, |
|
"naucs_at_50_diff1": 0.7459081960812681, |
|
"naucs_at_100_max": 0.41099442703800165, |
|
"naucs_at_100_std": 0.4785954026968201, |
|
"naucs_at_100_diff1": 0.7044383203056372 |
|
}, |
|
"vidore/infovqa_test_subsampled": { |
|
"ndcg_at_1": 0.89676, |
|
"ndcg_at_3": 0.92534, |
|
"ndcg_at_5": 0.93031, |
|
"ndcg_at_10": 0.935, |
|
"ndcg_at_20": 0.93663, |
|
"ndcg_at_50": 0.93904, |
|
"ndcg_at_100": 0.94001, |
|
"map_at_1": 0.89676, |
|
"map_at_3": 0.91903, |
|
"map_at_5": 0.92176, |
|
"map_at_10": 0.92376, |
|
"map_at_20": 0.92426, |
|
"map_at_50": 0.92465, |
|
"map_at_100": 0.92473, |
|
"recall_at_1": 0.89676, |
|
"recall_at_3": 0.94332, |
|
"recall_at_5": 0.95547, |
|
"recall_at_10": 0.96964, |
|
"recall_at_20": 0.97571, |
|
"recall_at_50": 0.98785, |
|
"recall_at_100": 0.99393, |
|
"precision_at_1": 0.89676, |
|
"precision_at_3": 0.31444, |
|
"precision_at_5": 0.19109, |
|
"precision_at_10": 0.09696, |
|
"precision_at_20": 0.04879, |
|
"precision_at_50": 0.01976, |
|
"precision_at_100": 0.00994, |
|
"mrr_at_1": 0.8967611336032388, |
|
"mrr_at_3": 0.9183535762483129, |
|
"mrr_at_5": 0.9206815114709849, |
|
"mrr_at_10": 0.9232191054559475, |
|
"mrr_at_20": 0.9235380847222951, |
|
"mrr_at_50": 0.9239302146072342, |
|
"mrr_at_100": 0.9240125185515768, |
|
"naucs_at_1_max": 0.7062394427119798, |
|
"naucs_at_1_std": -0.2812879238976883, |
|
"naucs_at_1_diff1": 0.9410064894465787, |
|
"naucs_at_3_max": 0.7564908149226892, |
|
"naucs_at_3_std": -0.3059756682732854, |
|
"naucs_at_3_diff1": 0.9422566807977654, |
|
"naucs_at_5_max": 0.84758972902799, |
|
"naucs_at_5_std": -0.0929285302133143, |
|
"naucs_at_5_diff1": 0.9450692388254637, |
|
"naucs_at_10_max": 0.8860131032188592, |
|
"naucs_at_10_std": 0.24420167069765694, |
|
"naucs_at_10_diff1": 0.9368484108193146, |
|
"naucs_at_20_max": 0.8806609405034168, |
|
"naucs_at_20_std": 0.28312028971462133, |
|
"naucs_at_20_diff1": 0.9428274225349419, |
|
"naucs_at_50_max": 0.78308879001761, |
|
"naucs_at_50_std": 0.08727770914673263, |
|
"naucs_at_50_diff1": 0.9537108770403242, |
|
"naucs_at_100_max": 0.6097113980568468, |
|
"naucs_at_100_std": -0.06311386037266957, |
|
"naucs_at_100_diff1": 0.9074217540806789 |
|
}, |
|
"vidore/tabfquad_test_subsampled": { |
|
"ndcg_at_1": 0.90714, |
|
"ndcg_at_3": 0.94809, |
|
"ndcg_at_5": 0.95085, |
|
"ndcg_at_10": 0.95556, |
|
"ndcg_at_20": 0.95556, |
|
"ndcg_at_50": 0.95633, |
|
"ndcg_at_100": 0.95633, |
|
"map_at_1": 0.90714, |
|
"map_at_3": 0.93869, |
|
"map_at_5": 0.94012, |
|
"map_at_10": 0.94212, |
|
"map_at_20": 0.94212, |
|
"map_at_50": 0.94227, |
|
"map_at_100": 0.94227, |
|
"recall_at_1": 0.90714, |
|
"recall_at_3": 0.975, |
|
"recall_at_5": 0.98214, |
|
"recall_at_10": 0.99643, |
|
"recall_at_20": 0.99643, |
|
"recall_at_50": 1.0, |
|
"recall_at_100": 1.0, |
|
"precision_at_1": 0.90714, |
|
"precision_at_3": 0.325, |
|
"precision_at_5": 0.19643, |
|
"precision_at_10": 0.09964, |
|
"precision_at_20": 0.04982, |
|
"precision_at_50": 0.02, |
|
"precision_at_100": 0.01, |
|
"mrr_at_1": 0.9071428571428571, |
|
"mrr_at_3": 0.9386904761904761, |
|
"mrr_at_5": 0.9401190476190476, |
|
"mrr_at_10": 0.9421173469387754, |
|
"mrr_at_20": 0.9421173469387754, |
|
"mrr_at_50": 0.9422602040816326, |
|
"mrr_at_100": 0.9422602040816326, |
|
"naucs_at_1_max": 0.47509516627163817, |
|
"naucs_at_1_std": 0.09654887596064192, |
|
"naucs_at_1_diff1": 0.9256625727213957, |
|
"naucs_at_3_max": 0.7953181272509063, |
|
"naucs_at_3_std": 0.6569294384420459, |
|
"naucs_at_3_diff1": 0.9626517273576122, |
|
"naucs_at_5_max": 0.9477124183006519, |
|
"naucs_at_5_std": 0.8585434173669502, |
|
"naucs_at_5_diff1": 0.9477124183006519, |
|
"naucs_at_10_max": 1.0, |
|
"naucs_at_10_std": 1.0, |
|
"naucs_at_10_diff1": 0.8692810457516478, |
|
"naucs_at_20_max": 1.0, |
|
"naucs_at_20_std": 1.0, |
|
"naucs_at_20_diff1": 0.8692810457516478, |
|
"naucs_at_50_max": 1.0, |
|
"naucs_at_50_std": 1.0, |
|
"naucs_at_50_diff1": 1.0, |
|
"naucs_at_100_max": 1.0, |
|
"naucs_at_100_std": 1.0, |
|
"naucs_at_100_diff1": 1.0 |
|
}, |
|
"vidore/tatdqa_test": { |
|
"ndcg_at_1": 0.68165, |
|
"ndcg_at_3": 0.78589, |
|
"ndcg_at_5": 0.80738, |
|
"ndcg_at_10": 0.81887, |
|
"ndcg_at_20": 0.82338, |
|
"ndcg_at_50": 0.82868, |
|
"ndcg_at_100": 0.82966, |
|
"map_at_1": 0.68165, |
|
"map_at_3": 0.76094, |
|
"map_at_5": 0.77284, |
|
"map_at_10": 0.77775, |
|
"map_at_20": 0.77902, |
|
"map_at_50": 0.77992, |
|
"map_at_100": 0.78, |
|
"recall_at_1": 0.68165, |
|
"recall_at_3": 0.85784, |
|
"recall_at_5": 0.91009, |
|
"recall_at_10": 0.94471, |
|
"recall_at_20": 0.96233, |
|
"recall_at_50": 0.98846, |
|
"recall_at_100": 0.99453, |
|
"precision_at_1": 0.68165, |
|
"precision_at_3": 0.28595, |
|
"precision_at_5": 0.18202, |
|
"precision_at_10": 0.09447, |
|
"precision_at_20": 0.04812, |
|
"precision_at_50": 0.01977, |
|
"precision_at_100": 0.00995, |
|
"mrr_at_1": 0.6822600243013366, |
|
"mrr_at_3": 0.7609356014580796, |
|
"mrr_at_5": 0.7725394896719318, |
|
"mrr_at_10": 0.7775212636695014, |
|
"mrr_at_20": 0.7787535437042965, |
|
"mrr_at_50": 0.7796543784238207, |
|
"mrr_at_100": 0.7797401545799822, |
|
"naucs_at_1_max": 0.16062026715795888, |
|
"naucs_at_1_std": -0.3264360293606425, |
|
"naucs_at_1_diff1": 0.8234210928574244, |
|
"naucs_at_3_max": 0.2735402374223285, |
|
"naucs_at_3_std": -0.2518265754222236, |
|
"naucs_at_3_diff1": 0.7126512468213168, |
|
"naucs_at_5_max": 0.3207976518601587, |
|
"naucs_at_5_std": -0.09980902320534159, |
|
"naucs_at_5_diff1": 0.654620096904173, |
|
"naucs_at_10_max": 0.4248907897527349, |
|
"naucs_at_10_std": 0.05751189029665147, |
|
"naucs_at_10_diff1": 0.6072701680557849, |
|
"naucs_at_20_max": 0.5189102534669143, |
|
"naucs_at_20_std": 0.17852289719761627, |
|
"naucs_at_20_diff1": 0.5826792796971454, |
|
"naucs_at_50_max": 0.6766878761446519, |
|
"naucs_at_50_std": 0.4444418209829138, |
|
"naucs_at_50_diff1": 0.5707904926948768, |
|
"naucs_at_100_max": 0.5171029913955458, |
|
"naucs_at_100_std": 0.4414823767216705, |
|
"naucs_at_100_diff1": 0.48651595702377487 |
|
}, |
|
"vidore/shiftproject_test": { |
|
"ndcg_at_1": 0.79, |
|
"ndcg_at_3": 0.88309, |
|
"ndcg_at_5": 0.88309, |
|
"ndcg_at_10": 0.88666, |
|
"ndcg_at_20": 0.89172, |
|
"ndcg_at_50": 0.89372, |
|
"ndcg_at_100": 0.89546, |
|
"map_at_1": 0.79, |
|
"map_at_3": 0.86, |
|
"map_at_5": 0.86, |
|
"map_at_10": 0.86167, |
|
"map_at_20": 0.86308, |
|
"map_at_50": 0.8634, |
|
"map_at_100": 0.86359, |
|
"recall_at_1": 0.79, |
|
"recall_at_3": 0.95, |
|
"recall_at_5": 0.95, |
|
"recall_at_10": 0.96, |
|
"recall_at_20": 0.98, |
|
"recall_at_50": 0.99, |
|
"recall_at_100": 1.0, |
|
"precision_at_1": 0.79, |
|
"precision_at_3": 0.31667, |
|
"precision_at_5": 0.19, |
|
"precision_at_10": 0.096, |
|
"precision_at_20": 0.049, |
|
"precision_at_50": 0.0198, |
|
"precision_at_100": 0.01, |
|
"mrr_at_1": 0.79, |
|
"mrr_at_3": 0.8633333333333333, |
|
"mrr_at_5": 0.8633333333333333, |
|
"mrr_at_10": 0.865, |
|
"mrr_at_20": 0.8664354066985647, |
|
"mrr_at_50": 0.8667579873437259, |
|
"mrr_at_100": 0.8669466665890089, |
|
"naucs_at_1_max": 0.039218986702575266, |
|
"naucs_at_1_std": -0.30031019308918766, |
|
"naucs_at_1_diff1": 0.8456248346839152, |
|
"naucs_at_3_max": 0.5220354808590087, |
|
"naucs_at_3_std": -0.057609710550887504, |
|
"naucs_at_3_diff1": 0.8160597572362241, |
|
"naucs_at_5_max": 0.5220354808590145, |
|
"naucs_at_5_std": -0.05760971055088009, |
|
"naucs_at_5_diff1": 0.8160597572362281, |
|
"naucs_at_10_max": 0.4352240896358576, |
|
"naucs_at_10_std": -0.10270774976656832, |
|
"naucs_at_10_diff1": 0.9305555555555542, |
|
"naucs_at_20_max": 0.1914098972922579, |
|
"naucs_at_20_std": -0.3968253968253954, |
|
"naucs_at_20_diff1": 0.861111111111116, |
|
"naucs_at_50_max": 0.554154995331464, |
|
"naucs_at_50_std": 0.35807656395892007, |
|
"naucs_at_50_diff1": 1.0, |
|
"naucs_at_100_max": null, |
|
"naucs_at_100_std": null, |
|
"naucs_at_100_diff1": null |
|
}, |
|
"vidore/syntheticDocQA_artificial_intelligence_test": { |
|
"ndcg_at_1": 1.0, |
|
"ndcg_at_3": 1.0, |
|
"ndcg_at_5": 1.0, |
|
"ndcg_at_10": 1.0, |
|
"ndcg_at_20": 1.0, |
|
"ndcg_at_50": 1.0, |
|
"ndcg_at_100": 1.0, |
|
"map_at_1": 1.0, |
|
"map_at_3": 1.0, |
|
"map_at_5": 1.0, |
|
"map_at_10": 1.0, |
|
"map_at_20": 1.0, |
|
"map_at_50": 1.0, |
|
"map_at_100": 1.0, |
|
"recall_at_1": 1.0, |
|
"recall_at_3": 1.0, |
|
"recall_at_5": 1.0, |
|
"recall_at_10": 1.0, |
|
"recall_at_20": 1.0, |
|
"recall_at_50": 1.0, |
|
"recall_at_100": 1.0, |
|
"precision_at_1": 1.0, |
|
"precision_at_3": 0.33333, |
|
"precision_at_5": 0.2, |
|
"precision_at_10": 0.1, |
|
"precision_at_20": 0.05, |
|
"precision_at_50": 0.02, |
|
"precision_at_100": 0.01, |
|
"mrr_at_1": 1.0, |
|
"mrr_at_3": 1.0, |
|
"mrr_at_5": 1.0, |
|
"mrr_at_10": 1.0, |
|
"mrr_at_20": 1.0, |
|
"mrr_at_50": 1.0, |
|
"mrr_at_100": 1.0, |
|
"naucs_at_1_max": null, |
|
"naucs_at_1_std": null, |
|
"naucs_at_1_diff1": null, |
|
"naucs_at_3_max": 1.0, |
|
"naucs_at_3_std": 1.0, |
|
"naucs_at_3_diff1": 1.0, |
|
"naucs_at_5_max": 1.0, |
|
"naucs_at_5_std": 1.0, |
|
"naucs_at_5_diff1": 1.0, |
|
"naucs_at_10_max": 1.0, |
|
"naucs_at_10_std": 1.0, |
|
"naucs_at_10_diff1": 1.0, |
|
"naucs_at_20_max": 1.0, |
|
"naucs_at_20_std": 1.0, |
|
"naucs_at_20_diff1": 1.0, |
|
"naucs_at_50_max": null, |
|
"naucs_at_50_std": null, |
|
"naucs_at_50_diff1": null, |
|
"naucs_at_100_max": null, |
|
"naucs_at_100_std": null, |
|
"naucs_at_100_diff1": null |
|
}, |
|
"vidore/syntheticDocQA_energy_test": { |
|
"ndcg_at_1": 0.94, |
|
"ndcg_at_3": 0.95893, |
|
"ndcg_at_5": 0.95893, |
|
"ndcg_at_10": 0.96208, |
|
"ndcg_at_20": 0.96718, |
|
"ndcg_at_50": 0.96718, |
|
"ndcg_at_100": 0.96718, |
|
"map_at_1": 0.94, |
|
"map_at_3": 0.955, |
|
"map_at_5": 0.955, |
|
"map_at_10": 0.95625, |
|
"map_at_20": 0.95767, |
|
"map_at_50": 0.95767, |
|
"map_at_100": 0.95767, |
|
"recall_at_1": 0.94, |
|
"recall_at_3": 0.97, |
|
"recall_at_5": 0.97, |
|
"recall_at_10": 0.98, |
|
"recall_at_20": 1.0, |
|
"recall_at_50": 1.0, |
|
"recall_at_100": 1.0, |
|
"precision_at_1": 0.94, |
|
"precision_at_3": 0.32333, |
|
"precision_at_5": 0.194, |
|
"precision_at_10": 0.098, |
|
"precision_at_20": 0.05, |
|
"precision_at_50": 0.02, |
|
"precision_at_100": 0.01, |
|
"mrr_at_1": 0.94, |
|
"mrr_at_3": 0.955, |
|
"mrr_at_5": 0.955, |
|
"mrr_at_10": 0.9566666666666667, |
|
"mrr_at_20": 0.9582142857142857, |
|
"mrr_at_50": 0.9582142857142857, |
|
"mrr_at_100": 0.9582142857142857, |
|
"naucs_at_1_max": 0.49004046062869583, |
|
"naucs_at_1_std": -0.6582633053221264, |
|
"naucs_at_1_diff1": 1.0, |
|
"naucs_at_3_max": 0.7424525365701778, |
|
"naucs_at_3_std": -1.040616246498596, |
|
"naucs_at_3_diff1": 1.0, |
|
"naucs_at_5_max": 0.742452536570183, |
|
"naucs_at_5_std": -1.040616246498598, |
|
"naucs_at_5_diff1": 1.0, |
|
"naucs_at_10_max": 0.9346405228758136, |
|
"naucs_at_10_std": -0.690943043884218, |
|
"naucs_at_10_diff1": 1.0, |
|
"naucs_at_20_max": 1.0, |
|
"naucs_at_20_std": 1.0, |
|
"naucs_at_20_diff1": 1.0, |
|
"naucs_at_50_max": null, |
|
"naucs_at_50_std": null, |
|
"naucs_at_50_diff1": null, |
|
"naucs_at_100_max": null, |
|
"naucs_at_100_std": null, |
|
"naucs_at_100_diff1": null |
|
}, |
|
"vidore/syntheticDocQA_government_reports_test": { |
|
"ndcg_at_1": 0.92, |
|
"ndcg_at_3": 0.95655, |
|
"ndcg_at_5": 0.96085, |
|
"ndcg_at_10": 0.96419, |
|
"ndcg_at_20": 0.96419, |
|
"ndcg_at_50": 0.96419, |
|
"ndcg_at_100": 0.96419, |
|
"map_at_1": 0.92, |
|
"map_at_3": 0.94833, |
|
"map_at_5": 0.95083, |
|
"map_at_10": 0.95226, |
|
"map_at_20": 0.95226, |
|
"map_at_50": 0.95226, |
|
"map_at_100": 0.95226, |
|
"recall_at_1": 0.92, |
|
"recall_at_3": 0.98, |
|
"recall_at_5": 0.99, |
|
"recall_at_10": 1.0, |
|
"recall_at_20": 1.0, |
|
"recall_at_50": 1.0, |
|
"recall_at_100": 1.0, |
|
"precision_at_1": 0.92, |
|
"precision_at_3": 0.32667, |
|
"precision_at_5": 0.198, |
|
"precision_at_10": 0.1, |
|
"precision_at_20": 0.05, |
|
"precision_at_50": 0.02, |
|
"precision_at_100": 0.01, |
|
"mrr_at_1": 0.93, |
|
"mrr_at_3": 0.9533333333333333, |
|
"mrr_at_5": 0.9558333333333333, |
|
"mrr_at_10": 0.9574999999999999, |
|
"mrr_at_20": 0.9574999999999999, |
|
"mrr_at_50": 0.9574999999999999, |
|
"mrr_at_100": 0.9574999999999999, |
|
"naucs_at_1_max": 0.6289682539682547, |
|
"naucs_at_1_std": 0.44461951447245585, |
|
"naucs_at_1_diff1": 0.9509803921568633, |
|
"naucs_at_3_max": 1.0, |
|
"naucs_at_3_std": 0.3384687208216551, |
|
"naucs_at_3_diff1": 0.9346405228758099, |
|
"naucs_at_5_max": 1.0, |
|
"naucs_at_5_std": 0.5541549953314738, |
|
"naucs_at_5_diff1": 0.8692810457516413, |
|
"naucs_at_10_max": 1.0, |
|
"naucs_at_10_std": 1.0, |
|
"naucs_at_10_diff1": 1.0, |
|
"naucs_at_20_max": 1.0, |
|
"naucs_at_20_std": 1.0, |
|
"naucs_at_20_diff1": 1.0, |
|
"naucs_at_50_max": null, |
|
"naucs_at_50_std": null, |
|
"naucs_at_50_diff1": null, |
|
"naucs_at_100_max": null, |
|
"naucs_at_100_std": null, |
|
"naucs_at_100_diff1": null |
|
}, |
|
"vidore/syntheticDocQA_healthcare_industry_test": { |
|
"ndcg_at_1": 0.94, |
|
"ndcg_at_3": 0.97655, |
|
"ndcg_at_5": 0.97655, |
|
"ndcg_at_10": 0.97655, |
|
"ndcg_at_20": 0.97655, |
|
"ndcg_at_50": 0.97655, |
|
"ndcg_at_100": 0.97655, |
|
"map_at_1": 0.94, |
|
"map_at_3": 0.96833, |
|
"map_at_5": 0.96833, |
|
"map_at_10": 0.96833, |
|
"map_at_20": 0.96833, |
|
"map_at_50": 0.96833, |
|
"map_at_100": 0.96833, |
|
"recall_at_1": 0.94, |
|
"recall_at_3": 1.0, |
|
"recall_at_5": 1.0, |
|
"recall_at_10": 1.0, |
|
"recall_at_20": 1.0, |
|
"recall_at_50": 1.0, |
|
"recall_at_100": 1.0, |
|
"precision_at_1": 0.94, |
|
"precision_at_3": 0.33333, |
|
"precision_at_5": 0.2, |
|
"precision_at_10": 0.1, |
|
"precision_at_20": 0.05, |
|
"precision_at_50": 0.02, |
|
"precision_at_100": 0.01, |
|
"mrr_at_1": 0.95, |
|
"mrr_at_3": 0.9733333333333333, |
|
"mrr_at_5": 0.9733333333333333, |
|
"mrr_at_10": 0.9733333333333333, |
|
"mrr_at_20": 0.9733333333333333, |
|
"mrr_at_50": 0.9733333333333333, |
|
"mrr_at_100": 0.9733333333333333, |
|
"naucs_at_1_max": 0.5662931839402436, |
|
"naucs_at_1_std": 0.18837535014005719, |
|
"naucs_at_1_diff1": 0.9782135076252712, |
|
"naucs_at_3_max": 1.0, |
|
"naucs_at_3_std": 1.0, |
|
"naucs_at_3_diff1": 1.0, |
|
"naucs_at_5_max": 1.0, |
|
"naucs_at_5_std": 1.0, |
|
"naucs_at_5_diff1": 1.0, |
|
"naucs_at_10_max": 1.0, |
|
"naucs_at_10_std": 1.0, |
|
"naucs_at_10_diff1": 1.0, |
|
"naucs_at_20_max": 1.0, |
|
"naucs_at_20_std": 1.0, |
|
"naucs_at_20_diff1": 1.0, |
|
"naucs_at_50_max": null, |
|
"naucs_at_50_std": null, |
|
"naucs_at_50_diff1": null, |
|
"naucs_at_100_max": null, |
|
"naucs_at_100_std": null, |
|
"naucs_at_100_diff1": null |
|
} |
|
} |
|
} |