vidore
baseline-results / voyageai_voyage-multimodal-3_metrics.json
QuentinJG's picture
Rename voyageai_metrics.json to voyageai_voyage-multimodal-3_metrics.json
ca40309 verified
{
"metadata": {
"timestamp": "2025-03-12T10:52:59.228266",
"vidore_benchmark_version": "4.0.3.dev37+g1548c2d.d20250311"
},
"metrics": {
"vidore/restaurant_esg_reports_beir": {
"ndcg_at_1": 0.46154,
"ndcg_at_3": 0.51553,
"ndcg_at_5": 0.56137,
"ndcg_at_10": 0.59354,
"ndcg_at_20": 0.63362,
"ndcg_at_50": 0.65072,
"ndcg_at_100": 0.66201,
"map_at_1": 0.36346,
"map_at_3": 0.44902,
"map_at_5": 0.49142,
"map_at_10": 0.5106,
"map_at_20": 0.52664,
"map_at_50": 0.53321,
"map_at_100": 0.53551,
"recall_at_1": 0.36346,
"recall_at_3": 0.50948,
"recall_at_5": 0.6369,
"recall_at_10": 0.71978,
"recall_at_20": 0.83934,
"recall_at_50": 0.90182,
"recall_at_100": 0.94766,
"precision_at_1": 0.46154,
"precision_at_3": 0.27564,
"precision_at_5": 0.22308,
"precision_at_10": 0.13462,
"precision_at_20": 0.08462,
"precision_at_50": 0.03962,
"precision_at_100": 0.02173,
"mrr_at_1": 0.46153846153846156,
"mrr_at_3": 0.564102564102564,
"mrr_at_5": 0.5910256410256409,
"mrr_at_10": 0.6018620268620267,
"mrr_at_20": 0.609330199714815,
"mrr_at_50": 0.6099933296882898,
"mrr_at_100": 0.6099933296882898,
"naucs_at_1_max": 0.20368019444404006,
"naucs_at_1_std": -0.05896301709840663,
"naucs_at_1_diff1": 0.5027857837399152,
"naucs_at_3_max": 0.2207596691773764,
"naucs_at_3_std": 0.006572688085190094,
"naucs_at_3_diff1": 0.07535489280712841,
"naucs_at_5_max": 0.3055052564988994,
"naucs_at_5_std": 0.2695070152185379,
"naucs_at_5_diff1": 0.028735419474887416,
"naucs_at_10_max": 0.13022275163938632,
"naucs_at_10_std": 0.16804625913226817,
"naucs_at_10_diff1": -0.1044735223259232,
"naucs_at_20_max": 0.030677866275297932,
"naucs_at_20_std": 0.2067178669184376,
"naucs_at_20_diff1": -0.15547715926288114,
"naucs_at_50_max": 0.06721043932684811,
"naucs_at_50_std": 0.2814855535601418,
"naucs_at_50_diff1": -0.15644474250949775,
"naucs_at_100_max": 0.04140512572483361,
"naucs_at_100_std": 0.2754882090192102,
"naucs_at_100_diff1": -0.20499364042570448
},
"vidore/synthetic_mit_biomedical_tissue_interactions_unfiltered": {
"ndcg_at_1": 0.50625,
"ndcg_at_3": 0.53801,
"ndcg_at_5": 0.56367,
"ndcg_at_10": 0.59144,
"ndcg_at_20": 0.62281,
"ndcg_at_50": 0.64988,
"ndcg_at_100": 0.6614,
"map_at_1": 0.2947,
"map_at_3": 0.42389,
"map_at_5": 0.46584,
"map_at_10": 0.49641,
"map_at_20": 0.51381,
"map_at_50": 0.52294,
"map_at_100": 0.52512,
"recall_at_1": 0.2947,
"recall_at_3": 0.51066,
"recall_at_5": 0.6115,
"recall_at_10": 0.69677,
"recall_at_20": 0.78713,
"recall_at_50": 0.87152,
"recall_at_100": 0.92041,
"precision_at_1": 0.50625,
"precision_at_3": 0.34583,
"precision_at_5": 0.26625,
"precision_at_10": 0.16813,
"precision_at_20": 0.10125,
"precision_at_50": 0.04987,
"precision_at_100": 0.02706,
"mrr_at_1": 0.50625,
"mrr_at_3": 0.6187499999999999,
"mrr_at_5": 0.6390625,
"mrr_at_10": 0.6450694444444445,
"mrr_at_20": 0.6481967685092686,
"mrr_at_50": 0.6493743580027906,
"mrr_at_100": 0.6497234378933107,
"naucs_at_1_max": 0.2982323803776623,
"naucs_at_1_std": -0.053774525827026284,
"naucs_at_1_diff1": 0.5200020115159291,
"naucs_at_3_max": 0.18024374308063665,
"naucs_at_3_std": 0.07332710212526489,
"naucs_at_3_diff1": 0.019165502096226788,
"naucs_at_5_max": 0.14274071990595502,
"naucs_at_5_std": 0.09730846621519294,
"naucs_at_5_diff1": -0.00690192345139435,
"naucs_at_10_max": 0.1869838718265326,
"naucs_at_10_std": 0.17477047588380465,
"naucs_at_10_diff1": -0.07438077296572282,
"naucs_at_20_max": 0.24640900247147313,
"naucs_at_20_std": 0.2484156281222067,
"naucs_at_20_diff1": -0.1333943313877057,
"naucs_at_50_max": 0.22134620285423043,
"naucs_at_50_std": 0.3203443552497451,
"naucs_at_50_diff1": -0.13630064984709492,
"naucs_at_100_max": 0.18852863001883446,
"naucs_at_100_std": 0.32571156994244094,
"naucs_at_100_diff1": -0.11435432105284754
},
"vidore/synthetic_economics_macro_economy_2024_filtered_v1.0": {
"ndcg_at_1": 0.67241,
"ndcg_at_3": 0.63319,
"ndcg_at_5": 0.58758,
"ndcg_at_10": 0.57198,
"ndcg_at_20": 0.58918,
"ndcg_at_50": 0.65786,
"ndcg_at_100": 0.69503,
"map_at_1": 0.13615,
"map_at_3": 0.21649,
"map_at_5": 0.25675,
"map_at_10": 0.3252,
"map_at_20": 0.38016,
"map_at_50": 0.43771,
"map_at_100": 0.46413,
"recall_at_1": 0.13615,
"recall_at_3": 0.23646,
"recall_at_5": 0.29799,
"recall_at_10": 0.43273,
"recall_at_20": 0.56259,
"recall_at_50": 0.76924,
"recall_at_100": 0.88035,
"precision_at_1": 0.67241,
"precision_at_3": 0.57471,
"precision_at_5": 0.48966,
"precision_at_10": 0.39828,
"precision_at_20": 0.29914,
"precision_at_50": 0.19172,
"precision_at_100": 0.12379,
"mrr_at_1": 0.6724137931034483,
"mrr_at_3": 0.7557471264367817,
"mrr_at_5": 0.764367816091954,
"mrr_at_10": 0.7718596059113301,
"mrr_at_20": 0.7718596059113301,
"mrr_at_50": 0.7732378352919377,
"mrr_at_100": 0.7732378352919377,
"naucs_at_1_max": 0.032282867498218674,
"naucs_at_1_std": -0.28271414000179634,
"naucs_at_1_diff1": 0.14417521370616468,
"naucs_at_3_max": 0.19868656246441452,
"naucs_at_3_std": 0.12756096614672727,
"naucs_at_3_diff1": -0.14423513218105685,
"naucs_at_5_max": 0.16258116633927042,
"naucs_at_5_std": 0.08888872261627004,
"naucs_at_5_diff1": -0.09215214837175129,
"naucs_at_10_max": 0.08087197701067339,
"naucs_at_10_std": 0.0593535492140523,
"naucs_at_10_diff1": 0.011413698146931404,
"naucs_at_20_max": 0.09066512825980459,
"naucs_at_20_std": 0.1515192296500721,
"naucs_at_20_diff1": 0.05635159011980896,
"naucs_at_50_max": 0.07419981716098847,
"naucs_at_50_std": 0.18498184475514726,
"naucs_at_50_diff1": 0.041495490587423654,
"naucs_at_100_max": 0.03526540983660958,
"naucs_at_100_std": 0.11166203694040092,
"naucs_at_100_diff1": 0.12019253855015599
},
"vidore/synthetic_rse_restaurant_filtered_v1.0": {
"ndcg_at_1": 0.42105,
"ndcg_at_3": 0.446,
"ndcg_at_5": 0.4719,
"ndcg_at_10": 0.51181,
"ndcg_at_20": 0.5424,
"ndcg_at_50": 0.56432,
"ndcg_at_100": 0.5872,
"map_at_1": 0.18615,
"map_at_3": 0.3094,
"map_at_5": 0.34722,
"map_at_10": 0.38335,
"map_at_20": 0.40112,
"map_at_50": 0.40968,
"map_at_100": 0.41626,
"recall_at_1": 0.18615,
"recall_at_3": 0.42928,
"recall_at_5": 0.52991,
"recall_at_10": 0.66591,
"recall_at_20": 0.76433,
"recall_at_50": 0.83751,
"recall_at_100": 0.91575,
"precision_at_1": 0.42105,
"precision_at_3": 0.30409,
"precision_at_5": 0.24561,
"precision_at_10": 0.16667,
"precision_at_20": 0.10789,
"precision_at_50": 0.05333,
"precision_at_100": 0.03263,
"mrr_at_1": 0.42105263157894735,
"mrr_at_3": 0.5350877192982455,
"mrr_at_5": 0.5552631578947367,
"mrr_at_10": 0.5674463937621831,
"mrr_at_20": 0.5723974683727004,
"mrr_at_50": 0.5730024290502564,
"mrr_at_100": 0.5730024290502564,
"naucs_at_1_max": -0.1063878813786229,
"naucs_at_1_std": 0.07009527096294454,
"naucs_at_1_diff1": 0.10532570058239055,
"naucs_at_3_max": -0.0707818319042163,
"naucs_at_3_std": 0.10106279988011081,
"naucs_at_3_diff1": 0.084845655655151,
"naucs_at_5_max": -0.11487901190848457,
"naucs_at_5_std": 0.09251915109792752,
"naucs_at_5_diff1": 0.012535607370615548,
"naucs_at_10_max": -0.09127037923640684,
"naucs_at_10_std": 0.13093656784846772,
"naucs_at_10_diff1": 0.03006202135754748,
"naucs_at_20_max": -0.05693043074070981,
"naucs_at_20_std": 0.1422048179530491,
"naucs_at_20_diff1": 0.021927827197454224,
"naucs_at_50_max": -0.12190658822908639,
"naucs_at_50_std": 0.16430064525199148,
"naucs_at_50_diff1": -0.10417541492717723,
"naucs_at_100_max": -0.17484165527500634,
"naucs_at_100_std": 0.13672197776470205,
"naucs_at_100_diff1": -0.15839101235075956
},
"vidore/synthetic_axa_filtered_v1.0": {
"ndcg_at_1": 0.72222,
"ndcg_at_3": 0.66954,
"ndcg_at_5": 0.64088,
"ndcg_at_10": 0.6477,
"ndcg_at_20": 0.68679,
"ndcg_at_50": 0.73939,
"ndcg_at_100": 0.75782,
"map_at_1": 0.36677,
"map_at_3": 0.4592,
"map_at_5": 0.48529,
"map_at_10": 0.53077,
"map_at_20": 0.56672,
"map_at_50": 0.58988,
"map_at_100": 0.5958,
"recall_at_1": 0.36677,
"recall_at_3": 0.50423,
"recall_at_5": 0.5832,
"recall_at_10": 0.66079,
"recall_at_20": 0.77947,
"recall_at_50": 0.9373,
"recall_at_100": 0.99068,
"precision_at_1": 0.72222,
"precision_at_3": 0.44444,
"precision_at_5": 0.32222,
"precision_at_10": 0.23333,
"precision_at_20": 0.15833,
"precision_at_50": 0.08333,
"precision_at_100": 0.04667,
"mrr_at_1": 0.7222222222222222,
"mrr_at_3": 0.7592592592592593,
"mrr_at_5": 0.7842592592592593,
"mrr_at_10": 0.7842592592592593,
"mrr_at_20": 0.7842592592592593,
"mrr_at_50": 0.7856481481481482,
"mrr_at_100": 0.7856481481481482,
"naucs_at_1_max": -0.5764508261912696,
"naucs_at_1_std": 0.2572205519822324,
"naucs_at_1_diff1": 0.5945012986070088,
"naucs_at_3_max": -0.3245546955664279,
"naucs_at_3_std": 0.2106608705520064,
"naucs_at_3_diff1": -0.18354778613695244,
"naucs_at_5_max": -0.32979775271957523,
"naucs_at_5_std": 0.004295616052457978,
"naucs_at_5_diff1": -0.21668629588661706,
"naucs_at_10_max": -0.37966732415422166,
"naucs_at_10_std": -0.01491020124585064,
"naucs_at_10_diff1": -0.17349036538288762,
"naucs_at_20_max": -0.29338316737381204,
"naucs_at_20_std": -0.03576033793090156,
"naucs_at_20_diff1": -0.19533219218843523,
"naucs_at_50_max": -0.29990699257368786,
"naucs_at_50_std": -0.11316959031750934,
"naucs_at_50_diff1": -0.27924927011864364,
"naucs_at_100_max": -0.22547374701018,
"naucs_at_100_std": -0.1279133290410171,
"naucs_at_100_diff1": -0.32901479145609697
},
"vidore/synthetic_rse_restaurant_filtered_v1.0_multilingual": {
"ndcg_at_1": 0.41667,
"ndcg_at_3": 0.44206,
"ndcg_at_5": 0.46171,
"ndcg_at_10": 0.50911,
"ndcg_at_20": 0.54735,
"ndcg_at_50": 0.5785,
"ndcg_at_100": 0.59513,
"map_at_1": 0.18884,
"map_at_3": 0.30884,
"map_at_5": 0.34205,
"map_at_10": 0.38214,
"map_at_20": 0.40339,
"map_at_50": 0.41645,
"map_at_100": 0.42174,
"recall_at_1": 0.18884,
"recall_at_3": 0.41439,
"recall_at_5": 0.50081,
"recall_at_10": 0.65362,
"recall_at_20": 0.77708,
"recall_at_50": 0.87498,
"recall_at_100": 0.92944,
"precision_at_1": 0.41667,
"precision_at_3": 0.30409,
"precision_at_5": 0.2386,
"precision_at_10": 0.16667,
"precision_at_20": 0.10965,
"precision_at_50": 0.05763,
"precision_at_100": 0.03364,
"mrr_at_1": 0.4166666666666667,
"mrr_at_3": 0.5387426900584793,
"mrr_at_5": 0.5527777777777776,
"mrr_at_10": 0.5685202589807851,
"mrr_at_20": 0.5744233342337056,
"mrr_at_50": 0.574930578048572,
"mrr_at_100": 0.574930578048572,
"naucs_at_1_max": 0.01715145223542086,
"naucs_at_1_std": 0.0899310510434977,
"naucs_at_1_diff1": 0.1739307636238112,
"naucs_at_3_max": -0.031778970284482205,
"naucs_at_3_std": 0.15113736191861826,
"naucs_at_3_diff1": -0.023575716122440124,
"naucs_at_5_max": -0.11291764491834187,
"naucs_at_5_std": 0.10256509751947128,
"naucs_at_5_diff1": -0.07511697723029634,
"naucs_at_10_max": -0.06154590672598315,
"naucs_at_10_std": 0.08064531970193034,
"naucs_at_10_diff1": -0.018188695451970553,
"naucs_at_20_max": -0.014776270960712531,
"naucs_at_20_std": 0.17295501151323417,
"naucs_at_20_diff1": -0.06161735463033105,
"naucs_at_50_max": -0.05048590733744633,
"naucs_at_50_std": 0.1490648093736084,
"naucs_at_50_diff1": -0.13782527489285434,
"naucs_at_100_max": -0.06129053077443416,
"naucs_at_100_std": 0.1378046540638781,
"naucs_at_100_diff1": -0.16944450675960782
},
"vidore/synthetic_axa_filtered_v1.0_multilingual": {
"ndcg_at_1": 0.65278,
"ndcg_at_3": 0.61596,
"ndcg_at_5": 0.59512,
"ndcg_at_10": 0.60056,
"ndcg_at_20": 0.63495,
"ndcg_at_50": 0.69554,
"ndcg_at_100": 0.71726,
"map_at_1": 0.33339,
"map_at_3": 0.4226,
"map_at_5": 0.45105,
"map_at_10": 0.49113,
"map_at_20": 0.52543,
"map_at_50": 0.5505,
"map_at_100": 0.55603,
"recall_at_1": 0.33339,
"recall_at_3": 0.46525,
"recall_at_5": 0.5196,
"recall_at_10": 0.60514,
"recall_at_20": 0.70862,
"recall_at_50": 0.89775,
"recall_at_100": 0.97606,
"precision_at_1": 0.65278,
"precision_at_3": 0.40741,
"precision_at_5": 0.31667,
"precision_at_10": 0.22361,
"precision_at_20": 0.14861,
"precision_at_50": 0.08111,
"precision_at_100": 0.04528,
"mrr_at_1": 0.6527777777777778,
"mrr_at_3": 0.7037037037037037,
"mrr_at_5": 0.7203703703703704,
"mrr_at_10": 0.7238977072310406,
"mrr_at_20": 0.7247657627865962,
"mrr_at_50": 0.7270465535079976,
"mrr_at_100": 0.7274945821818327,
"naucs_at_1_max": 0.22507029768221098,
"naucs_at_1_std": 0.13788316928206162,
"naucs_at_1_diff1": 0.5995848183367006,
"naucs_at_3_max": 0.10374741818519737,
"naucs_at_3_std": 0.1212402799460214,
"naucs_at_3_diff1": 0.032982270408976666,
"naucs_at_5_max": 0.036545011697732825,
"naucs_at_5_std": 0.04976840467312129,
"naucs_at_5_diff1": -0.06474423852856963,
"naucs_at_10_max": -0.012180820225981331,
"naucs_at_10_std": 0.007819844618087223,
"naucs_at_10_diff1": -0.11570751534998236,
"naucs_at_20_max": -0.05746500182397195,
"naucs_at_20_std": -0.02111513643125022,
"naucs_at_20_diff1": -0.12602864520641527,
"naucs_at_50_max": -0.1124769198431645,
"naucs_at_50_std": -0.07628706085741649,
"naucs_at_50_diff1": -0.19607255004920401,
"naucs_at_100_max": -0.11390067714346258,
"naucs_at_100_std": -0.09427043796285493,
"naucs_at_100_diff1": -0.25292751670835045
},
"vidore/synthetic_mit_biomedical_tissue_interactions_unfiltered_multilingual": {
"ndcg_at_1": 0.46875,
"ndcg_at_3": 0.48885,
"ndcg_at_5": 0.51496,
"ndcg_at_10": 0.54548,
"ndcg_at_20": 0.57449,
"ndcg_at_50": 0.60556,
"ndcg_at_100": 0.62078,
"map_at_1": 0.27801,
"map_at_3": 0.38689,
"map_at_5": 0.42623,
"map_at_10": 0.45364,
"map_at_20": 0.46929,
"map_at_50": 0.47926,
"map_at_100": 0.48215,
"recall_at_1": 0.27801,
"recall_at_3": 0.46662,
"recall_at_5": 0.55996,
"recall_at_10": 0.65464,
"recall_at_20": 0.73468,
"recall_at_50": 0.83743,
"recall_at_100": 0.90162,
"precision_at_1": 0.46875,
"precision_at_3": 0.30781,
"precision_at_5": 0.24,
"precision_at_10": 0.15109,
"precision_at_20": 0.09297,
"precision_at_50": 0.04666,
"precision_at_100": 0.02609,
"mrr_at_1": 0.46875,
"mrr_at_3": 0.5653645833333331,
"mrr_at_5": 0.5828645833333328,
"mrr_at_10": 0.5928670634920632,
"mrr_at_20": 0.5961635393061956,
"mrr_at_50": 0.5979642273664314,
"mrr_at_100": 0.598388641842729,
"naucs_at_1_max": 0.25717698422505025,
"naucs_at_1_std": -0.10478191029284567,
"naucs_at_1_diff1": 0.4072573005477985,
"naucs_at_3_max": 0.2659990641306254,
"naucs_at_3_std": 0.04479561155056106,
"naucs_at_3_diff1": 0.11139438643390147,
"naucs_at_5_max": 0.2170152015957716,
"naucs_at_5_std": 0.06816504281074703,
"naucs_at_5_diff1": 0.03610018938984803,
"naucs_at_10_max": 0.23222160900815464,
"naucs_at_10_std": 0.1310209006859444,
"naucs_at_10_diff1": -0.038456197207725154,
"naucs_at_20_max": 0.27497446589778796,
"naucs_at_20_std": 0.208324896139066,
"naucs_at_20_diff1": -0.08762814336480476,
"naucs_at_50_max": 0.27441764448304734,
"naucs_at_50_std": 0.2529300579928729,
"naucs_at_50_diff1": -0.11931330945117197,
"naucs_at_100_max": 0.26643076503646324,
"naucs_at_100_std": 0.23283573973890204,
"naucs_at_100_diff1": -0.09996794144423607
},
"vidore/synthetics_economics_macro_economy_2024_filtered_v1.0_multilingual": {
"ndcg_at_1": 0.64224,
"ndcg_at_3": 0.60064,
"ndcg_at_5": 0.55019,
"ndcg_at_10": 0.52755,
"ndcg_at_20": 0.55431,
"ndcg_at_50": 0.62193,
"ndcg_at_100": 0.66273,
"map_at_1": 0.12328,
"map_at_3": 0.20176,
"map_at_5": 0.23781,
"map_at_10": 0.29317,
"map_at_20": 0.3496,
"map_at_50": 0.40329,
"map_at_100": 0.42827,
"recall_at_1": 0.12328,
"recall_at_3": 0.22334,
"recall_at_5": 0.27732,
"recall_at_10": 0.39122,
"recall_at_20": 0.54233,
"recall_at_50": 0.74043,
"recall_at_100": 0.86408,
"precision_at_1": 0.64224,
"precision_at_3": 0.54023,
"precision_at_5": 0.45345,
"precision_at_10": 0.36509,
"precision_at_20": 0.28384,
"precision_at_50": 0.18336,
"precision_at_100": 0.11944,
"mrr_at_1": 0.6422413793103449,
"mrr_at_3": 0.726293103448276,
"mrr_at_5": 0.7344827586206897,
"mrr_at_10": 0.7423662424740011,
"mrr_at_20": 0.7454521368427901,
"mrr_at_50": 0.7464683101612821,
"mrr_at_100": 0.7466140292051692,
"naucs_at_1_max": 0.04669677333287125,
"naucs_at_1_std": -0.047276436301337176,
"naucs_at_1_diff1": 0.20998438017074644,
"naucs_at_3_max": 0.1207746945432274,
"naucs_at_3_std": 0.11705226278367024,
"naucs_at_3_diff1": -0.0659769870275157,
"naucs_at_5_max": 0.17489805487159318,
"naucs_at_5_std": 0.15087482671660668,
"naucs_at_5_diff1": -0.10486886234938332,
"naucs_at_10_max": 0.13971495080647375,
"naucs_at_10_std": 0.12342403085916763,
"naucs_at_10_diff1": -0.11904046578732998,
"naucs_at_20_max": 0.1262352504070948,
"naucs_at_20_std": 0.1870795410571109,
"naucs_at_20_diff1": -0.09021505632729916,
"naucs_at_50_max": 0.08609145496415921,
"naucs_at_50_std": 0.19880949579195997,
"naucs_at_50_diff1": -0.10141550865230196,
"naucs_at_100_max": 0.029463316752851777,
"naucs_at_100_std": 0.1254397237152911,
"naucs_at_100_diff1": -0.10340073450123488
},
"vidore/arxivqa_test_subsampled": {
"ndcg_at_1": 0.78,
"ndcg_at_3": 0.83717,
"ndcg_at_5": 0.8493,
"ndcg_at_10": 0.85579,
"ndcg_at_20": 0.86416,
"ndcg_at_50": 0.86978,
"ndcg_at_100": 0.8714,
"map_at_1": 0.78,
"map_at_3": 0.82367,
"map_at_5": 0.83027,
"map_at_10": 0.83296,
"map_at_20": 0.83513,
"map_at_50": 0.83606,
"map_at_100": 0.8362,
"recall_at_1": 0.78,
"recall_at_3": 0.876,
"recall_at_5": 0.906,
"recall_at_10": 0.926,
"recall_at_20": 0.96,
"recall_at_50": 0.988,
"recall_at_100": 0.998,
"precision_at_1": 0.78,
"precision_at_3": 0.292,
"precision_at_5": 0.1812,
"precision_at_10": 0.0926,
"precision_at_20": 0.048,
"precision_at_50": 0.01976,
"precision_at_100": 0.00998,
"mrr_at_1": 0.78,
"mrr_at_3": 0.8236666666666668,
"mrr_at_5": 0.8302666666666666,
"mrr_at_10": 0.8329571428571427,
"mrr_at_20": 0.8351287569413728,
"mrr_at_50": 0.8360576689817807,
"mrr_at_100": 0.8362028700500819,
"naucs_at_1_max": 0.7913757128946993,
"naucs_at_1_std": -0.6034404414151248,
"naucs_at_1_diff1": 0.9052951268141137,
"naucs_at_3_max": 0.7991254905596246,
"naucs_at_3_std": -0.5793856802941784,
"naucs_at_3_diff1": 0.8585874972961292,
"naucs_at_5_max": 0.7909291376124926,
"naucs_at_5_std": -0.4963148379919354,
"naucs_at_5_diff1": 0.8356576673222494,
"naucs_at_10_max": 0.8344689227042192,
"naucs_at_10_std": -0.5341433870845648,
"naucs_at_10_diff1": 0.8497867615514662,
"naucs_at_20_max": 0.8126984126984111,
"naucs_at_20_std": -0.4176003734827309,
"naucs_at_20_diff1": 0.8263305322128826,
"naucs_at_50_max": 0.9074074074074128,
"naucs_at_50_std": -0.04474011826952445,
"naucs_at_50_diff1": 0.860333022097726,
"naucs_at_100_max": 1.0,
"naucs_at_100_std": 1.0,
"naucs_at_100_diff1": 1.0
},
"vidore/docvqa_test_subsampled": {
"ndcg_at_1": 0.45455,
"ndcg_at_3": 0.53012,
"ndcg_at_5": 0.55569,
"ndcg_at_10": 0.57792,
"ndcg_at_20": 0.59293,
"ndcg_at_50": 0.60814,
"ndcg_at_100": 0.61994,
"map_at_1": 0.45455,
"map_at_3": 0.51109,
"map_at_5": 0.52528,
"map_at_10": 0.53447,
"map_at_20": 0.53882,
"map_at_50": 0.54136,
"map_at_100": 0.54249,
"recall_at_1": 0.45455,
"recall_at_3": 0.58537,
"recall_at_5": 0.64745,
"recall_at_10": 0.71619,
"recall_at_20": 0.77384,
"recall_at_50": 0.84922,
"recall_at_100": 0.92018,
"precision_at_1": 0.45455,
"precision_at_3": 0.19512,
"precision_at_5": 0.12949,
"precision_at_10": 0.07162,
"precision_at_20": 0.03869,
"precision_at_50": 0.01698,
"precision_at_100": 0.0092,
"mrr_at_1": 0.45454545454545453,
"mrr_at_3": 0.5110864745011089,
"mrr_at_5": 0.5252771618625277,
"mrr_at_10": 0.5344683771513038,
"mrr_at_20": 0.5388215531769072,
"mrr_at_50": 0.5413611772588918,
"mrr_at_100": 0.5424869155538622,
"naucs_at_1_max": 0.4075821857009155,
"naucs_at_1_std": -0.310949225760234,
"naucs_at_1_diff1": 0.7407514800732501,
"naucs_at_3_max": 0.46743175097720985,
"naucs_at_3_std": -0.1986126839848541,
"naucs_at_3_diff1": 0.6505296132803555,
"naucs_at_5_max": 0.5364564428320254,
"naucs_at_5_std": -0.14408657067489153,
"naucs_at_5_diff1": 0.6322410022842855,
"naucs_at_10_max": 0.5825512151708625,
"naucs_at_10_std": -0.07725749814895451,
"naucs_at_10_diff1": 0.6332882465209557,
"naucs_at_20_max": 0.5813970577815284,
"naucs_at_20_std": -0.02416200306109636,
"naucs_at_20_diff1": 0.5952214798946482,
"naucs_at_50_max": 0.6298047922819098,
"naucs_at_50_std": 0.21852001263213766,
"naucs_at_50_diff1": 0.5810079368486553,
"naucs_at_100_max": 0.6564226194686283,
"naucs_at_100_std": 0.46804642848156325,
"naucs_at_100_diff1": 0.49830945198923904
},
"vidore/infovqa_test_subsampled": {
"ndcg_at_1": 0.7753,
"ndcg_at_3": 0.84285,
"ndcg_at_5": 0.85383,
"ndcg_at_10": 0.86362,
"ndcg_at_20": 0.86829,
"ndcg_at_50": 0.87162,
"ndcg_at_100": 0.87297,
"map_at_1": 0.7753,
"map_at_3": 0.82692,
"map_at_5": 0.8331,
"map_at_10": 0.83712,
"map_at_20": 0.83843,
"map_at_50": 0.83902,
"map_at_100": 0.83915,
"recall_at_1": 0.7753,
"recall_at_3": 0.88866,
"recall_at_5": 0.91498,
"recall_at_10": 0.94534,
"recall_at_20": 0.96356,
"recall_at_50": 0.97976,
"recall_at_100": 0.98785,
"precision_at_1": 0.7753,
"precision_at_3": 0.29622,
"precision_at_5": 0.183,
"precision_at_10": 0.09453,
"precision_at_20": 0.04818,
"precision_at_50": 0.0196,
"precision_at_100": 0.00988,
"mrr_at_1": 0.7753036437246964,
"mrr_at_3": 0.8269230769230768,
"mrr_at_5": 0.8330971659919026,
"mrr_at_10": 0.8371192404087138,
"mrr_at_20": 0.8384322229490562,
"mrr_at_50": 0.8390209545984961,
"mrr_at_100": 0.8391494570651827,
"naucs_at_1_max": 0.42955277741228204,
"naucs_at_1_std": -0.413540459458001,
"naucs_at_1_diff1": 0.8615855669987156,
"naucs_at_3_max": 0.46912857131917574,
"naucs_at_3_std": -0.3714926257299717,
"naucs_at_3_diff1": 0.82680032161878,
"naucs_at_5_max": 0.6392482503231406,
"naucs_at_5_std": -0.2299842899342104,
"naucs_at_5_diff1": 0.8417184248940351,
"naucs_at_10_max": 0.7086238741706962,
"naucs_at_10_std": -0.0498141562896836,
"naucs_at_10_diff1": 0.837619456912457,
"naucs_at_20_max": 0.6570477401161009,
"naucs_at_20_std": 0.0009204781615544056,
"naucs_at_20_diff1": 0.7936258020327029,
"naucs_at_50_max": 0.774779293140126,
"naucs_at_50_std": 0.35856346999101907,
"naucs_at_50_diff1": 0.7547641636196891,
"naucs_at_100_max": 0.7116997912767351,
"naucs_at_100_std": 0.3194376069347773,
"naucs_at_100_diff1": 0.7833756960419608
},
"vidore/tabfquad_test_subsampled": {
"ndcg_at_1": 0.87143,
"ndcg_at_3": 0.91866,
"ndcg_at_5": 0.92758,
"ndcg_at_10": 0.92996,
"ndcg_at_20": 0.9336,
"ndcg_at_50": 0.93499,
"ndcg_at_100": 0.93499,
"map_at_1": 0.87143,
"map_at_3": 0.90774,
"map_at_5": 0.91274,
"map_at_10": 0.91376,
"map_at_20": 0.91476,
"map_at_50": 0.91497,
"map_at_100": 0.91497,
"recall_at_1": 0.87143,
"recall_at_3": 0.95,
"recall_at_5": 0.97143,
"recall_at_10": 0.97857,
"recall_at_20": 0.99286,
"recall_at_50": 1.0,
"recall_at_100": 1.0,
"precision_at_1": 0.87143,
"precision_at_3": 0.31667,
"precision_at_5": 0.19429,
"precision_at_10": 0.09786,
"precision_at_20": 0.04964,
"precision_at_50": 0.02,
"precision_at_100": 0.01,
"mrr_at_1": 0.8714285714285714,
"mrr_at_3": 0.9077380952380953,
"mrr_at_5": 0.9127380952380953,
"mrr_at_10": 0.9137585034013606,
"mrr_at_20": 0.9147645211930926,
"mrr_at_50": 0.9149716040262259,
"mrr_at_100": 0.9149716040262259,
"naucs_at_1_max": 0.7871300352601777,
"naucs_at_1_std": 0.20583128539373943,
"naucs_at_1_diff1": 0.9197964526124592,
"naucs_at_3_max": 0.9229691876750705,
"naucs_at_3_std": 0.460784313725494,
"naucs_at_3_diff1": 0.9626517273576086,
"naucs_at_5_max": 0.9673202614379075,
"naucs_at_5_std": 0.562791783380022,
"naucs_at_5_diff1": 0.934640522875815,
"naucs_at_10_max": 0.9782135076252753,
"naucs_at_10_std": 0.7584811702458847,
"naucs_at_10_diff1": 0.9128540305010935,
"naucs_at_20_max": 1.0,
"naucs_at_20_std": 1.0,
"naucs_at_20_diff1": 0.8692810457516309,
"naucs_at_50_max": 1.0,
"naucs_at_50_std": 1.0,
"naucs_at_50_diff1": 1.0,
"naucs_at_100_max": 1.0,
"naucs_at_100_std": 1.0,
"naucs_at_100_diff1": 1.0
},
"vidore/tatdqa_test": {
"ndcg_at_1": 0.55346,
"ndcg_at_3": 0.66654,
"ndcg_at_5": 0.69922,
"ndcg_at_10": 0.72683,
"ndcg_at_20": 0.73868,
"ndcg_at_50": 0.74458,
"ndcg_at_100": 0.74555,
"map_at_1": 0.55346,
"map_at_3": 0.63902,
"map_at_5": 0.65725,
"map_at_10": 0.66893,
"map_at_20": 0.67236,
"map_at_50": 0.6733,
"map_at_100": 0.67338,
"recall_at_1": 0.55346,
"recall_at_3": 0.74605,
"recall_at_5": 0.82503,
"recall_at_10": 0.90887,
"recall_at_20": 0.95443,
"recall_at_50": 0.9842,
"recall_at_100": 0.99028,
"precision_at_1": 0.55346,
"precision_at_3": 0.24868,
"precision_at_5": 0.16501,
"precision_at_10": 0.09089,
"precision_at_20": 0.04772,
"precision_at_50": 0.01968,
"precision_at_100": 0.0099,
"mrr_at_1": 0.5552855407047388,
"mrr_at_3": 0.6395301741595798,
"mrr_at_5": 0.6578473066018649,
"mrr_at_10": 0.6696035603386765,
"mrr_at_20": 0.6729832012543134,
"mrr_at_50": 0.6739181612518058,
"mrr_at_100": 0.6739995114642742,
"naucs_at_1_max": 0.4481578507912886,
"naucs_at_1_std": -0.28229697462188064,
"naucs_at_1_diff1": 0.6794797414689293,
"naucs_at_3_max": 0.521452354349859,
"naucs_at_3_std": -0.2525394663950513,
"naucs_at_3_diff1": 0.5641368811967125,
"naucs_at_5_max": 0.5522320601024093,
"naucs_at_5_std": -0.23449944203419384,
"naucs_at_5_diff1": 0.5550996108687463,
"naucs_at_10_max": 0.6709947806703614,
"naucs_at_10_std": -0.018864423203824147,
"naucs_at_10_diff1": 0.5147848561655853,
"naucs_at_20_max": 0.6719932800208073,
"naucs_at_20_std": 0.18814578113635355,
"naucs_at_20_diff1": 0.4774949408808388,
"naucs_at_50_max": 0.710665729775863,
"naucs_at_50_std": 0.409805723201301,
"naucs_at_50_diff1": 0.4920058027972864,
"naucs_at_100_max": 0.6822698211447887,
"naucs_at_100_std": 0.3946630393669552,
"naucs_at_100_diff1": 0.5232939215033167
},
"vidore/shiftproject_test": {
"ndcg_at_1": 0.59,
"ndcg_at_3": 0.76142,
"ndcg_at_5": 0.78683,
"ndcg_at_10": 0.8064,
"ndcg_at_20": 0.8064,
"ndcg_at_50": 0.8064,
"ndcg_at_100": 0.80812,
"map_at_1": 0.59,
"map_at_3": 0.72333,
"map_at_5": 0.73783,
"map_at_10": 0.74602,
"map_at_20": 0.74602,
"map_at_50": 0.74602,
"map_at_100": 0.74621,
"recall_at_1": 0.59,
"recall_at_3": 0.87,
"recall_at_5": 0.93,
"recall_at_10": 0.99,
"recall_at_20": 0.99,
"recall_at_50": 0.99,
"recall_at_100": 1.0,
"precision_at_1": 0.59,
"precision_at_3": 0.29,
"precision_at_5": 0.186,
"precision_at_10": 0.099,
"precision_at_20": 0.0495,
"precision_at_50": 0.0198,
"precision_at_100": 0.01,
"mrr_at_1": 0.59,
"mrr_at_3": 0.7233333333333333,
"mrr_at_5": 0.7378333333333333,
"mrr_at_10": 0.7460238095238095,
"mrr_at_20": 0.7460238095238095,
"mrr_at_50": 0.7460238095238095,
"mrr_at_100": 0.7462056277056278,
"naucs_at_1_max": 0.14863456938676678,
"naucs_at_1_std": -0.41319500491584377,
"naucs_at_1_diff1": 0.6677623373002481,
"naucs_at_3_max": 0.34644153151151447,
"naucs_at_3_std": -0.3760275494334602,
"naucs_at_3_diff1": 0.5028141894393838,
"naucs_at_5_max": 0.29825263438709065,
"naucs_at_5_std": -0.40456182472989133,
"naucs_at_5_diff1": 0.434507136187809,
"naucs_at_10_max": -0.1713352007469681,
"naucs_at_10_std": -0.5634920634920767,
"naucs_at_10_diff1": -1.1517273576097316,
"naucs_at_20_max": -0.1713352007469681,
"naucs_at_20_std": -0.5634920634920767,
"naucs_at_20_diff1": -1.1517273576097316,
"naucs_at_50_max": -0.17133520074697067,
"naucs_at_50_std": -0.5634920634920583,
"naucs_at_50_diff1": -1.1517273576096694,
"naucs_at_100_max": null,
"naucs_at_100_std": null,
"naucs_at_100_diff1": null
},
"vidore/syntheticDocQA_artificial_intelligence_test": {
"ndcg_at_1": 0.87,
"ndcg_at_3": 0.94047,
"ndcg_at_5": 0.94478,
"ndcg_at_10": 0.94478,
"ndcg_at_20": 0.94478,
"ndcg_at_50": 0.94478,
"ndcg_at_100": 0.94478,
"map_at_1": 0.87,
"map_at_3": 0.92333,
"map_at_5": 0.92583,
"map_at_10": 0.92583,
"map_at_20": 0.92583,
"map_at_50": 0.92583,
"map_at_100": 0.92583,
"recall_at_1": 0.87,
"recall_at_3": 0.99,
"recall_at_5": 1.0,
"recall_at_10": 1.0,
"recall_at_20": 1.0,
"recall_at_50": 1.0,
"recall_at_100": 1.0,
"precision_at_1": 0.87,
"precision_at_3": 0.33,
"precision_at_5": 0.2,
"precision_at_10": 0.1,
"precision_at_20": 0.05,
"precision_at_50": 0.02,
"precision_at_100": 0.01,
"mrr_at_1": 0.87,
"mrr_at_3": 0.9233333333333333,
"mrr_at_5": 0.9258333333333333,
"mrr_at_10": 0.9258333333333333,
"mrr_at_20": 0.9258333333333333,
"mrr_at_50": 0.9258333333333333,
"mrr_at_100": 0.9258333333333333,
"naucs_at_1_max": 0.37958231504110235,
"naucs_at_1_std": 0.006480041472265402,
"naucs_at_1_diff1": 0.9063171147152481,
"naucs_at_3_max": 1.0,
"naucs_at_3_std": 0.7222222222222157,
"naucs_at_3_diff1": 0.8692810457516356,
"naucs_at_5_max": 1.0,
"naucs_at_5_std": 1.0,
"naucs_at_5_diff1": 1.0,
"naucs_at_10_max": 1.0,
"naucs_at_10_std": 1.0,
"naucs_at_10_diff1": 1.0,
"naucs_at_20_max": 1.0,
"naucs_at_20_std": 1.0,
"naucs_at_20_diff1": 1.0,
"naucs_at_50_max": null,
"naucs_at_50_std": null,
"naucs_at_50_diff1": null,
"naucs_at_100_max": null,
"naucs_at_100_std": null,
"naucs_at_100_diff1": null
},
"vidore/syntheticDocQA_energy_test": {
"ndcg_at_1": 0.85,
"ndcg_at_3": 0.89155,
"ndcg_at_5": 0.89542,
"ndcg_at_10": 0.91169,
"ndcg_at_20": 0.91448,
"ndcg_at_50": 0.91661,
"ndcg_at_100": 0.91661,
"map_at_1": 0.85,
"map_at_3": 0.88167,
"map_at_5": 0.88367,
"map_at_10": 0.89044,
"map_at_20": 0.89135,
"map_at_50": 0.89175,
"map_at_100": 0.89175,
"recall_at_1": 0.85,
"recall_at_3": 0.92,
"recall_at_5": 0.93,
"recall_at_10": 0.98,
"recall_at_20": 0.99,
"recall_at_50": 1.0,
"recall_at_100": 1.0,
"precision_at_1": 0.85,
"precision_at_3": 0.30667,
"precision_at_5": 0.186,
"precision_at_10": 0.098,
"precision_at_20": 0.0495,
"precision_at_50": 0.02,
"precision_at_100": 0.01,
"mrr_at_1": 0.85,
"mrr_at_3": 0.8816666666666667,
"mrr_at_5": 0.8836666666666667,
"mrr_at_10": 0.8904404761904763,
"mrr_at_20": 0.8913495670995673,
"mrr_at_50": 0.8917495670995673,
"mrr_at_100": 0.8917495670995673,
"naucs_at_1_max": 0.36173120728929387,
"naucs_at_1_std": -0.9650178978197211,
"naucs_at_1_diff1": 0.9199479336153596,
"naucs_at_3_max": 0.4982492997198882,
"naucs_at_3_std": -1.0291783380018664,
"naucs_at_3_diff1": 0.932598039215688,
"naucs_at_5_max": 0.5939042283580102,
"naucs_at_5_std": -1.0116713352007418,
"naucs_at_5_diff1": 0.96265172735761,
"naucs_at_10_max": 0.21825396825397442,
"naucs_at_10_std": -1.7399626517273414,
"naucs_at_10_diff1": 1.0,
"naucs_at_20_max": 1.0,
"naucs_at_20_std": -1.7399626517273863,
"naucs_at_20_diff1": 1.0,
"naucs_at_50_max": null,
"naucs_at_50_std": null,
"naucs_at_50_diff1": null,
"naucs_at_100_max": null,
"naucs_at_100_std": null,
"naucs_at_100_diff1": null
},
"vidore/syntheticDocQA_government_reports_test": {
"ndcg_at_1": 0.9,
"ndcg_at_3": 0.96047,
"ndcg_at_5": 0.96047,
"ndcg_at_10": 0.96047,
"ndcg_at_20": 0.96047,
"ndcg_at_50": 0.96047,
"ndcg_at_100": 0.96047,
"map_at_1": 0.9,
"map_at_3": 0.94667,
"map_at_5": 0.94667,
"map_at_10": 0.94667,
"map_at_20": 0.94667,
"map_at_50": 0.94667,
"map_at_100": 0.94667,
"recall_at_1": 0.9,
"recall_at_3": 1.0,
"recall_at_5": 1.0,
"recall_at_10": 1.0,
"recall_at_20": 1.0,
"recall_at_50": 1.0,
"recall_at_100": 1.0,
"precision_at_1": 0.9,
"precision_at_3": 0.33333,
"precision_at_5": 0.2,
"precision_at_10": 0.1,
"precision_at_20": 0.05,
"precision_at_50": 0.02,
"precision_at_100": 0.01,
"mrr_at_1": 0.9,
"mrr_at_3": 0.9466666666666668,
"mrr_at_5": 0.9466666666666668,
"mrr_at_10": 0.9466666666666668,
"mrr_at_20": 0.9466666666666668,
"mrr_at_50": 0.9466666666666668,
"mrr_at_100": 0.9466666666666668,
"naucs_at_1_max": 0.2663398692810457,
"naucs_at_1_std": -0.1846405228758159,
"naucs_at_1_diff1": 0.8835200746965451,
"naucs_at_3_max": 1.0,
"naucs_at_3_std": 1.0,
"naucs_at_3_diff1": 1.0,
"naucs_at_5_max": 1.0,
"naucs_at_5_std": 1.0,
"naucs_at_5_diff1": 1.0,
"naucs_at_10_max": 1.0,
"naucs_at_10_std": 1.0,
"naucs_at_10_diff1": 1.0,
"naucs_at_20_max": 1.0,
"naucs_at_20_std": 1.0,
"naucs_at_20_diff1": 1.0,
"naucs_at_50_max": null,
"naucs_at_50_std": null,
"naucs_at_50_diff1": null,
"naucs_at_100_max": null,
"naucs_at_100_std": null,
"naucs_at_100_diff1": null
},
"vidore/syntheticDocQA_healthcare_industry_test": {
"ndcg_at_1": 0.87,
"ndcg_at_3": 0.95071,
"ndcg_at_5": 0.95071,
"ndcg_at_10": 0.95071,
"ndcg_at_20": 0.95071,
"ndcg_at_50": 0.95071,
"ndcg_at_100": 0.95071,
"map_at_1": 0.87,
"map_at_3": 0.93333,
"map_at_5": 0.93333,
"map_at_10": 0.93333,
"map_at_20": 0.93333,
"map_at_50": 0.93333,
"map_at_100": 0.93333,
"recall_at_1": 0.87,
"recall_at_3": 1.0,
"recall_at_5": 1.0,
"recall_at_10": 1.0,
"recall_at_20": 1.0,
"recall_at_50": 1.0,
"recall_at_100": 1.0,
"precision_at_1": 0.87,
"precision_at_3": 0.33333,
"precision_at_5": 0.2,
"precision_at_10": 0.1,
"precision_at_20": 0.05,
"precision_at_50": 0.02,
"precision_at_100": 0.01,
"mrr_at_1": 0.87,
"mrr_at_3": 0.9333333333333332,
"mrr_at_5": 0.9333333333333332,
"mrr_at_10": 0.9333333333333332,
"mrr_at_20": 0.9333333333333332,
"mrr_at_50": 0.9333333333333332,
"mrr_at_100": 0.9333333333333332,
"naucs_at_1_max": 0.640339183885063,
"naucs_at_1_std": -0.4568984670073326,
"naucs_at_1_diff1": 0.9339035769828927,
"naucs_at_3_max": 1.0,
"naucs_at_3_std": 1.0,
"naucs_at_3_diff1": 1.0,
"naucs_at_5_max": 1.0,
"naucs_at_5_std": 1.0,
"naucs_at_5_diff1": 1.0,
"naucs_at_10_max": 1.0,
"naucs_at_10_std": 1.0,
"naucs_at_10_diff1": 1.0,
"naucs_at_20_max": 1.0,
"naucs_at_20_std": 1.0,
"naucs_at_20_diff1": 1.0,
"naucs_at_50_max": null,
"naucs_at_50_std": null,
"naucs_at_50_diff1": null,
"naucs_at_100_max": null,
"naucs_at_100_std": null,
"naucs_at_100_diff1": null
}
}
}