{"vidore/arxivqa_test_subsampled": {"ndcg_at_1": 0.622, "ndcg_at_3": 0.69369, "ndcg_at_5": 0.70427, "ndcg_at_10": 0.71783, "ndcg_at_20": 0.727, "ndcg_at_100": 0.74493, "ndcg_at_1000": 0.75223, "map_at_1": 0.622, "map_at_3": 0.67567, "map_at_5": 0.68147, "map_at_10": 0.68705, "map_at_20": 0.68961, "map_at_100": 0.69214, "map_at_1000": 0.69247, "recall_at_1": 0.622, "recall_at_3": 0.746, "recall_at_5": 0.772, "recall_at_10": 0.814, "recall_at_20": 0.85, "recall_at_100": 0.946, "recall_at_1000": 1.0, "precision_at_1": 0.622, "precision_at_3": 0.24867, "precision_at_5": 0.1544, "precision_at_10": 0.0814, "precision_at_20": 0.0425, "precision_at_100": 0.00946, "precision_at_1000": 0.001, "mrr_at_1": 0.622, "mrr_at_3": 0.6736666666666665, "mrr_at_5": 0.6804666666666664, "mrr_at_10": 0.6862682539682539, "mrr_at_20": 0.688662312395207, "mrr_at_100": 0.6911966165133806, "mrr_at_1000": 0.6915317530986231, "naucs_at_1_max": 0.6984372056830003, "naucs_at_1_std": 0.25231053319046604, "naucs_at_1_diff1": 0.863091065732469, "naucs_at_3_max": 0.6807235637623004, "naucs_at_3_std": 0.2414317536543939, "naucs_at_3_diff1": 0.8063264302451976, "naucs_at_5_max": 0.6629240324892501, "naucs_at_5_std": 0.27148446303491397, "naucs_at_5_diff1": 0.8022158317482351, "naucs_at_10_max": 0.6602214077343115, "naucs_at_10_std": 0.25396706666809093, "naucs_at_10_diff1": 0.7651282818460624, "naucs_at_20_max": 0.6446404165310774, "naucs_at_20_std": 0.26381386267491136, "naucs_at_20_diff1": 0.7524438659290602, "naucs_at_100_max": 0.7423142096344666, "naucs_at_100_std": 0.34984611128401694, "naucs_at_100_diff1": 0.7420721374969711, "naucs_at_1000_max": 1.0, "naucs_at_1000_std": 1.0, "naucs_at_1000_diff1": 1.0}, "vidore/docvqa_test_subsampled": {"ndcg_at_1": 0.30377, "ndcg_at_3": 0.37182, "ndcg_at_5": 0.39548, "ndcg_at_10": 0.41691, "ndcg_at_20": 0.43379, "ndcg_at_100": 0.46741, "ndcg_at_1000": 0.4939, "map_at_1": 0.30377, "map_at_3": 0.35477, "map_at_5": 0.36785, "map_at_10": 0.37664, "map_at_20": 0.38131, "map_at_100": 0.38576, "map_at_1000": 0.38681, "recall_at_1": 0.30377, "recall_at_3": 0.42129, "recall_at_5": 0.47894, "recall_at_10": 0.54545, "recall_at_20": 0.61197, "recall_at_100": 0.79601, "recall_at_1000": 1.0, "precision_at_1": 0.30377, "precision_at_3": 0.14043, "precision_at_5": 0.09579, "precision_at_10": 0.05455, "precision_at_20": 0.0306, "precision_at_100": 0.00796, "precision_at_1000": 0.001, "mrr_at_1": 0.30155210643015523, "mrr_at_3": 0.3547671840354768, "mrr_at_5": 0.3677383592017738, "mrr_at_10": 0.3758886777179459, "mrr_at_20": 0.3808746495191476, "mrr_at_100": 0.38521917916910364, "mrr_at_1000": 0.3862695215417875, "naucs_at_1_max": 0.4928763364311302, "naucs_at_1_std": 0.24853148639823786, "naucs_at_1_diff1": 0.7259530605621985, "naucs_at_3_max": 0.446649632566899, "naucs_at_3_std": 0.2979324677451571, "naucs_at_3_diff1": 0.5948333805489103, "naucs_at_5_max": 0.4212406030554807, "naucs_at_5_std": 0.2980189188097191, "naucs_at_5_diff1": 0.5128514344633472, "naucs_at_10_max": 0.3841239837660503, "naucs_at_10_std": 0.3051410138541696, "naucs_at_10_diff1": 0.4833799034029087, "naucs_at_20_max": 0.37081454305491823, "naucs_at_20_std": 0.3428527717716659, "naucs_at_20_diff1": 0.4432615232615892, "naucs_at_100_max": 0.3715026405085789, "naucs_at_100_std": 0.4646797252908688, "naucs_at_100_diff1": 0.45378439880433125, "naucs_at_1000_max": 1.0, "naucs_at_1000_std": 1.0, "naucs_at_1000_diff1": 1.0}, "vidore/infovqa_test_subsampled": {"ndcg_at_1": 0.68016, "ndcg_at_3": 0.75634, "ndcg_at_5": 0.77472, "ndcg_at_10": 0.78922, "ndcg_at_20": 0.79779, "ndcg_at_100": 0.8057, "ndcg_at_1000": 0.80892, "map_at_1": 0.68016, "map_at_3": 0.73785, "map_at_5": 0.74808, "map_at_10": 0.75413, "map_at_20": 0.75641, "map_at_100": 0.75751, "map_at_1000": 0.75765, "recall_at_1": 0.68016, "recall_at_3": 0.80972, "recall_at_5": 0.85425, "recall_at_10": 0.89879, "recall_at_20": 0.9332, "recall_at_100": 0.97571, "recall_at_1000": 1.0, "precision_at_1": 0.68016, "precision_at_3": 0.26991, "precision_at_5": 0.17085, "precision_at_10": 0.08988, "precision_at_20": 0.04666, "precision_at_100": 0.00976, "precision_at_1000": 0.001, "mrr_at_1": 0.680161943319838, "mrr_at_3": 0.7378542510121456, "mrr_at_5": 0.7480769230769229, "mrr_at_10": 0.7540919606709079, "mrr_at_20": 0.7564901974189586, "mrr_at_100": 0.7575034872691773, "mrr_at_1000": 0.7576408958804035, "naucs_at_1_max": 0.35566271868132526, "naucs_at_1_std": -0.13017376191751398, "naucs_at_1_diff1": 0.8407113334078951, "naucs_at_3_max": 0.3737930321884956, "naucs_at_3_std": -0.12727167771097328, "naucs_at_3_diff1": 0.7771427225016556, "naucs_at_5_max": 0.41907683428958065, "naucs_at_5_std": -0.03122637604043099, "naucs_at_5_diff1": 0.775179180381762, "naucs_at_10_max": 0.5296332750599823, "naucs_at_10_std": 0.09621625399114077, "naucs_at_10_diff1": 0.7921537877237935, "naucs_at_20_max": 0.6614807974603235, "naucs_at_20_std": 0.26564925037604614, "naucs_at_20_diff1": 0.788090173438919, "naucs_at_100_max": 0.5764310655230227, "naucs_at_100_std": 0.26774513072852335, "naucs_at_100_diff1": 0.7291737175763904, "naucs_at_1000_max": 1.0, "naucs_at_1000_std": 1.0, "naucs_at_1000_diff1": 1.0}, "vidore/tabfquad_test_subsampled": {"ndcg_at_1": 0.55357, "ndcg_at_3": 0.62814, "ndcg_at_5": 0.64152, "ndcg_at_10": 0.66811, "ndcg_at_20": 0.67993, "ndcg_at_100": 0.71041, "ndcg_at_1000": 0.71041, "map_at_1": 0.55357, "map_at_3": 0.60952, "map_at_5": 0.61702, "map_at_10": 0.62802, "map_at_20": 0.6313, "map_at_100": 0.63596, "map_at_1000": 0.63596, "recall_at_1": 0.55357, "recall_at_3": 0.68214, "recall_at_5": 0.71429, "recall_at_10": 0.79643, "recall_at_20": 0.84286, "recall_at_100": 1.0, "recall_at_1000": 1.0, "precision_at_1": 0.55357, "precision_at_3": 0.22738, "precision_at_5": 0.14286, "precision_at_10": 0.07964, "precision_at_20": 0.04214, "precision_at_100": 0.01, "precision_at_1000": 0.001, "mrr_at_1": 0.5535714285714286, "mrr_at_3": 0.6095238095238095, "mrr_at_5": 0.6170238095238095, "mrr_at_10": 0.6276643990929704, "mrr_at_20": 0.6312696030442602, "mrr_at_100": 0.6359366342220795, "mrr_at_1000": 0.6359366342220795, "naucs_at_1_max": 0.4612480177209454, "naucs_at_1_std": 0.1267551035819467, "naucs_at_1_diff1": 0.8295315528481892, "naucs_at_3_max": 0.4972329468341564, "naucs_at_3_std": 0.3175015338088654, "naucs_at_3_diff1": 0.7089233591343741, "naucs_at_5_max": 0.5117059769498793, "naucs_at_5_std": 0.3708054140980973, "naucs_at_5_diff1": 0.6843674618064864, "naucs_at_10_max": 0.4390413429644816, "naucs_at_10_std": 0.3337351199641042, "naucs_at_10_diff1": 0.5761708267713077, "naucs_at_20_max": 0.40009803047856857, "naucs_at_20_std": 0.30784912218162297, "naucs_at_20_diff1": 0.5373295606452183, "naucs_at_100_max": 1.0, "naucs_at_100_std": 1.0, "naucs_at_100_diff1": 1.0, "naucs_at_1000_max": NaN, "naucs_at_1000_std": NaN, "naucs_at_1000_diff1": NaN}, "vidore/tatdqa_test": {"ndcg_at_1": 0.27339, "ndcg_at_3": 0.37032, "ndcg_at_5": 0.40744, "ndcg_at_10": 0.44291, "ndcg_at_20": 0.46796, "ndcg_at_100": 0.50544, "ndcg_at_1000": 0.51354, "map_at_1": 0.27339, "map_at_3": 0.3465, "map_at_5": 0.367, "map_at_10": 0.38136, "map_at_20": 0.38832, "map_at_100": 0.39346, "map_at_1000": 0.39387, "recall_at_1": 0.27339, "recall_at_3": 0.43925, "recall_at_5": 0.52977, "recall_at_10": 0.64095, "recall_at_20": 0.73937, "recall_at_100": 0.94168, "recall_at_1000": 1.0, "precision_at_1": 0.27339, "precision_at_3": 0.14642, "precision_at_5": 0.10595, "precision_at_10": 0.06409, "precision_at_20": 0.03697, "precision_at_100": 0.00942, "precision_at_1000": 0.001, "mrr_at_1": 0.2709599027946537, "mrr_at_3": 0.3449777237748073, "mrr_at_5": 0.3656946132037261, "mrr_at_10": 0.38013630928272474, "mrr_at_20": 0.3871318388831053, "mrr_at_100": 0.39236800875106836, "mrr_at_1000": 0.3927721673077235, "naucs_at_1_max": 0.10554489434048779, "naucs_at_1_std": -0.07852551910644305, "naucs_at_1_diff1": 0.5400649391521823, "naucs_at_3_max": 0.10297066707027175, "naucs_at_3_std": -0.010968118840326283, "naucs_at_3_diff1": 0.42126546399172343, "naucs_at_5_max": 0.103914859574771, "naucs_at_5_std": -0.006196709993623548, "naucs_at_5_diff1": 0.4032956786666166, "naucs_at_10_max": 0.09448577468935329, "naucs_at_10_std": -0.0016728294722104995, "naucs_at_10_diff1": 0.37407950317940747, "naucs_at_20_max": 0.08074941586194169, "naucs_at_20_std": 4.007008250921936e-05, "naucs_at_20_diff1": 0.3398398221486548, "naucs_at_100_max": 0.1894026512622526, "naucs_at_100_std": 0.18779694861230584, "naucs_at_100_diff1": 0.48000405282224096, "naucs_at_1000_max": NaN, "naucs_at_1000_std": NaN, "naucs_at_1000_diff1": NaN}, "vidore/shiftproject_test": {"ndcg_at_1": 0.25, "ndcg_at_3": 0.3494, "ndcg_at_5": 0.39845, "ndcg_at_10": 0.44231, "ndcg_at_20": 0.46774, "ndcg_at_100": 0.50084, "ndcg_at_1000": 0.50726, "map_at_1": 0.25, "map_at_3": 0.325, "map_at_5": 0.352, "map_at_10": 0.36926, "map_at_20": 0.37629, "map_at_100": 0.38145, "map_at_1000": 0.38169, "recall_at_1": 0.25, "recall_at_3": 0.42, "recall_at_5": 0.54, "recall_at_10": 0.68, "recall_at_20": 0.78, "recall_at_100": 0.95, "recall_at_1000": 1.0, "precision_at_1": 0.25, "precision_at_3": 0.14, "precision_at_5": 0.108, "precision_at_10": 0.068, "precision_at_20": 0.039, "precision_at_100": 0.0095, "precision_at_1000": 0.001, "mrr_at_1": 0.26, "mrr_at_3": 0.33000000000000007, "mrr_at_5": 0.35700000000000004, "mrr_at_10": 0.3746349206349207, "mrr_at_20": 0.3816949202758027, "mrr_at_100": 0.38685478604647594, "mrr_at_1000": 0.38709862816510116, "naucs_at_1_max": 0.1574549466715704, "naucs_at_1_std": -0.10303788157410809, "naucs_at_1_diff1": 0.2442809856564912, "naucs_at_3_max": 0.32091660834175784, "naucs_at_3_std": -0.1466158591907097, "naucs_at_3_diff1": 0.16244135106410507, "naucs_at_5_max": 0.24536689727987618, "naucs_at_5_std": -0.15837292656497418, "naucs_at_5_diff1": 0.17715539996110155, "naucs_at_10_max": 0.21313316287747947, "naucs_at_10_std": -0.10156519936424467, "naucs_at_10_diff1": 0.11676801879621386, "naucs_at_20_max": 0.19814995131450897, "naucs_at_20_std": -0.014281077572216307, "naucs_at_20_diff1": 0.19889182547410442, "naucs_at_100_max": 0.5425770308123271, "naucs_at_100_std": 0.1131652661064462, "naucs_at_100_diff1": 0.23445378151260604, "naucs_at_1000_max": NaN, "naucs_at_1000_std": NaN, "naucs_at_1000_diff1": NaN}, "vidore/syntheticDocQA_artificial_intelligence_test": {"ndcg_at_1": 0.82, "ndcg_at_3": 0.87786, "ndcg_at_5": 0.89034, "ndcg_at_10": 0.89349, "ndcg_at_20": 0.90134, "ndcg_at_100": 0.90294, "ndcg_at_1000": 0.90294, "map_at_1": 0.82, "map_at_3": 0.86333, "map_at_5": 0.87033, "map_at_10": 0.87158, "map_at_20": 0.87387, "map_at_100": 0.874, "map_at_1000": 0.874, "recall_at_1": 0.82, "recall_at_3": 0.92, "recall_at_5": 0.95, "recall_at_10": 0.96, "recall_at_20": 0.99, "recall_at_100": 1.0, "recall_at_1000": 1.0, "precision_at_1": 0.82, "precision_at_3": 0.30667, "precision_at_5": 0.19, "precision_at_10": 0.096, "precision_at_20": 0.0495, "precision_at_100": 0.01, "precision_at_1000": 0.001, "mrr_at_1": 0.82, "mrr_at_3": 0.8633333333333333, "mrr_at_5": 0.8703333333333333, "mrr_at_10": 0.8715833333333333, "mrr_at_20": 0.8739209956709957, "mrr_at_100": 0.8740525746183642, "mrr_at_1000": 0.8740525746183642, "naucs_at_1_max": 0.324182178654037, "naucs_at_1_std": -0.17948011895583169, "naucs_at_1_diff1": 0.8288908470095823, "naucs_at_3_max": 0.5691526610644263, "naucs_at_3_std": -0.13101073762838406, "naucs_at_3_diff1": 0.8045634920634936, "naucs_at_5_max": 0.5207282913165321, "naucs_at_5_std": -0.5524743230625453, "naucs_at_5_diff1": 0.7690009337068187, "naucs_at_10_max": 0.6202147525676922, "naucs_at_10_std": -0.40266106442576227, "naucs_at_10_diff1": 0.9305555555555542, "naucs_at_20_max": 0.12278244631185926, "naucs_at_20_std": -1.7399626517273863, "naucs_at_20_diff1": 1.0, "naucs_at_100_max": NaN, "naucs_at_100_std": NaN, "naucs_at_100_diff1": NaN, "naucs_at_1000_max": NaN, "naucs_at_1000_std": NaN, "naucs_at_1000_diff1": NaN}, "vidore/syntheticDocQA_energy_test": {"ndcg_at_1": 0.8, "ndcg_at_3": 0.87809, "ndcg_at_5": 0.88627, "ndcg_at_10": 0.88627, "ndcg_at_20": 0.89413, "ndcg_at_100": 0.89617, "ndcg_at_1000": 0.89745, "map_at_1": 0.8, "map_at_3": 0.86, "map_at_5": 0.8645, "map_at_10": 0.8645, "map_at_20": 0.8668, "map_at_100": 0.86715, "map_at_1000": 0.86719, "recall_at_1": 0.8, "recall_at_3": 0.93, "recall_at_5": 0.95, "recall_at_10": 0.95, "recall_at_20": 0.98, "recall_at_100": 0.99, "recall_at_1000": 1.0, "precision_at_1": 0.8, "precision_at_3": 0.31, "precision_at_5": 0.19, "precision_at_10": 0.095, "precision_at_20": 0.049, "precision_at_100": 0.0099, "precision_at_1000": 0.001, "mrr_at_1": 0.8, "mrr_at_3": 0.86, "mrr_at_5": 0.865, "mrr_at_10": 0.865, "mrr_at_20": 0.8673449883449884, "mrr_at_100": 0.8676898159311952, "mrr_at_1000": 0.8677338687946313, "naucs_at_1_max": 0.31336163836163833, "naucs_at_1_std": -0.3745004995005006, "naucs_at_1_diff1": 0.8786213786213782, "naucs_at_3_max": 0.4835934373749493, "naucs_at_3_std": -0.8576097105508865, "naucs_at_3_diff1": 0.8989595838335334, "naucs_at_5_max": 0.30317460317460687, "naucs_at_5_std": -1.190943043884201, "naucs_at_5_diff1": 0.9477124183006543, "naucs_at_10_max": 0.30317460317460687, "naucs_at_10_std": -1.190943043884201, "naucs_at_10_diff1": 0.9477124183006543, "naucs_at_20_max": 0.24042950513538955, "naucs_at_20_std": -0.9556489262371616, "naucs_at_20_diff1": 0.9346405228758136, "naucs_at_100_max": 0.35807656395892007, "naucs_at_100_std": -1.7399626517273008, "naucs_at_100_diff1": 1.0, "naucs_at_1000_max": NaN, "naucs_at_1000_std": NaN, "naucs_at_1000_diff1": NaN}, "vidore/syntheticDocQA_government_reports_test": {"ndcg_at_1": 0.8, "ndcg_at_3": 0.87547, "ndcg_at_5": 0.89226, "ndcg_at_10": 0.89898, "ndcg_at_20": 0.90133, "ndcg_at_100": 0.90133, "ndcg_at_1000": 0.90133, "map_at_1": 0.8, "map_at_3": 0.85667, "map_at_5": 0.86617, "map_at_10": 0.86908, "map_at_20": 0.86964, "map_at_100": 0.86964, "map_at_1000": 0.86964, "recall_at_1": 0.8, "recall_at_3": 0.93, "recall_at_5": 0.97, "recall_at_10": 0.99, "recall_at_20": 1.0, "recall_at_100": 1.0, "recall_at_1000": 1.0, "precision_at_1": 0.8, "precision_at_3": 0.31, "precision_at_5": 0.194, "precision_at_10": 0.099, "precision_at_20": 0.05, "precision_at_100": 0.01, "precision_at_1000": 0.001, "mrr_at_1": 0.8, "mrr_at_3": 0.8566666666666669, "mrr_at_5": 0.8661666666666669, "mrr_at_10": 0.8690833333333337, "mrr_at_20": 0.8696388888888891, "mrr_at_100": 0.8696388888888891, "mrr_at_1000": 0.8696388888888891, "naucs_at_1_max": 0.25077422577422587, "naucs_at_1_std": -0.24747752247752283, "naucs_at_1_diff1": 0.7295704295704294, "naucs_at_3_max": 0.2665066026410558, "naucs_at_3_std": -0.43657462985193923, "naucs_at_3_diff1": 0.7435640923035859, "naucs_at_5_max": -0.07983193277310867, "naucs_at_5_std": -0.628851540616243, "naucs_at_5_diff1": 0.9128540305010848, "naucs_at_10_max": 0.5541549953314738, "naucs_at_10_std": -0.1713352007469681, "naucs_at_10_diff1": 0.8692810457516413, "naucs_at_20_max": 1.0, "naucs_at_20_std": 1.0, "naucs_at_20_diff1": 1.0, "naucs_at_100_max": NaN, "naucs_at_100_std": NaN, "naucs_at_100_diff1": NaN, "naucs_at_1000_max": NaN, "naucs_at_1000_std": NaN, "naucs_at_1000_diff1": NaN}, "vidore/syntheticDocQA_healthcare_industry_test": {"ndcg_at_1": 0.8, "ndcg_at_3": 0.86809, "ndcg_at_5": 0.88488, "ndcg_at_10": 0.89438, "ndcg_at_20": 0.89701, "ndcg_at_100": 0.89913, "ndcg_at_1000": 0.89913, "map_at_1": 0.8, "map_at_3": 0.85333, "map_at_5": 0.86283, "map_at_10": 0.86662, "map_at_20": 0.86739, "map_at_100": 0.86779, "map_at_1000": 0.86779, "recall_at_1": 0.8, "recall_at_3": 0.91, "recall_at_5": 0.95, "recall_at_10": 0.98, "recall_at_20": 0.99, "recall_at_100": 1.0, "recall_at_1000": 1.0, "precision_at_1": 0.8, "precision_at_3": 0.30333, "precision_at_5": 0.19, "precision_at_10": 0.098, "precision_at_20": 0.0495, "precision_at_100": 0.01, "precision_at_1000": 0.001, "mrr_at_1": 0.8, "mrr_at_3": 0.8533333333333333, "mrr_at_5": 0.8628333333333333, "mrr_at_10": 0.8666230158730158, "mrr_at_20": 0.8673922466422468, "mrr_at_100": 0.8678089133089134, "mrr_at_1000": 0.8678089133089134, "naucs_at_1_max": 0.4438311688311687, "naucs_at_1_std": -0.4122627372627377, "naucs_at_1_diff1": 0.89547952047952, "naucs_at_3_max": 0.3717709305944596, "naucs_at_3_std": -0.9621848739495795, "naucs_at_3_diff1": 0.8474945533769087, "naucs_at_5_max": 0.27432306255836286, "naucs_at_5_std": -0.9674136321194953, "naucs_at_5_diff1": 0.8627450980392155, "naucs_at_10_max": 0.7957516339869297, "naucs_at_10_std": -0.10270774976657283, "naucs_at_10_diff1": 0.7957516339869297, "naucs_at_20_max": 0.8692810457516413, "naucs_at_20_std": -0.5634920634920767, "naucs_at_20_diff1": 0.8692810457516413, "naucs_at_100_max": NaN, "naucs_at_100_std": NaN, "naucs_at_100_diff1": NaN, "naucs_at_1000_max": NaN, "naucs_at_1000_std": NaN, "naucs_at_1000_diff1": NaN}}