{"arxivqa_test_subsampled": {"ndcg_at_1": 0.83, "ndcg_at_3": 0.86645, "ndcg_at_5": 0.87575, "ndcg_at_10": 0.88357, "ndcg_at_20": 0.89031, "ndcg_at_50": 0.89361, "ndcg_at_100": 0.89491, "map_at_1": 0.83, "map_at_3": 0.857, "map_at_5": 0.8623, "map_at_10": 0.86557, "map_at_20": 0.86751, "map_at_50": 0.86809, "map_at_100": 0.86821, "recall_at_1": 0.83, "recall_at_3": 0.894, "recall_at_5": 0.916, "recall_at_10": 0.94, "recall_at_20": 0.966, "recall_at_50": 0.982, "recall_at_100": 0.99, "precision_at_1": 0.83, "precision_at_3": 0.298, "precision_at_5": 0.1832, "precision_at_10": 0.094, "precision_at_20": 0.0483, "precision_at_50": 0.01964, "precision_at_100": 0.0099, "mrr_at_1": 0.83, "mrr_at_3": 0.8569999999999998, "mrr_at_5": 0.8622999999999997, "mrr_at_10": 0.8655468253968253, "mrr_at_20": 0.86748706375324, "mrr_at_50": 0.8680725159027165, "mrr_at_100": 0.8681857764435326, "naucs_at_1_max": 0.858646311023393, "naucs_at_1_std": -0.4664247982817673, "naucs_at_1_diff1": 0.9168804783189187, "naucs_at_3_max": 0.8260919723834373, "naucs_at_3_std": -0.4909749214631783, "naucs_at_3_diff1": 0.8531405853433434, "naucs_at_5_max": 0.8605108710150751, "naucs_at_5_std": -0.5535658707927644, "naucs_at_5_diff1": 0.8712818460717628, "naucs_at_10_max": 0.8889666977902271, "naucs_at_10_std": -0.31691565515095205, "naucs_at_10_diff1": 0.8706037970743868, "naucs_at_20_max": 0.8959191519745157, "naucs_at_20_std": -0.38292964244521194, "naucs_at_20_diff1": 0.8699675948810928, "naucs_at_50_max": 0.9110384894698567, "naucs_at_50_std": -0.5361552028218665, "naucs_at_50_diff1": 0.8615001556178092, "naucs_at_100_max": 0.8921568627450854, "naucs_at_100_std": -0.12110177404293686, "naucs_at_100_diff1": 0.8585434173669326}, "docvqa_test_subsampled": {"ndcg_at_1": 0.48337, "ndcg_at_3": 0.54361, "ndcg_at_5": 0.56631, "ndcg_at_10": 0.5856, "ndcg_at_20": 0.6002, "ndcg_at_50": 0.61575, "ndcg_at_100": 0.62417, "map_at_1": 0.48337, "map_at_3": 0.52846, "map_at_5": 0.54098, "map_at_10": 0.5489, "map_at_20": 0.55291, "map_at_50": 0.55547, "map_at_100": 0.55625, "recall_at_1": 0.48337, "recall_at_3": 0.58758, "recall_at_5": 0.64302, "recall_at_10": 0.70288, "recall_at_20": 0.76053, "recall_at_50": 0.83814, "recall_at_100": 0.88914, "precision_at_1": 0.48337, "precision_at_3": 0.19586, "precision_at_5": 0.1286, "precision_at_10": 0.07029, "precision_at_20": 0.03803, "precision_at_50": 0.01676, "precision_at_100": 0.00889, "mrr_at_1": 0.48337028824833705, "mrr_at_3": 0.5291943828529196, "mrr_at_5": 0.5411677753141169, "mrr_at_10": 0.5491280399816985, "mrr_at_20": 0.5531358543364028, "mrr_at_50": 0.5556861079139531, "mrr_at_100": 0.5564702079607413, "naucs_at_1_max": 0.6938261034813209, "naucs_at_1_std": -0.44374096550677106, "naucs_at_1_diff1": 0.8515620837021114, "naucs_at_3_max": 0.6668377646579767, "naucs_at_3_std": -0.4652816060602179, "naucs_at_3_diff1": 0.7505735469305647, "naucs_at_5_max": 0.724457489986816, "naucs_at_5_std": -0.3958839295973761, "naucs_at_5_diff1": 0.7229459462048281, "naucs_at_10_max": 0.676802465865959, "naucs_at_10_std": -0.46150705683769994, "naucs_at_10_diff1": 0.6592299253063731, "naucs_at_20_max": 0.6600327112639377, "naucs_at_20_std": -0.4913360754229586, "naucs_at_20_diff1": 0.6173724312440265, "naucs_at_50_max": 0.7107726516332598, "naucs_at_50_std": -0.30342460889725203, "naucs_at_50_diff1": 0.5878153412566914, "naucs_at_100_max": 0.7701174556499546, "naucs_at_100_std": -0.20534787776527266, "naucs_at_100_diff1": 0.6057647818477818}, "infovqa_test_subsampled": {"ndcg_at_1": 0.88462, "ndcg_at_3": 0.91491, "ndcg_at_5": 0.92388, "ndcg_at_10": 0.92663, "ndcg_at_20": 0.92863, "ndcg_at_50": 0.93028, "ndcg_at_100": 0.93091, "map_at_1": 0.88462, "map_at_3": 0.90722, "map_at_5": 0.91208, "map_at_10": 0.9133, "map_at_20": 0.91382, "map_at_50": 0.91409, "map_at_100": 0.91414, "recall_at_1": 0.88462, "recall_at_3": 0.93725, "recall_at_5": 0.95951, "recall_at_10": 0.96761, "recall_at_20": 0.97571, "recall_at_50": 0.98381, "recall_at_100": 0.98785, "precision_at_1": 0.88462, "precision_at_3": 0.31242, "precision_at_5": 0.1919, "precision_at_10": 0.09676, "precision_at_20": 0.04879, "precision_at_50": 0.01968, "precision_at_100": 0.00988, "mrr_at_1": 0.8846153846153846, "mrr_at_3": 0.9072199730094463, "mrr_at_5": 0.9120782726045881, "mrr_at_10": 0.9132952573742044, "mrr_at_20": 0.9138156422643798, "mrr_at_50": 0.9140889280185405, "mrr_at_100": 0.9141383515097923, "naucs_at_1_max": 0.7812468890694119, "naucs_at_1_std": -0.08799174841521007, "naucs_at_1_diff1": 0.9456266707519869, "naucs_at_3_max": 0.8372432713037467, "naucs_at_3_std": 0.03838532830090231, "naucs_at_3_diff1": 0.9282000807550249, "naucs_at_5_max": 0.9295244758349281, "naucs_at_5_std": 0.1803114561450837, "naucs_at_5_diff1": 0.9665230450023843, "naucs_at_10_max": 0.9292640159035281, "naucs_at_10_std": 0.10340232903541587, "naucs_at_10_diff1": 0.9581538062529754, "naucs_at_20_max": 0.9659719840147728, "naucs_at_20_std": 0.2981831051495906, "naucs_at_20_diff1": 0.94420507500398, "naucs_at_50_max": 0.9836748182418981, "naucs_at_50_std": 0.36839391253502923, "naucs_at_50_diff1": 0.9326327942640528, "naucs_at_100_max": 0.9782330909892136, "naucs_at_100_std": 0.3783664086797387, "naucs_at_100_diff1": 0.9101770590187516}, "shiftproject_test": {"ndcg_at_1": 0.95, "ndcg_at_3": 0.97262, "ndcg_at_5": 0.97262, "ndcg_at_10": 0.97262, "ndcg_at_20": 0.97518, "ndcg_at_50": 0.97518, "ndcg_at_100": 0.97518, "map_at_1": 0.95, "map_at_3": 0.96667, "map_at_5": 0.96667, "map_at_10": 0.96667, "map_at_20": 0.96738, "map_at_50": 0.96738, "map_at_100": 0.96738, "recall_at_1": 0.95, "recall_at_3": 0.99, "recall_at_5": 0.99, "recall_at_10": 0.99, "recall_at_20": 1.0, "recall_at_50": 1.0, "recall_at_100": 1.0, "precision_at_1": 0.95, "precision_at_3": 0.33, "precision_at_5": 0.198, "precision_at_10": 0.099, "precision_at_20": 0.05, "precision_at_50": 0.02, "precision_at_100": 0.01, "mrr_at_1": 0.95, "mrr_at_3": 0.9666666666666667, "mrr_at_5": 0.9666666666666667, "mrr_at_10": 0.9666666666666667, "mrr_at_20": 0.9673809523809525, "mrr_at_50": 0.9673809523809525, "mrr_at_100": 0.9673809523809525, "naucs_at_1_max": 0.5981325863678774, "naucs_at_1_std": -0.3083099906629302, "naucs_at_1_diff1": 0.8921568627450971, "naucs_at_3_max": 1.0, "naucs_at_3_std": 0.35807656395889226, "naucs_at_3_diff1": 0.7222222222222157, "naucs_at_5_max": 1.0, "naucs_at_5_std": 0.35807656395891135, "naucs_at_5_diff1": 0.7222222222222276, "naucs_at_10_max": 1.0, "naucs_at_10_std": 0.35807656395891135, "naucs_at_10_diff1": 0.7222222222222276, "naucs_at_20_max": 1.0, "naucs_at_20_std": 1.0, "naucs_at_20_diff1": 1.0, "naucs_at_50_max": null, "naucs_at_50_std": null, "naucs_at_50_diff1": null, "naucs_at_100_max": null, "naucs_at_100_std": null, "naucs_at_100_diff1": null}, "syntheticDocQA_artificial_intelligence_test": {"ndcg_at_1": 0.99, "ndcg_at_3": 0.99631, "ndcg_at_5": 0.99631, "ndcg_at_10": 0.99631, "ndcg_at_20": 0.99631, "ndcg_at_50": 0.99631, "ndcg_at_100": 0.99631, "map_at_1": 0.99, "map_at_3": 0.995, "map_at_5": 0.995, "map_at_10": 0.995, "map_at_20": 0.995, "map_at_50": 0.995, "map_at_100": 0.995, "recall_at_1": 0.99, "recall_at_3": 1.0, "recall_at_5": 1.0, "recall_at_10": 1.0, "recall_at_20": 1.0, "recall_at_50": 1.0, "recall_at_100": 1.0, "precision_at_1": 0.99, "precision_at_3": 0.33333, "precision_at_5": 0.2, "precision_at_10": 0.1, "precision_at_20": 0.05, "precision_at_50": 0.02, "precision_at_100": 0.01, "mrr_at_1": 0.99, "mrr_at_3": 0.995, "mrr_at_5": 0.995, "mrr_at_10": 0.995, "mrr_at_20": 0.995, "mrr_at_50": 0.995, "mrr_at_100": 0.995, "naucs_at_1_max": 1.0, "naucs_at_1_std": 0.8692810457516276, "naucs_at_1_diff1": 1.0, "naucs_at_3_max": 1.0, "naucs_at_3_std": 1.0, "naucs_at_3_diff1": 1.0, "naucs_at_5_max": 1.0, "naucs_at_5_std": 1.0, "naucs_at_5_diff1": 1.0, "naucs_at_10_max": 1.0, "naucs_at_10_std": 1.0, "naucs_at_10_diff1": 1.0, "naucs_at_20_max": 1.0, "naucs_at_20_std": 1.0, "naucs_at_20_diff1": 1.0, "naucs_at_50_max": null, "naucs_at_50_std": null, "naucs_at_50_diff1": null, "naucs_at_100_max": null, "naucs_at_100_std": null, "naucs_at_100_diff1": null}, "syntheticDocQA_energy_test": {"ndcg_at_1": 0.94, "ndcg_at_3": 0.95893, "ndcg_at_5": 0.95893, "ndcg_at_10": 0.96831, "ndcg_at_20": 0.96831, "ndcg_at_50": 0.96831, "ndcg_at_100": 0.96831, "map_at_1": 0.94, "map_at_3": 0.955, "map_at_5": 0.955, "map_at_10": 0.95868, "map_at_20": 0.95868, "map_at_50": 0.95868, "map_at_100": 0.95868, "recall_at_1": 0.94, "recall_at_3": 0.97, "recall_at_5": 0.97, "recall_at_10": 1.0, "recall_at_20": 1.0, "recall_at_50": 1.0, "recall_at_100": 1.0, "precision_at_1": 0.94, "precision_at_3": 0.32333, "precision_at_5": 0.194, "precision_at_10": 0.1, "precision_at_20": 0.05, "precision_at_50": 0.02, "precision_at_100": 0.01, "mrr_at_1": 0.94, "mrr_at_3": 0.955, "mrr_at_5": 0.955, "mrr_at_10": 0.9586785714285714, "mrr_at_20": 0.9586785714285714, "mrr_at_50": 0.9586785714285714, "mrr_at_100": 0.9586785714285714, "naucs_at_1_max": 0.7394179894179895, "naucs_at_1_std": -0.7495331465919671, "naucs_at_1_diff1": 0.9346405228758177, "naucs_at_3_max": 1.0, "naucs_at_3_std": -1.1517273576097098, "naucs_at_3_diff1": 0.9564270152505466, "naucs_at_5_max": 1.0, "naucs_at_5_std": -1.1517273576097071, "naucs_at_5_diff1": 0.9564270152505424, "naucs_at_10_max": 1.0, "naucs_at_10_std": 1.0, "naucs_at_10_diff1": 1.0, "naucs_at_20_max": 1.0, "naucs_at_20_std": 1.0, "naucs_at_20_diff1": 1.0, "naucs_at_50_max": null, "naucs_at_50_std": null, "naucs_at_50_diff1": null, "naucs_at_100_max": null, "naucs_at_100_std": null, "naucs_at_100_diff1": null}, "syntheticDocQA_government_reports_test": {"ndcg_at_1": 0.99, "ndcg_at_3": 0.995, "ndcg_at_5": 0.995, "ndcg_at_10": 0.995, "ndcg_at_20": 0.995, "ndcg_at_50": 0.995, "ndcg_at_100": 0.995, "map_at_1": 0.99, "map_at_3": 0.99333, "map_at_5": 0.99333, "map_at_10": 0.99333, "map_at_20": 0.99333, "map_at_50": 0.99333, "map_at_100": 0.99333, "recall_at_1": 0.99, "recall_at_3": 1.0, "recall_at_5": 1.0, "recall_at_10": 1.0, "recall_at_20": 1.0, "recall_at_50": 1.0, "recall_at_100": 1.0, "precision_at_1": 0.99, "precision_at_3": 0.33333, "precision_at_5": 0.2, "precision_at_10": 0.1, "precision_at_20": 0.05, "precision_at_50": 0.02, "precision_at_100": 0.01, "mrr_at_1": 0.99, "mrr_at_3": 0.9933333333333334, "mrr_at_5": 0.9933333333333334, "mrr_at_10": 0.9933333333333334, "mrr_at_20": 0.9933333333333334, "mrr_at_50": 0.9933333333333334, "mrr_at_100": 0.9933333333333334, "naucs_at_1_max": 0.7222222222222201, "naucs_at_1_std": -1.739962651727339, "naucs_at_1_diff1": 1.0, "naucs_at_3_max": 1.0, "naucs_at_3_std": 1.0, "naucs_at_3_diff1": 1.0, "naucs_at_5_max": 1.0, "naucs_at_5_std": 1.0, "naucs_at_5_diff1": 1.0, "naucs_at_10_max": 1.0, "naucs_at_10_std": 1.0, "naucs_at_10_diff1": 1.0, "naucs_at_20_max": 1.0, "naucs_at_20_std": 1.0, "naucs_at_20_diff1": 1.0, "naucs_at_50_max": null, "naucs_at_50_std": null, "naucs_at_50_diff1": null, "naucs_at_100_max": null, "naucs_at_100_std": null, "naucs_at_100_diff1": null}, "syntheticDocQA_healthcare_industry_test": {"ndcg_at_1": 0.99, "ndcg_at_3": 0.99631, "ndcg_at_5": 0.99631, "ndcg_at_10": 0.99631, "ndcg_at_20": 0.99631, "ndcg_at_50": 0.99631, "ndcg_at_100": 0.99631, "map_at_1": 0.99, "map_at_3": 0.995, "map_at_5": 0.995, "map_at_10": 0.995, "map_at_20": 0.995, "map_at_50": 0.995, "map_at_100": 0.995, "recall_at_1": 0.99, "recall_at_3": 1.0, "recall_at_5": 1.0, "recall_at_10": 1.0, "recall_at_20": 1.0, "recall_at_50": 1.0, "recall_at_100": 1.0, "precision_at_1": 0.99, "precision_at_3": 0.33333, "precision_at_5": 0.2, "precision_at_10": 0.1, "precision_at_20": 0.05, "precision_at_50": 0.02, "precision_at_100": 0.01, "mrr_at_1": 0.99, "mrr_at_3": 0.995, "mrr_at_5": 0.995, "mrr_at_10": 0.995, "mrr_at_20": 0.995, "mrr_at_50": 0.995, "mrr_at_100": 0.995, "naucs_at_1_max": 1.0, "naucs_at_1_std": 0.7222222222222201, "naucs_at_1_diff1": 1.0, "naucs_at_3_max": 1.0, "naucs_at_3_std": 1.0, "naucs_at_3_diff1": 1.0, "naucs_at_5_max": 1.0, "naucs_at_5_std": 1.0, "naucs_at_5_diff1": 1.0, "naucs_at_10_max": 1.0, "naucs_at_10_std": 1.0, "naucs_at_10_diff1": 1.0, "naucs_at_20_max": 1.0, "naucs_at_20_std": 1.0, "naucs_at_20_diff1": 1.0, "naucs_at_50_max": null, "naucs_at_50_std": null, "naucs_at_50_diff1": null, "naucs_at_100_max": null, "naucs_at_100_std": null, "naucs_at_100_diff1": null}, "tabfquad_test_subsampled": {"ndcg_at_1": 0.9, "ndcg_at_3": 0.9355, "ndcg_at_5": 0.9458, "ndcg_at_10": 0.94692, "ndcg_at_20": 0.94874, "ndcg_at_50": 0.94943, "ndcg_at_100": 0.94943, "map_at_1": 0.9, "map_at_3": 0.92679, "map_at_5": 0.9325, "map_at_10": 0.93295, "map_at_20": 0.93344, "map_at_50": 0.93355, "map_at_100": 0.93355, "recall_at_1": 0.9, "recall_at_3": 0.96071, "recall_at_5": 0.98571, "recall_at_10": 0.98929, "recall_at_20": 0.99643, "recall_at_50": 1.0, "recall_at_100": 1.0, "precision_at_1": 0.9, "precision_at_3": 0.32024, "precision_at_5": 0.19714, "precision_at_10": 0.09893, "precision_at_20": 0.04982, "precision_at_50": 0.02, "precision_at_100": 0.01, "mrr_at_1": 0.9, "mrr_at_3": 0.9267857142857143, "mrr_at_5": 0.9317857142857144, "mrr_at_10": 0.9328273809523809, "mrr_at_20": 0.9333253205128206, "mrr_at_50": 0.9334303625296272, "mrr_at_100": 0.9334303625296272, "naucs_at_1_max": 0.7993697478991594, "naucs_at_1_std": 0.48374349739895933, "naucs_at_1_diff1": 0.9092136854741905, "naucs_at_3_max": 0.9881164587046973, "naucs_at_3_std": 0.7182327476445171, "naucs_at_3_diff1": 0.9524658348187793, "naucs_at_5_max": 1.0, "naucs_at_5_std": 0.865196078431377, "naucs_at_5_diff1": 0.9346405228758147, "naucs_at_10_max": 1.0, "naucs_at_10_std": 0.9128540305011011, "naucs_at_10_diff1": 0.9128540305011011, "naucs_at_20_max": 1.0, "naucs_at_20_std": 0.8692810457516478, "naucs_at_20_diff1": 0.8692810457516478, "naucs_at_50_max": 1.0, "naucs_at_50_std": 1.0, "naucs_at_50_diff1": 1.0, "naucs_at_100_max": 1.0, "naucs_at_100_std": 1.0, "naucs_at_100_diff1": 1.0}, "tatdqa_test": {"ndcg_at_1": 0.63913, "ndcg_at_3": 0.73348, "ndcg_at_5": 0.76119, "ndcg_at_10": 0.77795, "ndcg_at_20": 0.78597, "ndcg_at_50": 0.7922, "ndcg_at_100": 0.79398, "map_at_1": 0.63913, "map_at_3": 0.71061, "map_at_5": 0.72595, "map_at_10": 0.73302, "map_at_20": 0.73532, "map_at_50": 0.73641, "map_at_100": 0.73656, "recall_at_1": 0.63913, "recall_at_3": 0.79951, "recall_at_5": 0.86695, "recall_at_10": 0.91798, "recall_at_20": 0.94897, "recall_at_50": 0.97934, "recall_at_100": 0.99028, "precision_at_1": 0.63913, "precision_at_3": 0.2665, "precision_at_5": 0.17339, "precision_at_10": 0.0918, "precision_at_20": 0.04745, "precision_at_50": 0.01959, "precision_at_100": 0.0099, "mrr_at_1": 0.6391251518833536, "mrr_at_3": 0.7106115836371002, "mrr_at_5": 0.7256480356419612, "mrr_at_10": 0.7328699685625567, "mrr_at_20": 0.7350934149912067, "mrr_at_50": 0.7362113667635196, "mrr_at_100": 0.7363668461888006, "naucs_at_1_max": 0.5938210540556276, "naucs_at_1_std": -0.16049718029718266, "naucs_at_1_diff1": 0.7609838065385791, "naucs_at_3_max": 0.6431538299660706, "naucs_at_3_std": -0.08130035312037115, "naucs_at_3_diff1": 0.6646930087024925, "naucs_at_5_max": 0.6677283839470244, "naucs_at_5_std": -0.04183840532339394, "naucs_at_5_diff1": 0.6386845987046517, "naucs_at_10_max": 0.7170537401608961, "naucs_at_10_std": 0.029973785816548366, "naucs_at_10_diff1": 0.6180179387252528, "naucs_at_20_max": 0.7286213852092154, "naucs_at_20_std": 0.267131652053233, "naucs_at_20_diff1": 0.5728179001757068, "naucs_at_50_max": 0.8183455244679178, "naucs_at_50_std": 0.6268074134337968, "naucs_at_50_diff1": 0.540539174474304, "naucs_at_100_max": 0.9384258483213721, "naucs_at_100_std": 0.9047196439054298, "naucs_at_100_diff1": 0.6317586644999579}}