colqwen2-7b-v0.1 / results.json
manu's picture
Upload results.json
5ac26d9 verified
raw
history blame
16.3 kB
{"./data_dir/eval_vidore/tatdqa_test": {"ndcg_at_1": 0.67193, "ndcg_at_3": 0.77075, "ndcg_at_5": 0.79358, "ndcg_at_10": 0.8076, "ndcg_at_20": 0.81423, "ndcg_at_50": 0.81698, "ndcg_at_100": 0.81863, "map_at_1": 0.67193, "map_at_3": 0.74727, "map_at_5": 0.75996, "map_at_10": 0.76579, "map_at_20": 0.7677, "map_at_50": 0.76813, "map_at_100": 0.76827, "recall_at_1": 0.67193, "recall_at_3": 0.8384, "recall_at_5": 0.89368, "recall_at_10": 0.93682, "recall_at_20": 0.96233, "recall_at_50": 0.97631, "recall_at_100": 0.98663, "precision_at_1": 0.67193, "precision_at_3": 0.27947, "precision_at_5": 0.17874, "precision_at_10": 0.09368, "precision_at_20": 0.04812, "precision_at_50": 0.01953, "precision_at_100": 0.00987, "mrr_at_1": 0.6676792223572297, "mrr_at_3": 0.745240988254354, "mrr_at_5": 0.7566018631024706, "mrr_at_10": 0.7630472622422804, "mrr_at_20": 0.7648916939123942, "mrr_at_50": 0.7653111892014712, "mrr_at_100": 0.7654665531953649, "naucs_at_1_max": 0.20771145663189075, "naucs_at_1_std": -0.18773433911267384, "naucs_at_1_diff1": 0.8170194754624222, "naucs_at_3_max": 0.24607774142531255, "naucs_at_3_std": -0.16584110193613, "naucs_at_3_diff1": 0.7378398220281965, "naucs_at_5_max": 0.2989857582497622, "naucs_at_5_std": -0.08436505768312826, "naucs_at_5_diff1": 0.7055812813302946, "naucs_at_10_max": 0.4087086049178199, "naucs_at_10_std": 0.1542914363622356, "naucs_at_10_diff1": 0.6839773195644397, "naucs_at_20_max": 0.45412221479599435, "naucs_at_20_std": 0.3801693627818807, "naucs_at_20_diff1": 0.6874517110683748, "naucs_at_50_max": 0.42104082268255205, "naucs_at_50_std": 0.46988809251941027, "naucs_at_50_diff1": 0.6654484997896868, "naucs_at_100_max": 0.507330323866924, "naucs_at_100_std": 0.6683042871053126, "naucs_at_100_diff1": 0.661034185188578}, "./data_dir/eval_vidore/shiftproject_test": {"ndcg_at_1": 0.71, "ndcg_at_3": 0.82309, "ndcg_at_5": 0.83514, "ndcg_at_10": 0.84118, "ndcg_at_20": 0.84624, "ndcg_at_50": 0.84824, "ndcg_at_100": 0.84986, "map_at_1": 0.71, "map_at_3": 0.79333, "map_at_5": 0.79983, "map_at_10": 0.80208, "map_at_20": 0.80346, "map_at_50": 0.80379, "map_at_100": 0.80393, "recall_at_1": 0.71, "recall_at_3": 0.91, "recall_at_5": 0.94, "recall_at_10": 0.96, "recall_at_20": 0.98, "recall_at_50": 0.99, "recall_at_100": 1.0, "precision_at_1": 0.71, "precision_at_3": 0.30333, "precision_at_5": 0.188, "precision_at_10": 0.096, "precision_at_20": 0.049, "precision_at_50": 0.0198, "precision_at_100": 0.01, "mrr_at_1": 0.71, "mrr_at_3": 0.795, "mrr_at_5": 0.802, "mrr_at_10": 0.80425, "mrr_at_20": 0.8058733766233765, "mrr_at_50": 0.80620670995671, "mrr_at_100": 0.8063516374929418, "naucs_at_1_max": -0.006300613383243949, "naucs_at_1_std": -0.21616663269277062, "naucs_at_1_diff1": 0.6874339825435943, "naucs_at_3_max": 0.35667600373482716, "naucs_at_3_std": -0.1857557837949981, "naucs_at_3_diff1": 0.830635958086938, "naucs_at_5_max": 0.15561780267662587, "naucs_at_5_std": -0.39091192032368627, "naucs_at_5_diff1": 0.7895269218798655, "naucs_at_10_max": -0.04726890756302253, "naucs_at_10_std": -0.7935340802987776, "naucs_at_10_diff1": 0.8231792717086845, "naucs_at_20_max": -0.5088702147525547, "naucs_at_20_std": -0.43534080298785716, "naucs_at_20_diff1": 0.8692810457516353, "naucs_at_50_max": 0.7222222222222041, "naucs_at_50_std": 0.8692810457516374, "naucs_at_50_diff1": 0.8692810457516374, "naucs_at_100_max": NaN, "naucs_at_100_std": NaN, "naucs_at_100_diff1": NaN}, "./data_dir/eval_vidore/syntheticDocQA_artificial_intelligence_test": {"ndcg_at_1": 0.96, "ndcg_at_3": 0.97893, "ndcg_at_5": 0.98323, "ndcg_at_10": 0.98323, "ndcg_at_20": 0.98323, "ndcg_at_50": 0.98323, "ndcg_at_100": 0.98323, "map_at_1": 0.96, "map_at_3": 0.975, "map_at_5": 0.9775, "map_at_10": 0.9775, "map_at_20": 0.9775, "map_at_50": 0.9775, "map_at_100": 0.9775, "recall_at_1": 0.96, "recall_at_3": 0.99, "recall_at_5": 1.0, "recall_at_10": 1.0, "recall_at_20": 1.0, "recall_at_50": 1.0, "recall_at_100": 1.0, "precision_at_1": 0.96, "precision_at_3": 0.33, "precision_at_5": 0.2, "precision_at_10": 0.1, "precision_at_20": 0.05, "precision_at_50": 0.02, "precision_at_100": 0.01, "mrr_at_1": 0.96, "mrr_at_3": 0.975, "mrr_at_5": 0.9775, "mrr_at_10": 0.9775, "mrr_at_20": 0.9775, "mrr_at_50": 0.9775, "mrr_at_100": 0.9775, "naucs_at_1_max": 0.6458916900093364, "naucs_at_1_std": -0.053688141923436454, "naucs_at_1_diff1": 1.0, "naucs_at_3_max": 0.8692810457516356, "naucs_at_3_std": -1.1517273576097802, "naucs_at_3_diff1": 1.0, "naucs_at_5_max": 1.0, "naucs_at_5_std": 1.0, "naucs_at_5_diff1": 1.0, "naucs_at_10_max": 1.0, "naucs_at_10_std": 1.0, "naucs_at_10_diff1": 1.0, "naucs_at_20_max": 1.0, "naucs_at_20_std": 1.0, "naucs_at_20_diff1": 1.0, "naucs_at_50_max": NaN, "naucs_at_50_std": NaN, "naucs_at_50_diff1": NaN, "naucs_at_100_max": NaN, "naucs_at_100_std": NaN, "naucs_at_100_diff1": NaN}, "./data_dir/eval_vidore/syntheticDocQA_government_reports_test": {"ndcg_at_1": 0.88, "ndcg_at_3": 0.94047, "ndcg_at_5": 0.94865, "ndcg_at_10": 0.94865, "ndcg_at_20": 0.94865, "ndcg_at_50": 0.94865, "ndcg_at_100": 0.94865, "map_at_1": 0.88, "map_at_3": 0.92667, "map_at_5": 0.93117, "map_at_10": 0.93117, "map_at_20": 0.93117, "map_at_50": 0.93117, "map_at_100": 0.93117, "recall_at_1": 0.88, "recall_at_3": 0.98, "recall_at_5": 1.0, "recall_at_10": 1.0, "recall_at_20": 1.0, "recall_at_50": 1.0, "recall_at_100": 1.0, "precision_at_1": 0.88, "precision_at_3": 0.32667, "precision_at_5": 0.2, "precision_at_10": 0.1, "precision_at_20": 0.05, "precision_at_50": 0.02, "precision_at_100": 0.01, "mrr_at_1": 0.88, "mrr_at_3": 0.9283333333333332, "mrr_at_5": 0.9328333333333333, "mrr_at_10": 0.9328333333333333, "mrr_at_20": 0.9328333333333333, "mrr_at_50": 0.9328333333333333, "mrr_at_100": 0.9328333333333333, "naucs_at_1_max": 0.31053133948456807, "naucs_at_1_std": 0.3409163219853637, "naucs_at_1_diff1": 0.8739261851734011, "naucs_at_3_max": 0.6136788048552655, "naucs_at_3_std": 0.6136788048552655, "naucs_at_3_diff1": 0.7117180205415458, "naucs_at_5_max": 1.0, "naucs_at_5_std": 1.0, "naucs_at_5_diff1": 1.0, "naucs_at_10_max": 1.0, "naucs_at_10_std": 1.0, "naucs_at_10_diff1": 1.0, "naucs_at_20_max": 1.0, "naucs_at_20_std": 1.0, "naucs_at_20_diff1": 1.0, "naucs_at_50_max": NaN, "naucs_at_50_std": NaN, "naucs_at_50_diff1": NaN, "naucs_at_100_max": NaN, "naucs_at_100_std": NaN, "naucs_at_100_diff1": NaN}, "./data_dir/eval_vidore/arxivqa_test_subsampled": {"ndcg_at_1": 0.824, "ndcg_at_3": 0.87528, "ndcg_at_5": 0.88501, "ndcg_at_10": 0.89231, "ndcg_at_20": 0.89749, "ndcg_at_50": 0.89952, "ndcg_at_100": 0.90052, "map_at_1": 0.824, "map_at_3": 0.862, "map_at_5": 0.8673, "map_at_10": 0.87042, "map_at_20": 0.87191, "map_at_50": 0.87225, "map_at_100": 0.87235, "recall_at_1": 0.824, "recall_at_3": 0.914, "recall_at_5": 0.938, "recall_at_10": 0.96, "recall_at_20": 0.98, "recall_at_50": 0.99, "recall_at_100": 0.996, "precision_at_1": 0.824, "precision_at_3": 0.30467, "precision_at_5": 0.1876, "precision_at_10": 0.096, "precision_at_20": 0.049, "precision_at_50": 0.0198, "precision_at_100": 0.00996, "mrr_at_1": 0.822, "mrr_at_3": 0.8623333333333334, "mrr_at_5": 0.8669333333333333, "mrr_at_10": 0.8700460317460318, "mrr_at_20": 0.8716778804528804, "mrr_at_50": 0.8720248035298035, "mrr_at_100": 0.8721252844768993, "naucs_at_1_max": 0.735077815761065, "naucs_at_1_std": -0.04282115869017602, "naucs_at_1_diff1": 0.9371963835912196, "naucs_at_3_max": 0.7796126202418969, "naucs_at_3_std": -0.025850650337654255, "naucs_at_3_diff1": 0.9369205046359642, "naucs_at_5_max": 0.7821451161109595, "naucs_at_5_std": -0.09443992650824237, "naucs_at_5_diff1": 0.9525616698292219, "naucs_at_10_max": 0.7889355742296903, "naucs_at_10_std": -0.2129785247432343, "naucs_at_10_diff1": 0.9607843137254902, "naucs_at_20_max": 0.7794584500466787, "naucs_at_20_std": -0.02777777777778027, "naucs_at_20_diff1": 0.9477124183006537, "naucs_at_50_max": 0.9215686274509768, "naucs_at_50_std": -0.06750700280111896, "naucs_at_50_diff1": 0.947712418300658, "naucs_at_100_max": 0.9346405228758466, "naucs_at_100_std": -0.3699813258636757, "naucs_at_100_diff1": 1.0}, "./data_dir/eval_vidore/docvqa_test_subsampled": {"ndcg_at_1": 0.5255, "ndcg_at_3": 0.60078, "ndcg_at_5": 0.61862, "ndcg_at_10": 0.63259, "ndcg_at_20": 0.64451, "ndcg_at_50": 0.65881, "ndcg_at_100": 0.66752, "map_at_1": 0.5255, "map_at_3": 0.58167, "map_at_5": 0.59132, "map_at_10": 0.59728, "map_at_20": 0.60064, "map_at_50": 0.60285, "map_at_100": 0.60364, "recall_at_1": 0.5255, "recall_at_3": 0.65632, "recall_at_5": 0.70067, "recall_at_10": 0.74279, "recall_at_20": 0.78936, "recall_at_50": 0.86253, "recall_at_100": 0.91574, "precision_at_1": 0.5255, "precision_at_3": 0.21877, "precision_at_5": 0.14013, "precision_at_10": 0.07428, "precision_at_20": 0.03947, "precision_at_50": 0.01725, "precision_at_100": 0.00916, "mrr_at_1": 0.5277161862527716, "mrr_at_3": 0.5805617147080562, "mrr_at_5": 0.5903178122690318, "mrr_at_10": 0.5972389399218668, "mrr_at_20": 0.6002228297434856, "mrr_at_50": 0.6027282655343267, "mrr_at_100": 0.6033300437903428, "naucs_at_1_max": 0.34919146368331516, "naucs_at_1_std": 0.6755700583274495, "naucs_at_1_diff1": 0.9012163798897747, "naucs_at_3_max": 0.21972764067769676, "naucs_at_3_std": 0.7384263112544703, "naucs_at_3_diff1": 0.8261106084064109, "naucs_at_5_max": 0.13679495064259664, "naucs_at_5_std": 0.7543173419080406, "naucs_at_5_diff1": 0.8038332262621047, "naucs_at_10_max": 0.08213096380071569, "naucs_at_10_std": 0.8025911097016517, "naucs_at_10_diff1": 0.8067908578890264, "naucs_at_20_max": 0.009640010057001363, "naucs_at_20_std": 0.8318658815167514, "naucs_at_20_diff1": 0.7973567600141757, "naucs_at_50_max": -0.05840523108601927, "naucs_at_50_std": 0.8861125417030429, "naucs_at_50_diff1": 0.7971097456566356, "naucs_at_100_max": -0.17013898231075125, "naucs_at_100_std": 0.8872540701354344, "naucs_at_100_diff1": 0.7978782264372887}, "./data_dir/eval_vidore/syntheticDocQA_healthcare_industry_test": {"ndcg_at_1": 0.96, "ndcg_at_3": 0.98524, "ndcg_at_5": 0.98524, "ndcg_at_10": 0.98524, "ndcg_at_20": 0.98524, "ndcg_at_50": 0.98524, "ndcg_at_100": 0.98524, "map_at_1": 0.96, "map_at_3": 0.98, "map_at_5": 0.98, "map_at_10": 0.98, "map_at_20": 0.98, "map_at_50": 0.98, "map_at_100": 0.98, "recall_at_1": 0.96, "recall_at_3": 1.0, "recall_at_5": 1.0, "recall_at_10": 1.0, "recall_at_20": 1.0, "recall_at_50": 1.0, "recall_at_100": 1.0, "precision_at_1": 0.96, "precision_at_3": 0.33333, "precision_at_5": 0.2, "precision_at_10": 0.1, "precision_at_20": 0.05, "precision_at_50": 0.02, "precision_at_100": 0.01, "mrr_at_1": 0.96, "mrr_at_3": 0.98, "mrr_at_5": 0.98, "mrr_at_10": 0.98, "mrr_at_20": 0.98, "mrr_at_50": 0.98, "mrr_at_100": 0.98, "naucs_at_1_max": 0.47607376283847014, "naucs_at_1_std": 0.29470121381886283, "naucs_at_1_diff1": 1.0, "naucs_at_3_max": 1.0, "naucs_at_3_std": 1.0, "naucs_at_3_diff1": 1.0, "naucs_at_5_max": 1.0, "naucs_at_5_std": 1.0, "naucs_at_5_diff1": 1.0, "naucs_at_10_max": 1.0, "naucs_at_10_std": 1.0, "naucs_at_10_diff1": 1.0, "naucs_at_20_max": 1.0, "naucs_at_20_std": 1.0, "naucs_at_20_diff1": 1.0, "naucs_at_50_max": NaN, "naucs_at_50_std": NaN, "naucs_at_50_diff1": NaN, "naucs_at_100_max": NaN, "naucs_at_100_std": NaN, "naucs_at_100_diff1": NaN}, "./data_dir/eval_vidore/infovqa_test_subsampled": {"ndcg_at_1": 0.88664, "ndcg_at_3": 0.91464, "ndcg_at_5": 0.92466, "ndcg_at_10": 0.92913, "ndcg_at_20": 0.93018, "ndcg_at_50": 0.93097, "ndcg_at_100": 0.9323, "map_at_1": 0.88664, "map_at_3": 0.90756, "map_at_5": 0.91312, "map_at_10": 0.91491, "map_at_20": 0.91521, "map_at_50": 0.91533, "map_at_100": 0.91545, "recall_at_1": 0.88664, "recall_at_3": 0.93522, "recall_at_5": 0.95951, "recall_at_10": 0.97368, "recall_at_20": 0.97773, "recall_at_50": 0.98178, "recall_at_100": 0.98988, "precision_at_1": 0.88664, "precision_at_3": 0.31174, "precision_at_5": 0.1919, "precision_at_10": 0.09737, "precision_at_20": 0.04889, "precision_at_50": 0.01964, "precision_at_100": 0.0099, "mrr_at_1": 0.8825910931174089, "mrr_at_3": 0.9045209176788124, "mrr_at_5": 0.9107962213225371, "mrr_at_10": 0.9126630679262259, "mrr_at_20": 0.912966170396511, "mrr_at_50": 0.9130906841326399, "mrr_at_100": 0.9132104022267463, "naucs_at_1_max": 0.6260502828027972, "naucs_at_1_std": -0.005294178018755926, "naucs_at_1_diff1": 0.9399416231604794, "naucs_at_3_max": 0.7681566860034388, "naucs_at_3_std": 0.09777449128981919, "naucs_at_3_diff1": 0.9365795595509864, "naucs_at_5_max": 0.8274718121903979, "naucs_at_5_std": 0.28017408880961947, "naucs_at_5_diff1": 0.9469328268926711, "naucs_at_10_max": 0.8890624021380364, "naucs_at_10_std": 0.6020867105858281, "naucs_at_10_diff1": 0.9698612029081272, "naucs_at_20_max": 0.8807647892599361, "naucs_at_20_std": 0.5416116992436861, "naucs_at_20_diff1": 0.9643814216187027, "naucs_at_50_max": 0.8687793484360007, "naucs_at_50_std": 0.5014664630218402, "naucs_at_50_diff1": 0.9709774546522744, "naucs_at_100_max": 0.892212470822504, "naucs_at_100_std": 0.6872894779438028, "naucs_at_100_diff1": 1.0}, "./data_dir/eval_vidore/syntheticDocQA_energy_test": {"ndcg_at_1": 0.95, "ndcg_at_3": 0.96762, "ndcg_at_5": 0.96762, "ndcg_at_10": 0.96762, "ndcg_at_20": 0.96762, "ndcg_at_50": 0.97147, "ndcg_at_100": 0.97147, "map_at_1": 0.95, "map_at_3": 0.96333, "map_at_5": 0.96333, "map_at_10": 0.96333, "map_at_20": 0.96333, "map_at_50": 0.9639, "map_at_100": 0.9639, "recall_at_1": 0.95, "recall_at_3": 0.98, "recall_at_5": 0.98, "recall_at_10": 0.98, "recall_at_20": 0.98, "recall_at_50": 1.0, "recall_at_100": 1.0, "precision_at_1": 0.95, "precision_at_3": 0.32667, "precision_at_5": 0.196, "precision_at_10": 0.098, "precision_at_20": 0.049, "precision_at_50": 0.02, "precision_at_100": 0.01, "mrr_at_1": 0.97, "mrr_at_3": 0.975, "mrr_at_5": 0.975, "mrr_at_10": 0.975, "mrr_at_20": 0.975, "mrr_at_50": 0.9755971479500891, "mrr_at_100": 0.9755971479500891, "naucs_at_1_max": 0.02399626517273991, "naucs_at_1_std": -0.8497665732959815, "naucs_at_1_diff1": 0.9738562091503253, "naucs_at_3_max": 0.9346405228758099, "naucs_at_3_std": 0.19140989729224936, "naucs_at_3_diff1": 0.9346405228758099, "naucs_at_5_max": 0.9346405228758136, "naucs_at_5_std": 0.1914098972922579, "naucs_at_5_diff1": 0.9346405228758136, "naucs_at_10_max": 0.9346405228758136, "naucs_at_10_std": 0.1914098972922579, "naucs_at_10_diff1": 0.9346405228758136, "naucs_at_20_max": 0.9346405228758136, "naucs_at_20_std": 0.1914098972922579, "naucs_at_20_diff1": 0.9346405228758136, "naucs_at_50_max": NaN, "naucs_at_50_std": NaN, "naucs_at_50_diff1": NaN, "naucs_at_100_max": NaN, "naucs_at_100_std": NaN, "naucs_at_100_diff1": NaN}, "./data_dir/eval_vidore/tabfquad_test_subsampled": {"ndcg_at_1": 0.83214, "ndcg_at_3": 0.86764, "ndcg_at_5": 0.88133, "ndcg_at_10": 0.89185, "ndcg_at_20": 0.89926, "ndcg_at_50": 0.90195, "ndcg_at_100": 0.90195, "map_at_1": 0.83214, "map_at_3": 0.85893, "map_at_5": 0.86679, "map_at_10": 0.8712, "map_at_20": 0.87333, "map_at_50": 0.8737, "map_at_100": 0.8737, "recall_at_1": 0.83214, "recall_at_3": 0.89286, "recall_at_5": 0.925, "recall_at_10": 0.95714, "recall_at_20": 0.98571, "recall_at_50": 1.0, "recall_at_100": 1.0, "precision_at_1": 0.83214, "precision_at_3": 0.29762, "precision_at_5": 0.185, "precision_at_10": 0.09571, "precision_at_20": 0.04929, "precision_at_50": 0.02, "precision_at_100": 0.01, "mrr_at_1": 0.8321428571428572, "mrr_at_3": 0.8565476190476191, "mrr_at_5": 0.8663690476190476, "mrr_at_10": 0.8704435941043084, "mrr_at_20": 0.8729122974947554, "mrr_at_50": 0.8732756347375155, "mrr_at_100": 0.8732756347375155, "naucs_at_1_max": 0.4951548964909703, "naucs_at_1_std": 0.2199278478092164, "naucs_at_1_diff1": 0.8757052666904376, "naucs_at_3_max": 0.5832810047095762, "naucs_at_3_std": 0.4004395604395596, "naucs_at_3_diff1": 0.8785871271585566, "naucs_at_5_max": 0.605375483526744, "naucs_at_5_std": 0.4247921390778528, "naucs_at_5_diff1": 0.8749722111066649, "naucs_at_10_max": 0.5688608776844056, "naucs_at_10_std": 0.2660675381263621, "naucs_at_10_diff1": 0.922385620915035, "naucs_at_20_max": 0.865196078431377, "naucs_at_20_std": 0.7496498599439745, "naucs_at_20_diff1": 0.8978758169934754, "naucs_at_50_max": 1.0, "naucs_at_50_std": 1.0, "naucs_at_50_diff1": 1.0, "naucs_at_100_max": 1.0, "naucs_at_100_std": 1.0, "naucs_at_100_diff1": 1.0}}