colqwen2-2b-v1.0 / results.json
tattrongvu's picture
Upload 57 files
7e6afe8 verified
{
"vidore/arxivqa_test_subsampled": {
"ndcg_at_1": 0.85,
"ndcg_at_3": 0.89228,
"ndcg_at_5": 0.89969,
"ndcg_at_10": 0.90675,
"ndcg_at_20": 0.91237,
"ndcg_at_50": 0.91522,
"ndcg_at_100": 0.91554,
"map_at_1": 0.85,
"map_at_3": 0.882,
"map_at_5": 0.8861,
"map_at_10": 0.88898,
"map_at_20": 0.89055,
"map_at_50": 0.89104,
"map_at_100": 0.89107,
"recall_at_1": 0.85,
"recall_at_3": 0.922,
"recall_at_5": 0.94,
"recall_at_10": 0.962,
"recall_at_20": 0.984,
"recall_at_50": 0.998,
"recall_at_100": 1.0,
"precision_at_1": 0.85,
"precision_at_3": 0.30733,
"precision_at_5": 0.188,
"precision_at_10": 0.0962,
"precision_at_20": 0.0492,
"precision_at_50": 0.01996,
"precision_at_100": 0.01,
"mrr_at_1": 0.846,
"mrr_at_3": 0.8793333333333334,
"mrr_at_5": 0.8830333333333333,
"mrr_at_10": 0.8864992063492062,
"mrr_at_20": 0.8880353542656172,
"mrr_at_50": 0.8885337581333198,
"mrr_at_100": 0.8885597321592938,
"naucs_at_1_max": 0.807211194272698,
"naucs_at_1_std": -0.05267165636186127,
"naucs_at_1_diff1": 0.9369345916042959,
"naucs_at_3_max": 0.8579209461562436,
"naucs_at_3_std": 0.05307764131293816,
"naucs_at_3_diff1": 0.9121956474897643,
"naucs_at_5_max": 0.8668689698101463,
"naucs_at_5_std": 0.1076719576719556,
"naucs_at_5_diff1": 0.9274042950513546,
"naucs_at_10_max": 0.9051550444739312,
"naucs_at_10_std": 0.11334709322325026,
"naucs_at_10_diff1": 0.9363605091159263,
"naucs_at_20_max": 0.9115896358543447,
"naucs_at_20_std": 0.0822829131652637,
"naucs_at_20_diff1": 0.9325980392156931,
"naucs_at_50_max": 0.86928104575168,
"naucs_at_50_std": -1.151727357609834,
"naucs_at_50_diff1": 1.0,
"naucs_at_100_max": 1.0,
"naucs_at_100_std": 1.0,
"naucs_at_100_diff1": 1.0
},
"vidore/docvqa_test_subsampled": {
"ndcg_at_1": 0.5255,
"ndcg_at_3": 0.58323,
"ndcg_at_5": 0.60928,
"ndcg_at_10": 0.6312,
"ndcg_at_20": 0.64271,
"ndcg_at_50": 0.65172,
"ndcg_at_100": 0.66009,
"map_at_1": 0.5255,
"map_at_3": 0.56874,
"map_at_5": 0.58348,
"map_at_10": 0.59235,
"map_at_20": 0.59566,
"map_at_50": 0.597,
"map_at_100": 0.59776,
"recall_at_1": 0.5255,
"recall_at_3": 0.62528,
"recall_at_5": 0.68736,
"recall_at_10": 0.7561,
"recall_at_20": 0.80044,
"recall_at_50": 0.84701,
"recall_at_100": 0.898,
"precision_at_1": 0.5255,
"precision_at_3": 0.20843,
"precision_at_5": 0.13747,
"precision_at_10": 0.07561,
"precision_at_20": 0.04002,
"precision_at_50": 0.01694,
"precision_at_100": 0.00898,
"mrr_at_1": 0.5210643015521065,
"mrr_at_3": 0.567257945306726,
"mrr_at_5": 0.5807834441980785,
"mrr_at_10": 0.5902518213493823,
"mrr_at_20": 0.5930426782324527,
"mrr_at_50": 0.5946364866259196,
"mrr_at_100": 0.5951585532787789,
"naucs_at_1_max": 0.17116973406228145,
"naucs_at_1_std": 0.19544078728073017,
"naucs_at_1_diff1": 0.8677435977596096,
"naucs_at_3_max": 0.058557313285818244,
"naucs_at_3_std": 0.2717799040343582,
"naucs_at_3_diff1": 0.8164636793441545,
"naucs_at_5_max": -0.05874522172882286,
"naucs_at_5_std": 0.3665163783010554,
"naucs_at_5_diff1": 0.7947909776107586,
"naucs_at_10_max": -0.25417632083805924,
"naucs_at_10_std": 0.4815135951184752,
"naucs_at_10_diff1": 0.7793392745175759,
"naucs_at_20_max": -0.4248479263934413,
"naucs_at_20_std": 0.5025457196714144,
"naucs_at_20_diff1": 0.8088576009445793,
"naucs_at_50_max": -0.6253326294965954,
"naucs_at_50_std": 0.7313108018974633,
"naucs_at_50_diff1": 0.8583751909406857,
"naucs_at_100_max": -0.8449611456968541,
"naucs_at_100_std": 0.9545749692417804,
"naucs_at_100_diff1": 0.8604715807203863
},
"vidore/infovqa_test_subsampled": {
"ndcg_at_1": 0.87247,
"ndcg_at_3": 0.91404,
"ndcg_at_5": 0.91918,
"ndcg_at_10": 0.92524,
"ndcg_at_20": 0.92769,
"ndcg_at_50": 0.92926,
"ndcg_at_100": 0.92926,
"map_at_1": 0.87247,
"map_at_3": 0.90452,
"map_at_5": 0.90746,
"map_at_10": 0.91005,
"map_at_20": 0.91067,
"map_at_50": 0.9109,
"map_at_100": 0.9109,
"recall_at_1": 0.87247,
"recall_at_3": 0.9413,
"recall_at_5": 0.95344,
"recall_at_10": 0.97166,
"recall_at_20": 0.98178,
"recall_at_50": 0.98988,
"recall_at_100": 0.98988,
"precision_at_1": 0.87247,
"precision_at_3": 0.31377,
"precision_at_5": 0.19069,
"precision_at_10": 0.09717,
"precision_at_20": 0.04909,
"precision_at_50": 0.0198,
"precision_at_100": 0.0099,
"mrr_at_1": 0.8704453441295547,
"mrr_at_3": 0.9035087719298244,
"mrr_at_5": 0.9063427800269903,
"mrr_at_10": 0.9085799434483645,
"mrr_at_20": 0.9091654351207062,
"mrr_at_50": 0.9094025116628965,
"mrr_at_100": 0.9094025116628965,
"naucs_at_1_max": 0.5862949877081309,
"naucs_at_1_std": -0.09978842769982305,
"naucs_at_1_diff1": 0.9422575413582027,
"naucs_at_3_max": 0.6682958971071765,
"naucs_at_3_std": -0.17493815995842807,
"naucs_at_3_diff1": 0.9255153259160952,
"naucs_at_5_max": 0.7631677959063347,
"naucs_at_5_std": 0.10157587361064939,
"naucs_at_5_diff1": 0.9117628654622407,
"naucs_at_10_max": 0.8838078085686626,
"naucs_at_10_std": 0.5343512930451619,
"naucs_at_10_diff1": 0.9148610774134698,
"naucs_at_20_max": 0.9546293120196974,
"naucs_at_20_std": 0.7223350051556908,
"naucs_at_20_diff1": 0.9564661819784059,
"naucs_at_50_max": 0.9183327616354471,
"naucs_at_50_std": 0.6841596004695476,
"naucs_at_50_diff1": 0.9477594183740937,
"naucs_at_100_max": 0.9183327616354471,
"naucs_at_100_std": 0.6841596004695476,
"naucs_at_100_diff1": 0.9477594183740937
},
"vidore/tabfquad_test_subsampled": {
"ndcg_at_1": 0.9,
"ndcg_at_3": 0.94188,
"ndcg_at_5": 0.94342,
"ndcg_at_10": 0.95164,
"ndcg_at_20": 0.95164,
"ndcg_at_50": 0.95237,
"ndcg_at_100": 0.95237,
"map_at_1": 0.9,
"map_at_3": 0.93274,
"map_at_5": 0.93363,
"map_at_10": 0.93711,
"map_at_20": 0.93711,
"map_at_50": 0.93723,
"map_at_100": 0.93723,
"recall_at_1": 0.9,
"recall_at_3": 0.96786,
"recall_at_5": 0.97143,
"recall_at_10": 0.99643,
"recall_at_20": 0.99643,
"recall_at_50": 1.0,
"recall_at_100": 1.0,
"precision_at_1": 0.9,
"precision_at_3": 0.32262,
"precision_at_5": 0.19429,
"precision_at_10": 0.09964,
"precision_at_20": 0.04982,
"precision_at_50": 0.02,
"precision_at_100": 0.01,
"mrr_at_1": 0.8964285714285715,
"mrr_at_3": 0.930952380952381,
"mrr_at_5": 0.9318452380952381,
"mrr_at_10": 0.9354053287981859,
"mrr_at_20": 0.9354053287981859,
"mrr_at_50": 0.9355284815075456,
"mrr_at_100": 0.9355284815075456,
"naucs_at_1_max": 0.6023242630385479,
"naucs_at_1_std": 0.1999466453247955,
"naucs_at_1_diff1": 0.9321395224756563,
"naucs_at_3_max": 0.9709513435003594,
"naucs_at_3_std": 0.7533457827575493,
"naucs_at_3_diff1": 0.9400871459694935,
"naucs_at_5_max": 0.9673202614379075,
"naucs_at_5_std": 0.7572362278244656,
"naucs_at_5_diff1": 0.932598039215689,
"naucs_at_10_max": 1.0,
"naucs_at_10_std": 1.0,
"naucs_at_10_diff1": 0.72222222222224,
"naucs_at_20_max": 1.0,
"naucs_at_20_std": 1.0,
"naucs_at_20_diff1": 0.72222222222224,
"naucs_at_50_max": 1.0,
"naucs_at_50_std": 1.0,
"naucs_at_50_diff1": 1.0,
"naucs_at_100_max": 1.0,
"naucs_at_100_std": 1.0,
"naucs_at_100_diff1": 1.0
},
"vidore/tatdqa_test": {
"ndcg_at_1": 0.67922,
"ndcg_at_3": 0.77126,
"ndcg_at_5": 0.79547,
"ndcg_at_10": 0.81213,
"ndcg_at_20": 0.81714,
"ndcg_at_50": 0.8201,
"ndcg_at_100": 0.82157,
"map_at_1": 0.67922,
"map_at_3": 0.74868,
"map_at_5": 0.76223,
"map_at_10": 0.7692,
"map_at_20": 0.77062,
"map_at_50": 0.77108,
"map_at_100": 0.7712,
"recall_at_1": 0.67922,
"recall_at_3": 0.83657,
"recall_at_5": 0.8949,
"recall_at_10": 0.94593,
"recall_at_20": 0.96537,
"recall_at_50": 0.98056,
"recall_at_100": 0.98967,
"precision_at_1": 0.67922,
"precision_at_3": 0.27886,
"precision_at_5": 0.17898,
"precision_at_10": 0.09459,
"precision_at_20": 0.04827,
"precision_at_50": 0.01961,
"precision_at_100": 0.0099,
"mrr_at_1": 0.6773997569866342,
"mrr_at_3": 0.7477723774807619,
"mrr_at_5": 0.7615633859862302,
"mrr_at_10": 0.7684981870431451,
"mrr_at_20": 0.7700138577184539,
"mrr_at_50": 0.7704845824005803,
"mrr_at_100": 0.7706159963424961,
"naucs_at_1_max": 0.1774117896564107,
"naucs_at_1_std": -0.24832936266113984,
"naucs_at_1_diff1": 0.7996783800774746,
"naucs_at_3_max": 0.26913363145255553,
"naucs_at_3_std": -0.17474231347643812,
"naucs_at_3_diff1": 0.7326803741116257,
"naucs_at_5_max": 0.36576896450364044,
"naucs_at_5_std": -0.032454808755900705,
"naucs_at_5_diff1": 0.7033807158189981,
"naucs_at_10_max": 0.3646700445883288,
"naucs_at_10_std": 0.19880405123210632,
"naucs_at_10_diff1": 0.7042603308547618,
"naucs_at_20_max": 0.4634752837344628,
"naucs_at_20_std": 0.4658794215520421,
"naucs_at_20_diff1": 0.6598124404673089,
"naucs_at_50_max": 0.6289968950467605,
"naucs_at_50_std": 0.6642506493403703,
"naucs_at_50_diff1": 0.7500502336238475,
"naucs_at_100_max": 0.5973270147647666,
"naucs_at_100_std": 0.6380160564965871,
"naucs_at_100_diff1": 0.7184268296201503
},
"vidore/shiftproject_test": {
"ndcg_at_1": 0.8,
"ndcg_at_3": 0.87809,
"ndcg_at_5": 0.89875,
"ndcg_at_10": 0.90231,
"ndcg_at_20": 0.90231,
"ndcg_at_50": 0.90231,
"ndcg_at_100": 0.90392,
"map_at_1": 0.8,
"map_at_3": 0.86,
"map_at_5": 0.8715,
"map_at_10": 0.87317,
"map_at_20": 0.87317,
"map_at_50": 0.87317,
"map_at_100": 0.8733,
"recall_at_1": 0.8,
"recall_at_3": 0.93,
"recall_at_5": 0.98,
"recall_at_10": 0.99,
"recall_at_20": 0.99,
"recall_at_50": 0.99,
"recall_at_100": 1.0,
"precision_at_1": 0.8,
"precision_at_3": 0.31,
"precision_at_5": 0.196,
"precision_at_10": 0.099,
"precision_at_20": 0.0495,
"precision_at_50": 0.0198,
"precision_at_100": 0.01,
"mrr_at_1": 0.79,
"mrr_at_3": 0.865,
"mrr_at_5": 0.872,
"mrr_at_10": 0.8736666666666667,
"mrr_at_20": 0.8736666666666667,
"mrr_at_50": 0.8736666666666667,
"mrr_at_100": 0.8738036529680366,
"naucs_at_1_max": 0.1717282717282722,
"naucs_at_1_std": -0.36158841158841215,
"naucs_at_1_diff1": 0.8469030969030963,
"naucs_at_3_max": 0.01674002934507224,
"naucs_at_3_std": -0.664332399626516,
"naucs_at_3_diff1": 0.8195945044684548,
"naucs_at_5_max": 0.35807656395892185,
"naucs_at_5_std": -0.10270774976657283,
"naucs_at_5_diff1": 0.7117180205415541,
"naucs_at_10_max": 0.35807656395891135,
"naucs_at_10_std": 0.35807656395891135,
"naucs_at_10_diff1": 0.5541549953314738,
"naucs_at_20_max": 0.35807656395891135,
"naucs_at_20_std": 0.35807656395891135,
"naucs_at_20_diff1": 0.5541549953314738,
"naucs_at_50_max": 0.35807656395892007,
"naucs_at_50_std": 0.35807656395892007,
"naucs_at_50_diff1": 0.554154995331464,
"naucs_at_100_max": null,
"naucs_at_100_std": null,
"naucs_at_100_diff1": null
},
"vidore/syntheticDocQA_artificial_intelligence_test": {
"ndcg_at_1": 0.99,
"ndcg_at_3": 0.99631,
"ndcg_at_5": 0.99631,
"ndcg_at_10": 0.99631,
"ndcg_at_20": 0.99631,
"ndcg_at_50": 0.99631,
"ndcg_at_100": 0.99631,
"map_at_1": 0.99,
"map_at_3": 0.995,
"map_at_5": 0.995,
"map_at_10": 0.995,
"map_at_20": 0.995,
"map_at_50": 0.995,
"map_at_100": 0.995,
"recall_at_1": 0.99,
"recall_at_3": 1.0,
"recall_at_5": 1.0,
"recall_at_10": 1.0,
"recall_at_20": 1.0,
"recall_at_50": 1.0,
"recall_at_100": 1.0,
"precision_at_1": 0.99,
"precision_at_3": 0.33333,
"precision_at_5": 0.2,
"precision_at_10": 0.1,
"precision_at_20": 0.05,
"precision_at_50": 0.02,
"precision_at_100": 0.01,
"mrr_at_1": 0.99,
"mrr_at_3": 0.995,
"mrr_at_5": 0.995,
"mrr_at_10": 0.995,
"mrr_at_20": 0.995,
"mrr_at_50": 0.995,
"mrr_at_100": 0.995,
"naucs_at_1_max": 0.7222222222222201,
"naucs_at_1_std": 0.7222222222222201,
"naucs_at_1_diff1": 1.0,
"naucs_at_3_max": 1.0,
"naucs_at_3_std": 1.0,
"naucs_at_3_diff1": 1.0,
"naucs_at_5_max": 1.0,
"naucs_at_5_std": 1.0,
"naucs_at_5_diff1": 1.0,
"naucs_at_10_max": 1.0,
"naucs_at_10_std": 1.0,
"naucs_at_10_diff1": 1.0,
"naucs_at_20_max": 1.0,
"naucs_at_20_std": 1.0,
"naucs_at_20_diff1": 1.0,
"naucs_at_50_max": null,
"naucs_at_50_std": null,
"naucs_at_50_diff1": null,
"naucs_at_100_max": null,
"naucs_at_100_std": null,
"naucs_at_100_diff1": null
},
"vidore/syntheticDocQA_energy_test": {
"ndcg_at_1": 0.94,
"ndcg_at_3": 0.95131,
"ndcg_at_5": 0.95992,
"ndcg_at_10": 0.96641,
"ndcg_at_20": 0.96641,
"ndcg_at_50": 0.96641,
"ndcg_at_100": 0.96641,
"map_at_1": 0.94,
"map_at_3": 0.94833,
"map_at_5": 0.95333,
"map_at_10": 0.95601,
"map_at_20": 0.95601,
"map_at_50": 0.95601,
"map_at_100": 0.95601,
"recall_at_1": 0.94,
"recall_at_3": 0.96,
"recall_at_5": 0.98,
"recall_at_10": 1.0,
"recall_at_20": 1.0,
"recall_at_50": 1.0,
"recall_at_100": 1.0,
"precision_at_1": 0.94,
"precision_at_3": 0.32,
"precision_at_5": 0.196,
"precision_at_10": 0.1,
"precision_at_20": 0.05,
"precision_at_50": 0.02,
"precision_at_100": 0.01,
"mrr_at_1": 0.94,
"mrr_at_3": 0.9533333333333333,
"mrr_at_5": 0.9558333333333333,
"mrr_at_10": 0.9589285714285716,
"mrr_at_20": 0.9589285714285716,
"mrr_at_50": 0.9589285714285716,
"mrr_at_100": 0.9589285714285716,
"naucs_at_1_max": 0.6961562402738896,
"naucs_at_1_std": -0.4341736694677865,
"naucs_at_1_diff1": 0.9782135076252712,
"naucs_at_3_max": 0.73739495798319,
"naucs_at_3_std": -0.9213352007469611,
"naucs_at_3_diff1": 1.0,
"naucs_at_5_max": 0.6136788048552745,
"naucs_at_5_std": -1.7399626517273414,
"naucs_at_5_diff1": 1.0,
"naucs_at_10_max": 1.0,
"naucs_at_10_std": 1.0,
"naucs_at_10_diff1": 1.0,
"naucs_at_20_max": 1.0,
"naucs_at_20_std": 1.0,
"naucs_at_20_diff1": 1.0,
"naucs_at_50_max": null,
"naucs_at_50_std": null,
"naucs_at_50_diff1": null,
"naucs_at_100_max": null,
"naucs_at_100_std": null,
"naucs_at_100_diff1": null
},
"vidore/syntheticDocQA_government_reports_test": {
"ndcg_at_1": 0.88,
"ndcg_at_3": 0.95178,
"ndcg_at_5": 0.95178,
"ndcg_at_10": 0.95178,
"ndcg_at_20": 0.95178,
"ndcg_at_50": 0.95178,
"ndcg_at_100": 0.95178,
"map_at_1": 0.88,
"map_at_3": 0.935,
"map_at_5": 0.935,
"map_at_10": 0.935,
"map_at_20": 0.935,
"map_at_50": 0.935,
"map_at_100": 0.935,
"recall_at_1": 0.88,
"recall_at_3": 1.0,
"recall_at_5": 1.0,
"recall_at_10": 1.0,
"recall_at_20": 1.0,
"recall_at_50": 1.0,
"recall_at_100": 1.0,
"precision_at_1": 0.88,
"precision_at_3": 0.33333,
"precision_at_5": 0.2,
"precision_at_10": 0.1,
"precision_at_20": 0.05,
"precision_at_50": 0.02,
"precision_at_100": 0.01,
"mrr_at_1": 0.89,
"mrr_at_3": 0.9416666666666668,
"mrr_at_5": 0.9416666666666668,
"mrr_at_10": 0.9416666666666668,
"mrr_at_20": 0.9416666666666668,
"mrr_at_50": 0.9416666666666668,
"mrr_at_100": 0.9416666666666668,
"naucs_at_1_max": 0.42968501431753087,
"naucs_at_1_std": 0.40972001272669406,
"naucs_at_1_diff1": 0.8544384346166086,
"naucs_at_3_max": 1.0,
"naucs_at_3_std": 1.0,
"naucs_at_3_diff1": 1.0,
"naucs_at_5_max": 1.0,
"naucs_at_5_std": 1.0,
"naucs_at_5_diff1": 1.0,
"naucs_at_10_max": 1.0,
"naucs_at_10_std": 1.0,
"naucs_at_10_diff1": 1.0,
"naucs_at_20_max": 1.0,
"naucs_at_20_std": 1.0,
"naucs_at_20_diff1": 1.0,
"naucs_at_50_max": null,
"naucs_at_50_std": null,
"naucs_at_50_diff1": null,
"naucs_at_100_max": null,
"naucs_at_100_std": null,
"naucs_at_100_diff1": null
},
"vidore/syntheticDocQA_healthcare_industry_test": {
"ndcg_at_1": 0.97,
"ndcg_at_3": 0.98893,
"ndcg_at_5": 0.98893,
"ndcg_at_10": 0.98893,
"ndcg_at_20": 0.98893,
"ndcg_at_50": 0.98893,
"ndcg_at_100": 0.98893,
"map_at_1": 0.97,
"map_at_3": 0.985,
"map_at_5": 0.985,
"map_at_10": 0.985,
"map_at_20": 0.985,
"map_at_50": 0.985,
"map_at_100": 0.985,
"recall_at_1": 0.97,
"recall_at_3": 1.0,
"recall_at_5": 1.0,
"recall_at_10": 1.0,
"recall_at_20": 1.0,
"recall_at_50": 1.0,
"recall_at_100": 1.0,
"precision_at_1": 0.97,
"precision_at_3": 0.33333,
"precision_at_5": 0.2,
"precision_at_10": 0.1,
"precision_at_20": 0.05,
"precision_at_50": 0.02,
"precision_at_100": 0.01,
"mrr_at_1": 0.98,
"mrr_at_3": 0.99,
"mrr_at_5": 0.99,
"mrr_at_10": 0.99,
"mrr_at_20": 0.99,
"mrr_at_50": 0.99,
"mrr_at_100": 0.99,
"naucs_at_1_max": 0.5448179271708694,
"naucs_at_1_std": 0.044817927170871553,
"naucs_at_1_diff1": 1.0,
"naucs_at_3_max": 1.0,
"naucs_at_3_std": 1.0,
"naucs_at_3_diff1": 1.0,
"naucs_at_5_max": 1.0,
"naucs_at_5_std": 1.0,
"naucs_at_5_diff1": 1.0,
"naucs_at_10_max": 1.0,
"naucs_at_10_std": 1.0,
"naucs_at_10_diff1": 1.0,
"naucs_at_20_max": 1.0,
"naucs_at_20_std": 1.0,
"naucs_at_20_diff1": 1.0,
"naucs_at_50_max": null,
"naucs_at_50_std": null,
"naucs_at_50_diff1": null,
"naucs_at_100_max": null,
"naucs_at_100_std": null,
"naucs_at_100_diff1": null
}
}