{"GEM/web_nlg_en": {"0": {"PALM_prompt": {"bleu": 0.31620109957758985, "bleu_stderr": 0.0436977639970438, "rouge1_fmeasure": 0.10315902016726786, "rouge1_fmeasure_stderr": 0.0019060070438482958, "rouge1_precision": 0.06769961049671226, "rouge1_precision_stderr": 0.0014408731719188182, "rouge1_recall": 0.2867407372924206, "rouge1_recall_stderr": 0.004571157006568459, "rouge2_fmeasure": 0.048680633498613235, "rouge2_fmeasure_stderr": 0.0012001070226091816, "rouge2_precision": 0.031623473816054536, "rouge2_precision_stderr": 0.0008563816673904925, "rouge2_recall": 0.14002477235273347, "rouge2_recall_stderr": 0.0030829927271468455, "rougeL_fmeasure": 0.10001471836261917, "rougeL_fmeasure_stderr": 0.0018101971022073298, "rougeL_precision": 0.06551735699492812, "rougeL_precision_stderr": 0.001360472354290908, "rougeL_recall": 0.27974078406805947, "rougeL_recall_stderr": 0.004483148560424672, "rougeLsum_fmeasure": 0.09908745681833024, "rougeLsum_fmeasure_stderr": 0.001816434962081851, "rougeLsum_precision": 0.06504923908690437, "rougeLsum_precision_stderr": 0.0013793228194582826, "rougeLsum_recall": 0.2754429077514643, "rougeLsum_recall_stderr": 0.00433299850418606}}, "1": {"PALM_prompt": {"bleu": 0.4465798489958593, "bleu_stderr": 0.03821208721897477, "rouge1_fmeasure": 0.11510221349692805, "rouge1_fmeasure_stderr": 0.0018417715919236185, "rouge1_precision": 0.07371823857673165, "rouge1_precision_stderr": 0.0013763349225185478, "rouge1_recall": 0.3688809731011637, "rouge1_recall_stderr": 0.005115562578388885, "rouge2_fmeasure": 0.053026565677639095, "rouge2_fmeasure_stderr": 0.0011718066518224836, "rouge2_precision": 0.03378602637117124, "rouge2_precision_stderr": 0.000831107209277974, "rouge2_recall": 0.17620010741543168, "rouge2_recall_stderr": 0.0034569647317057232, "rougeL_fmeasure": 0.10846810658720578, "rougeL_fmeasure_stderr": 0.0016257087585928257, "rougeL_precision": 0.06938216236815531, "rougeL_precision_stderr": 0.0012090035216715325, "rougeL_recall": 0.34811809237457786, "rougeL_recall_stderr": 0.004687691743161809, "rougeLsum_fmeasure": 0.11005414089372284, "rougeLsum_fmeasure_stderr": 0.0017281404618979693, "rougeLsum_precision": 0.07050615181309323, "rougeLsum_precision_stderr": 0.0012933152319356035, "rougeLsum_recall": 0.3514069079411779, "rougeLsum_recall_stderr": 0.004710020922149002}}, "2": {"PALM_prompt": {"bleu": 0.49390694019851883, "bleu_stderr": 0.03283528773113811, "rouge1_fmeasure": 0.11167166378709677, "rouge1_fmeasure_stderr": 0.0016694573474676788, "rouge1_precision": 0.07053978792457792, "rouge1_precision_stderr": 0.0012141148921630063, "rouge1_recall": 0.3722085841928087, "rouge1_recall_stderr": 0.004932224410126405, "rouge2_fmeasure": 0.05071036081345163, "rouge2_fmeasure_stderr": 0.0010731951740562927, "rouge2_precision": 0.031882639973859254, "rouge2_precision_stderr": 0.0007440437082987532, "rouge2_recall": 0.179162100861545, "rouge2_recall_stderr": 0.0036067927027667616, "rougeL_fmeasure": 0.10482960375745125, "rougeL_fmeasure_stderr": 0.0015367324295981716, "rougeL_precision": 0.0662695912572972, "rougeL_precision_stderr": 0.001111137879131896, "rougeL_recall": 0.34634376427492525, "rougeL_recall_stderr": 0.004426222539040666, "rougeLsum_fmeasure": 0.10651850585213189, "rougeLsum_fmeasure_stderr": 0.0015844678024154568, "rougeLsum_precision": 0.06731544242555773, "rougeLsum_precision_stderr": 0.0011479427958618216, "rougeLsum_recall": 0.35393011607524494, "rougeLsum_recall_stderr": 0.004611169262021209}}, "3": {"PALM_prompt": {"bleu": 0.5426048325951223, "bleu_stderr": 0.03414762901334615, "rouge1_fmeasure": 0.11159350504871245, "rouge1_fmeasure_stderr": 0.0016562900359034227, "rouge1_precision": 0.07041178144389862, "rouge1_precision_stderr": 0.0012146468016201537, "rouge1_recall": 0.3806080313854094, "rouge1_recall_stderr": 0.004930952912276716, "rouge2_fmeasure": 0.051399485378853214, "rouge2_fmeasure_stderr": 0.0010807547835818652, "rouge2_precision": 0.032283483005272874, "rouge2_precision_stderr": 0.0007563256470583733, "rouge2_recall": 0.18522848506406464, "rouge2_recall_stderr": 0.0035881170072198853, "rougeL_fmeasure": 0.10376227199390708, "rougeL_fmeasure_stderr": 0.001492834950808515, "rougeL_precision": 0.06553805543962049, "rougeL_precision_stderr": 0.0010879995668703526, "rougeL_recall": 0.3498070556202262, "rougeL_recall_stderr": 0.004296322479898717, "rougeLsum_fmeasure": 0.10593510385968205, "rougeLsum_fmeasure_stderr": 0.0015633618969914315, "rougeLsum_precision": 0.06689940608066422, "rougeLsum_precision_stderr": 0.0011444191721156794, "rougeLsum_recall": 0.35921150590689427, "rougeLsum_recall_stderr": 0.004534305089149354}}, "4": {"PALM_prompt": {"bleu": 0.6158935835123573, "bleu_stderr": 0.03969439975973284, "rouge1_fmeasure": 0.1127232845633186, "rouge1_fmeasure_stderr": 0.001650148473844283, "rouge1_precision": 0.07095341891738169, "rouge1_precision_stderr": 0.0012268960930883893, "rouge1_recall": 0.3948815888890596, "rouge1_recall_stderr": 0.00505695792325671, "rouge2_fmeasure": 0.05230538013971725, "rouge2_fmeasure_stderr": 0.0010638238078717074, "rouge2_precision": 0.03272634340230286, "rouge2_precision_stderr": 0.0007457412019553036, "rouge2_recall": 0.1970032898801884, "rouge2_recall_stderr": 0.003797281265549432, "rougeL_fmeasure": 0.10397420735695281, "rougeL_fmeasure_stderr": 0.001479748305227831, "rougeL_precision": 0.06554986867988374, "rougeL_precision_stderr": 0.001099297326932835, "rougeL_recall": 0.36044030372432745, "rougeL_recall_stderr": 0.004445317364552965, "rougeLsum_fmeasure": 0.10684181144801078, "rougeLsum_fmeasure_stderr": 0.001555630994167373, "rougeLsum_precision": 0.0673318377529105, "rougeLsum_precision_stderr": 0.0011577821136081392, "rougeLsum_recall": 0.37274353850210856, "rougeLsum_recall_stderr": 0.004690673077697574}}, "5": {"PALM_prompt": {"bleu": 0.5599015034833886, "bleu_stderr": 0.02863116158124125, "rouge1_fmeasure": 0.11039512335080189, "rouge1_fmeasure_stderr": 0.0015466817445104132, "rouge1_precision": 0.06902840436505926, "rouge1_precision_stderr": 0.0011145856685702779, "rouge1_recall": 0.39323447465184375, "rouge1_recall_stderr": 0.004991043149363716, "rouge2_fmeasure": 0.05099483054042069, "rouge2_fmeasure_stderr": 0.0010204042678031483, "rouge2_precision": 0.031714162258970564, "rouge2_precision_stderr": 0.0006995612067700058, "rouge2_recall": 0.19495949944965052, "rouge2_recall_stderr": 0.0038121376683133124, "rougeL_fmeasure": 0.1017740535739683, "rougeL_fmeasure_stderr": 0.0014243479541065289, "rougeL_precision": 0.06382078815066221, "rougeL_precision_stderr": 0.0010298208385526133, "rougeL_recall": 0.3570036135407675, "rougeL_recall_stderr": 0.00431277011710034, "rougeLsum_fmeasure": 0.1044773680345822, "rougeLsum_fmeasure_stderr": 0.001473141262559054, "rougeLsum_precision": 0.06543964695789724, "rougeLsum_precision_stderr": 0.0010627633224600764, "rougeLsum_recall": 0.369631200254553, "rougeLsum_recall_stderr": 0.004590693587109356}}}, "GEM/wiki_lingua_en": {"0": {"tldr_en": {"bleu": 1.60885283648322, "bleu_stderr": 0.046404803775343256, "rouge1_fmeasure": 0.16981770764951246, "rouge1_fmeasure_stderr": 0.0018844380426673607, "rouge1_precision": 0.146341713551491, "rouge1_precision_stderr": 0.001907488992714226, "rouge1_recall": 0.24303710279927596, "rouge1_recall_stderr": 0.0026740629162863815, "rouge2_fmeasure": 0.03548853418089557, "rouge2_fmeasure_stderr": 0.0008596537307285957, "rouge2_precision": 0.030255907844947725, "rouge2_precision_stderr": 0.0007661823292966557, "rouge2_recall": 0.0524686714748099, "rouge2_recall_stderr": 0.0013880458970171093, "rougeL_fmeasure": 0.1358656284421895, "rougeL_fmeasure_stderr": 0.001389903118786626, "rougeL_precision": 0.11563887486905755, "rougeL_precision_stderr": 0.001369806180194911, "rougeL_recall": 0.1990169050957429, "rougeL_recall_stderr": 0.00219255306093255, "rougeLsum_fmeasure": 0.15524577102172657, "rougeLsum_fmeasure_stderr": 0.0017126012169208825, "rougeLsum_precision": 0.13357747346540397, "rougeLsum_precision_stderr": 0.0017299539524552423, "rougeLsum_recall": 0.22314380798385272, "rougeLsum_recall_stderr": 0.0024794181108329524}}, "1": {"tldr_en": {"bleu": 2.725412897374069, "bleu_stderr": 0.06590713364460175, "rouge1_fmeasure": 0.21273278313561203, "rouge1_fmeasure_stderr": 0.002011144383038581, "rouge1_precision": 0.19152350230841855, "rouge1_precision_stderr": 0.0023810619465519586, "rouge1_recall": 0.302694565096085, "rouge1_recall_stderr": 0.002871626633712586, "rouge2_fmeasure": 0.05180034750467234, "rouge2_fmeasure_stderr": 0.0010557187582866223, "rouge2_precision": 0.04768841739901736, "rouge2_precision_stderr": 0.0012211060679656308, "rouge2_recall": 0.07569607558899676, "rouge2_recall_stderr": 0.0016977441994545117, "rougeL_fmeasure": 0.15200924118476186, "rougeL_fmeasure_stderr": 0.0013679053352126194, "rougeL_precision": 0.13653437043291017, "rougeL_precision_stderr": 0.001724532681214248, "rougeL_recall": 0.22191488232376044, "rougeL_recall_stderr": 0.0022628821878105465, "rougeLsum_fmeasure": 0.19969478957091424, "rougeLsum_fmeasure_stderr": 0.0018860691826304264, "rougeLsum_precision": 0.17974451166450459, "rougeLsum_precision_stderr": 0.0022478628561453545, "rougeLsum_recall": 0.28504093466511404, "rougeLsum_recall_stderr": 0.0027223245492742462}}, "2": {"tldr_en": {"bleu": 3.0660991212944317, "bleu_stderr": 0.10372713065464424, "rouge1_fmeasure": 0.21977815129794487, "rouge1_fmeasure_stderr": 0.0019325468923461176, "rouge1_precision": 0.21412338509678533, "rouge1_precision_stderr": 0.0028281010919592436, "rouge1_recall": 0.30461283300382674, "rouge1_recall_stderr": 0.002825271119088337, "rouge2_fmeasure": 0.05616050870223023, "rouge2_fmeasure_stderr": 0.0011252548440132944, "rouge2_precision": 0.05888063726692182, "rouge2_precision_stderr": 0.0017538775810198863, "rouge2_recall": 0.0782305781107223, "rouge2_recall_stderr": 0.001697698646970674, "rougeL_fmeasure": 0.15708445866755325, "rougeL_fmeasure_stderr": 0.0013652347675896105, "rougeL_precision": 0.15547333657821524, "rougeL_precision_stderr": 0.0023132587548469795, "rougeL_recall": 0.22142616128174153, "rougeL_recall_stderr": 0.0022228357872264405, "rougeLsum_fmeasure": 0.20703520109346182, "rougeLsum_fmeasure_stderr": 0.0018184636268796823, "rougeLsum_precision": 0.20218982558840237, "rougeLsum_precision_stderr": 0.002724146894044121, "rougeLsum_recall": 0.28724184959573407, "rougeLsum_recall_stderr": 0.002676027470194893}}, "3": {"tldr_en": {"bleu": 3.043581013367525, "bleu_stderr": 0.06318311374792976, "rouge1_fmeasure": 0.18460495577113004, "rouge1_fmeasure_stderr": 0.0023270611135582223, "rouge1_precision": 0.19006263661359438, "rouge1_precision_stderr": 0.003139121389089328, "rouge1_recall": 0.25004795480735637, "rouge1_recall_stderr": 0.003318865578322209, "rouge2_fmeasure": 0.0465256311864123, "rouge2_fmeasure_stderr": 0.0010870859889237309, "rouge2_precision": 0.04998451594641819, "rouge2_precision_stderr": 0.0015733990846015632, "rouge2_recall": 0.06377668032838274, "rouge2_recall_stderr": 0.0016076140964349293, "rougeL_fmeasure": 0.1325297521693101, "rougeL_fmeasure_stderr": 0.0016515379862171921, "rougeL_precision": 0.1388220207502087, "rougeL_precision_stderr": 0.0024768396997075434, "rougeL_recall": 0.18232394784353995, "rougeL_recall_stderr": 0.0025352244187402725, "rougeLsum_fmeasure": 0.17377308374858433, "rougeLsum_fmeasure_stderr": 0.0021801660978291804, "rougeLsum_precision": 0.17915267789040445, "rougeLsum_precision_stderr": 0.0029769183305334277, "rougeLsum_recall": 0.23593719882808015, "rougeLsum_recall_stderr": 0.0031494826787230117}}, "4": {"tldr_en": {"bleu": 0.5444888845892801, "bleu_stderr": 0.04621602768652671, "rouge1_fmeasure": 0.05811203454473267, "rouge1_fmeasure_stderr": 0.0019981446295197548, "rouge1_precision": 0.06078951045960508, "rouge1_precision_stderr": 0.002443721533125645, "rouge1_recall": 0.08186853894096363, "rouge1_recall_stderr": 0.0028763649076511124, "rouge2_fmeasure": 0.01512885969707243, "rouge2_fmeasure_stderr": 0.0007703321227883491, "rouge2_precision": 0.01680552219176822, "rouge2_precision_stderr": 0.0011749998773802146, "rouge2_recall": 0.021789779449750947, "rouge2_recall_stderr": 0.0011367880836474229, "rougeL_fmeasure": 0.04285501108776758, "rougeL_fmeasure_stderr": 0.0014773789216696632, "rougeL_precision": 0.04590783650634408, "rougeL_precision_stderr": 0.0019570366932069668, "rougeL_recall": 0.06116884881798984, "rougeL_recall_stderr": 0.002201839898397505, "rougeLsum_fmeasure": 0.05447901946898106, "rougeLsum_fmeasure_stderr": 0.0018729612207289811, "rougeLsum_precision": 0.057044182216271055, "rougeLsum_precision_stderr": 0.0023002698396750224, "rougeLsum_recall": 0.07690877478375856, "rougeLsum_recall_stderr": 0.00271186082309868}}, "5": {"tldr_en": {"bleu": 2.039795888249637e-07, "bleu_stderr": 6.241479656801881e-07, "rouge1_fmeasure": 0.008974413993334825, "rouge1_fmeasure_stderr": 0.000850429801246656, "rouge1_precision": 0.00905136410465181, "rouge1_precision_stderr": 0.0009625732504594573, "rouge1_recall": 0.013165140267782167, "rouge1_recall_stderr": 0.0013100670955066764, "rouge2_fmeasure": 0.0022731813763166996, "rouge2_fmeasure_stderr": 0.0003025709305560882, "rouge2_precision": 0.002595081746321728, "rouge2_precision_stderr": 0.0004928989810568098, "rouge2_recall": 0.0034078615155149253, "rouge2_recall_stderr": 0.000480327507603207, "rougeL_fmeasure": 0.006751312855145466, "rougeL_fmeasure_stderr": 0.0006422189838493418, "rougeL_precision": 0.007005791567818198, "rougeL_precision_stderr": 0.0007842438362092874, "rougeL_recall": 0.009863523757332088, "rougeL_recall_stderr": 0.0009910793454999053, "rougeLsum_fmeasure": 0.008374385321680305, "rougeLsum_fmeasure_stderr": 0.0007920142646349635, "rougeLsum_precision": 0.008492645686409112, "rougeLsum_precision_stderr": 0.0009129144636313662, "rougeLsum_recall": 0.012275407152918577, "rougeLsum_recall_stderr": 0.0012159807830293056}}}, "e2e_nlg_cleaned": {"0": {"generate_text_restaurant": {"bleu": 0.9486318659821757, "bleu_stderr": 0.046054186708753594, "rouge1_fmeasure": 0.06647296884394631, "rouge1_fmeasure_stderr": 0.0013703971424785793, "rouge1_precision": 0.05127435604947866, "rouge1_precision_stderr": 0.0010816160215933884, "rouge1_recall": 0.09809462257860511, "rouge1_recall_stderr": 0.001988448826829593, "rouge2_fmeasure": 0.011764220975410813, "rouge2_fmeasure_stderr": 0.0005194241761303413, "rouge2_precision": 0.009013651576884465, "rouge2_precision_stderr": 0.0003983827007173943, "rouge2_recall": 0.017566860336679598, "rouge2_recall_stderr": 0.0007876531254085971, "rougeL_fmeasure": 0.06585835855034873, "rougeL_fmeasure_stderr": 0.0013503477728497991, "rougeL_precision": 0.050780395408484696, "rougeL_precision_stderr": 0.001064268150921614, "rougeL_recall": 0.09725254219294728, "rougeL_recall_stderr": 0.001963943905207662, "rougeLsum_fmeasure": 0.05626251970787973, "rougeLsum_fmeasure_stderr": 0.0011217151771389764, "rougeLsum_precision": 0.04328842801917388, "rougeLsum_precision_stderr": 0.0008811589017402656, "rougeLsum_recall": 0.083491757226437, "rougeLsum_recall_stderr": 0.0016470232472348585}}, "1": {"generate_text_restaurant": {"bleu": 10.736417414826192, "bleu_stderr": 0.12883315690574576, "rouge1_fmeasure": 0.42347669756200107, "rouge1_fmeasure_stderr": 0.002299761985015768, "rouge1_precision": 0.4994281816248813, "rouge1_precision_stderr": 0.00315562260432105, "rouge1_recall": 0.4074682552684028, "rouge1_recall_stderr": 0.0028860632451414964, "rouge2_fmeasure": 0.19063915520224362, "rouge2_fmeasure_stderr": 0.001908484563894186, "rouge2_precision": 0.22810495987567186, "rouge2_precision_stderr": 0.0024574603360052174, "rouge2_recall": 0.1831102494700893, "rouge2_recall_stderr": 0.002053236226953995, "rougeL_fmeasure": 0.30934327771314435, "rougeL_fmeasure_stderr": 0.0019536593166029873, "rougeL_precision": 0.3668088539701383, "rougeL_precision_stderr": 0.0027243573366763025, "rougeL_recall": 0.29737795551223317, "rougeL_recall_stderr": 0.0023390292209083986, "rougeLsum_fmeasure": 0.34772596056303123, "rougeLsum_fmeasure_stderr": 0.0022228086994649674, "rougeLsum_precision": 0.41086699735293175, "rougeLsum_precision_stderr": 0.00298010231762013, "rougeLsum_recall": 0.33421135617493986, "rougeLsum_recall_stderr": 0.0026325643111599697}}, "2": {"generate_text_restaurant": {"bleu": 11.947803791576034, "bleu_stderr": 0.18068831586395323, "rouge1_fmeasure": 0.43222217428452275, "rouge1_fmeasure_stderr": 0.002325391661151201, "rouge1_precision": 0.5073660157910931, "rouge1_precision_stderr": 0.0035132557513627384, "rouge1_recall": 0.4252886953751185, "rouge1_recall_stderr": 0.0028365349980832635, "rouge2_fmeasure": 0.20576675267077524, "rouge2_fmeasure_stderr": 0.001963830551898311, "rouge2_precision": 0.24649494438796668, "rouge2_precision_stderr": 0.0027184108588514406, "rouge2_recall": 0.20184046785984408, "rouge2_recall_stderr": 0.0021123641171435486, "rougeL_fmeasure": 0.32621056636133966, "rougeL_fmeasure_stderr": 0.001998413132278442, "rougeL_precision": 0.3837579986355456, "rougeL_precision_stderr": 0.0030213974997960135, "rougeL_recall": 0.32249416980407164, "rougeL_recall_stderr": 0.0024171000266711845, "rougeLsum_fmeasure": 0.362643163803525, "rougeLsum_fmeasure_stderr": 0.0022826535654147787, "rougeLsum_precision": 0.4264901349632602, "rougeLsum_precision_stderr": 0.0033243377703121176, "rougeLsum_recall": 0.35635697158144575, "rougeLsum_recall_stderr": 0.0026380595993714005}}, "3": {"generate_text_restaurant": {"bleu": 11.022223505125432, "bleu_stderr": 0.14435451624639248, "rouge1_fmeasure": 0.4122731478459889, "rouge1_fmeasure_stderr": 0.0023286861099915115, "rouge1_precision": 0.47445453300900486, "rouge1_precision_stderr": 0.003918784702695351, "rouge1_recall": 0.4372528894635071, "rouge1_recall_stderr": 0.0029315268755683195, "rouge2_fmeasure": 0.20060096359818363, "rouge2_fmeasure_stderr": 0.0019169537157168396, "rouge2_precision": 0.23627437735170165, "rouge2_precision_stderr": 0.0028287810639010436, "rouge2_recall": 0.21271321394771003, "rouge2_recall_stderr": 0.0021996801944212745, "rougeL_fmeasure": 0.3208945118759007, "rougeL_fmeasure_stderr": 0.002007420505456512, "rougeL_precision": 0.3679608824002368, "rougeL_precision_stderr": 0.003302299484821572, "rougeL_recall": 0.34501971416413774, "rougeL_recall_stderr": 0.002657419633721613, "rougeLsum_fmeasure": 0.34897504961881226, "rougeLsum_fmeasure_stderr": 0.0022990110747661196, "rougeLsum_precision": 0.40239904758288486, "rougeLsum_precision_stderr": 0.0036502771896898987, "rougeLsum_recall": 0.3695275624157989, "rougeLsum_recall_stderr": 0.0027595288849904336}}, "4": {"generate_text_restaurant": {"bleu": 9.968039437977147, "bleu_stderr": 0.16372238418882856, "rouge1_fmeasure": 0.3942231576041269, "rouge1_fmeasure_stderr": 0.002305613856580516, "rouge1_precision": 0.43588888990546887, "rouge1_precision_stderr": 0.004022019430599169, "rouge1_recall": 0.4458867552004997, "rouge1_recall_stderr": 0.0028782803291545513, "rouge2_fmeasure": 0.1911423171080508, "rouge2_fmeasure_stderr": 0.0018706868888293648, "rouge2_precision": 0.21649002753801427, "rouge2_precision_stderr": 0.002818208322338056, "rouge2_recall": 0.2164206555655709, "rouge2_recall_stderr": 0.002180147158374511, "rougeL_fmeasure": 0.3129997975563598, "rougeL_fmeasure_stderr": 0.0019192520823043578, "rougeL_precision": 0.34301626897705667, "rougeL_precision_stderr": 0.0032663142976474832, "rougeL_recall": 0.3603682332684797, "rougeL_recall_stderr": 0.002650578012719782, "rougeLsum_fmeasure": 0.3342250141451574, "rougeLsum_fmeasure_stderr": 0.0022869639714824075, "rougeLsum_precision": 0.3700159885396528, "rougeLsum_precision_stderr": 0.003699304823578603, "rougeLsum_recall": 0.37759731987687517, "rougeLsum_recall_stderr": 0.0027625981535221496}}, "5": {"generate_text_restaurant": {"bleu": 9.267917474708051, "bleu_stderr": 0.0863498368743197, "rouge1_fmeasure": 0.38301060693441696, "rouge1_fmeasure_stderr": 0.0022710773465877397, "rouge1_precision": 0.40824332377558614, "rouge1_precision_stderr": 0.004053792791346083, "rouge1_recall": 0.4545220617281385, "rouge1_recall_stderr": 0.0027916622089178417, "rouge2_fmeasure": 0.1856207485297989, "rouge2_fmeasure_stderr": 0.0017855294573506195, "rouge2_precision": 0.2031488158554883, "rouge2_precision_stderr": 0.0027549921677444858, "rouge2_recall": 0.22030941659210415, "rouge2_recall_stderr": 0.002116008910837953, "rougeL_fmeasure": 0.30811802294334445, "rougeL_fmeasure_stderr": 0.0018298681577941182, "rougeL_precision": 0.3245979445437026, "rougeL_precision_stderr": 0.00323088675022427, "rougeL_recall": 0.37317081898251825, "rougeL_recall_stderr": 0.0025979568518245586, "rougeLsum_fmeasure": 0.3263399929619776, "rougeLsum_fmeasure_stderr": 0.0022192850835474867, "rougeLsum_precision": 0.34851330936717334, "rougeLsum_precision_stderr": 0.0036963981631764316, "rougeLsum_recall": 0.386814061201923, "rougeLsum_recall_stderr": 0.0026979746355648222}}}, "gem_xsum": {"0": {"article_DOC_summary": {"bleu": 2.022928782196655, "bleu_stderr": 0.06323504041482224, "rouge1_fmeasure": 0.20850602933405124, "rouge1_fmeasure_stderr": 0.0025783509188228872, "rouge1_precision": 0.1690176511800054, "rouge1_precision_stderr": 0.0025057503766924764, "rouge1_recall": 0.3169600025152783, "rouge1_recall_stderr": 0.004390086610875057, "rouge2_fmeasure": 0.04480106981761703, "rouge2_fmeasure_stderr": 0.0016469393826685948, "rouge2_precision": 0.035231821829655605, "rouge2_precision_stderr": 0.0014122236080052043, "rouge2_recall": 0.0721669404414664, "rouge2_recall_stderr": 0.0026942676554950196, "rougeL_fmeasure": 0.15783763779709026, "rougeL_fmeasure_stderr": 0.0020045338016978164, "rougeL_precision": 0.1276621204119681, "rougeL_precision_stderr": 0.0019441096332612402, "rougeL_recall": 0.24175632866951158, "rougeL_recall_stderr": 0.0035366671887579804, "rougeLsum_fmeasure": 0.16234750057160516, "rougeLsum_fmeasure_stderr": 0.0021521921302323334, "rougeLsum_precision": 0.13096994127744102, "rougeLsum_precision_stderr": 0.002011329849282318, "rougeLsum_recall": 0.24916483206303525, "rougeLsum_recall_stderr": 0.003801039212088291}}, "1": {"article_DOC_summary": {"bleu": 1.3013783094677602, "bleu_stderr": 0.05323851494545823, "rouge1_fmeasure": 0.17053066710298548, "rouge1_fmeasure_stderr": 0.00248505468489638, "rouge1_precision": 0.1208560729467065, "rouge1_precision_stderr": 0.0018331156830519264, "rouge1_recall": 0.3011735743290485, "rouge1_recall_stderr": 0.004262574821709688, "rouge2_fmeasure": 0.033207183560968925, "rouge2_fmeasure_stderr": 0.001348828018973971, "rouge2_precision": 0.023321914774610174, "rouge2_precision_stderr": 0.0009490899905683155, "rouge2_recall": 0.06000231967162931, "rouge2_recall_stderr": 0.002490214577848948, "rougeL_fmeasure": 0.13262019002149206, "rougeL_fmeasure_stderr": 0.0018340910251430245, "rougeL_precision": 0.09381616328217902, "rougeL_precision_stderr": 0.0013434290825839483, "rougeL_recall": 0.23579210005809345, "rougeL_recall_stderr": 0.0033043055105988852, "rougeLsum_fmeasure": 0.13665130703802245, "rougeLsum_fmeasure_stderr": 0.0019843002642716883, "rougeLsum_precision": 0.09660547186408498, "rougeLsum_precision_stderr": 0.001445839504863143, "rougeLsum_recall": 0.24312964604533158, "rougeLsum_recall_stderr": 0.0035600019821752133}}, "2": {"article_DOC_summary": {"bleu": 1.4610227609434248, "bleu_stderr": 0.10327228234775739, "rouge1_fmeasure": 0.17640095609918918, "rouge1_fmeasure_stderr": 0.0024236476790657165, "rouge1_precision": 0.12496533702098848, "rouge1_precision_stderr": 0.0017902842566202737, "rouge1_recall": 0.31218014639465674, "rouge1_recall_stderr": 0.004202785523007602, "rouge2_fmeasure": 0.036694425298060884, "rouge2_fmeasure_stderr": 0.001436730910285075, "rouge2_precision": 0.02572420280473422, "rouge2_precision_stderr": 0.0010068612303705702, "rouge2_recall": 0.06686357551325348, "rouge2_recall_stderr": 0.002695792942377374, "rougeL_fmeasure": 0.13833597033877038, "rougeL_fmeasure_stderr": 0.0018696740518708518, "rougeL_precision": 0.09783615822934287, "rougeL_precision_stderr": 0.0013714730714619002, "rougeL_recall": 0.2462675293448225, "rougeL_recall_stderr": 0.0033637471659569394, "rougeLsum_fmeasure": 0.14067838491016335, "rougeLsum_fmeasure_stderr": 0.0020231190670618898, "rougeLsum_precision": 0.0994096762980347, "rougeLsum_precision_stderr": 0.001470776129912826, "rougeLsum_recall": 0.25080300299758923, "rougeLsum_recall_stderr": 0.0036598233956450744}}, "3": {"article_DOC_summary": {"bleu": 1.5362804322700707, "bleu_stderr": 0.11595973725688433, "rouge1_fmeasure": 0.17278808012766025, "rouge1_fmeasure_stderr": 0.0026240269874744267, "rouge1_precision": 0.12510405231526503, "rouge1_precision_stderr": 0.002062669731180533, "rouge1_recall": 0.3002566487080628, "rouge1_recall_stderr": 0.00444519044441344, "rouge2_fmeasure": 0.03632164091184316, "rouge2_fmeasure_stderr": 0.0014329723024295558, "rouge2_precision": 0.025915517056828243, "rouge2_precision_stderr": 0.001041527932832055, "rouge2_recall": 0.06490306343860648, "rouge2_recall_stderr": 0.002582065276373352, "rougeL_fmeasure": 0.13425652952824363, "rougeL_fmeasure_stderr": 0.0019915146930490554, "rougeL_precision": 0.09706185807135201, "rougeL_precision_stderr": 0.0015576011801810463, "rougeL_recall": 0.23482330953325586, "rougeL_recall_stderr": 0.0035152268940508787, "rougeLsum_fmeasure": 0.13896782667459545, "rougeLsum_fmeasure_stderr": 0.0021519301734642866, "rougeLsum_precision": 0.10039857540576827, "rougeLsum_precision_stderr": 0.0016632482173482024, "rougeLsum_recall": 0.24311650290142006, "rougeLsum_recall_stderr": 0.0037784538877470666}}, "4": {"article_DOC_summary": {"bleu": 0.6830672784259785, "bleu_stderr": 0.1433690132848898, "rouge1_fmeasure": 0.04542922982390074, "rouge1_fmeasure_stderr": 0.0025681655681753014, "rouge1_precision": 0.03756651198393947, "rouge1_precision_stderr": 0.0023236074296884438, "rouge1_recall": 0.07282121177546534, "rouge1_recall_stderr": 0.0042242724928273434, "rouge2_fmeasure": 0.008994455579157571, "rouge2_fmeasure_stderr": 0.0008310182585970243, "rouge2_precision": 0.006737094306664144, "rouge2_precision_stderr": 0.000626877122582944, "rouge2_recall": 0.015461875442437803, "rouge2_recall_stderr": 0.0014919283390046763, "rougeL_fmeasure": 0.035105523746789644, "rougeL_fmeasure_stderr": 0.001981716429062695, "rougeL_precision": 0.02937799854609358, "rougeL_precision_stderr": 0.001900401107297335, "rougeL_recall": 0.05665888070678968, "rougeL_recall_stderr": 0.0033350108370089723, "rougeLsum_fmeasure": 0.036860085207122494, "rougeLsum_fmeasure_stderr": 0.00209278103955841, "rougeLsum_precision": 0.030851918047711355, "rougeLsum_precision_stderr": 0.001993157296417591, "rougeLsum_recall": 0.059397277374744976, "rougeLsum_recall_stderr": 0.003504149895888219}}, "5": {"article_DOC_summary": {"bleu": 3.607095794764019e-38, "bleu_stderr": 1.5118654753033633e-33, "rouge1_fmeasure": 0.0022333095605726874, "rouge1_fmeasure_stderr": 0.0005881591558060873, "rouge1_precision": 0.0024341904015074173, "rouge1_precision_stderr": 0.0006524893303985873, "rouge1_recall": 0.002130274826814078, "rouge1_recall_stderr": 0.0005569834732465687, "rouge2_fmeasure": 0.0001299846766359192, "rouge2_fmeasure_stderr": 7.573788646136168e-05, "rouge2_precision": 0.0001469327010392493, "rouge2_precision_stderr": 8.511648046715374e-05, "rouge2_recall": 0.00011774019543164939, "rouge2_recall_stderr": 6.929829602370543e-05, "rougeL_fmeasure": 0.0016791945013548595, "rougeL_fmeasure_stderr": 0.0004338697276550635, "rougeL_precision": 0.0018277319353608855, "rougeL_precision_stderr": 0.0004795477675060686, "rougeL_recall": 0.0016097800295936467, "rougeL_recall_stderr": 0.00041574825239381176, "rougeLsum_fmeasure": 0.001850332138799774, "rougeLsum_fmeasure_stderr": 0.00048558179067708615, "rougeLsum_precision": 0.0020186120549751606, "rougeLsum_precision_stderr": 0.0005377477849886966, "rougeLsum_recall": 0.0017704581231688795, "rougeLsum_recall_stderr": 0.0004643082172236394}}}}