{"GEM/web_nlg_en": {"0": {"PALM_prompt": {"bleu": 0.365505358129517, "bleu_stderr": 0.03502257670524251, "rouge1_fmeasure": 0.11517580303119217, "rouge1_fmeasure_stderr": 0.0020726202696031543, "rouge1_precision": 0.07648980561615028, "rouge1_precision_stderr": 0.0016823886910426983, "rouge1_recall": 0.316968269417661, "rouge1_recall_stderr": 0.004623445320634521, "rouge2_fmeasure": 0.05439843034235182, "rouge2_fmeasure_stderr": 0.0013023755402193301, "rouge2_precision": 0.03570362124189832, "rouge2_precision_stderr": 0.0009599625749737652, "rouge2_recall": 0.15470348037232984, "rouge2_recall_stderr": 0.003242824778038987, "rougeL_fmeasure": 0.11102338511120223, "rougeL_fmeasure_stderr": 0.0019162065673904122, "rougeL_precision": 0.0734086130120135, "rougeL_precision_stderr": 0.0015390196221697744, "rougeL_recall": 0.30884652788740097, "rougeL_recall_stderr": 0.00451227940122316, "rougeLsum_fmeasure": 0.10975162370468329, "rougeLsum_fmeasure_stderr": 0.0019421285766935562, "rougeLsum_precision": 0.0728812519843257, "rougeLsum_precision_stderr": 0.0015910427532987823, "rougeLsum_recall": 0.30239723755664005, "rougeLsum_recall_stderr": 0.004314214246801637}}, "1": {"PALM_prompt": {"bleu": 0.4718765280215146, "bleu_stderr": 0.02672659137955592, "rouge1_fmeasure": 0.11775338606123435, "rouge1_fmeasure_stderr": 0.001924384162772881, "rouge1_precision": 0.07654420057263799, "rouge1_precision_stderr": 0.001528431355295901, "rouge1_recall": 0.3706220656375829, "rouge1_recall_stderr": 0.005186402601785923, "rouge2_fmeasure": 0.05500396414987799, "rouge2_fmeasure_stderr": 0.001213368877240726, "rouge2_precision": 0.03570999027007081, "rouge2_precision_stderr": 0.0009259668096094864, "rouge2_recall": 0.1822691656242857, "rouge2_recall_stderr": 0.0036821478817688734, "rougeL_fmeasure": 0.11151902972714106, "rougeL_fmeasure_stderr": 0.0017404591497852157, "rougeL_precision": 0.07222463413711289, "rougeL_precision_stderr": 0.0013459334398937528, "rougeL_recall": 0.3516108976702013, "rougeL_recall_stderr": 0.004840237014367524, "rougeLsum_fmeasure": 0.11173525418209604, "rougeLsum_fmeasure_stderr": 0.0018042448789429362, "rougeLsum_precision": 0.07254869188023266, "rougeLsum_precision_stderr": 0.0014083064426811413, "rougeLsum_recall": 0.3508473688063052, "rougeLsum_recall_stderr": 0.004774412270890995}}, "2": {"PALM_prompt": {"bleu": 0.48374587973148897, "bleu_stderr": 0.02160429268653843, "rouge1_fmeasure": 0.11843692560953636, "rouge1_fmeasure_stderr": 0.0017527280633787895, "rouge1_precision": 0.07520635325014476, "rouge1_precision_stderr": 0.0012989042348400615, "rouge1_recall": 0.39564239187862277, "rouge1_recall_stderr": 0.005166204918034083, "rouge2_fmeasure": 0.054721812477036336, "rouge2_fmeasure_stderr": 0.001114142006270754, "rouge2_precision": 0.034651911364013195, "rouge2_precision_stderr": 0.0008033018295138833, "rouge2_recall": 0.19427006065716845, "rouge2_recall_stderr": 0.003694246348436424, "rougeL_fmeasure": 0.11051417048104582, "rougeL_fmeasure_stderr": 0.0015915778651008035, "rougeL_precision": 0.07024200119155555, "rougeL_precision_stderr": 0.0011783887241769058, "rougeL_recall": 0.3660382891013138, "rougeL_recall_stderr": 0.004576443871389266, "rougeLsum_fmeasure": 0.11235520576986081, "rougeLsum_fmeasure_stderr": 0.001649520360666583, "rougeLsum_precision": 0.07137662063765705, "rougeLsum_precision_stderr": 0.0012216802168618529, "rougeLsum_recall": 0.3736585873846558, "rougeLsum_recall_stderr": 0.0047213971801516675}}, "3": {"PALM_prompt": {"bleu": 0.5399234847930408, "bleu_stderr": 0.02832255846005892, "rouge1_fmeasure": 0.12135721954139542, "rouge1_fmeasure_stderr": 0.002098842147816486, "rouge1_precision": 0.07987959903519301, "rouge1_precision_stderr": 0.001958806889747015, "rouge1_recall": 0.39125211905519386, "rouge1_recall_stderr": 0.005082258550273298, "rouge2_fmeasure": 0.056940304530391644, "rouge2_fmeasure_stderr": 0.001476712038400785, "rouge2_precision": 0.03807261851649924, "rouge2_precision_stderr": 0.0014606137888846914, "rouge2_recall": 0.1920905336863606, "rouge2_recall_stderr": 0.0037709962536828148, "rougeL_fmeasure": 0.11241760319665695, "rougeL_fmeasure_stderr": 0.001875353100684847, "rougeL_precision": 0.07393702555239919, "rougeL_precision_stderr": 0.0017596086344590835, "rougeL_recall": 0.3604586740703297, "rougeL_recall_stderr": 0.00447114612728174, "rougeLsum_fmeasure": 0.11489067985494965, "rougeLsum_fmeasure_stderr": 0.0019441426076225704, "rougeLsum_precision": 0.07556968795913989, "rougeLsum_precision_stderr": 0.0018059611644347965, "rougeLsum_recall": 0.36906064559005386, "rougeLsum_recall_stderr": 0.004657575811928199}}, "4": {"PALM_prompt": {"bleu": 0.5510849766399221, "bleu_stderr": 0.0175511957441724, "rouge1_fmeasure": 0.12506604984230196, "rouge1_fmeasure_stderr": 0.0021472394878356772, "rouge1_precision": 0.08534032348465934, "rouge1_precision_stderr": 0.002292239718680053, "rouge1_recall": 0.39434008978071233, "rouge1_recall_stderr": 0.004965906826527694, "rouge2_fmeasure": 0.05857717517903851, "rouge2_fmeasure_stderr": 0.0014885390811421018, "rouge2_precision": 0.04079538462727728, "rouge2_precision_stderr": 0.0016327036390176998, "rouge2_recall": 0.19630864366698197, "rouge2_recall_stderr": 0.003787999118899299, "rougeL_fmeasure": 0.11580311530092204, "rougeL_fmeasure_stderr": 0.0019176848380825057, "rougeL_precision": 0.07878721956235119, "rougeL_precision_stderr": 0.002055020271794094, "rougeL_recall": 0.364530967486755, "rougeL_recall_stderr": 0.004405836254872888, "rougeLsum_fmeasure": 0.11850283070508899, "rougeLsum_fmeasure_stderr": 0.0019921248365642125, "rougeLsum_precision": 0.08070493918368636, "rougeLsum_precision_stderr": 0.0021155618114281965, "rougeLsum_recall": 0.37309717144724813, "rougeLsum_recall_stderr": 0.0045779450824008265}}, "5": {"PALM_prompt": {"bleu": 0.6422980998155431, "bleu_stderr": 0.037904429698092754, "rouge1_fmeasure": 0.12675458660511493, "rouge1_fmeasure_stderr": 0.00211254006069773, "rouge1_precision": 0.08424188758880696, "rouge1_precision_stderr": 0.002073755705231499, "rouge1_recall": 0.4099473868748358, "rouge1_recall_stderr": 0.005200368795117541, "rouge2_fmeasure": 0.05982201871515683, "rouge2_fmeasure_stderr": 0.0014369670279242037, "rouge2_precision": 0.03998997078611554, "rouge2_precision_stderr": 0.001369954649204164, "rouge2_recall": 0.20657125503274204, "rouge2_recall_stderr": 0.003979108305764359, "rougeL_fmeasure": 0.11576724371241058, "rougeL_fmeasure_stderr": 0.001850628212707506, "rougeL_precision": 0.0764988131100183, "rougeL_precision_stderr": 0.0017647565104687796, "rougeL_recall": 0.3745750098125955, "rougeL_recall_stderr": 0.004580604196812087, "rougeLsum_fmeasure": 0.1196790452648868, "rougeLsum_fmeasure_stderr": 0.0019537411567052284, "rougeLsum_precision": 0.07933848644696936, "rougeLsum_precision_stderr": 0.00188255712696218, "rougeLsum_recall": 0.38689755781022106, "rougeLsum_recall_stderr": 0.004814338347726989}}}, "GEM/wiki_lingua_en": {"0": {"tldr_en": {"bleu": 1.5771300792035017, "bleu_stderr": 0.04991796257960264, "rouge1_fmeasure": 0.1774235464739232, "rouge1_fmeasure_stderr": 0.0018163106034253622, "rouge1_precision": 0.1516264295226916, "rouge1_precision_stderr": 0.0018524175518842324, "rouge1_recall": 0.25832545207070934, "rouge1_recall_stderr": 0.002638155634459137, "rouge2_fmeasure": 0.036141464890612394, "rouge2_fmeasure_stderr": 0.000839659551210909, "rouge2_precision": 0.030629699620307885, "rouge2_precision_stderr": 0.0007444530530260053, "rouge2_recall": 0.05478482434968888, "rouge2_recall_stderr": 0.0014158784161058227, "rougeL_fmeasure": 0.13773474664769586, "rougeL_fmeasure_stderr": 0.0012950817280923518, "rougeL_precision": 0.11612341320254116, "rougeL_precision_stderr": 0.0012804789106474253, "rougeL_recall": 0.20607942556619077, "rougeL_recall_stderr": 0.002171423201122513, "rougeLsum_fmeasure": 0.16363854542371178, "rougeLsum_fmeasure_stderr": 0.0016593981477502706, "rougeLsum_precision": 0.13965855809404587, "rougeLsum_precision_stderr": 0.001693541152993375, "rougeLsum_recall": 0.23916390053431685, "rougeLsum_recall_stderr": 0.0024532076303709566}}, "1": {"tldr_en": {"bleu": 2.6338996032067037, "bleu_stderr": 0.04821985007341574, "rouge1_fmeasure": 0.21549296085889416, "rouge1_fmeasure_stderr": 0.001962312333109593, "rouge1_precision": 0.1960438684706822, "rouge1_precision_stderr": 0.002420004329456638, "rouge1_recall": 0.3054255437992693, "rouge1_recall_stderr": 0.0028119843202321767, "rouge2_fmeasure": 0.052527946163837866, "rouge2_fmeasure_stderr": 0.0010300747120330824, "rouge2_precision": 0.048597738419155066, "rouge2_precision_stderr": 0.0012043368500439934, "rouge2_recall": 0.07625438773178222, "rouge2_recall_stderr": 0.0016442065251268264, "rougeL_fmeasure": 0.1552047441571399, "rougeL_fmeasure_stderr": 0.0013475708470744893, "rougeL_precision": 0.14105634371954578, "rougeL_precision_stderr": 0.0017960770429619884, "rougeL_recall": 0.22476789816855414, "rougeL_recall_stderr": 0.002198629804934752, "rougeLsum_fmeasure": 0.2024541465021801, "rougeLsum_fmeasure_stderr": 0.0018427500688387478, "rougeLsum_precision": 0.1841194002510797, "rougeLsum_precision_stderr": 0.002285643984120407, "rougeLsum_recall": 0.2874198264299386, "rougeLsum_recall_stderr": 0.002661780779760906}}, "2": {"tldr_en": {"bleu": 2.7339435213952954, "bleu_stderr": 0.08831287809847477, "rouge1_fmeasure": 0.21122130658633273, "rouge1_fmeasure_stderr": 0.0018812807521498378, "rouge1_precision": 0.22208554630988123, "rouge1_precision_stderr": 0.0030592331065051187, "rouge1_recall": 0.2808452321492671, "rouge1_recall_stderr": 0.0027284281619657023, "rouge2_fmeasure": 0.05358064041219617, "rouge2_fmeasure_stderr": 0.001095882710793521, "rouge2_precision": 0.06046646631865548, "rouge2_precision_stderr": 0.0017721217804806883, "rouge2_recall": 0.07186596521205721, "rouge2_recall_stderr": 0.0015862584243939379, "rougeL_fmeasure": 0.15555355290554032, "rougeL_fmeasure_stderr": 0.0013845276157140925, "rougeL_precision": 0.1663336512931002, "rougeL_precision_stderr": 0.0025460716364344035, "rougeL_recall": 0.20924091942957526, "rougeL_recall_stderr": 0.0021395819034057957, "rougeLsum_fmeasure": 0.19918181053317313, "rougeLsum_fmeasure_stderr": 0.0017863595069102555, "rougeLsum_precision": 0.20966401003427135, "rougeLsum_precision_stderr": 0.0029349921286997397, "rougeLsum_recall": 0.26501858440596643, "rougeLsum_recall_stderr": 0.0025934297416044965}}, "3": {"tldr_en": {"bleu": 2.808827686001197, "bleu_stderr": 0.08213221206745722, "rouge1_fmeasure": 0.17457065630242485, "rouge1_fmeasure_stderr": 0.0022811171020873555, "rouge1_precision": 0.20151220398388653, "rouge1_precision_stderr": 0.003538573262408237, "rouge1_recall": 0.2223618574421121, "rouge1_recall_stderr": 0.0031370627753889795, "rouge2_fmeasure": 0.04538412430723011, "rouge2_fmeasure_stderr": 0.0011137423389001417, "rouge2_precision": 0.056450530011037774, "rouge2_precision_stderr": 0.001899159218772425, "rouge2_recall": 0.05804412523184788, "rouge2_recall_stderr": 0.001549150248868251, "rougeL_fmeasure": 0.13090310082030293, "rougeL_fmeasure_stderr": 0.001721329482675598, "rougeL_precision": 0.15447450169492752, "rougeL_precision_stderr": 0.0029508761594556, "rougeL_recall": 0.16842599358464877, "rougeL_recall_stderr": 0.002466298283915131, "rougeLsum_fmeasure": 0.1642585492586059, "rougeLsum_fmeasure_stderr": 0.002151308865930046, "rougeLsum_precision": 0.18997302354862627, "rougeLsum_precision_stderr": 0.003379901693046309, "rougeLsum_recall": 0.20932241363190107, "rougeLsum_recall_stderr": 0.0029630061584631977}}, "4": {"tldr_en": {"bleu": 0.42966794244887624, "bleu_stderr": 0.035917657004646976, "rouge1_fmeasure": 0.053785062512770904, "rouge1_fmeasure_stderr": 0.0019009934531933658, "rouge1_precision": 0.062065451767783136, "rouge1_precision_stderr": 0.0025766540709191484, "rouge1_recall": 0.07325002815770003, "rouge1_recall_stderr": 0.0027088207655545965, "rouge2_fmeasure": 0.014282852961170977, "rouge2_fmeasure_stderr": 0.0007741688780895341, "rouge2_precision": 0.017675628829991, "rouge2_precision_stderr": 0.0012407972320120778, "rouge2_recall": 0.01977636831988382, "rouge2_recall_stderr": 0.0011283949419256306, "rougeL_fmeasure": 0.04164135070814292, "rougeL_fmeasure_stderr": 0.0014736957523667849, "rougeL_precision": 0.049030420193037695, "rougeL_precision_stderr": 0.002131756729760763, "rougeL_recall": 0.05736282405821277, "rougeL_recall_stderr": 0.00216288276194006, "rougeLsum_fmeasure": 0.050035887012515115, "rougeLsum_fmeasure_stderr": 0.0017731426679041462, "rougeLsum_precision": 0.058036942597802434, "rougeLsum_precision_stderr": 0.002430597253785704, "rougeLsum_recall": 0.0679523381710879, "rougeLsum_recall_stderr": 0.002514986188456351}}, "5": {"tldr_en": {"bleu": 3.823406141653412e-08, "bleu_stderr": 2.3572915929393266e-07, "rouge1_fmeasure": 0.008135420542127486, "rouge1_fmeasure_stderr": 0.0008510596013228797, "rouge1_precision": 0.009545503572333743, "rouge1_precision_stderr": 0.0011345249271005433, "rouge1_recall": 0.010911180416057834, "rouge1_recall_stderr": 0.0011344359689942696, "rouge2_fmeasure": 0.002363561101990574, "rouge2_fmeasure_stderr": 0.0003463559402652083, "rouge2_precision": 0.0031516148332706023, "rouge2_precision_stderr": 0.0005738789950728937, "rouge2_recall": 0.003031168084874358, "rouge2_recall_stderr": 0.0004228518413073389, "rougeL_fmeasure": 0.0064498961923167225, "rougeL_fmeasure_stderr": 0.0006794408076426697, "rougeL_precision": 0.007713930656521292, "rougeL_precision_stderr": 0.0009395466555885211, "rougeL_recall": 0.008772010609353077, "rougeL_recall_stderr": 0.0009278010486524886, "rougeLsum_fmeasure": 0.007522191750756639, "rougeLsum_fmeasure_stderr": 0.0007926548281458674, "rougeLsum_precision": 0.008941240950458557, "rougeLsum_precision_stderr": 0.001083475475749176, "rougeLsum_recall": 0.010066280358176229, "rougeLsum_recall_stderr": 0.0010527295772454254}}}, "e2e_nlg_cleaned": {"0": {"generate_text_restaurant": {"bleu": 0.3208850619163438, "bleu_stderr": 0.027543719581997656, "rouge1_fmeasure": 0.10916751598723827, "rouge1_fmeasure_stderr": 0.0014055907970164387, "rouge1_precision": 0.10193917716251552, "rouge1_precision_stderr": 0.001262181298087086, "rouge1_recall": 0.15601250356121832, "rouge1_recall_stderr": 0.0020891935548174425, "rouge2_fmeasure": 0.009248558480455402, "rouge2_fmeasure_stderr": 0.0004313443991859932, "rouge2_precision": 0.007445964200184842, "rouge2_precision_stderr": 0.0003678087990770306, "rouge2_recall": 0.013249490277614285, "rouge2_recall_stderr": 0.0006050891673880483, "rougeL_fmeasure": 0.10228268189979718, "rougeL_fmeasure_stderr": 0.0012007887693969246, "rougeL_precision": 0.09622582095078518, "rougeL_precision_stderr": 0.0011221806240824383, "rougeL_recall": 0.14676075425466434, "rougeL_recall_stderr": 0.0018588780711754765, "rougeLsum_fmeasure": 0.09392560779905762, "rougeLsum_fmeasure_stderr": 0.0012365163701298068, "rougeLsum_precision": 0.09021551282781398, "rougeLsum_precision_stderr": 0.001196816947994912, "rougeLsum_recall": 0.13314596760706443, "rougeLsum_recall_stderr": 0.0018265117421291898}}, "1": {"generate_text_restaurant": {"bleu": 9.498137857144059, "bleu_stderr": 0.1477483846665993, "rouge1_fmeasure": 0.4119167949001581, "rouge1_fmeasure_stderr": 0.002445937789571047, "rouge1_precision": 0.46201076063949176, "rouge1_precision_stderr": 0.003576401067530048, "rouge1_recall": 0.4249090695108872, "rouge1_recall_stderr": 0.0028802714470119437, "rouge2_fmeasure": 0.18403497667662663, "rouge2_fmeasure_stderr": 0.0019162644583975092, "rouge2_precision": 0.2092047650298544, "rouge2_precision_stderr": 0.0024838168245392305, "rouge2_recall": 0.18917870334257866, "rouge2_recall_stderr": 0.0020759460916259984, "rougeL_fmeasure": 0.30413411528049716, "rougeL_fmeasure_stderr": 0.001945912792128954, "rougeL_precision": 0.3403440164840635, "rougeL_precision_stderr": 0.0028415076843255572, "rougeL_recall": 0.3170055892398947, "rougeL_recall_stderr": 0.002404493195497503, "rougeLsum_fmeasure": 0.33563087396583235, "rougeLsum_fmeasure_stderr": 0.0023149924126427478, "rougeLsum_precision": 0.3775599736681179, "rougeLsum_precision_stderr": 0.0032502114949214756, "rougeLsum_recall": 0.34538906935021624, "rougeLsum_recall_stderr": 0.0026367308341003165}}, "2": {"generate_text_restaurant": {"bleu": 13.178169645381882, "bleu_stderr": 0.14701876949947695, "rouge1_fmeasure": 0.46727420182238266, "rouge1_fmeasure_stderr": 0.0022489064451099916, "rouge1_precision": 0.5485301163149456, "rouge1_precision_stderr": 0.003233977450244202, "rouge1_recall": 0.44657986759919344, "rouge1_recall_stderr": 0.002892969727503868, "rouge2_fmeasure": 0.22659525794755594, "rouge2_fmeasure_stderr": 0.001980574922731356, "rouge2_precision": 0.27008917722754844, "rouge2_precision_stderr": 0.0026539245848408374, "rouge2_recall": 0.21646658883159345, "rouge2_recall_stderr": 0.002153896365279606, "rougeL_fmeasure": 0.3441210120028325, "rougeL_fmeasure_stderr": 0.00204980503397177, "rougeL_precision": 0.40630765997029067, "rougeL_precision_stderr": 0.002951468161215274, "rougeL_recall": 0.328147850195057, "rougeL_recall_stderr": 0.002418356461143628, "rougeLsum_fmeasure": 0.3866960602353657, "rougeLsum_fmeasure_stderr": 0.0022595897436360297, "rougeLsum_precision": 0.45540238483443796, "rougeLsum_precision_stderr": 0.003166546359535319, "rougeLsum_recall": 0.368741941065053, "rougeLsum_recall_stderr": 0.0026700865280267125}}, "3": {"generate_text_restaurant": {"bleu": 14.265105209260534, "bleu_stderr": 0.1893500782984233, "rouge1_fmeasure": 0.4799133777857901, "rouge1_fmeasure_stderr": 0.0022135808666613305, "rouge1_precision": 0.559024314601452, "rouge1_precision_stderr": 0.0031784190876307933, "rouge1_recall": 0.45808203587088997, "rouge1_recall_stderr": 0.0028518099942914533, "rouge2_fmeasure": 0.23933867072765447, "rouge2_fmeasure_stderr": 0.002056446121541092, "rouge2_precision": 0.28156906090939965, "rouge2_precision_stderr": 0.002633452625347187, "rouge2_recall": 0.22885468218951255, "rouge2_recall_stderr": 0.002267467095330921, "rougeL_fmeasure": 0.35296360624903717, "rougeL_fmeasure_stderr": 0.0020967204204817742, "rougeL_precision": 0.4125112452470242, "rougeL_precision_stderr": 0.002904863553764727, "rougeL_recall": 0.33660055867060584, "rougeL_recall_stderr": 0.002472291373452986, "rougeLsum_fmeasure": 0.3984458953846194, "rougeLsum_fmeasure_stderr": 0.002298372273182809, "rougeLsum_precision": 0.4644875443067367, "rougeLsum_precision_stderr": 0.0031234652192854697, "rougeLsum_recall": 0.3800515404807272, "rougeLsum_recall_stderr": 0.002711485448834275}}, "4": {"generate_text_restaurant": {"bleu": 14.311299442145796, "bleu_stderr": 0.2043752470776103, "rouge1_fmeasure": 0.48312751290425876, "rouge1_fmeasure_stderr": 0.00219722786310601, "rouge1_precision": 0.5595243846681779, "rouge1_precision_stderr": 0.003134221189136695, "rouge1_recall": 0.4610455256568642, "rouge1_recall_stderr": 0.002793888016644011, "rouge2_fmeasure": 0.23828760771878502, "rouge2_fmeasure_stderr": 0.002043450588678613, "rouge2_precision": 0.27887090816092297, "rouge2_precision_stderr": 0.0026246554724291865, "rouge2_recall": 0.22793411052086368, "rouge2_recall_stderr": 0.0022423088111720104, "rougeL_fmeasure": 0.3555764901156687, "rougeL_fmeasure_stderr": 0.0020670663945140033, "rougeL_precision": 0.41253108581089387, "rougeL_precision_stderr": 0.00283282528319235, "rougeL_recall": 0.3394690558137249, "rougeL_recall_stderr": 0.0024394133712828357, "rougeLsum_fmeasure": 0.4038760495426285, "rougeLsum_fmeasure_stderr": 0.002305749793250546, "rougeLsum_precision": 0.467697201819798, "rougeLsum_precision_stderr": 0.003094645415240535, "rougeLsum_recall": 0.3854933075172655, "rougeLsum_recall_stderr": 0.002709810392823172}}, "5": {"generate_text_restaurant": {"bleu": 14.402250187802036, "bleu_stderr": 0.1983928889862991, "rouge1_fmeasure": 0.48540929140592903, "rouge1_fmeasure_stderr": 0.0021715483077903346, "rouge1_precision": 0.5583813578424975, "rouge1_precision_stderr": 0.0031344137787681203, "rouge1_recall": 0.4642665683523303, "rouge1_recall_stderr": 0.002731585667992789, "rouge2_fmeasure": 0.2398021041336989, "rouge2_fmeasure_stderr": 0.0020301662097027286, "rouge2_precision": 0.27924813792572967, "rouge2_precision_stderr": 0.002635929222128578, "rouge2_recall": 0.22915068098077981, "rouge2_recall_stderr": 0.002170676781668329, "rougeL_fmeasure": 0.357735601845654, "rougeL_fmeasure_stderr": 0.002076611761684181, "rougeL_precision": 0.41264019927219936, "rougeL_precision_stderr": 0.002874141935635406, "rougeL_recall": 0.34201988731429955, "rougeL_recall_stderr": 0.0024029406608019996, "rougeLsum_fmeasure": 0.40708987645111167, "rougeLsum_fmeasure_stderr": 0.002281570268847696, "rougeLsum_precision": 0.4687058447147468, "rougeLsum_precision_stderr": 0.0031001215033715983, "rougeLsum_recall": 0.38926892052969453, "rougeLsum_recall_stderr": 0.002660572577149138}}}, "gem_xsum": {"0": {"article_DOC_summary": {"bleu": 2.082420995996749, "bleu_stderr": 0.08510840681858502, "rouge1_fmeasure": 0.21361320484198185, "rouge1_fmeasure_stderr": 0.002539975403596883, "rouge1_precision": 0.1624663450684432, "rouge1_precision_stderr": 0.0022160293096088234, "rouge1_recall": 0.34744341300319803, "rouge1_recall_stderr": 0.004353721648015942, "rouge2_fmeasure": 0.0486530292947008, "rouge2_fmeasure_stderr": 0.0016139822828471707, "rouge2_precision": 0.03612968077045935, "rouge2_precision_stderr": 0.0012390705828397384, "rouge2_recall": 0.08240926002728291, "rouge2_recall_stderr": 0.0028024469958468482, "rougeL_fmeasure": 0.1614687609383373, "rougeL_fmeasure_stderr": 0.0019520455117725732, "rougeL_precision": 0.12244847188349789, "rougeL_precision_stderr": 0.001679495285671899, "rougeL_recall": 0.2645952209520843, "rougeL_recall_stderr": 0.0035203556610604583, "rougeLsum_fmeasure": 0.16739501050654218, "rougeLsum_fmeasure_stderr": 0.0021485643294003954, "rougeLsum_precision": 0.12662445631555733, "rougeLsum_precision_stderr": 0.0017816880579829913, "rougeLsum_recall": 0.275038473988472, "rougeLsum_recall_stderr": 0.003891933532028957}}, "1": {"article_DOC_summary": {"bleu": 1.563017708107888, "bleu_stderr": 0.06736983578799105, "rouge1_fmeasure": 0.18623035044278274, "rouge1_fmeasure_stderr": 0.002473522166982443, "rouge1_precision": 0.13263242230509506, "rouge1_precision_stderr": 0.0018520825040276166, "rouge1_recall": 0.3254090814037424, "rouge1_recall_stderr": 0.004152382484060741, "rouge2_fmeasure": 0.0402884158203053, "rouge2_fmeasure_stderr": 0.0014356830765523726, "rouge2_precision": 0.028392395062709016, "rouge2_precision_stderr": 0.0010172043872722577, "rouge2_recall": 0.07221536214104553, "rouge2_recall_stderr": 0.0026117766579513814, "rougeL_fmeasure": 0.14521474180810057, "rougeL_fmeasure_stderr": 0.0018533757290429948, "rougeL_precision": 0.10316577690192445, "rougeL_precision_stderr": 0.0013718034489219495, "rougeL_recall": 0.2554918983982777, "rougeL_recall_stderr": 0.003218687837696152, "rougeLsum_fmeasure": 0.14919756084049868, "rougeLsum_fmeasure_stderr": 0.002062513276092944, "rougeLsum_precision": 0.10599521523063213, "rougeLsum_precision_stderr": 0.0015218989277518463, "rougeLsum_recall": 0.2625681470613011, "rougeLsum_recall_stderr": 0.003597030470005279}}, "2": {"article_DOC_summary": {"bleu": 1.6762842895764352, "bleu_stderr": 0.0791926134566303, "rouge1_fmeasure": 0.18953795656968836, "rouge1_fmeasure_stderr": 0.002432292652997283, "rouge1_precision": 0.13538804105400676, "rouge1_precision_stderr": 0.0018293632886803941, "rouge1_recall": 0.3302325861232888, "rouge1_recall_stderr": 0.0042380934010501185, "rouge2_fmeasure": 0.04250905212911774, "rouge2_fmeasure_stderr": 0.001489153203301286, "rouge2_precision": 0.029962800938098572, "rouge2_precision_stderr": 0.0010534096947695541, "rouge2_recall": 0.07683747490684736, "rouge2_recall_stderr": 0.0028124212896749722, "rougeL_fmeasure": 0.150446942473803, "rougeL_fmeasure_stderr": 0.0018477627122504869, "rougeL_precision": 0.1072695052343289, "rougeL_precision_stderr": 0.0013743282170330293, "rougeL_recall": 0.2635615604235294, "rougeL_recall_stderr": 0.0033637530249115495, "rougeLsum_fmeasure": 0.14951703911062328, "rougeLsum_fmeasure_stderr": 0.0020292384708233196, "rougeLsum_precision": 0.10641741696830354, "rougeLsum_precision_stderr": 0.001487583204435948, "rougeLsum_recall": 0.26292280913745725, "rougeLsum_recall_stderr": 0.003726405564135895}}, "3": {"article_DOC_summary": {"bleu": 1.7308630541864396, "bleu_stderr": 0.08778732229137869, "rouge1_fmeasure": 0.18459222002003098, "rouge1_fmeasure_stderr": 0.0027511828148869526, "rouge1_precision": 0.13995034823105182, "rouge1_precision_stderr": 0.0024260078328372124, "rouge1_recall": 0.3040476296806973, "rouge1_recall_stderr": 0.00446777393978941, "rouge2_fmeasure": 0.04273954336339969, "rouge2_fmeasure_stderr": 0.0015070002894092183, "rouge2_precision": 0.031700084263988036, "rouge2_precision_stderr": 0.0011622600202074865, "rouge2_recall": 0.07302117867885434, "rouge2_recall_stderr": 0.0026515753289958746, "rougeL_fmeasure": 0.14848775504028594, "rougeL_fmeasure_stderr": 0.0021627004910264496, "rougeL_precision": 0.11185866851166562, "rougeL_precision_stderr": 0.0018488632017068527, "rougeL_recall": 0.2465359323519087, "rougeL_recall_stderr": 0.0036397000597042954, "rougeLsum_fmeasure": 0.14446258726311614, "rougeLsum_fmeasure_stderr": 0.0022415522283490545, "rougeLsum_precision": 0.10917649093837714, "rougeLsum_precision_stderr": 0.001929790524784196, "rougeLsum_recall": 0.23984547232610806, "rougeLsum_recall_stderr": 0.0037774696922394497}}, "4": {"article_DOC_summary": {"bleu": 0.5738384774948022, "bleu_stderr": 0.05603875019319245, "rouge1_fmeasure": 0.05094176319365546, "rouge1_fmeasure_stderr": 0.002882647234702002, "rouge1_precision": 0.046138251522645654, "rouge1_precision_stderr": 0.0028937716323574583, "rouge1_recall": 0.07367464652619297, "rouge1_recall_stderr": 0.004126545243784722, "rouge2_fmeasure": 0.010775980130208754, "rouge2_fmeasure_stderr": 0.0009408820942311892, "rouge2_precision": 0.009258127688613489, "rouge2_precision_stderr": 0.0008866577886039543, "rouge2_recall": 0.015509633996620949, "rouge2_recall_stderr": 0.0013241742875245073, "rougeL_fmeasure": 0.04049131749896121, "rougeL_fmeasure_stderr": 0.0022591085239586873, "rougeL_precision": 0.03689744588577719, "rougeL_precision_stderr": 0.0023273437354799104, "rougeL_recall": 0.05909059170937521, "rougeL_recall_stderr": 0.0033193012154986838, "rougeLsum_fmeasure": 0.03971916742116221, "rougeLsum_fmeasure_stderr": 0.002257663029431442, "rougeLsum_precision": 0.03639698892402911, "rougeLsum_precision_stderr": 0.0023439318335337477, "rougeLsum_recall": 0.05773883087379689, "rougeLsum_recall_stderr": 0.0032861038296946314}}, "5": {"article_DOC_summary": {"bleu": 4.166211075601866e-37, "bleu_stderr": 1.716028525004054e-32, "rouge1_fmeasure": 0.002731053639815148, "rouge1_fmeasure_stderr": 0.0007782335896411102, "rouge1_precision": 0.0031000607790285925, "rouge1_precision_stderr": 0.0009192158828809469, "rouge1_recall": 0.0025343349377899326, "rouge1_recall_stderr": 0.000716465136061307, "rouge2_fmeasure": 0.0003317630778664413, "rouge2_fmeasure_stderr": 0.00021829498201476416, "rouge2_precision": 0.0004180960548885077, "rouge2_precision_stderr": 0.0002916918368087507, "rouge2_recall": 0.00028444825614636933, "rouge2_recall_stderr": 0.00018182421707992435, "rougeL_fmeasure": 0.002019007248509181, "rougeL_fmeasure_stderr": 0.0005504745008200219, "rougeL_precision": 0.0022354310506363783, "rougeL_precision_stderr": 0.0006041902919239048, "rougeL_recall": 0.0019147454695116499, "rougeL_recall_stderr": 0.0005366627834143417, "rougeLsum_fmeasure": 0.0022517933303518667, "rougeLsum_fmeasure_stderr": 0.0006473059361227687, "rougeLsum_precision": 0.0025381250270262476, "rougeLsum_precision_stderr": 0.0007465918244299208, "rougeLsum_recall": 0.0021073593748461884, "rougeLsum_recall_stderr": 0.000609805170315193}}}}