{"GEM/web_nlg_en": {"0": {"PALM_prompt": {"bleu": 0.3463387125507984, "bleu_stderr": 0.03871898741816671, "rouge1_fmeasure": 0.10952539068797028, "rouge1_fmeasure_stderr": 0.0019907747077539725, "rouge1_precision": 0.07211255715607569, "rouge1_precision_stderr": 0.001551406165163628, "rouge1_recall": 0.2996849092736172, "rouge1_recall_stderr": 0.004583023786340968, "rouge2_fmeasure": 0.05201678241725894, "rouge2_fmeasure_stderr": 0.0012570598168046025, "rouge2_precision": 0.03381420888180137, "rouge2_precision_stderr": 0.0008950985117036589, "rouge2_recall": 0.14844147775806338, "rouge2_recall_stderr": 0.0032200950902031658, "rougeL_fmeasure": 0.10599044553263734, "rougeL_fmeasure_stderr": 0.001858626781810144, "rougeL_precision": 0.06953968025004763, "rougeL_precision_stderr": 0.0014395600092792235, "rougeL_recall": 0.2927861422575508, "rougeL_recall_stderr": 0.004486869628532065, "rougeLsum_fmeasure": 0.10494341774143819, "rougeLsum_fmeasure_stderr": 0.0018712967363079748, "rougeLsum_precision": 0.06905492701097961, "rougeLsum_precision_stderr": 0.0014675622764115906, "rougeLsum_recall": 0.28799521128404415, "rougeLsum_recall_stderr": 0.004338230779660113}}, "1": {"PALM_prompt": {"bleu": 0.49152208622242877, "bleu_stderr": 0.04139408950745415, "rouge1_fmeasure": 0.11542248804126877, "rouge1_fmeasure_stderr": 0.001852315570556662, "rouge1_precision": 0.07373625415642708, "rouge1_precision_stderr": 0.0013444564112333292, "rouge1_recall": 0.3753665468025263, "rouge1_recall_stderr": 0.00536016010380475, "rouge2_fmeasure": 0.05396039097370975, "rouge2_fmeasure_stderr": 0.0011621890988087783, "rouge2_precision": 0.03437112478262944, "rouge2_precision_stderr": 0.0008158271460114628, "rouge2_recall": 0.1839462343866126, "rouge2_recall_stderr": 0.003709671721946962, "rougeL_fmeasure": 0.1080526825836882, "rougeL_fmeasure_stderr": 0.0016391879678756425, "rougeL_precision": 0.06891381858838289, "rougeL_precision_stderr": 0.00117848640155061, "rougeL_recall": 0.3513896637107432, "rougeL_recall_stderr": 0.004856217872136033, "rougeLsum_fmeasure": 0.10983109806282532, "rougeLsum_fmeasure_stderr": 0.0017465824716290605, "rougeLsum_precision": 0.07022268782208652, "rougeLsum_precision_stderr": 0.0012677785220343175, "rougeLsum_recall": 0.3548574219712635, "rougeLsum_recall_stderr": 0.004914558194954389}}, "2": {"PALM_prompt": {"bleu": 0.5036165898830023, "bleu_stderr": 0.03163382931247645, "rouge1_fmeasure": 0.11611735091169018, "rouge1_fmeasure_stderr": 0.0016856649398913782, "rouge1_precision": 0.07345117313274237, "rouge1_precision_stderr": 0.0012208182117261878, "rouge1_recall": 0.3941081050839388, "rouge1_recall_stderr": 0.005139991780948632, "rouge2_fmeasure": 0.0542677230188957, "rouge2_fmeasure_stderr": 0.001076889081745943, "rouge2_precision": 0.03416030472845622, "rouge2_precision_stderr": 0.0007497324529078045, "rouge2_recall": 0.1960695205229479, "rouge2_recall_stderr": 0.00374456566803786, "rougeL_fmeasure": 0.10822818662084129, "rougeL_fmeasure_stderr": 0.0015080010309372358, "rougeL_precision": 0.06848596200566257, "rougeL_precision_stderr": 0.001088456262302762, "rougeL_recall": 0.3641445841455221, "rougeL_recall_stderr": 0.004555374452263096, "rougeLsum_fmeasure": 0.11045227449849929, "rougeLsum_fmeasure_stderr": 0.0015880076943480838, "rougeLsum_precision": 0.06991710191369618, "rougeLsum_precision_stderr": 0.00115124520295404, "rougeLsum_recall": 0.37308280267746685, "rougeLsum_recall_stderr": 0.004752608689239747}}, "3": {"PALM_prompt": {"bleu": 0.6498113531541159, "bleu_stderr": 0.044359939496823625, "rouge1_fmeasure": 0.11670639827568505, "rouge1_fmeasure_stderr": 0.0017228506693859023, "rouge1_precision": 0.07362728433969368, "rouge1_precision_stderr": 0.0012506969519923664, "rouge1_recall": 0.40433747874257164, "rouge1_recall_stderr": 0.00532349382454595, "rouge2_fmeasure": 0.055174784608656414, "rouge2_fmeasure_stderr": 0.001103480731304987, "rouge2_precision": 0.03462285279213432, "rouge2_precision_stderr": 0.0007700688556812641, "rouge2_recall": 0.20446580518938245, "rouge2_recall_stderr": 0.0038704073812126957, "rougeL_fmeasure": 0.10780699471813608, "rougeL_fmeasure_stderr": 0.0015196469475095016, "rougeL_precision": 0.06807883372554288, "rougeL_precision_stderr": 0.0011054577780329877, "rougeL_recall": 0.369498755496309, "rougeL_recall_stderr": 0.004606643368535042, "rougeLsum_fmeasure": 0.11062957727513113, "rougeLsum_fmeasure_stderr": 0.0016229376323127634, "rougeLsum_precision": 0.06987690204692998, "rougeLsum_precision_stderr": 0.001181829372472824, "rougeLsum_recall": 0.38020527679899335, "rougeLsum_recall_stderr": 0.004841997364585111}}, "4": {"PALM_prompt": {"bleu": 0.6676812083161542, "bleu_stderr": 0.04984003951128037, "rouge1_fmeasure": 0.11795519287394977, "rouge1_fmeasure_stderr": 0.001663656872341927, "rouge1_precision": 0.07419859091894718, "rouge1_precision_stderr": 0.0012073720133260548, "rouge1_recall": 0.4115156265704582, "rouge1_recall_stderr": 0.005279248235847037, "rouge2_fmeasure": 0.05617955897318711, "rouge2_fmeasure_stderr": 0.001072962808033341, "rouge2_precision": 0.03509931891578484, "rouge2_precision_stderr": 0.0007461921191218064, "rouge2_recall": 0.21194614881093146, "rouge2_recall_stderr": 0.003942396709196514, "rougeL_fmeasure": 0.10867138834194551, "rougeL_fmeasure_stderr": 0.0014576101979114201, "rougeL_precision": 0.0683956812460672, "rougeL_precision_stderr": 0.0010554662078452836, "rougeL_recall": 0.37604842524473375, "rougeL_recall_stderr": 0.004602132355576208, "rougeLsum_fmeasure": 0.11206081323499055, "rougeLsum_fmeasure_stderr": 0.001572212563142291, "rougeLsum_precision": 0.07053184039179991, "rougeLsum_precision_stderr": 0.0011422521869853676, "rougeLsum_recall": 0.3893450058485989, "rougeLsum_recall_stderr": 0.004865697961495776}}, "5": {"PALM_prompt": {"bleu": 0.7710974467285127, "bleu_stderr": 0.05203704839844347, "rouge1_fmeasure": 0.11877703066041605, "rouge1_fmeasure_stderr": 0.0016491364267747024, "rouge1_precision": 0.07425806182657936, "rouge1_precision_stderr": 0.0011956495019689597, "rouge1_recall": 0.42780274108203253, "rouge1_recall_stderr": 0.005406944243614746, "rouge2_fmeasure": 0.05625150089671772, "rouge2_fmeasure_stderr": 0.0010511709925049085, "rouge2_precision": 0.03492035728514057, "rouge2_precision_stderr": 0.000728989115137721, "rouge2_recall": 0.22003827942872525, "rouge2_recall_stderr": 0.004025013823319427, "rougeL_fmeasure": 0.10772149028740496, "rougeL_fmeasure_stderr": 0.0014157977593889726, "rougeL_precision": 0.06747232289163295, "rougeL_precision_stderr": 0.001034208622107367, "rougeL_recall": 0.3846963659749557, "rougeL_recall_stderr": 0.004603801517001138, "rougeLsum_fmeasure": 0.11204458204469926, "rougeLsum_fmeasure_stderr": 0.0015584717483504628, "rougeLsum_precision": 0.07017346453232838, "rougeLsum_precision_stderr": 0.001136713184580948, "rougeLsum_recall": 0.40087756811378206, "rougeLsum_recall_stderr": 0.004939981502609751}}}, "GEM/wiki_lingua_en": {"0": {"tldr_en": {"bleu": 1.7317879218324492, "bleu_stderr": 0.06258434310865753, "rouge1_fmeasure": 0.18179483366438334, "rouge1_fmeasure_stderr": 0.001918528213130623, "rouge1_precision": 0.15426863660325024, "rouge1_precision_stderr": 0.0019390767016899475, "rouge1_recall": 0.26616584906943935, "rouge1_recall_stderr": 0.002800247123213755, "rouge2_fmeasure": 0.03857873002486118, "rouge2_fmeasure_stderr": 0.0008912625012118423, "rouge2_precision": 0.032398604164030766, "rouge2_precision_stderr": 0.0007853568426710733, "rouge2_recall": 0.059178979799423694, "rouge2_recall_stderr": 0.0015378959605561995, "rougeL_fmeasure": 0.14062571654868716, "rougeL_fmeasure_stderr": 0.0013664451991987955, "rougeL_precision": 0.1178409029648999, "rougeL_precision_stderr": 0.00134426120796486, "rougeL_recall": 0.21156320512029583, "rougeL_recall_stderr": 0.002302858626762558, "rougeLsum_fmeasure": 0.1667428911480839, "rougeLsum_fmeasure_stderr": 0.0017491099585958065, "rougeLsum_precision": 0.14121341341165533, "rougeLsum_precision_stderr": 0.0017607776877685353, "rougeLsum_recall": 0.24535304568196398, "rougeLsum_recall_stderr": 0.0026196185425979572}}, "1": {"tldr_en": {"bleu": 3.078946318578733, "bleu_stderr": 0.037508376634953426, "rouge1_fmeasure": 0.22615743170046998, "rouge1_fmeasure_stderr": 0.0019675759971617946, "rouge1_precision": 0.2097374056236598, "rouge1_precision_stderr": 0.002558792591642619, "rouge1_recall": 0.31993230192333455, "rouge1_recall_stderr": 0.002912578847069188, "rouge2_fmeasure": 0.05788753426578909, "rouge2_fmeasure_stderr": 0.0011036642735696503, "rouge2_precision": 0.05460829335196789, "rouge2_precision_stderr": 0.0013104520035504465, "rouge2_recall": 0.08436597375871419, "rouge2_recall_stderr": 0.0018136264810112849, "rougeL_fmeasure": 0.16096845678834487, "rougeL_fmeasure_stderr": 0.0013344427734486718, "rougeL_precision": 0.14966153212559197, "rougeL_precision_stderr": 0.0019100435840523184, "rougeL_recall": 0.23314632888007986, "rougeL_recall_stderr": 0.002308314606066584, "rougeLsum_fmeasure": 0.21248946284679468, "rougeLsum_fmeasure_stderr": 0.001850444919705845, "rougeLsum_precision": 0.1969300454898004, "rougeLsum_precision_stderr": 0.002419281823679596, "rougeLsum_recall": 0.3015516742807266, "rougeLsum_recall_stderr": 0.0027852344656345953}}, "2": {"tldr_en": {"bleu": 3.331365912474371, "bleu_stderr": 0.03901431585240638, "rouge1_fmeasure": 0.22500809081344597, "rouge1_fmeasure_stderr": 0.0019395777660833832, "rouge1_precision": 0.2249179940170448, "rouge1_precision_stderr": 0.002953091033379103, "rouge1_recall": 0.30791265980488064, "rouge1_recall_stderr": 0.0028052680018540153, "rouge2_fmeasure": 0.058940718015282535, "rouge2_fmeasure_stderr": 0.0011427794692985003, "rouge2_precision": 0.06082816124882105, "rouge2_precision_stderr": 0.0015517487698999066, "rouge2_recall": 0.08191649217784704, "rouge2_recall_stderr": 0.0017207233219242591, "rougeL_fmeasure": 0.1629946491305722, "rougeL_fmeasure_stderr": 0.001412842903446524, "rougeL_precision": 0.1651950475417842, "rougeL_precision_stderr": 0.0023849745375518774, "rougeL_recall": 0.22637843422800283, "rougeL_recall_stderr": 0.002257218203318618, "rougeLsum_fmeasure": 0.21287275166909125, "rougeLsum_fmeasure_stderr": 0.001828524451639913, "rougeLsum_precision": 0.21271781118896244, "rougeLsum_precision_stderr": 0.0027972927699949795, "rougeLsum_recall": 0.29203959550294045, "rougeLsum_recall_stderr": 0.002679740707668158}}, "3": {"tldr_en": {"bleu": 3.4654459013677066, "bleu_stderr": 0.09533106520935124, "rouge1_fmeasure": 0.1828984280612045, "rouge1_fmeasure_stderr": 0.00233789023320496, "rouge1_precision": 0.1984883398198494, "rouge1_precision_stderr": 0.003387900153458854, "rouge1_recall": 0.2444675402553931, "rouge1_recall_stderr": 0.003332060879697036, "rouge2_fmeasure": 0.048423081518600516, "rouge2_fmeasure_stderr": 0.0011278965656492843, "rouge2_precision": 0.05494653639366956, "rouge2_precision_stderr": 0.00172026049377679, "rouge2_recall": 0.06573981524186268, "rouge2_recall_stderr": 0.001646361012922936, "rougeL_fmeasure": 0.13482403873394622, "rougeL_fmeasure_stderr": 0.0017315326993232382, "rougeL_precision": 0.14973545109772782, "rougeL_precision_stderr": 0.002771115067407858, "rougeL_recall": 0.1820828761022503, "rougeL_recall_stderr": 0.002594908370622835, "rougeLsum_fmeasure": 0.1727178547993039, "rougeLsum_fmeasure_stderr": 0.0022030460306759693, "rougeLsum_precision": 0.1876688685476534, "rougeLsum_precision_stderr": 0.003222108012150837, "rougeLsum_recall": 0.23146444735253652, "rougeLsum_recall_stderr": 0.003170383006624478}}, "4": {"tldr_en": {"bleu": 0.5096514625512257, "bleu_stderr": 0.04746911438860582, "rouge1_fmeasure": 0.057249298351433005, "rouge1_fmeasure_stderr": 0.001981710879314234, "rouge1_precision": 0.06373323883393266, "rouge1_precision_stderr": 0.0025948109156841556, "rouge1_recall": 0.07974114305386926, "rouge1_recall_stderr": 0.002852169393376925, "rouge2_fmeasure": 0.014679683423748945, "rouge2_fmeasure_stderr": 0.0007250006064285315, "rouge2_precision": 0.017183606562936146, "rouge2_precision_stderr": 0.001165303674699654, "rouge2_recall": 0.021451383479229473, "rouge2_recall_stderr": 0.00115814797861179, "rougeL_fmeasure": 0.04339902158323832, "rougeL_fmeasure_stderr": 0.0014931210623861644, "rougeL_precision": 0.049676263167134256, "rougeL_precision_stderr": 0.0021317796688731104, "rougeL_recall": 0.061127221909033094, "rougeL_recall_stderr": 0.0022295833532602533, "rougeLsum_fmeasure": 0.05356492994210666, "rougeLsum_fmeasure_stderr": 0.0018539473478258858, "rougeLsum_precision": 0.059918160107108445, "rougeLsum_precision_stderr": 0.002458251392796141, "rougeLsum_recall": 0.07475299437390277, "rougeLsum_recall_stderr": 0.0026852062028548873}}, "5": {"tldr_en": {"bleu": 2.4367817796838913e-07, "bleu_stderr": 5.931740679366216e-07, "rouge1_fmeasure": 0.009381663500620675, "rouge1_fmeasure_stderr": 0.0009033228148794374, "rouge1_precision": 0.00974635222327858, "rouge1_precision_stderr": 0.0010426157804008867, "rouge1_recall": 0.013305767376845547, "rouge1_recall_stderr": 0.001294486365694067, "rouge2_fmeasure": 0.002426218955168773, "rouge2_fmeasure_stderr": 0.00032099513562133, "rouge2_precision": 0.0027541706176161013, "rouge2_precision_stderr": 0.0004991531053543725, "rouge2_recall": 0.0034881657779112446, "rouge2_recall_stderr": 0.0004828260114230198, "rougeL_fmeasure": 0.007132684824681642, "rougeL_fmeasure_stderr": 0.0006849988631397933, "rougeL_precision": 0.007558937884226414, "rougeL_precision_stderr": 0.0008514792129217634, "rougeL_recall": 0.010297022985567691, "rougeL_recall_stderr": 0.0010209752122782392, "rougeLsum_fmeasure": 0.008824412648201954, "rougeLsum_fmeasure_stderr": 0.0008523533756253951, "rougeLsum_precision": 0.00925164902439946, "rougeLsum_precision_stderr": 0.001003429166331945, "rougeLsum_recall": 0.012522528933544396, "rougeLsum_recall_stderr": 0.0012265948088620682}}}, "e2e_nlg_cleaned": {"0": {"generate_text_restaurant": {"bleu": 1.4674593008700727, "bleu_stderr": 0.07690373053792376, "rouge1_fmeasure": 0.06377803506212068, "rouge1_fmeasure_stderr": 0.001672122677396593, "rouge1_precision": 0.05683753991737235, "rouge1_precision_stderr": 0.0014560506575201325, "rouge1_recall": 0.08937391024861521, "rouge1_recall_stderr": 0.002366915901253559, "rouge2_fmeasure": 0.015238638354519577, "rouge2_fmeasure_stderr": 0.0007071169872858592, "rouge2_precision": 0.012214590726895359, "rouge2_precision_stderr": 0.0005743247716736654, "rouge2_recall": 0.021379218732414145, "rouge2_recall_stderr": 0.0009966104546792834, "rougeL_fmeasure": 0.059880641876164487, "rougeL_fmeasure_stderr": 0.0014895688210922907, "rougeL_precision": 0.05347894988195794, "rougeL_precision_stderr": 0.0013049823564136975, "rougeL_recall": 0.08437384990508254, "rougeL_recall_stderr": 0.0021538312776559535, "rougeLsum_fmeasure": 0.057561121270217515, "rougeLsum_fmeasure_stderr": 0.0014995174600948955, "rougeLsum_precision": 0.05199652967109443, "rougeLsum_precision_stderr": 0.001336335232731129, "rougeLsum_recall": 0.08011650518165435, "rougeLsum_recall_stderr": 0.0021036901960562}}, "1": {"generate_text_restaurant": {"bleu": 11.256639255609565, "bleu_stderr": 0.13909119146023038, "rouge1_fmeasure": 0.43826153885312474, "rouge1_fmeasure_stderr": 0.0023680361634807615, "rouge1_precision": 0.5241369762469382, "rouge1_precision_stderr": 0.0032402613188758484, "rouge1_recall": 0.4154073794853628, "rouge1_recall_stderr": 0.0029811452241909936, "rouge2_fmeasure": 0.20120573159323082, "rouge2_fmeasure_stderr": 0.0019466830589320579, "rouge2_precision": 0.24440729108549972, "rouge2_precision_stderr": 0.0025713353876726987, "rouge2_recall": 0.1903569141394937, "rouge2_recall_stderr": 0.002085369890907639, "rougeL_fmeasure": 0.31512942959617346, "rougeL_fmeasure_stderr": 0.0020245073951865498, "rougeL_precision": 0.3797441094381383, "rougeL_precision_stderr": 0.002849422577384458, "rougeL_recall": 0.2977661478395331, "rougeL_recall_stderr": 0.0023832352149522175, "rougeLsum_fmeasure": 0.35586936216582027, "rougeLsum_fmeasure_stderr": 0.002288936359442796, "rougeLsum_precision": 0.4269573872984081, "rougeLsum_precision_stderr": 0.003094947485413177, "rougeLsum_recall": 0.33674441043750625, "rougeLsum_recall_stderr": 0.00269773822444997}}, "2": {"generate_text_restaurant": {"bleu": 13.376126264980714, "bleu_stderr": 0.2423138700015996, "rouge1_fmeasure": 0.47582339525157197, "rouge1_fmeasure_stderr": 0.0022765247887398116, "rouge1_precision": 0.5586896631262273, "rouge1_precision_stderr": 0.0032542273894082263, "rouge1_recall": 0.4534492320208494, "rouge1_recall_stderr": 0.0029116157123098745, "rouge2_fmeasure": 0.23204546503817813, "rouge2_fmeasure_stderr": 0.002046713809774589, "rouge2_precision": 0.27694841097623996, "rouge2_precision_stderr": 0.002758389324353955, "rouge2_recall": 0.2206909261465891, "rouge2_recall_stderr": 0.0021891415728379693, "rougeL_fmeasure": 0.34446258237680916, "rougeL_fmeasure_stderr": 0.0020760578430186376, "rougeL_precision": 0.40753042690914904, "rougeL_precision_stderr": 0.002988569615037221, "rougeL_recall": 0.3271426648953936, "rougeL_recall_stderr": 0.002412434421850288, "rougeLsum_fmeasure": 0.39054726501758946, "rougeLsum_fmeasure_stderr": 0.002301771792227363, "rougeLsum_precision": 0.4602485572678633, "rougeLsum_precision_stderr": 0.003204122515744201, "rougeLsum_recall": 0.3712619134780482, "rougeLsum_recall_stderr": 0.0026876195742092054}}, "3": {"generate_text_restaurant": {"bleu": 14.093165522897872, "bleu_stderr": 0.21216386354546166, "rouge1_fmeasure": 0.4785676515677228, "rouge1_fmeasure_stderr": 0.0022234504082830633, "rouge1_precision": 0.5387233761250629, "rouge1_precision_stderr": 0.0031864759527455624, "rouge1_recall": 0.4726895100996329, "rouge1_recall_stderr": 0.002899854544961585, "rouge2_fmeasure": 0.23558342825678338, "rouge2_fmeasure_stderr": 0.002030621156209231, "rouge2_precision": 0.2685393636176561, "rouge2_precision_stderr": 0.0026170967343239477, "rouge2_recall": 0.23277587897646693, "rouge2_recall_stderr": 0.0022527763377626336, "rougeL_fmeasure": 0.34641516486003826, "rougeL_fmeasure_stderr": 0.0020831944107613303, "rougeL_precision": 0.39161805848668024, "rougeL_precision_stderr": 0.002876699759638117, "rougeL_recall": 0.34175514874890695, "rougeL_recall_stderr": 0.0024862399492205957, "rougeLsum_fmeasure": 0.3965640250353348, "rougeLsum_fmeasure_stderr": 0.0022751928578861502, "rougeLsum_precision": 0.44704833712523245, "rougeLsum_precision_stderr": 0.003092169155791799, "rougeLsum_recall": 0.3913487563855888, "rougeLsum_recall_stderr": 0.0027430209943532587}}, "4": {"generate_text_restaurant": {"bleu": 13.01877522701202, "bleu_stderr": 0.1634606411416184, "rouge1_fmeasure": 0.47017887879088466, "rouge1_fmeasure_stderr": 0.00215775715520141, "rouge1_precision": 0.4967367435501768, "rouge1_precision_stderr": 0.002997180519517344, "rouge1_recall": 0.48986433299719573, "rouge1_recall_stderr": 0.0028919527625229664, "rouge2_fmeasure": 0.2285190900484798, "rouge2_fmeasure_stderr": 0.001968236514909628, "rouge2_precision": 0.24350630882815852, "rouge2_precision_stderr": 0.002422719426969184, "rouge2_recall": 0.2387594057692899, "rouge2_recall_stderr": 0.0022672859667634986, "rougeL_fmeasure": 0.3311043111563345, "rougeL_fmeasure_stderr": 0.001975651372330419, "rougeL_precision": 0.3508199102140834, "rougeL_precision_stderr": 0.002597964369996749, "rougeL_recall": 0.34517696947416515, "rougeL_recall_stderr": 0.0024767421656897485, "rougeLsum_fmeasure": 0.3879654204025311, "rougeLsum_fmeasure_stderr": 0.00222102600090257, "rougeLsum_precision": 0.4096834114721446, "rougeLsum_precision_stderr": 0.0028584575443569072, "rougeLsum_recall": 0.4045460483730194, "rougeLsum_recall_stderr": 0.002787010565242438}}, "5": {"generate_text_restaurant": {"bleu": 11.738533814250154, "bleu_stderr": 0.20692029359403782, "rouge1_fmeasure": 0.4579176439966838, "rouge1_fmeasure_stderr": 0.0019838649103218315, "rouge1_precision": 0.4557324007548413, "rouge1_precision_stderr": 0.0026141133736043063, "rouge1_recall": 0.5008190200746241, "rouge1_recall_stderr": 0.0027912701451645113, "rouge2_fmeasure": 0.21699681614941907, "rouge2_fmeasure_stderr": 0.0018260134934355917, "rouge2_precision": 0.21649241809836905, "rouge2_precision_stderr": 0.0020808047468387015, "rouge2_recall": 0.23946332773224333, "rouge2_recall_stderr": 0.0022622492821207474, "rougeL_fmeasure": 0.3204737144833669, "rougeL_fmeasure_stderr": 0.0018416039122686005, "rougeL_precision": 0.31896738977233224, "rougeL_precision_stderr": 0.002249879972490852, "rougeL_recall": 0.3516931047967278, "rougeL_recall_stderr": 0.0024669281840779384, "rougeLsum_fmeasure": 0.38110492282903374, "rougeLsum_fmeasure_stderr": 0.0020518013347156708, "rougeLsum_precision": 0.3790705627204969, "rougeLsum_precision_stderr": 0.0024962460456464603, "rougeLsum_recall": 0.4171792042608784, "rougeLsum_recall_stderr": 0.0027157128707540365}}}, "gem_xsum": {"0": {"article_DOC_summary": {"bleu": 2.2151365071026334, "bleu_stderr": 0.10551243625041298, "rouge1_fmeasure": 0.2173222672616331, "rouge1_fmeasure_stderr": 0.0026735963951633086, "rouge1_precision": 0.17320559498489507, "rouge1_precision_stderr": 0.0025525024097035748, "rouge1_recall": 0.33568511811329627, "rouge1_recall_stderr": 0.004457272030335943, "rouge2_fmeasure": 0.05119317937818865, "rouge2_fmeasure_stderr": 0.0016915277669349944, "rouge2_precision": 0.03984347722138949, "rouge2_precision_stderr": 0.0014498730660041778, "rouge2_recall": 0.08293611853648174, "rouge2_recall_stderr": 0.0027922604769135967, "rougeL_fmeasure": 0.16413944160730887, "rougeL_fmeasure_stderr": 0.0020492207241516436, "rougeL_precision": 0.1306308027797899, "rougeL_precision_stderr": 0.001979750535716133, "rougeL_recall": 0.25481924486600754, "rougeL_recall_stderr": 0.0034477504419509046, "rougeLsum_fmeasure": 0.17170031392993537, "rougeLsum_fmeasure_stderr": 0.002265881556419863, "rougeLsum_precision": 0.13618964667417757, "rougeLsum_precision_stderr": 0.0020883754136888665, "rougeLsum_recall": 0.2671983620973551, "rougeLsum_recall_stderr": 0.0038518682770408703}}, "1": {"article_DOC_summary": {"bleu": 1.5874448429909755, "bleu_stderr": 0.07657449929611179, "rouge1_fmeasure": 0.18543200867192464, "rouge1_fmeasure_stderr": 0.0024553301715842025, "rouge1_precision": 0.13193321373947423, "rouge1_precision_stderr": 0.0018249214408045705, "rouge1_recall": 0.32491663088067385, "rouge1_recall_stderr": 0.004280533648795701, "rouge2_fmeasure": 0.04099230088578755, "rouge2_fmeasure_stderr": 0.0014846354986486204, "rouge2_precision": 0.02885078338766851, "rouge2_precision_stderr": 0.0010494871344340587, "rouge2_recall": 0.07423283049608298, "rouge2_recall_stderr": 0.0027810291758957346, "rougeL_fmeasure": 0.14626844109613504, "rougeL_fmeasure_stderr": 0.0018773361178004498, "rougeL_precision": 0.10387006177524372, "rougeL_precision_stderr": 0.0013802990359211345, "rougeL_recall": 0.2578619666146113, "rougeL_recall_stderr": 0.003428735324171146, "rougeLsum_fmeasure": 0.1472004999527075, "rougeLsum_fmeasure_stderr": 0.0020688083081768726, "rougeLsum_precision": 0.10445447840702451, "rougeLsum_precision_stderr": 0.001509990224349501, "rougeLsum_recall": 0.2598290086664842, "rougeLsum_recall_stderr": 0.0037495698358454184}}, "2": {"article_DOC_summary": {"bleu": 1.620400084032387, "bleu_stderr": 0.1036187597036037, "rouge1_fmeasure": 0.18753394533546663, "rouge1_fmeasure_stderr": 0.0024632687591213827, "rouge1_precision": 0.13378369552141486, "rouge1_precision_stderr": 0.001828879330748606, "rouge1_recall": 0.32737811206091777, "rouge1_recall_stderr": 0.004306408194620798, "rouge2_fmeasure": 0.04246731521010523, "rouge2_fmeasure_stderr": 0.0014710047875479853, "rouge2_precision": 0.0299925935097244, "rouge2_precision_stderr": 0.0010381433997656876, "rouge2_recall": 0.07593086345843493, "rouge2_recall_stderr": 0.0027442526221015794, "rougeL_fmeasure": 0.14937612301640457, "rougeL_fmeasure_stderr": 0.0018862901936057773, "rougeL_precision": 0.10643964494355733, "rougeL_precision_stderr": 0.0013938532111114862, "rougeL_recall": 0.26198866539949395, "rougeL_recall_stderr": 0.0034185812335638674, "rougeLsum_fmeasure": 0.14706588908674015, "rougeLsum_fmeasure_stderr": 0.0020537944843788485, "rougeLsum_precision": 0.10465900735165316, "rougeLsum_precision_stderr": 0.0014985247658685268, "rougeLsum_recall": 0.25870432987334707, "rougeLsum_recall_stderr": 0.0037543234582558148}}, "3": {"article_DOC_summary": {"bleu": 1.6556986327135799, "bleu_stderr": 0.09408085446538644, "rouge1_fmeasure": 0.181742673631377, "rouge1_fmeasure_stderr": 0.0026996346996907114, "rouge1_precision": 0.1325857147512653, "rouge1_precision_stderr": 0.002104582538451698, "rouge1_recall": 0.310270163693354, "rouge1_recall_stderr": 0.004622235270535744, "rouge2_fmeasure": 0.041996639319967895, "rouge2_fmeasure_stderr": 0.0014924431333982891, "rouge2_precision": 0.030071518934551324, "rouge2_precision_stderr": 0.0010760225740262315, "rouge2_recall": 0.07399993568063115, "rouge2_recall_stderr": 0.0027512935104685335, "rougeL_fmeasure": 0.1455139114170652, "rougeL_fmeasure_stderr": 0.002103135242813012, "rougeL_precision": 0.10572519383258887, "rougeL_precision_stderr": 0.001594887821630211, "rougeL_recall": 0.24999311515441475, "rougeL_recall_stderr": 0.0037295235353239403, "rougeLsum_fmeasure": 0.1443734491656482, "rougeLsum_fmeasure_stderr": 0.002242271836640455, "rougeLsum_precision": 0.10501603221104056, "rougeLsum_precision_stderr": 0.0017119294258030526, "rougeLsum_recall": 0.24836824871710267, "rougeLsum_recall_stderr": 0.003968401031348439}}, "4": {"article_DOC_summary": {"bleu": 0.8787323538547989, "bleu_stderr": 0.09806037997681721, "rouge1_fmeasure": 0.051203664083526064, "rouge1_fmeasure_stderr": 0.002916215578123627, "rouge1_precision": 0.04185793101612411, "rouge1_precision_stderr": 0.0025354871639657332, "rouge1_recall": 0.07960189442566881, "rouge1_recall_stderr": 0.004594099676529609, "rouge2_fmeasure": 0.012145091480254444, "rouge2_fmeasure_stderr": 0.001038605071999789, "rouge2_precision": 0.009545271254314988, "rouge2_precision_stderr": 0.0009027168872299666, "rouge2_recall": 0.019489192736000506, "rouge2_recall_stderr": 0.0016525733661952122, "rougeL_fmeasure": 0.040479741202891835, "rougeL_fmeasure_stderr": 0.0022777830898179745, "rougeL_precision": 0.03331696824804232, "rougeL_precision_stderr": 0.002048247078605598, "rougeL_recall": 0.06320111546579645, "rougeL_recall_stderr": 0.0036120398264049094, "rougeLsum_fmeasure": 0.041001723419299384, "rougeLsum_fmeasure_stderr": 0.0023481586557545764, "rougeLsum_precision": 0.033884182850020796, "rougeLsum_precision_stderr": 0.0021113829994884406, "rougeLsum_recall": 0.0637408678817515, "rougeLsum_recall_stderr": 0.003715585442877857}}, "5": {"article_DOC_summary": {"bleu": 6.480764426251045e-36, "bleu_stderr": 1.6529080147588964e-30, "rouge1_fmeasure": 0.003279934928320664, "rouge1_fmeasure_stderr": 0.0009428534366320934, "rouge1_precision": 0.003661405957465891, "rouge1_precision_stderr": 0.0010410174134967514, "rouge1_recall": 0.003073378808572809, "rouge1_recall_stderr": 0.0008998604189966408, "rouge2_fmeasure": 0.0007405035248494208, "rouge2_fmeasure_stderr": 0.00038311030521319677, "rouge2_precision": 0.0007725002522449804, "rouge2_precision_stderr": 0.0003775496435431225, "rouge2_recall": 0.0007322912012146197, "rouge2_recall_stderr": 0.0003972475356359937, "rougeL_fmeasure": 0.0021896510504014074, "rougeL_fmeasure_stderr": 0.0006251341441438973, "rougeL_precision": 0.002439909640242604, "rougeL_precision_stderr": 0.0006917842321148266, "rougeL_recall": 0.0020657262287064482, "rougeL_recall_stderr": 0.000601437175466453, "rougeLsum_fmeasure": 0.0026863003460885, "rougeLsum_fmeasure_stderr": 0.0007784026207598828, "rougeLsum_precision": 0.0030026261505173824, "rougeLsum_precision_stderr": 0.0008643214712623419, "rougeLsum_recall": 0.002523952641616138, "rougeLsum_recall_stderr": 0.0007458033281437961}}}}