Muennighoff's picture
Add
046a6f8
raw
history blame contribute delete
No virus
28 kB
{"GEM/web_nlg_en": {"0": {"PALM_prompt": {"bleu": 0.3467629462258173, "bleu_stderr": 0.02970357160289475, "rouge1_fmeasure": 0.10168995757313223, "rouge1_fmeasure_stderr": 0.002205136296377914, "rouge1_precision": 0.06878822022347678, "rouge1_precision_stderr": 0.0018402243911493595, "rouge1_recall": 0.27232967386093304, "rouge1_recall_stderr": 0.004788240547260121, "rouge2_fmeasure": 0.047987557752268435, "rouge2_fmeasure_stderr": 0.0013365935083590927, "rouge2_precision": 0.032157818821665254, "rouge2_precision_stderr": 0.0010577093145147903, "rouge2_recall": 0.13056520217921638, "rouge2_recall_stderr": 0.003115822594052185, "rougeL_fmeasure": 0.09753239224447119, "rougeL_fmeasure_stderr": 0.002045677987971358, "rougeL_precision": 0.06577945729496877, "rougeL_precision_stderr": 0.0017155698460292435, "rougeL_recall": 0.26369146928376647, "rougeL_recall_stderr": 0.004637827662279574, "rougeLsum_fmeasure": 0.09759642084616944, "rougeLsum_fmeasure_stderr": 0.002085598873406324, "rougeLsum_precision": 0.0660369144272614, "rougeLsum_precision_stderr": 0.0017577996789584932, "rougeLsum_recall": 0.2618058785302665, "rougeLsum_recall_stderr": 0.004567480767611532}}, "1": {"PALM_prompt": {"bleu": 0.5417393419395882, "bleu_stderr": 0.044815454507757216, "rouge1_fmeasure": 0.12113784115181007, "rouge1_fmeasure_stderr": 0.00204351472161063, "rouge1_precision": 0.07838021666667039, "rouge1_precision_stderr": 0.001559180299177493, "rouge1_recall": 0.3755850605619716, "rouge1_recall_stderr": 0.005524724736554615, "rouge2_fmeasure": 0.0570198899318319, "rouge2_fmeasure_stderr": 0.001278985747994651, "rouge2_precision": 0.03690042031780109, "rouge2_precision_stderr": 0.0009597755725437089, "rouge2_recall": 0.18447574372209172, "rouge2_recall_stderr": 0.003749625715974277, "rougeL_fmeasure": 0.11413083233833846, "rougeL_fmeasure_stderr": 0.00182579199474273, "rougeL_precision": 0.07360709733960606, "rougeL_precision_stderr": 0.0013864930506007718, "rougeL_recall": 0.35714638889794165, "rougeL_recall_stderr": 0.005177897601280693, "rougeLsum_fmeasure": 0.11517017027086042, "rougeLsum_fmeasure_stderr": 0.0019117167496261315, "rougeLsum_precision": 0.07455301066982571, "rougeLsum_precision_stderr": 0.0014702009508263548, "rougeLsum_recall": 0.35705351591203466, "rougeLsum_recall_stderr": 0.005124748725370867}}, "2": {"PALM_prompt": {"bleu": 0.6195362524152161, "bleu_stderr": 0.0433066997903282, "rouge1_fmeasure": 0.12722099841869644, "rouge1_fmeasure_stderr": 0.0020051304009439364, "rouge1_precision": 0.08150779213996648, "rouge1_precision_stderr": 0.0014788918897118996, "rouge1_recall": 0.39438157472425567, "rouge1_recall_stderr": 0.0054341417243741336, "rouge2_fmeasure": 0.06064856236396107, "rouge2_fmeasure_stderr": 0.0012642203603085826, "rouge2_precision": 0.038682782799535693, "rouge2_precision_stderr": 0.0009057286857801548, "rouge2_recall": 0.1990947924647244, "rouge2_recall_stderr": 0.00383449080505824, "rougeL_fmeasure": 0.11906444968750551, "rougeL_fmeasure_stderr": 0.0017672699572919628, "rougeL_precision": 0.07608859632960721, "rougeL_precision_stderr": 0.0012909622078597883, "rougeL_recall": 0.37140486765608993, "rougeL_recall_stderr": 0.0049913485027498535, "rougeLsum_fmeasure": 0.12069299340732352, "rougeLsum_fmeasure_stderr": 0.0018626803556984809, "rougeLsum_precision": 0.07730775091885286, "rougeLsum_precision_stderr": 0.001374674060600659, "rougeLsum_recall": 0.3741568135976793, "rougeLsum_recall_stderr": 0.005028121786060987}}, "3": {"PALM_prompt": {"bleu": 0.6651492106144187, "bleu_stderr": 0.03992762768292497, "rouge1_fmeasure": 0.13042770795969455, "rouge1_fmeasure_stderr": 0.0019693711185330702, "rouge1_precision": 0.08305197408599092, "rouge1_precision_stderr": 0.0014375464331781317, "rouge1_recall": 0.41344530788870276, "rouge1_recall_stderr": 0.0054959874852452345, "rouge2_fmeasure": 0.06210979827800543, "rouge2_fmeasure_stderr": 0.001238202910442987, "rouge2_precision": 0.03935700634635547, "rouge2_precision_stderr": 0.0008788463963429873, "rouge2_recall": 0.20918456834004137, "rouge2_recall_stderr": 0.0038122513646778704, "rougeL_fmeasure": 0.12177286572068512, "rougeL_fmeasure_stderr": 0.001731588340217775, "rougeL_precision": 0.07737768321205232, "rougeL_precision_stderr": 0.0012566340597038746, "rougeL_recall": 0.3880088138045564, "rougeL_recall_stderr": 0.005024656689740799, "rougeLsum_fmeasure": 0.1229421986392733, "rougeLsum_fmeasure_stderr": 0.0018122045178229098, "rougeLsum_precision": 0.07831413935386002, "rougeLsum_precision_stderr": 0.0013273507638749266, "rougeLsum_recall": 0.3891854551198864, "rougeLsum_recall_stderr": 0.004973306456143662}}, "4": {"PALM_prompt": {"bleu": 0.6912927008104243, "bleu_stderr": 0.04708951610676302, "rouge1_fmeasure": 0.1320847120906677, "rouge1_fmeasure_stderr": 0.0019403317559554816, "rouge1_precision": 0.0842695948148098, "rouge1_precision_stderr": 0.0014410127187428725, "rouge1_recall": 0.4150737056078972, "rouge1_recall_stderr": 0.005329280847677363, "rouge2_fmeasure": 0.06309490039873673, "rouge2_fmeasure_stderr": 0.0012285556191215666, "rouge2_precision": 0.04005469000020114, "rouge2_precision_stderr": 0.0008847321997082807, "rouge2_recall": 0.2125055267910503, "rouge2_recall_stderr": 0.00386501230544102, "rougeL_fmeasure": 0.1226339582280795, "rougeL_fmeasure_stderr": 0.0016942210740045196, "rougeL_precision": 0.07804896946431904, "rougeL_precision_stderr": 0.001251675917738052, "rougeL_recall": 0.38803923342395225, "rougeL_recall_stderr": 0.0048632521563710535, "rougeLsum_fmeasure": 0.12483654375531031, "rougeLsum_fmeasure_stderr": 0.0017905619741641855, "rougeLsum_precision": 0.07963023585233621, "rougeLsum_precision_stderr": 0.0013354958204871354, "rougeLsum_recall": 0.39318103373651475, "rougeLsum_recall_stderr": 0.004902375078327026}}, "5": {"PALM_prompt": {"bleu": 0.7164241433415443, "bleu_stderr": 0.03468898038675718, "rouge1_fmeasure": 0.13233671042567177, "rouge1_fmeasure_stderr": 0.0019126994396419705, "rouge1_precision": 0.08401315872109257, "rouge1_precision_stderr": 0.0014023651252151289, "rouge1_recall": 0.4237987628433736, "rouge1_recall_stderr": 0.005319284520415636, "rouge2_fmeasure": 0.06277842285044863, "rouge2_fmeasure_stderr": 0.0012115695346373973, "rouge2_precision": 0.0395877176495914, "rouge2_precision_stderr": 0.0008578936363749117, "rouge2_recall": 0.21586520421581895, "rouge2_recall_stderr": 0.0038714581739094592, "rougeL_fmeasure": 0.1219588053350218, "rougeL_fmeasure_stderr": 0.001644273360150485, "rougeL_precision": 0.07729277177448167, "rougeL_precision_stderr": 0.0012081151013118559, "rougeL_recall": 0.39392380455148956, "rougeL_recall_stderr": 0.0048182862776320525, "rougeLsum_fmeasure": 0.12486327130932445, "rougeLsum_fmeasure_stderr": 0.0017601066987214956, "rougeLsum_precision": 0.07928144489756499, "rougeLsum_precision_stderr": 0.0012981371342668502, "rougeLsum_recall": 0.40087962084922146, "rougeLsum_recall_stderr": 0.004904552367490611}}}, "GEM/wiki_lingua_en": {"0": {"tldr_en": {"bleu": 1.4210312656847472, "bleu_stderr": 0.060270643720608696, "rouge1_fmeasure": 0.17653069728735207, "rouge1_fmeasure_stderr": 0.0017819912726454782, "rouge1_precision": 0.15061252743056497, "rouge1_precision_stderr": 0.0018348650687593155, "rouge1_recall": 0.256454503266184, "rouge1_recall_stderr": 0.0025452463169892557, "rouge2_fmeasure": 0.03354589374526059, "rouge2_fmeasure_stderr": 0.0008087056282946077, "rouge2_precision": 0.028369222882273205, "rouge2_precision_stderr": 0.0007066540587211176, "rouge2_recall": 0.05008641307901103, "rouge2_recall_stderr": 0.00134215691396269, "rougeL_fmeasure": 0.1377911140506496, "rougeL_fmeasure_stderr": 0.0012669830058260783, "rougeL_precision": 0.11608797101294863, "rougeL_precision_stderr": 0.0012705078508947738, "rougeL_recall": 0.20490213048658962, "rougeL_recall_stderr": 0.0020399289498688185, "rougeLsum_fmeasure": 0.16190034239297366, "rougeLsum_fmeasure_stderr": 0.0016143560219178483, "rougeLsum_precision": 0.13795098287356825, "rougeLsum_precision_stderr": 0.0016647360532169207, "rougeLsum_recall": 0.23598099685826873, "rougeLsum_recall_stderr": 0.002335452933383992}}, "1": {"tldr_en": {"bleu": 2.5844259677574737, "bleu_stderr": 0.060938127857024925, "rouge1_fmeasure": 0.22237786427514242, "rouge1_fmeasure_stderr": 0.0019482055053236735, "rouge1_precision": 0.19156214602392785, "rouge1_precision_stderr": 0.0021369510379202743, "rouge1_recall": 0.32241362924149136, "rouge1_recall_stderr": 0.0028124884724620492, "rouge2_fmeasure": 0.05440677143664293, "rouge2_fmeasure_stderr": 0.0010246128614251008, "rouge2_precision": 0.04682145837635855, "rouge2_precision_stderr": 0.0009902476215161073, "rouge2_recall": 0.08160157667413973, "rouge2_recall_stderr": 0.0017499912589990709, "rougeL_fmeasure": 0.155878968269544, "rougeL_fmeasure_stderr": 0.0012777679642915526, "rougeL_precision": 0.13283623589550608, "rougeL_precision_stderr": 0.0013929466849964527, "rougeL_recall": 0.2320852430342068, "rougeL_recall_stderr": 0.002191740016789271, "rougeLsum_fmeasure": 0.207642407950538, "rougeLsum_fmeasure_stderr": 0.0018053014603110992, "rougeLsum_precision": 0.17867424980926405, "rougeLsum_precision_stderr": 0.0019827351033431455, "rougeLsum_recall": 0.3020497324959359, "rougeLsum_recall_stderr": 0.0026583190853660004}}, "2": {"tldr_en": {"bleu": 2.7330421823571975, "bleu_stderr": 0.05994884184811053, "rouge1_fmeasure": 0.22383767677096728, "rouge1_fmeasure_stderr": 0.0018512996402949512, "rouge1_precision": 0.19849396333378058, "rouge1_precision_stderr": 0.00217880930473335, "rouge1_recall": 0.3198528101524774, "rouge1_recall_stderr": 0.0027518708376480633, "rouge2_fmeasure": 0.05524886451119943, "rouge2_fmeasure_stderr": 0.0010126638954711643, "rouge2_precision": 0.04934256998523157, "rouge2_precision_stderr": 0.0010451599371028265, "rouge2_recall": 0.08127176283096699, "rouge2_recall_stderr": 0.0017102813824312235, "rougeL_fmeasure": 0.15745470072630446, "rougeL_fmeasure_stderr": 0.001253574049933065, "rougeL_precision": 0.138887604964176, "rougeL_precision_stderr": 0.0015142419484140983, "rougeL_recall": 0.23030068542441662, "rougeL_recall_stderr": 0.002186692355755909, "rougeLsum_fmeasure": 0.21015985227741332, "rougeLsum_fmeasure_stderr": 0.00172463768243361, "rougeLsum_precision": 0.18624703148940888, "rougeLsum_precision_stderr": 0.0020468421192427477, "rougeLsum_recall": 0.3013114439049721, "rougeLsum_recall_stderr": 0.002616357765698253}}, "3": {"tldr_en": {"bleu": 2.8290112012146706, "bleu_stderr": 0.05951839122489339, "rouge1_fmeasure": 0.1852182555649124, "rouge1_fmeasure_stderr": 0.002287271359986313, "rouge1_precision": 0.17248122219408474, "rouge1_precision_stderr": 0.002628198982060811, "rouge1_recall": 0.2638796471875207, "rouge1_recall_stderr": 0.0034027530893483465, "rouge2_fmeasure": 0.04567763446412075, "rouge2_fmeasure_stderr": 0.0010289915108698396, "rouge2_precision": 0.04218748111521178, "rouge2_precision_stderr": 0.0011031465249406545, "rouge2_recall": 0.0670929954668809, "rouge2_recall_stderr": 0.0017026172079320436, "rougeL_fmeasure": 0.13133010966101086, "rougeL_fmeasure_stderr": 0.0015897764193778007, "rougeL_precision": 0.12295346030090092, "rougeL_precision_stderr": 0.0019567592451512905, "rougeL_recall": 0.19076774529285573, "rougeL_recall_stderr": 0.002589979675308181, "rougeLsum_fmeasure": 0.17421064673691836, "rougeLsum_fmeasure_stderr": 0.002151537032475058, "rougeLsum_precision": 0.1620648856258479, "rougeLsum_precision_stderr": 0.0024771812577127515, "rougeLsum_recall": 0.24873657023544105, "rougeLsum_recall_stderr": 0.0032321806677604713}}, "4": {"tldr_en": {"bleu": 0.6132507015376946, "bleu_stderr": 0.05397498618101934, "rouge1_fmeasure": 0.05928113069738738, "rouge1_fmeasure_stderr": 0.0019814030720861505, "rouge1_precision": 0.05687980992466601, "rouge1_precision_stderr": 0.002135399553380944, "rouge1_recall": 0.08817602363470518, "rouge1_recall_stderr": 0.0030338376299604442, "rouge2_fmeasure": 0.014105994773694855, "rouge2_fmeasure_stderr": 0.0006690326869559216, "rouge2_precision": 0.012772621686539164, "rouge2_precision_stderr": 0.0006603560652934723, "rouge2_recall": 0.02236367739681952, "rouge2_recall_stderr": 0.0011837465631426769, "rougeL_fmeasure": 0.04316919203763769, "rougeL_fmeasure_stderr": 0.0014271969073492822, "rougeL_precision": 0.04187422720293646, "rougeL_precision_stderr": 0.001622780833042087, "rougeL_recall": 0.06552142962785648, "rougeL_recall_stderr": 0.002313135493815312, "rougeLsum_fmeasure": 0.055629619710077606, "rougeLsum_fmeasure_stderr": 0.0018557175801784927, "rougeLsum_precision": 0.053197083436625686, "rougeLsum_precision_stderr": 0.0019860916804782702, "rougeLsum_recall": 0.08309251098591129, "rougeLsum_recall_stderr": 0.0028748941628762583}}, "5": {"tldr_en": {"bleu": 1.774349780922794e-06, "bleu_stderr": 2.6185834564883983e-06, "rouge1_fmeasure": 0.01019849090383851, "rouge1_fmeasure_stderr": 0.0009502392973365573, "rouge1_precision": 0.009944006650658749, "rouge1_precision_stderr": 0.0010025455254208035, "rouge1_recall": 0.014539537304699115, "rouge1_recall_stderr": 0.0013678920537217771, "rouge2_fmeasure": 0.0027920581048711053, "rouge2_fmeasure_stderr": 0.0003262526064746703, "rouge2_precision": 0.002755589189971845, "rouge2_precision_stderr": 0.0004379750152181389, "rouge2_recall": 0.004253966152589437, "rouge2_recall_stderr": 0.0005366488784059504, "rougeL_fmeasure": 0.007455220141107615, "rougeL_fmeasure_stderr": 0.0006935679633605328, "rougeL_precision": 0.007311450396075794, "rougeL_precision_stderr": 0.0007625817436989474, "rougeL_recall": 0.010903740963770921, "rougeL_recall_stderr": 0.0010467455072106112, "rougeLsum_fmeasure": 0.009635314110130312, "rougeLsum_fmeasure_stderr": 0.0008939064145876629, "rougeLsum_precision": 0.009418418074912453, "rougeLsum_precision_stderr": 0.0009507068948382848, "rougeLsum_recall": 0.013851363629870408, "rougeLsum_recall_stderr": 0.0013115124395592303}}}, "e2e_nlg_cleaned": {"0": {"generate_text_restaurant": {"bleu": 1.3562210829072388, "bleu_stderr": 0.06363294711119734, "rouge1_fmeasure": 0.12013040778127415, "rouge1_fmeasure_stderr": 0.0017746386859163203, "rouge1_precision": 0.11009512311383156, "rouge1_precision_stderr": 0.0020727913604168193, "rouge1_recall": 0.16243977504759669, "rouge1_recall_stderr": 0.002228768903465126, "rouge2_fmeasure": 0.01952192502751282, "rouge2_fmeasure_stderr": 0.0007045263606140751, "rouge2_precision": 0.016237573503050346, "rouge2_precision_stderr": 0.0005791686929917277, "rouge2_recall": 0.027893395046500822, "rouge2_recall_stderr": 0.001039576769487543, "rougeL_fmeasure": 0.1164630301972042, "rougeL_fmeasure_stderr": 0.0016922702496737136, "rougeL_precision": 0.10534269523932902, "rougeL_precision_stderr": 0.0018942650621943632, "rougeL_recall": 0.1589275088375994, "rougeL_recall_stderr": 0.0021856832752487143, "rougeLsum_fmeasure": 0.1010326136243227, "rougeLsum_fmeasure_stderr": 0.0015162989057978518, "rougeLsum_precision": 0.09138176673759738, "rougeLsum_precision_stderr": 0.0016976459528528838, "rougeLsum_recall": 0.13851750677859065, "rougeLsum_recall_stderr": 0.001981721576730165}}, "1": {"generate_text_restaurant": {"bleu": 10.908750419467065, "bleu_stderr": 0.1153875315765743, "rouge1_fmeasure": 0.4318510329737581, "rouge1_fmeasure_stderr": 0.002423250819689724, "rouge1_precision": 0.5144363803211901, "rouge1_precision_stderr": 0.003364029946676966, "rouge1_recall": 0.4137228068795505, "rouge1_recall_stderr": 0.0030035953453339268, "rouge2_fmeasure": 0.1949067304345254, "rouge2_fmeasure_stderr": 0.001891675195297321, "rouge2_precision": 0.23527684115197875, "rouge2_precision_stderr": 0.0024569912549073252, "rouge2_recall": 0.18651128554977991, "rouge2_recall_stderr": 0.002042569449007174, "rougeL_fmeasure": 0.3076421628030137, "rougeL_fmeasure_stderr": 0.0020211262460051935, "rougeL_precision": 0.36920804381770184, "rougeL_precision_stderr": 0.0028723757205354077, "rougeL_recall": 0.29425760131507245, "rougeL_recall_stderr": 0.002383672145953424, "rougeLsum_fmeasure": 0.34713651369676346, "rougeLsum_fmeasure_stderr": 0.0022926393764313565, "rougeLsum_precision": 0.414855533795446, "rougeLsum_precision_stderr": 0.003125185132516662, "rougeLsum_recall": 0.3320236369114425, "rougeLsum_recall_stderr": 0.002686308288138277}}, "2": {"generate_text_restaurant": {"bleu": 12.425560961298928, "bleu_stderr": 0.16843145386704422, "rouge1_fmeasure": 0.45921716599492257, "rouge1_fmeasure_stderr": 0.002284361054039901, "rouge1_precision": 0.5435495761199652, "rouge1_precision_stderr": 0.0033633572533129526, "rouge1_recall": 0.44219185708552616, "rouge1_recall_stderr": 0.00292267717822634, "rouge2_fmeasure": 0.22033369538829456, "rouge2_fmeasure_stderr": 0.0018920736545353272, "rouge2_precision": 0.2653358395725804, "rouge2_precision_stderr": 0.0025850234460909963, "rouge2_recall": 0.21206583671651486, "rouge2_recall_stderr": 0.002085373413054097, "rougeL_fmeasure": 0.3231355705500899, "rougeL_fmeasure_stderr": 0.001978955011971195, "rougeL_precision": 0.3843321993416038, "rougeL_precision_stderr": 0.002878039104074086, "rougeL_recall": 0.31120337816430665, "rougeL_recall_stderr": 0.0023877325589714915, "rougeLsum_fmeasure": 0.3679358851605252, "rougeLsum_fmeasure_stderr": 0.0022120825656228383, "rougeLsum_precision": 0.4362291530818777, "rougeLsum_precision_stderr": 0.0031299309485586665, "rougeLsum_recall": 0.35428245787963414, "rougeLsum_recall_stderr": 0.0026612537289267993}}, "3": {"generate_text_restaurant": {"bleu": 12.221288385114814, "bleu_stderr": 0.19082268895380647, "rouge1_fmeasure": 0.455166206022795, "rouge1_fmeasure_stderr": 0.002223244735102527, "rouge1_precision": 0.5214139268556559, "rouge1_precision_stderr": 0.0034175211851896997, "rouge1_recall": 0.4572305092055359, "rouge1_recall_stderr": 0.0029026293132885382, "rouge2_fmeasure": 0.22104435685182108, "rouge2_fmeasure_stderr": 0.001862760899413114, "rouge2_precision": 0.25743143640704197, "rouge2_precision_stderr": 0.002555258701398823, "rouge2_recall": 0.22245222231941147, "rouge2_recall_stderr": 0.0021467153010892278, "rougeL_fmeasure": 0.3180868476673524, "rougeL_fmeasure_stderr": 0.001990706335801619, "rougeL_precision": 0.36543621857412, "rougeL_precision_stderr": 0.002896309387223668, "rougeL_recall": 0.32086576136811035, "rougeL_recall_stderr": 0.002496102233183468, "rougeLsum_fmeasure": 0.36359919692230264, "rougeLsum_fmeasure_stderr": 0.0021840977848229704, "rougeLsum_precision": 0.41670685142961694, "rougeLsum_precision_stderr": 0.0031268624160023773, "rougeLsum_recall": 0.36576515899261053, "rougeLsum_recall_stderr": 0.0027165252275173565}}, "4": {"generate_text_restaurant": {"bleu": 11.904071947513604, "bleu_stderr": 0.15041975256207835, "rouge1_fmeasure": 0.44883724359759763, "rouge1_fmeasure_stderr": 0.0021474205192137984, "rouge1_precision": 0.5108040030722113, "rouge1_precision_stderr": 0.0034305316404786837, "rouge1_recall": 0.45509983428195105, "rouge1_recall_stderr": 0.0028400978670404054, "rouge2_fmeasure": 0.21940517221276123, "rouge2_fmeasure_stderr": 0.001839987625193181, "rouge2_precision": 0.25452186027600054, "rouge2_precision_stderr": 0.002593019861818015, "rouge2_recall": 0.2223684457329366, "rouge2_recall_stderr": 0.0020931795571949214, "rougeL_fmeasure": 0.31318384946030303, "rougeL_fmeasure_stderr": 0.001958394522848982, "rougeL_precision": 0.35641993842979697, "rougeL_precision_stderr": 0.002858311870167588, "rougeL_recall": 0.31918812987193673, "rougeL_recall_stderr": 0.002462359664481415, "rougeLsum_fmeasure": 0.3596273970546791, "rougeLsum_fmeasure_stderr": 0.002138488051834353, "rougeLsum_precision": 0.4091932721797993, "rougeLsum_precision_stderr": 0.0031234438953318695, "rougeLsum_recall": 0.3650198785228199, "rougeLsum_recall_stderr": 0.0026634554137160474}}, "5": {"generate_text_restaurant": {"bleu": 11.477221691171614, "bleu_stderr": 0.17452231964837656, "rouge1_fmeasure": 0.44490742452457227, "rouge1_fmeasure_stderr": 0.0020181658108621714, "rouge1_precision": 0.48062887592759473, "rouge1_precision_stderr": 0.003115584089249707, "rouge1_recall": 0.46458395842191347, "rouge1_recall_stderr": 0.0027243347719385098, "rouge2_fmeasure": 0.21402408036134005, "rouge2_fmeasure_stderr": 0.0017335777517730798, "rouge2_precision": 0.2342559795744666, "rouge2_precision_stderr": 0.0023001280246662233, "rouge2_recall": 0.22414454145192106, "rouge2_recall_stderr": 0.002057301424201448, "rougeL_fmeasure": 0.30844290377202477, "rougeL_fmeasure_stderr": 0.001825487934292388, "rougeL_precision": 0.332844249120604, "rougeL_precision_stderr": 0.0025414395166544717, "rougeL_recall": 0.3239788679633895, "rougeL_recall_stderr": 0.002397374612400007, "rougeLsum_fmeasure": 0.360656182266104, "rougeLsum_fmeasure_stderr": 0.0020257067176805616, "rougeLsum_precision": 0.38938087151639184, "rougeLsum_precision_stderr": 0.0028412019801890083, "rougeLsum_recall": 0.3769961983819593, "rougeLsum_recall_stderr": 0.0025939559956521933}}}, "gem_xsum": {"0": {"article_DOC_summary": {"bleu": 2.036660647928376, "bleu_stderr": 0.0886671989991428, "rouge1_fmeasure": 0.20872501710774183, "rouge1_fmeasure_stderr": 0.0025765264814385574, "rouge1_precision": 0.16625735855106855, "rouge1_precision_stderr": 0.0024463651813182914, "rouge1_recall": 0.3230884270864929, "rouge1_recall_stderr": 0.004359311826645138, "rouge2_fmeasure": 0.04541415352191168, "rouge2_fmeasure_stderr": 0.0016019047132235528, "rouge2_precision": 0.03520681144190837, "rouge2_precision_stderr": 0.0013363705236252219, "rouge2_recall": 0.07441126206565717, "rouge2_recall_stderr": 0.0027685648685041907, "rougeL_fmeasure": 0.15771639364031548, "rougeL_fmeasure_stderr": 0.001968467651802171, "rougeL_precision": 0.12527352638980324, "rougeL_precision_stderr": 0.0018832520008059408, "rougeL_recall": 0.24649639309519972, "rougeL_recall_stderr": 0.0035131508278542895, "rougeLsum_fmeasure": 0.16106544122061872, "rougeLsum_fmeasure_stderr": 0.002144088469758669, "rougeLsum_precision": 0.12771639136222968, "rougeLsum_precision_stderr": 0.001971864037023057, "rougeLsum_recall": 0.2517880179492348, "rougeLsum_recall_stderr": 0.003783114418327505}}, "1": {"article_DOC_summary": {"bleu": 1.6913128558245667, "bleu_stderr": 0.09521771990115542, "rouge1_fmeasure": 0.18955906449065837, "rouge1_fmeasure_stderr": 0.0025437030392446553, "rouge1_precision": 0.13473651953646212, "rouge1_precision_stderr": 0.0018830579225946448, "rouge1_recall": 0.33263109371075555, "rouge1_recall_stderr": 0.0043737298284748935, "rouge2_fmeasure": 0.04240941625507146, "rouge2_fmeasure_stderr": 0.0015134151293483083, "rouge2_precision": 0.02979980903695056, "rouge2_precision_stderr": 0.0010699057640840117, "rouge2_recall": 0.07661622521673665, "rouge2_recall_stderr": 0.00277147224226074, "rougeL_fmeasure": 0.14860417887228614, "rougeL_fmeasure_stderr": 0.0019427079439186818, "rougeL_precision": 0.10545507286869261, "rougeL_precision_stderr": 0.0014282925798028265, "rougeL_recall": 0.2622174946749768, "rougeL_recall_stderr": 0.0034532690725241335, "rougeLsum_fmeasure": 0.1502154921172796, "rougeLsum_fmeasure_stderr": 0.0021382854049990575, "rougeLsum_precision": 0.10644896438074114, "rougeLsum_precision_stderr": 0.0015535641404371687, "rougeLsum_recall": 0.26570822729983273, "rougeLsum_recall_stderr": 0.003832781853814249}}, "2": {"article_DOC_summary": {"bleu": 1.786388858790864, "bleu_stderr": 0.09393324735285516, "rouge1_fmeasure": 0.18998879543596028, "rouge1_fmeasure_stderr": 0.002435102538796071, "rouge1_precision": 0.13513168211881918, "rouge1_precision_stderr": 0.0018134843059910172, "rouge1_recall": 0.33296777114951603, "rouge1_recall_stderr": 0.004186110631264128, "rouge2_fmeasure": 0.043714937888104634, "rouge2_fmeasure_stderr": 0.0014970464888779478, "rouge2_precision": 0.030769398298986696, "rouge2_precision_stderr": 0.0010540577559318123, "rouge2_recall": 0.07868075969570267, "rouge2_recall_stderr": 0.0027818491235428898, "rougeL_fmeasure": 0.15208229332764386, "rougeL_fmeasure_stderr": 0.0018630213365044542, "rougeL_precision": 0.10802075057180306, "rougeL_precision_stderr": 0.0013747641806187527, "rougeL_recall": 0.2676676120777271, "rougeL_recall_stderr": 0.0033391627876980176, "rougeLsum_fmeasure": 0.14924955467827622, "rougeLsum_fmeasure_stderr": 0.0020506164724061102, "rougeLsum_precision": 0.10589092864182613, "rougeLsum_precision_stderr": 0.0014978471864364863, "rougeLsum_recall": 0.2634124678259771, "rougeLsum_recall_stderr": 0.003693726279677115}}, "3": {"article_DOC_summary": {"bleu": 1.7371936749495764, "bleu_stderr": 0.0800692258778186, "rouge1_fmeasure": 0.17964198401124917, "rouge1_fmeasure_stderr": 0.0026512597801644534, "rouge1_precision": 0.13084178809054492, "rouge1_precision_stderr": 0.0020828469963336364, "rouge1_recall": 0.30899923256216205, "rouge1_recall_stderr": 0.004574129254455469, "rouge2_fmeasure": 0.04121311126855391, "rouge2_fmeasure_stderr": 0.0014973096942535052, "rouge2_precision": 0.02936527020725493, "rouge2_precision_stderr": 0.001079925611326834, "rouge2_recall": 0.07307776507135433, "rouge2_recall_stderr": 0.0026918989216865676, "rougeL_fmeasure": 0.14521702310499732, "rougeL_fmeasure_stderr": 0.0021073439893499503, "rougeL_precision": 0.1055743501639221, "rougeL_precision_stderr": 0.001633721783184567, "rougeL_recall": 0.2507523912037128, "rougeL_recall_stderr": 0.003705785363246703, "rougeLsum_fmeasure": 0.14109185456998372, "rougeLsum_fmeasure_stderr": 0.002171446458317829, "rougeLsum_precision": 0.1025352295269978, "rougeLsum_precision_stderr": 0.001681219289412153, "rougeLsum_recall": 0.2444514281084609, "rougeLsum_recall_stderr": 0.0038788277037342775}}, "4": {"article_DOC_summary": {"bleu": 0.9036502659890296, "bleu_stderr": 0.13304107651014188, "rouge1_fmeasure": 0.05079255171386247, "rouge1_fmeasure_stderr": 0.0028639389763559352, "rouge1_precision": 0.043176373260258055, "rouge1_precision_stderr": 0.002661125304761837, "rouge1_recall": 0.07899107026617866, "rouge1_recall_stderr": 0.0045433837896930425, "rouge2_fmeasure": 0.012001869600776842, "rouge2_fmeasure_stderr": 0.0010805883272440714, "rouge2_precision": 0.009995007816000899, "rouge2_precision_stderr": 0.001094403515604492, "rouge2_recall": 0.019092183041857662, "rouge2_recall_stderr": 0.001704529550998399, "rougeL_fmeasure": 0.04075656651442719, "rougeL_fmeasure_stderr": 0.0022855328944283828, "rougeL_precision": 0.03509939833846206, "rougeL_precision_stderr": 0.002223074118925427, "rougeL_recall": 0.06366276411618525, "rougeL_recall_stderr": 0.0036829472841961148, "rougeLsum_fmeasure": 0.04091436573223043, "rougeLsum_fmeasure_stderr": 0.0023447923738265015, "rougeLsum_precision": 0.03533662342173648, "rougeLsum_precision_stderr": 0.002272411501142255, "rougeLsum_recall": 0.06371192890842961, "rougeLsum_recall_stderr": 0.003761149006539089}}, "5": {"article_DOC_summary": {"bleu": 2.161302022390058e-37, "bleu_stderr": 2.5426897518998265e-31, "rouge1_fmeasure": 0.002574370231366262, "rouge1_fmeasure_stderr": 0.0007438016527671989, "rouge1_precision": 0.0029134193104051152, "rouge1_precision_stderr": 0.0008486189609407175, "rouge1_recall": 0.0023861903048892907, "rouge1_recall_stderr": 0.0006880915596145494, "rouge2_fmeasure": 0.0005503568321367666, "rouge2_fmeasure_stderr": 0.0002924003153007301, "rouge2_precision": 0.0005833165170013117, "rouge2_precision_stderr": 0.00029806571308675146, "rouge2_recall": 0.0005320544235638574, "rouge2_recall_stderr": 0.00029204583936938926, "rougeL_fmeasure": 0.0020714173477565474, "rougeL_fmeasure_stderr": 0.0005851331121811386, "rougeL_precision": 0.002308787355007928, "rougeL_precision_stderr": 0.000647522012460148, "rougeL_recall": 0.0019494348168833185, "rougeL_recall_stderr": 0.0005577239393157619, "rougeLsum_fmeasure": 0.0022014683901710455, "rougeLsum_fmeasure_stderr": 0.0006370228443054409, "rougeLsum_precision": 0.0024689481663457947, "rougeLsum_precision_stderr": 0.0007147035241284636, "rougeLsum_recall": 0.0020576406943102633, "rougeLsum_recall_stderr": 0.0005976152809311452}}}}