File size: 27,966 Bytes
763a8f1 |
1 |
{"GEM/web_nlg_en": {"0": {"PALM_prompt": {"bleu": 0.4214863735405607, "bleu_stderr": 0.029154609162010323, "rouge1_fmeasure": 0.10879688033992795, "rouge1_fmeasure_stderr": 0.0021627779616647516, "rouge1_precision": 0.08388349369737222, "rouge1_precision_stderr": 0.0028741362760589364, "rouge1_recall": 0.2839223617284565, "rouge1_recall_stderr": 0.005264418568471245, "rouge2_fmeasure": 0.05055369077754123, "rouge2_fmeasure_stderr": 0.0012930809657985872, "rouge2_precision": 0.04057930751764507, "rouge2_precision_stderr": 0.002047816625134428, "rouge2_recall": 0.13506279227711254, "rouge2_recall_stderr": 0.0032130647312794175, "rougeL_fmeasure": 0.10393401018258999, "rougeL_fmeasure_stderr": 0.002007764403266908, "rougeL_precision": 0.08041455507307416, "rougeL_precision_stderr": 0.002796739709192279, "rougeL_recall": 0.2738666536323073, "rougeL_recall_stderr": 0.005085678508176572, "rougeLsum_fmeasure": 0.10270283885145984, "rougeLsum_fmeasure_stderr": 0.002020111493088052, "rougeLsum_precision": 0.07977634567972974, "rougeLsum_precision_stderr": 0.002805961856125458, "rougeLsum_recall": 0.26749167398935675, "rougeLsum_recall_stderr": 0.004882015301399527}}, "1": {"PALM_prompt": {"bleu": 0.5958530874585899, "bleu_stderr": 0.03649262475380295, "rouge1_fmeasure": 0.16359576779434043, "rouge1_fmeasure_stderr": 0.003809967310568941, "rouge1_precision": 0.13749267610186958, "rouge1_precision_stderr": 0.004325878829249963, "rouge1_recall": 0.3241716808952326, "rouge1_recall_stderr": 0.005125119098986173, "rouge2_fmeasure": 0.08433674778206289, "rouge2_fmeasure_stderr": 0.002591174609210514, "rouge2_precision": 0.07246358161159391, "rouge2_precision_stderr": 0.0029673895627135506, "rouge2_recall": 0.16876397664351184, "rouge2_recall_stderr": 0.00367859006299185, "rougeL_fmeasure": 0.14881701677232517, "rougeL_fmeasure_stderr": 0.003277859581563782, "rougeL_precision": 0.12393180075905823, "rougeL_precision_stderr": 0.0037992843733980434, "rougeL_recall": 0.30308740481864604, "rougeL_recall_stderr": 0.004697897076217226, "rougeLsum_fmeasure": 0.15170700107447863, "rougeLsum_fmeasure_stderr": 0.0033575398797432874, "rougeLsum_precision": 0.12662324522811608, "rougeLsum_precision_stderr": 0.00387820514144903, "rougeLsum_recall": 0.3067988164213401, "rougeLsum_recall_stderr": 0.004754578958904846}}, "2": {"PALM_prompt": {"bleu": 0.7632123296691333, "bleu_stderr": 0.038667647524407975, "rouge1_fmeasure": 0.2022385311781214, "rouge1_fmeasure_stderr": 0.004271916206549367, "rouge1_precision": 0.17619531326285107, "rouge1_precision_stderr": 0.005080542288823818, "rouge1_recall": 0.3742085058586801, "rouge1_recall_stderr": 0.004920653945655996, "rouge2_fmeasure": 0.10803467148430693, "rouge2_fmeasure_stderr": 0.0030612514779265803, "rouge2_precision": 0.09658792599721289, "rouge2_precision_stderr": 0.003611262853993622, "rouge2_recall": 0.20162933402440936, "rouge2_recall_stderr": 0.0038801577073926965, "rougeL_fmeasure": 0.18252899170611903, "rougeL_fmeasure_stderr": 0.0037263532749030616, "rougeL_precision": 0.15692981536908263, "rougeL_precision_stderr": 0.004446297762122498, "rougeL_recall": 0.3484780480719596, "rougeL_recall_stderr": 0.0045553445266088635, "rougeLsum_fmeasure": 0.18711611785244323, "rougeLsum_fmeasure_stderr": 0.003848891104616288, "rougeLsum_precision": 0.16217269474751653, "rougeLsum_precision_stderr": 0.004631557820535045, "rougeLsum_recall": 0.35330840347834674, "rougeLsum_recall_stderr": 0.004610857396095154}}, "3": {"PALM_prompt": {"bleu": 0.9207133879279265, "bleu_stderr": 0.03255931768193071, "rouge1_fmeasure": 0.20867536510345913, "rouge1_fmeasure_stderr": 0.004354382473584997, "rouge1_precision": 0.18377058302813723, "rouge1_precision_stderr": 0.005253580997340217, "rouge1_recall": 0.381271206422023, "rouge1_recall_stderr": 0.004890766475780684, "rouge2_fmeasure": 0.11272429502619766, "rouge2_fmeasure_stderr": 0.0031312620749979446, "rouge2_precision": 0.10294612127680682, "rouge2_precision_stderr": 0.0037309770662019557, "rouge2_recall": 0.2060814488662053, "rouge2_recall_stderr": 0.0038997213229875847, "rougeL_fmeasure": 0.18616032806880206, "rougeL_fmeasure_stderr": 0.003714239240740623, "rougeL_precision": 0.16232375389423376, "rougeL_precision_stderr": 0.0045761676741338285, "rougeL_recall": 0.35147344800261143, "rougeL_recall_stderr": 0.004418957418369871, "rougeLsum_fmeasure": 0.19151809123693445, "rougeLsum_fmeasure_stderr": 0.003873742236641197, "rougeLsum_precision": 0.16801891503402527, "rougeLsum_precision_stderr": 0.004781137280246318, "rougeLsum_recall": 0.3573456612646077, "rougeLsum_recall_stderr": 0.004500705918880425}}, "4": {"PALM_prompt": {"bleu": 0.9902518578876233, "bleu_stderr": 0.040737732761129415, "rouge1_fmeasure": 0.21290146130579965, "rouge1_fmeasure_stderr": 0.0043700834724458276, "rouge1_precision": 0.18789368573901274, "rouge1_precision_stderr": 0.005285851879717852, "rouge1_recall": 0.3899093270922249, "rouge1_recall_stderr": 0.004962887842702003, "rouge2_fmeasure": 0.11683410537192468, "rouge2_fmeasure_stderr": 0.0031833984768610346, "rouge2_precision": 0.10560975558011194, "rouge2_precision_stderr": 0.003731700714381224, "rouge2_recall": 0.2145796483953565, "rouge2_recall_stderr": 0.004035868026365014, "rougeL_fmeasure": 0.1890303353482411, "rougeL_fmeasure_stderr": 0.003700023042470156, "rougeL_precision": 0.16382625310518403, "rougeL_precision_stderr": 0.004486884267673038, "rougeL_recall": 0.3597071518828505, "rougeL_recall_stderr": 0.004521922524975513, "rougeLsum_fmeasure": 0.19508857877285685, "rougeLsum_fmeasure_stderr": 0.003865606407547543, "rougeLsum_precision": 0.1707530708743364, "rougeLsum_precision_stderr": 0.004732141735621611, "rougeLsum_recall": 0.36629613801895733, "rougeLsum_recall_stderr": 0.004591525609735619}}, "5": {"PALM_prompt": {"bleu": 1.0873761263949675, "bleu_stderr": 0.03934330697010386, "rouge1_fmeasure": 0.23018635133450477, "rouge1_fmeasure_stderr": 0.004612080716063762, "rouge1_precision": 0.2117037418048869, "rouge1_precision_stderr": 0.005797595530762211, "rouge1_recall": 0.39911584774379655, "rouge1_recall_stderr": 0.00498148260658174, "rouge2_fmeasure": 0.12701615271509778, "rouge2_fmeasure_stderr": 0.003293666322506656, "rouge2_precision": 0.12132204155512089, "rouge2_precision_stderr": 0.004137193433006742, "rouge2_recall": 0.2209500964153402, "rouge2_recall_stderr": 0.004025388576844993, "rougeL_fmeasure": 0.20292345789497096, "rougeL_fmeasure_stderr": 0.003854003762475144, "rougeL_precision": 0.18406790377006843, "rougeL_precision_stderr": 0.004937322660278917, "rougeL_recall": 0.36561941279365967, "rougeL_recall_stderr": 0.004496892763588926, "rougeLsum_fmeasure": 0.20912697515193987, "rougeLsum_fmeasure_stderr": 0.00401671896906783, "rougeLsum_precision": 0.19092590715178714, "rougeLsum_precision_stderr": 0.005162190150819128, "rougeLsum_recall": 0.3726247925460039, "rougeLsum_recall_stderr": 0.004574209186658482}}}, "GEM/wiki_lingua_en": {"0": {"tldr_en": {"bleu": 2.318732566456423, "bleu_stderr": 0.13881817798189033, "rouge1_fmeasure": 0.1485707360665655, "rouge1_fmeasure_stderr": 0.0023637963366588163, "rouge1_precision": 0.14513591635070752, "rouge1_precision_stderr": 0.002933831212103272, "rouge1_recall": 0.19891787194668262, "rouge1_recall_stderr": 0.003187558635297779, "rouge2_fmeasure": 0.03346604327851081, "rouge2_fmeasure_stderr": 0.0009887781706946746, "rouge2_precision": 0.029907874227091444, "rouge2_precision_stderr": 0.000921657729333574, "rouge2_recall": 0.04649017309040178, "rouge2_recall_stderr": 0.0014882369637529544, "rougeL_fmeasure": 0.11823159104307632, "rougeL_fmeasure_stderr": 0.0017829954318414592, "rougeL_precision": 0.11668487543384909, "rougeL_precision_stderr": 0.002498896390227391, "rougeL_recall": 0.16129272420830681, "rougeL_recall_stderr": 0.002571624720811961, "rougeLsum_fmeasure": 0.13755330088318402, "rougeLsum_fmeasure_stderr": 0.00219534310275043, "rougeLsum_precision": 0.13518764121791138, "rougeLsum_precision_stderr": 0.0028124634604811717, "rougeLsum_recall": 0.18445870962398936, "rougeLsum_recall_stderr": 0.0029688108031568614}}, "1": {"tldr_en": {"bleu": 2.926117660825783, "bleu_stderr": 0.0707920058779335, "rouge1_fmeasure": 0.18955083016621427, "rouge1_fmeasure_stderr": 0.002379156871875284, "rouge1_precision": 0.248970781629388, "rouge1_precision_stderr": 0.003874261949118977, "rouge1_recall": 0.20254661208456856, "rouge1_recall_stderr": 0.0028554953044439015, "rouge2_fmeasure": 0.04746965955266556, "rouge2_fmeasure_stderr": 0.0013357687513664974, "rouge2_precision": 0.0689782299271333, "rouge2_precision_stderr": 0.002313495667945766, "rouge2_recall": 0.049284004115414136, "rouge2_recall_stderr": 0.0014678263918321242, "rougeL_fmeasure": 0.14594622749474678, "rougeL_fmeasure_stderr": 0.0018424648214888, "rougeL_precision": 0.19495136652936196, "rougeL_precision_stderr": 0.0032222442707770895, "rougeL_recall": 0.1564134625395888, "rougeL_recall_stderr": 0.002249411692052382, "rougeLsum_fmeasure": 0.17879643931529124, "rougeLsum_fmeasure_stderr": 0.0022381896082302615, "rougeLsum_precision": 0.23507901615131913, "rougeLsum_precision_stderr": 0.0036892088805215145, "rougeLsum_recall": 0.19138092032456272, "rougeLsum_recall_stderr": 0.002706865345022287}}, "2": {"tldr_en": {"bleu": 4.482664241932101, "bleu_stderr": 0.08212180996103731, "rouge1_fmeasure": 0.25402066807919726, "rouge1_fmeasure_stderr": 0.0022729602698409765, "rouge1_precision": 0.35679011396950494, "rouge1_precision_stderr": 0.0039535541787012966, "rouge1_recall": 0.2525122163812022, "rouge1_recall_stderr": 0.0028104769002719686, "rouge2_fmeasure": 0.07776422929510499, "rouge2_fmeasure_stderr": 0.0015470867437394145, "rouge2_precision": 0.11566892110217673, "rouge2_precision_stderr": 0.0025968459819964438, "rouge2_recall": 0.0758485270748662, "rouge2_recall_stderr": 0.0016494845495132536, "rougeL_fmeasure": 0.19606027302517406, "rougeL_fmeasure_stderr": 0.0018502837344183064, "rougeL_precision": 0.2787485396392972, "rougeL_precision_stderr": 0.00333060867857478, "rougeL_recall": 0.1946844152208185, "rougeL_recall_stderr": 0.002269590023349728, "rougeLsum_fmeasure": 0.24005412545885543, "rougeLsum_fmeasure_stderr": 0.0021905454232920693, "rougeLsum_precision": 0.33780149114906943, "rougeLsum_precision_stderr": 0.003819320386381285, "rougeLsum_recall": 0.23865291484527454, "rougeLsum_recall_stderr": 0.0027000637562272383}}, "3": {"tldr_en": {"bleu": 3.0072655046058805, "bleu_stderr": 0.09596043858220096, "rouge1_fmeasure": 0.2113115990683054, "rouge1_fmeasure_stderr": 0.0027547750855983046, "rouge1_precision": 0.3061484539454385, "rouge1_precision_stderr": 0.004423098151670539, "rouge1_recall": 0.20167165147009586, "rouge1_recall_stderr": 0.003037208327664155, "rouge2_fmeasure": 0.06469489115245816, "rouge2_fmeasure_stderr": 0.0015394791419511076, "rouge2_precision": 0.10017174467185903, "rouge2_precision_stderr": 0.002669280506981759, "rouge2_recall": 0.06128388820701079, "rouge2_recall_stderr": 0.0016275016915406385, "rougeL_fmeasure": 0.1649989495768865, "rougeL_fmeasure_stderr": 0.002208842551468564, "rougeL_precision": 0.2427018640988824, "rougeL_precision_stderr": 0.0037099343074804333, "rougeL_recall": 0.1573050958528797, "rougeL_recall_stderr": 0.002452551923134493, "rougeLsum_fmeasure": 0.19989739105994972, "rougeLsum_fmeasure_stderr": 0.0026343775714049306, "rougeLsum_precision": 0.29051399119634647, "rougeLsum_precision_stderr": 0.004266689720705603, "rougeLsum_recall": 0.19088557384190263, "rougeLsum_recall_stderr": 0.0029163289376507914}}, "4": {"tldr_en": {"bleu": 0.02961687910857089, "bleu_stderr": 0.00667797537003518, "rouge1_fmeasure": 0.06646559577850898, "rouge1_fmeasure_stderr": 0.002389468792903583, "rouge1_precision": 0.09734210523837013, "rouge1_precision_stderr": 0.003585657330962349, "rouge1_recall": 0.06338401184872311, "rouge1_recall_stderr": 0.002461970340537986, "rouge2_fmeasure": 0.020767091534965167, "rouge2_fmeasure_stderr": 0.001088077081953597, "rouge2_precision": 0.0321171525149136, "rouge2_precision_stderr": 0.0017883302892353346, "rouge2_recall": 0.019779405420936473, "rouge2_recall_stderr": 0.0011693482689711905, "rougeL_fmeasure": 0.05241812699049824, "rougeL_fmeasure_stderr": 0.0019162468765830335, "rougeL_precision": 0.07721998831670598, "rougeL_precision_stderr": 0.002911924342353414, "rougeL_recall": 0.05016221089779053, "rougeL_recall_stderr": 0.001994888739662481, "rougeLsum_fmeasure": 0.062355467850168954, "rougeLsum_fmeasure_stderr": 0.0022529742622293867, "rougeLsum_precision": 0.09174287392107108, "rougeLsum_precision_stderr": 0.0034181860926286, "rougeLsum_recall": 0.05945776168044872, "rougeLsum_recall_stderr": 0.0023246003955623533}}, "5": {"tldr_en": {"bleu": 5.0425595242130537e-17, "bleu_stderr": 5.828914972997529e-15, "rouge1_fmeasure": 0.010515163702672926, "rouge1_fmeasure_stderr": 0.001060191799945764, "rouge1_precision": 0.01662223836437527, "rouge1_precision_stderr": 0.0017200192815433816, "rouge1_recall": 0.010369987242786843, "rouge1_recall_stderr": 0.0011350821871749513, "rouge2_fmeasure": 0.0034609320209794962, "rouge2_fmeasure_stderr": 0.000506080127090741, "rouge2_precision": 0.0056669762870846345, "rouge2_precision_stderr": 0.0008937346232787428, "rouge2_recall": 0.0035137406087487875, "rouge2_recall_stderr": 0.0005888971524329703, "rougeL_fmeasure": 0.00858027237742148, "rougeL_fmeasure_stderr": 0.0008896522724178397, "rougeL_precision": 0.013605527079975888, "rougeL_precision_stderr": 0.0014624549576253666, "rougeL_recall": 0.008580131540181942, "rougeL_recall_stderr": 0.0009742333834018987, "rougeLsum_fmeasure": 0.010008632917285501, "rougeLsum_fmeasure_stderr": 0.0010183013884774283, "rougeLsum_precision": 0.015819080798652796, "rougeLsum_precision_stderr": 0.001649211944475785, "rougeLsum_recall": 0.009938412449545603, "rougeLsum_recall_stderr": 0.0011052383189021134}}}, "e2e_nlg_cleaned": {"0": {"generate_text_restaurant": {"bleu": 3.727703428672484, "bleu_stderr": 0.16225275145292814, "rouge1_fmeasure": 0.11677483396146617, "rouge1_fmeasure_stderr": 0.0026043522717618377, "rouge1_precision": 0.15580458811715164, "rouge1_precision_stderr": 0.004522055277902883, "rouge1_recall": 0.16212105310140335, "rouge1_recall_stderr": 0.0038770863196531777, "rouge2_fmeasure": 0.04207195309354536, "rouge2_fmeasure_stderr": 0.0011458322627199238, "rouge2_precision": 0.08759078800738393, "rouge2_precision_stderr": 0.004060781916683637, "rouge2_recall": 0.05918434764233474, "rouge2_recall_stderr": 0.001745078033222418, "rougeL_fmeasure": 0.0970712318345091, "rougeL_fmeasure_stderr": 0.002118544001686245, "rougeL_precision": 0.13984894212789747, "rougeL_precision_stderr": 0.0044166136430229454, "rougeL_recall": 0.1340573709320961, "rougeL_recall_stderr": 0.0031951681845401422, "rougeLsum_fmeasure": 0.10190557193119215, "rougeLsum_fmeasure_stderr": 0.0022803567703003585, "rougeLsum_precision": 0.14388054529296093, "rougeLsum_precision_stderr": 0.004453879377805569, "rougeLsum_recall": 0.14043655820750423, "rougeLsum_recall_stderr": 0.003394973082402341}}, "1": {"generate_text_restaurant": {"bleu": 12.253787105095654, "bleu_stderr": 0.1531956101772429, "rouge1_fmeasure": 0.48227052690365063, "rouge1_fmeasure_stderr": 0.002317881335104088, "rouge1_precision": 0.5916925132644157, "rouge1_precision_stderr": 0.00322106862270845, "rouge1_recall": 0.4463736554053124, "rouge1_recall_stderr": 0.0030343957764200962, "rouge2_fmeasure": 0.22765626131798156, "rouge2_fmeasure_stderr": 0.0020703831562182183, "rouge2_precision": 0.2838064949819702, "rouge2_precision_stderr": 0.0027789665070579485, "rouge2_recall": 0.2105351617568858, "rouge2_recall_stderr": 0.0022171957363924296, "rougeL_fmeasure": 0.34946822459925764, "rougeL_fmeasure_stderr": 0.0020719433030147168, "rougeL_precision": 0.43217159380951586, "rougeL_precision_stderr": 0.0029973445963260422, "rougeL_recall": 0.32230580960354577, "rougeL_recall_stderr": 0.0024575923055788883, "rougeLsum_fmeasure": 0.3932633862316688, "rougeLsum_fmeasure_stderr": 0.002340814619008484, "rougeLsum_precision": 0.48366766620362545, "rougeLsum_precision_stderr": 0.0032029340181387936, "rougeLsum_recall": 0.36354140064435775, "rougeLsum_recall_stderr": 0.0027910193529178087}}, "2": {"generate_text_restaurant": {"bleu": 14.934222887897532, "bleu_stderr": 0.21278791413856055, "rouge1_fmeasure": 0.5160444555536067, "rouge1_fmeasure_stderr": 0.00228951307038736, "rouge1_precision": 0.6137196300402722, "rouge1_precision_stderr": 0.0031475076717186906, "rouge1_recall": 0.48231229181347424, "rouge1_recall_stderr": 0.002994935365094384, "rouge2_fmeasure": 0.2594509643808628, "rouge2_fmeasure_stderr": 0.0021848217582054836, "rouge2_precision": 0.3128748478554642, "rouge2_precision_stderr": 0.0028571435877434844, "rouge2_recall": 0.24224424588278937, "rouge2_recall_stderr": 0.002338319832959116, "rougeL_fmeasure": 0.37626113256931526, "rougeL_fmeasure_stderr": 0.0021363134322449147, "rougeL_precision": 0.4496161361042401, "rougeL_precision_stderr": 0.002965960715542685, "rougeL_recall": 0.35106979956416473, "rougeL_recall_stderr": 0.0025186871703425898, "rougeLsum_fmeasure": 0.42631762287613684, "rougeLsum_fmeasure_stderr": 0.00239431216095114, "rougeLsum_precision": 0.5075541777391559, "rougeLsum_precision_stderr": 0.003180746032746745, "rougeLsum_recall": 0.3982152959674102, "rougeLsum_recall_stderr": 0.002838831357019365}}, "3": {"generate_text_restaurant": {"bleu": 15.550166229098965, "bleu_stderr": 0.21100324131614723, "rouge1_fmeasure": 0.5240247422123916, "rouge1_fmeasure_stderr": 0.0022364704364336795, "rouge1_precision": 0.6164424274284126, "rouge1_precision_stderr": 0.0031180799828950793, "rouge1_recall": 0.49077882213900875, "rouge1_recall_stderr": 0.002902655623188235, "rouge2_fmeasure": 0.2655834480484239, "rouge2_fmeasure_stderr": 0.0021599553939183514, "rouge2_precision": 0.3165046826237152, "rouge2_precision_stderr": 0.002782884317807398, "rouge2_recall": 0.24838679979596562, "rouge2_recall_stderr": 0.0023021548981493603, "rougeL_fmeasure": 0.38460762326164105, "rougeL_fmeasure_stderr": 0.0021692227869033478, "rougeL_precision": 0.45453733777109134, "rougeL_precision_stderr": 0.0029846320407150165, "rougeL_recall": 0.35943496219625287, "rougeL_recall_stderr": 0.002503259775759038, "rougeLsum_fmeasure": 0.4372484038981659, "rougeLsum_fmeasure_stderr": 0.002394606287079693, "rougeLsum_precision": 0.5148376263253541, "rougeLsum_precision_stderr": 0.0031730624992959006, "rougeLsum_recall": 0.4092664706750279, "rougeLsum_recall_stderr": 0.002806743229599867}}, "4": {"generate_text_restaurant": {"bleu": 15.882734366339575, "bleu_stderr": 0.20014792318307217, "rouge1_fmeasure": 0.5268811401300224, "rouge1_fmeasure_stderr": 0.002296537855184882, "rouge1_precision": 0.617829970748385, "rouge1_precision_stderr": 0.0031627975477214964, "rouge1_recall": 0.4934813921824228, "rouge1_recall_stderr": 0.0028974554963002866, "rouge2_fmeasure": 0.2697484320297564, "rouge2_fmeasure_stderr": 0.0022376325121211964, "rouge2_precision": 0.31982595333569097, "rouge2_precision_stderr": 0.002834806640598152, "rouge2_recall": 0.2524396113719004, "rouge2_recall_stderr": 0.002374239958755143, "rougeL_fmeasure": 0.38708461902411606, "rougeL_fmeasure_stderr": 0.002242571110085911, "rougeL_precision": 0.4547884196194121, "rougeL_precision_stderr": 0.0029857683967765883, "rougeL_recall": 0.36242825370807497, "rougeL_recall_stderr": 0.00256326606590863, "rougeLsum_fmeasure": 0.4406025001412695, "rougeLsum_fmeasure_stderr": 0.0024516808057243426, "rougeLsum_precision": 0.5162937268213095, "rougeLsum_precision_stderr": 0.003187124832415968, "rougeLsum_recall": 0.4128904038699314, "rougeLsum_recall_stderr": 0.0028402630566630306}}, "5": {"generate_text_restaurant": {"bleu": 15.843755546529314, "bleu_stderr": 0.23380050838762192, "rouge1_fmeasure": 0.5268007980171965, "rouge1_fmeasure_stderr": 0.0022830659821340285, "rouge1_precision": 0.6189660173531598, "rouge1_precision_stderr": 0.003202216597059111, "rouge1_recall": 0.49387787166933184, "rouge1_recall_stderr": 0.00292152626004202, "rouge2_fmeasure": 0.26998871183013234, "rouge2_fmeasure_stderr": 0.0021968682565042135, "rouge2_precision": 0.32113506253536717, "rouge2_precision_stderr": 0.002823936183018856, "rouge2_recall": 0.25289072399317875, "rouge2_recall_stderr": 0.0023526916821315917, "rougeL_fmeasure": 0.38651546157123484, "rougeL_fmeasure_stderr": 0.002221892359998622, "rougeL_precision": 0.45492486270003574, "rougeL_precision_stderr": 0.002993407598047982, "rougeL_recall": 0.3622504836542661, "rougeL_recall_stderr": 0.002569318863258077, "rougeLsum_fmeasure": 0.44101339790167177, "rougeLsum_fmeasure_stderr": 0.0024405926593214712, "rougeLsum_precision": 0.5179172358492237, "rougeLsum_precision_stderr": 0.0032140290174150392, "rougeLsum_recall": 0.4135121055179984, "rougeLsum_recall_stderr": 0.0028519351140784115}}}, "gem_xsum": {"0": {"article_DOC_summary": {"bleu": 2.4021403698389303, "bleu_stderr": 0.067244017856741, "rouge1_fmeasure": 0.22900899484830875, "rouge1_fmeasure_stderr": 0.002592170416843644, "rouge1_precision": 0.16834475552405148, "rouge1_precision_stderr": 0.002143734509300351, "rouge1_recall": 0.3812302941527284, "rouge1_recall_stderr": 0.004466228338306761, "rouge2_fmeasure": 0.056521580391250686, "rouge2_fmeasure_stderr": 0.0017743435854162372, "rouge2_precision": 0.04090800254887081, "rouge2_precision_stderr": 0.001331305757616898, "rouge2_recall": 0.09717669760813316, "rouge2_recall_stderr": 0.0031305903631064793, "rougeL_fmeasure": 0.16720327598962526, "rougeL_fmeasure_stderr": 0.0020460047183396978, "rougeL_precision": 0.12317643828521285, "rougeL_precision_stderr": 0.0017773839864967875, "rougeL_recall": 0.2797265709939456, "rougeL_recall_stderr": 0.0036566609405842706, "rougeLsum_fmeasure": 0.18208585408505043, "rougeLsum_fmeasure_stderr": 0.00227028405987386, "rougeLsum_precision": 0.1339383429556578, "rougeLsum_precision_stderr": 0.0019089490816378235, "rougeLsum_recall": 0.3045528042834054, "rougeLsum_recall_stderr": 0.004033519848039268}}, "1": {"article_DOC_summary": {"bleu": 2.587973656923586, "bleu_stderr": 0.18271829592693106, "rouge1_fmeasure": 0.22010181845678548, "rouge1_fmeasure_stderr": 0.0035289902424468713, "rouge1_precision": 0.2269075171314588, "rouge1_precision_stderr": 0.004333302214651766, "rouge1_recall": 0.24532990314212508, "rouge1_recall_stderr": 0.003988402379243326, "rouge2_fmeasure": 0.04964766400970655, "rouge2_fmeasure_stderr": 0.002214536505649702, "rouge2_precision": 0.052629985612383176, "rouge2_precision_stderr": 0.0026272197223151062, "rouge2_recall": 0.05514694411681367, "rouge2_recall_stderr": 0.002420925395374345, "rougeL_fmeasure": 0.16668249804551818, "rougeL_fmeasure_stderr": 0.002858700548419538, "rougeL_precision": 0.1721080105359506, "rougeL_precision_stderr": 0.003568699794613313, "rougeL_recall": 0.18654158462763012, "rougeL_recall_stderr": 0.0032259213006477503, "rougeLsum_fmeasure": 0.168054574737479, "rougeLsum_fmeasure_stderr": 0.0028788648929427077, "rougeLsum_precision": 0.17318677280555747, "rougeLsum_precision_stderr": 0.0035702087618089537, "rougeLsum_recall": 0.18887685302453283, "rougeLsum_recall_stderr": 0.003346146632601525}}, "2": {"article_DOC_summary": {"bleu": 2.894349555094649, "bleu_stderr": 0.20938561045016857, "rouge1_fmeasure": 0.22681874696670282, "rouge1_fmeasure_stderr": 0.0035634918232377074, "rouge1_precision": 0.23962839287439405, "rouge1_precision_stderr": 0.004379685148326459, "rouge1_recall": 0.24084621475655701, "rouge1_recall_stderr": 0.003791189958412602, "rouge2_fmeasure": 0.05421648195620343, "rouge2_fmeasure_stderr": 0.0023479794051376422, "rouge2_precision": 0.05825281986003038, "rouge2_precision_stderr": 0.0026810505602905777, "rouge2_recall": 0.056775559678677465, "rouge2_recall_stderr": 0.002426834325647628, "rougeL_fmeasure": 0.17492387767242143, "rougeL_fmeasure_stderr": 0.0029179836282209, "rougeL_precision": 0.1845331825452337, "rougeL_precision_stderr": 0.003580958301916115, "rougeL_recall": 0.18702023658313446, "rougeL_recall_stderr": 0.003174519635609054, "rougeLsum_fmeasure": 0.17541718007715307, "rougeLsum_fmeasure_stderr": 0.0029228112018755566, "rougeLsum_precision": 0.1851109498506353, "rougeLsum_precision_stderr": 0.0035857038136326946, "rougeLsum_recall": 0.1874180466959014, "rougeLsum_recall_stderr": 0.0031802199539878143}}, "3": {"article_DOC_summary": {"bleu": 3.3807185036949794, "bleu_stderr": 0.21747997288721058, "rouge1_fmeasure": 0.22875361771029976, "rouge1_fmeasure_stderr": 0.004084338493816929, "rouge1_precision": 0.2493216186518576, "rouge1_precision_stderr": 0.0049084458961309585, "rouge1_recall": 0.23437481439478378, "rouge1_recall_stderr": 0.00414167551937926, "rouge2_fmeasure": 0.058170472646030105, "rouge2_fmeasure_stderr": 0.002575465227066567, "rouge2_precision": 0.06426035314217526, "rouge2_precision_stderr": 0.0029430708789924724, "rouge2_recall": 0.05825170712730457, "rouge2_recall_stderr": 0.0025593535615914685, "rougeL_fmeasure": 0.17477557833568425, "rougeL_fmeasure_stderr": 0.003389234359734604, "rougeL_precision": 0.19044444305113, "rougeL_precision_stderr": 0.004057392892502295, "rougeL_recall": 0.1796956624879631, "rougeL_recall_stderr": 0.0034464435487860908, "rougeLsum_fmeasure": 0.17624162420032213, "rougeLsum_fmeasure_stderr": 0.0033874175464656286, "rougeLsum_precision": 0.19176785292110343, "rougeLsum_precision_stderr": 0.004051683679981941, "rougeLsum_recall": 0.1817729140455351, "rougeLsum_recall_stderr": 0.0034769204180304563}}, "4": {"article_DOC_summary": {"bleu": 0.11188091321184003, "bleu_stderr": 0.02931669237987178, "rouge1_fmeasure": 0.055495095278546853, "rouge1_fmeasure_stderr": 0.0035332699011158906, "rouge1_precision": 0.06368749975876878, "rouge1_precision_stderr": 0.004163291649927898, "rouge1_recall": 0.05633355721143847, "rouge1_recall_stderr": 0.003674327931986382, "rouge2_fmeasure": 0.014126745787126624, "rouge2_fmeasure_stderr": 0.0014244420667161892, "rouge2_precision": 0.01625809935844295, "rouge2_precision_stderr": 0.001744008450570692, "rouge2_recall": 0.014127871826558468, "rouge2_recall_stderr": 0.0014279592951878697, "rougeL_fmeasure": 0.042006581084650725, "rougeL_fmeasure_stderr": 0.002736359920016333, "rougeL_precision": 0.048922678698080466, "rougeL_precision_stderr": 0.003321571568066582, "rougeL_recall": 0.04260833742058202, "rougeL_recall_stderr": 0.0028433365851945613, "rougeLsum_fmeasure": 0.04223553974124363, "rougeLsum_fmeasure_stderr": 0.0027526558135678226, "rougeLsum_precision": 0.049121011091270275, "rougeLsum_precision_stderr": 0.0033301554897141204, "rougeLsum_recall": 0.042965789423027506, "rougeLsum_recall_stderr": 0.0028912525537101723}}, "5": {"article_DOC_summary": {"bleu": 2.2560041633308834e-45, "bleu_stderr": 1.8421463064085026e-30, "rouge1_fmeasure": 0.002533146063446972, "rouge1_fmeasure_stderr": 0.0008926774274323296, "rouge1_precision": 0.002666427538603693, "rouge1_precision_stderr": 0.001013100557726815, "rouge1_recall": 0.0025861091150659685, "rouge1_recall_stderr": 0.0008630243879275325, "rouge2_fmeasure": 0.0006840490507628032, "rouge2_fmeasure_stderr": 0.00035126113759812106, "rouge2_precision": 0.0007974546793721661, "rouge2_precision_stderr": 0.0004389545775956508, "rouge2_recall": 0.0006295661715078737, "rouge2_recall_stderr": 0.00030074990914758437, "rougeL_fmeasure": 0.0018694866909844472, "rougeL_fmeasure_stderr": 0.0007140136174659965, "rougeL_precision": 0.002022260888604123, "rougeL_precision_stderr": 0.0008452973095491474, "rougeL_recall": 0.0018561449826780235, "rougeL_recall_stderr": 0.0006574742336350735, "rougeLsum_fmeasure": 0.0019113224438188196, "rougeLsum_fmeasure_stderr": 0.000720026623055153, "rougeLsum_precision": 0.00205235327222183, "rougeLsum_precision_stderr": 0.0008479115148274438, "rougeLsum_recall": 0.0019247556173263936, "rougeLsum_recall_stderr": 0.0006749866649238696}}}} |