|
dataset,fewshots,prompt,metric,value
|
|
e2e_nlg_cleaned,0,generate_text_restaurant,rouge2_fmeasure,0.00032804483755933243
|
|
e2e_nlg_cleaned,0,median,rouge2_fmeasure,0.00032804483755933243
|
|
e2e_nlg_cleaned,1,generate_text_restaurant,rouge2_fmeasure,0.14487745848120898
|
|
e2e_nlg_cleaned,1,median,rouge2_fmeasure,0.14487745848120898
|
|
e2e_nlg_cleaned,2,generate_text_restaurant,rouge2_fmeasure,0.16097050153867934
|
|
e2e_nlg_cleaned,2,median,rouge2_fmeasure,0.16097050153867934
|
|
e2e_nlg_cleaned,3,generate_text_restaurant,rouge2_fmeasure,0.17904291710237294
|
|
e2e_nlg_cleaned,3,median,rouge2_fmeasure,0.17904291710237294
|
|
e2e_nlg_cleaned,4,generate_text_restaurant,rouge2_fmeasure,0.18976514478592516
|
|
e2e_nlg_cleaned,4,median,rouge2_fmeasure,0.18976514478592516
|
|
e2e_nlg_cleaned,5,generate_text_restaurant,rouge2_fmeasure,0.19513439898691012
|
|
e2e_nlg_cleaned,5,median,rouge2_fmeasure,0.19513439898691012
|
|
e2e_nlg_cleaned,5,average,multiple,0.14501974428877598
|
|
gem_xsum,0,article_DOC_summary,rouge2_fmeasure,0.05093449549500333
|
|
gem_xsum,0,median,rouge2_fmeasure,0.05093449549500333
|
|
gem_xsum,1,article_DOC_summary,rouge2_fmeasure,0.03807299304872921
|
|
gem_xsum,1,median,rouge2_fmeasure,0.03807299304872921
|
|
gem_xsum,2,article_DOC_summary,rouge2_fmeasure,0.03829786428664246
|
|
gem_xsum,2,median,rouge2_fmeasure,0.03829786428664246
|
|
gem_xsum,3,article_DOC_summary,rouge2_fmeasure,0.03633421176029688
|
|
gem_xsum,3,median,rouge2_fmeasure,0.03633421176029688
|
|
gem_xsum,4,article_DOC_summary,rouge2_fmeasure,0.009377022747940285
|
|
gem_xsum,4,median,rouge2_fmeasure,0.009377022747940285
|
|
gem_xsum,5,article_DOC_summary,rouge2_fmeasure,0.0005666193916622732
|
|
gem_xsum,5,median,rouge2_fmeasure,0.0005666193916622732
|
|
gem_xsum,5,average,multiple,0.02893053445504574
|
|
web_nlg_en,0,PALM_prompt,rouge2_fmeasure,0.04861844568830817
|
|
web_nlg_en,0,median,rouge2_fmeasure,0.04861844568830817
|
|
web_nlg_en,1,PALM_prompt,rouge2_fmeasure,0.05672274465750321
|
|
web_nlg_en,1,median,rouge2_fmeasure,0.05672274465750321
|
|
web_nlg_en,2,PALM_prompt,rouge2_fmeasure,0.05789739591362932
|
|
web_nlg_en,2,median,rouge2_fmeasure,0.05789739591362932
|
|
web_nlg_en,3,PALM_prompt,rouge2_fmeasure,0.05845298625034767
|
|
web_nlg_en,3,median,rouge2_fmeasure,0.05845298625034767
|
|
web_nlg_en,4,PALM_prompt,rouge2_fmeasure,0.06051792994698306
|
|
web_nlg_en,4,median,rouge2_fmeasure,0.06051792994698306
|
|
web_nlg_en,5,PALM_prompt,rouge2_fmeasure,0.05997095205778236
|
|
web_nlg_en,5,median,rouge2_fmeasure,0.05997095205778236
|
|
web_nlg_en,5,average,multiple,0.057030075752425635
|
|
wiki_lingua_en,0,tldr_en,rouge2_fmeasure,0.034298445515984884
|
|
wiki_lingua_en,0,median,rouge2_fmeasure,0.034298445515984884
|
|
wiki_lingua_en,1,tldr_en,rouge2_fmeasure,0.04668447958482574
|
|
wiki_lingua_en,1,median,rouge2_fmeasure,0.04668447958482574
|
|
wiki_lingua_en,2,tldr_en,rouge2_fmeasure,0.05512243219484514
|
|
wiki_lingua_en,2,median,rouge2_fmeasure,0.05512243219484514
|
|
wiki_lingua_en,3,tldr_en,rouge2_fmeasure,0.047560822644652924
|
|
wiki_lingua_en,3,median,rouge2_fmeasure,0.047560822644652924
|
|
wiki_lingua_en,4,tldr_en,rouge2_fmeasure,0.015173414928652448
|
|
wiki_lingua_en,4,median,rouge2_fmeasure,0.015173414928652448
|
|
wiki_lingua_en,5,tldr_en,rouge2_fmeasure,0.002268834117142696
|
|
wiki_lingua_en,5,median,rouge2_fmeasure,0.002268834117142696
|
|
wiki_lingua_en,5,average,multiple,0.033518071497683974
|
|
|