Muennighoff's picture
Add
29393c3
dataset,fewshots,prompt,metric,value
e2e_nlg_cleaned,0,generate_text_restaurant,rouge2_fmeasure,0.00032804483755933243
e2e_nlg_cleaned,0,median,rouge2_fmeasure,0.00032804483755933243
e2e_nlg_cleaned,1,generate_text_restaurant,rouge2_fmeasure,0.14487745848120898
e2e_nlg_cleaned,1,median,rouge2_fmeasure,0.14487745848120898
e2e_nlg_cleaned,2,generate_text_restaurant,rouge2_fmeasure,0.16097050153867934
e2e_nlg_cleaned,2,median,rouge2_fmeasure,0.16097050153867934
e2e_nlg_cleaned,3,generate_text_restaurant,rouge2_fmeasure,0.17904291710237294
e2e_nlg_cleaned,3,median,rouge2_fmeasure,0.17904291710237294
e2e_nlg_cleaned,4,generate_text_restaurant,rouge2_fmeasure,0.18976514478592516
e2e_nlg_cleaned,4,median,rouge2_fmeasure,0.18976514478592516
e2e_nlg_cleaned,5,generate_text_restaurant,rouge2_fmeasure,0.19513439898691012
e2e_nlg_cleaned,5,median,rouge2_fmeasure,0.19513439898691012
e2e_nlg_cleaned,5,average,multiple,0.14501974428877598
gem_xsum,0,article_DOC_summary,rouge2_fmeasure,0.05093449549500333
gem_xsum,0,median,rouge2_fmeasure,0.05093449549500333
gem_xsum,1,article_DOC_summary,rouge2_fmeasure,0.03807299304872921
gem_xsum,1,median,rouge2_fmeasure,0.03807299304872921
gem_xsum,2,article_DOC_summary,rouge2_fmeasure,0.03829786428664246
gem_xsum,2,median,rouge2_fmeasure,0.03829786428664246
gem_xsum,3,article_DOC_summary,rouge2_fmeasure,0.03633421176029688
gem_xsum,3,median,rouge2_fmeasure,0.03633421176029688
gem_xsum,4,article_DOC_summary,rouge2_fmeasure,0.009377022747940285
gem_xsum,4,median,rouge2_fmeasure,0.009377022747940285
gem_xsum,5,article_DOC_summary,rouge2_fmeasure,0.0005666193916622732
gem_xsum,5,median,rouge2_fmeasure,0.0005666193916622732
gem_xsum,5,average,multiple,0.02893053445504574
web_nlg_en,0,PALM_prompt,rouge2_fmeasure,0.04861844568830817
web_nlg_en,0,median,rouge2_fmeasure,0.04861844568830817
web_nlg_en,1,PALM_prompt,rouge2_fmeasure,0.05672274465750321
web_nlg_en,1,median,rouge2_fmeasure,0.05672274465750321
web_nlg_en,2,PALM_prompt,rouge2_fmeasure,0.05789739591362932
web_nlg_en,2,median,rouge2_fmeasure,0.05789739591362932
web_nlg_en,3,PALM_prompt,rouge2_fmeasure,0.05845298625034767
web_nlg_en,3,median,rouge2_fmeasure,0.05845298625034767
web_nlg_en,4,PALM_prompt,rouge2_fmeasure,0.06051792994698306
web_nlg_en,4,median,rouge2_fmeasure,0.06051792994698306
web_nlg_en,5,PALM_prompt,rouge2_fmeasure,0.05997095205778236
web_nlg_en,5,median,rouge2_fmeasure,0.05997095205778236
web_nlg_en,5,average,multiple,0.057030075752425635
wiki_lingua_en,0,tldr_en,rouge2_fmeasure,0.034298445515984884
wiki_lingua_en,0,median,rouge2_fmeasure,0.034298445515984884
wiki_lingua_en,1,tldr_en,rouge2_fmeasure,0.04668447958482574
wiki_lingua_en,1,median,rouge2_fmeasure,0.04668447958482574
wiki_lingua_en,2,tldr_en,rouge2_fmeasure,0.05512243219484514
wiki_lingua_en,2,median,rouge2_fmeasure,0.05512243219484514
wiki_lingua_en,3,tldr_en,rouge2_fmeasure,0.047560822644652924
wiki_lingua_en,3,median,rouge2_fmeasure,0.047560822644652924
wiki_lingua_en,4,tldr_en,rouge2_fmeasure,0.015173414928652448
wiki_lingua_en,4,median,rouge2_fmeasure,0.015173414928652448
wiki_lingua_en,5,tldr_en,rouge2_fmeasure,0.002268834117142696
wiki_lingua_en,5,median,rouge2_fmeasure,0.002268834117142696
wiki_lingua_en,5,average,multiple,0.033518071497683974