|
dataset,fewshots,prompt,metric,value
|
|
e2e_nlg_cleaned,0,generate_text_restaurant,rouge2_fmeasure,0.0006359667540750598
|
|
e2e_nlg_cleaned,0,median,rouge2_fmeasure,0.0006359667540750598
|
|
e2e_nlg_cleaned,1,generate_text_restaurant,rouge2_fmeasure,0.12463514115806919
|
|
e2e_nlg_cleaned,1,median,rouge2_fmeasure,0.12463514115806919
|
|
e2e_nlg_cleaned,2,generate_text_restaurant,rouge2_fmeasure,0.1463066245452882
|
|
e2e_nlg_cleaned,2,median,rouge2_fmeasure,0.1463066245452882
|
|
e2e_nlg_cleaned,3,generate_text_restaurant,rouge2_fmeasure,0.14999298186863755
|
|
e2e_nlg_cleaned,3,median,rouge2_fmeasure,0.14999298186863755
|
|
e2e_nlg_cleaned,4,generate_text_restaurant,rouge2_fmeasure,0.1583408367591379
|
|
e2e_nlg_cleaned,4,median,rouge2_fmeasure,0.1583408367591379
|
|
e2e_nlg_cleaned,5,generate_text_restaurant,rouge2_fmeasure,0.1726081857656977
|
|
e2e_nlg_cleaned,5,median,rouge2_fmeasure,0.1726081857656977
|
|
e2e_nlg_cleaned,5,average,multiple,0.1254199561418176
|
|
gem_xsum,0,article_DOC_summary,rouge2_fmeasure,0.006073255625355645
|
|
gem_xsum,0,median,rouge2_fmeasure,0.006073255625355645
|
|
gem_xsum,1,article_DOC_summary,rouge2_fmeasure,0.005968104627521815
|
|
gem_xsum,1,median,rouge2_fmeasure,0.005968104627521815
|
|
gem_xsum,2,article_DOC_summary,rouge2_fmeasure,0.00672052705909708
|
|
gem_xsum,2,median,rouge2_fmeasure,0.00672052705909708
|
|
gem_xsum,3,article_DOC_summary,rouge2_fmeasure,0.006943244163002554
|
|
gem_xsum,3,median,rouge2_fmeasure,0.006943244163002554
|
|
gem_xsum,4,article_DOC_summary,rouge2_fmeasure,0.0026139422307253986
|
|
gem_xsum,4,median,rouge2_fmeasure,0.0026139422307253986
|
|
gem_xsum,5,article_DOC_summary,rouge2_fmeasure,0.00010730891049598514
|
|
gem_xsum,5,median,rouge2_fmeasure,0.00010730891049598514
|
|
gem_xsum,5,average,multiple,0.004737730436033079
|
|
web_nlg_en,0,PALM_prompt,rouge2_fmeasure,0.05502825027290272
|
|
web_nlg_en,0,median,rouge2_fmeasure,0.05502825027290272
|
|
web_nlg_en,1,PALM_prompt,rouge2_fmeasure,0.05811058513302895
|
|
web_nlg_en,1,median,rouge2_fmeasure,0.05811058513302895
|
|
web_nlg_en,2,PALM_prompt,rouge2_fmeasure,0.05685211598675336
|
|
web_nlg_en,2,median,rouge2_fmeasure,0.05685211598675336
|
|
web_nlg_en,3,PALM_prompt,rouge2_fmeasure,0.054818451753863656
|
|
web_nlg_en,3,median,rouge2_fmeasure,0.054818451753863656
|
|
web_nlg_en,4,PALM_prompt,rouge2_fmeasure,0.05493385212823661
|
|
web_nlg_en,4,median,rouge2_fmeasure,0.05493385212823661
|
|
web_nlg_en,5,PALM_prompt,rouge2_fmeasure,0.05370114479085305
|
|
web_nlg_en,5,median,rouge2_fmeasure,0.05370114479085305
|
|
web_nlg_en,5,average,multiple,0.05557406667760639
|
|
wiki_lingua_en,0,tldr_en,rouge2_fmeasure,0.0032754676506289828
|
|
wiki_lingua_en,0,median,rouge2_fmeasure,0.0032754676506289828
|
|
wiki_lingua_en,1,tldr_en,rouge2_fmeasure,0.004199685382427501
|
|
wiki_lingua_en,1,median,rouge2_fmeasure,0.004199685382427501
|
|
wiki_lingua_en,2,tldr_en,rouge2_fmeasure,0.004799135265562465
|
|
wiki_lingua_en,2,median,rouge2_fmeasure,0.004799135265562465
|
|
wiki_lingua_en,3,tldr_en,rouge2_fmeasure,0.005617198716065193
|
|
wiki_lingua_en,3,median,rouge2_fmeasure,0.005617198716065193
|
|
wiki_lingua_en,4,tldr_en,rouge2_fmeasure,0.0029260675465866874
|
|
wiki_lingua_en,4,median,rouge2_fmeasure,0.0029260675465866874
|
|
wiki_lingua_en,5,tldr_en,rouge2_fmeasure,0.0004573993622119604
|
|
wiki_lingua_en,5,median,rouge2_fmeasure,0.0004573993622119604
|
|
wiki_lingua_en,5,average,multiple,0.0035458256539137984
|
|
|