|
dataset,fewshots,prompt,metric,value
|
|
e2e_nlg_cleaned,0,generate_text_restaurant,rouge2_fmeasure,0.0043911029729981465
|
|
e2e_nlg_cleaned,0,median,rouge2_fmeasure,0.0043911029729981465
|
|
e2e_nlg_cleaned,1,generate_text_restaurant,rouge2_fmeasure,0.14634556896551848
|
|
e2e_nlg_cleaned,1,median,rouge2_fmeasure,0.14634556896551848
|
|
e2e_nlg_cleaned,2,generate_text_restaurant,rouge2_fmeasure,0.16691425263662168
|
|
e2e_nlg_cleaned,2,median,rouge2_fmeasure,0.16691425263662168
|
|
e2e_nlg_cleaned,3,generate_text_restaurant,rouge2_fmeasure,0.17476964694401387
|
|
e2e_nlg_cleaned,3,median,rouge2_fmeasure,0.17476964694401387
|
|
e2e_nlg_cleaned,4,generate_text_restaurant,rouge2_fmeasure,0.17238412451550736
|
|
e2e_nlg_cleaned,4,median,rouge2_fmeasure,0.17238412451550736
|
|
e2e_nlg_cleaned,5,generate_text_restaurant,rouge2_fmeasure,0.17413364387783356
|
|
e2e_nlg_cleaned,5,median,rouge2_fmeasure,0.17413364387783356
|
|
e2e_nlg_cleaned,5,average,multiple,0.1398230566520822
|
|
gem_xsum,0,article_DOC_summary,rouge2_fmeasure,0.01153407231838246
|
|
gem_xsum,0,median,rouge2_fmeasure,0.01153407231838246
|
|
gem_xsum,1,article_DOC_summary,rouge2_fmeasure,0.01870363630762986
|
|
gem_xsum,1,median,rouge2_fmeasure,0.01870363630762986
|
|
gem_xsum,2,article_DOC_summary,rouge2_fmeasure,0.02149971321984745
|
|
gem_xsum,2,median,rouge2_fmeasure,0.02149971321984745
|
|
gem_xsum,3,article_DOC_summary,rouge2_fmeasure,0.012510492483954895
|
|
gem_xsum,3,median,rouge2_fmeasure,0.012510492483954895
|
|
gem_xsum,4,article_DOC_summary,rouge2_fmeasure,0.0029439626544144923
|
|
gem_xsum,4,median,rouge2_fmeasure,0.0029439626544144923
|
|
gem_xsum,5,article_DOC_summary,rouge2_fmeasure,5.19777535214928e-05
|
|
gem_xsum,5,median,rouge2_fmeasure,5.19777535214928e-05
|
|
gem_xsum,5,average,multiple,0.01120730912295844
|
|
web_nlg_en,0,PALM_prompt,rouge2_fmeasure,0.05341982709541381
|
|
web_nlg_en,0,median,rouge2_fmeasure,0.05341982709541381
|
|
web_nlg_en,1,PALM_prompt,rouge2_fmeasure,0.05569920972530597
|
|
web_nlg_en,1,median,rouge2_fmeasure,0.05569920972530597
|
|
web_nlg_en,2,PALM_prompt,rouge2_fmeasure,0.055829123679104704
|
|
web_nlg_en,2,median,rouge2_fmeasure,0.055829123679104704
|
|
web_nlg_en,3,PALM_prompt,rouge2_fmeasure,0.0555802940665526
|
|
web_nlg_en,3,median,rouge2_fmeasure,0.0555802940665526
|
|
web_nlg_en,4,PALM_prompt,rouge2_fmeasure,0.05468830386197015
|
|
web_nlg_en,4,median,rouge2_fmeasure,0.05468830386197015
|
|
web_nlg_en,5,PALM_prompt,rouge2_fmeasure,0.05505652232011781
|
|
web_nlg_en,5,median,rouge2_fmeasure,0.05505652232011781
|
|
web_nlg_en,5,average,multiple,0.05504554679141084
|
|
wiki_lingua_en,0,tldr_en,rouge2_fmeasure,0.005442298869452033
|
|
wiki_lingua_en,0,median,rouge2_fmeasure,0.005442298869452033
|
|
wiki_lingua_en,1,tldr_en,rouge2_fmeasure,0.033304794776064954
|
|
wiki_lingua_en,1,median,rouge2_fmeasure,0.033304794776064954
|
|
wiki_lingua_en,2,tldr_en,rouge2_fmeasure,0.03566526748783912
|
|
wiki_lingua_en,2,median,rouge2_fmeasure,0.03566526748783912
|
|
wiki_lingua_en,3,tldr_en,rouge2_fmeasure,0.02943630075177706
|
|
wiki_lingua_en,3,median,rouge2_fmeasure,0.02943630075177706
|
|
wiki_lingua_en,4,tldr_en,rouge2_fmeasure,0.009975083716813172
|
|
wiki_lingua_en,4,median,rouge2_fmeasure,0.009975083716813172
|
|
wiki_lingua_en,5,tldr_en,rouge2_fmeasure,0.0016405694963126324
|
|
wiki_lingua_en,5,median,rouge2_fmeasure,0.0016405694963126324
|
|
wiki_lingua_en,5,average,multiple,0.019244052516376495
|
|
|