|
dataset,fewshots,prompt,metric,value
|
|
e2e_nlg_cleaned,0,generate_text_restaurant,rouge2_fmeasure,0.06187846081562434
|
|
e2e_nlg_cleaned,0,median,rouge2_fmeasure,0.06187846081562434
|
|
e2e_nlg_cleaned,1,generate_text_restaurant,rouge2_fmeasure,0.16696906460089045
|
|
e2e_nlg_cleaned,1,median,rouge2_fmeasure,0.16696906460089045
|
|
e2e_nlg_cleaned,2,generate_text_restaurant,rouge2_fmeasure,0.18635767606167977
|
|
e2e_nlg_cleaned,2,median,rouge2_fmeasure,0.18635767606167977
|
|
e2e_nlg_cleaned,3,generate_text_restaurant,rouge2_fmeasure,0.19583480506260798
|
|
e2e_nlg_cleaned,3,median,rouge2_fmeasure,0.19583480506260798
|
|
e2e_nlg_cleaned,4,generate_text_restaurant,rouge2_fmeasure,0.20132801941812545
|
|
e2e_nlg_cleaned,4,median,rouge2_fmeasure,0.20132801941812545
|
|
e2e_nlg_cleaned,5,generate_text_restaurant,rouge2_fmeasure,0.19734778489236487
|
|
e2e_nlg_cleaned,5,median,rouge2_fmeasure,0.19734778489236487
|
|
e2e_nlg_cleaned,5,average,multiple,0.16828596847521549
|
|
gem_xsum,0,article_DOC_summary,rouge2_fmeasure,0.049755066362456114
|
|
gem_xsum,0,median,rouge2_fmeasure,0.049755066362456114
|
|
gem_xsum,1,article_DOC_summary,rouge2_fmeasure,0.034970894707131765
|
|
gem_xsum,1,median,rouge2_fmeasure,0.034970894707131765
|
|
gem_xsum,2,article_DOC_summary,rouge2_fmeasure,0.032088581665832575
|
|
gem_xsum,2,median,rouge2_fmeasure,0.032088581665832575
|
|
gem_xsum,3,article_DOC_summary,rouge2_fmeasure,0.03314896853957152
|
|
gem_xsum,3,median,rouge2_fmeasure,0.03314896853957152
|
|
gem_xsum,4,article_DOC_summary,rouge2_fmeasure,0.00874385192747724
|
|
gem_xsum,4,median,rouge2_fmeasure,0.00874385192747724
|
|
gem_xsum,5,article_DOC_summary,rouge2_fmeasure,0.00024851863402463746
|
|
gem_xsum,5,median,rouge2_fmeasure,0.00024851863402463746
|
|
gem_xsum,5,average,multiple,0.026492646972748977
|
|
web_nlg_en,0,PALM_prompt,rouge2_fmeasure,0.04314501248705826
|
|
web_nlg_en,0,median,rouge2_fmeasure,0.04314501248705826
|
|
web_nlg_en,1,PALM_prompt,rouge2_fmeasure,0.051698558921326514
|
|
web_nlg_en,1,median,rouge2_fmeasure,0.051698558921326514
|
|
web_nlg_en,2,PALM_prompt,rouge2_fmeasure,0.05453717672261224
|
|
web_nlg_en,2,median,rouge2_fmeasure,0.05453717672261224
|
|
web_nlg_en,3,PALM_prompt,rouge2_fmeasure,0.05437250272050667
|
|
web_nlg_en,3,median,rouge2_fmeasure,0.05437250272050667
|
|
web_nlg_en,4,PALM_prompt,rouge2_fmeasure,0.05731193809218633
|
|
web_nlg_en,4,median,rouge2_fmeasure,0.05731193809218633
|
|
web_nlg_en,5,PALM_prompt,rouge2_fmeasure,0.055825671549297295
|
|
web_nlg_en,5,median,rouge2_fmeasure,0.055825671549297295
|
|
web_nlg_en,5,average,multiple,0.05281514341549788
|
|
wiki_lingua_en,0,tldr_en,rouge2_fmeasure,0.027936413268100608
|
|
wiki_lingua_en,0,median,rouge2_fmeasure,0.027936413268100608
|
|
wiki_lingua_en,1,tldr_en,rouge2_fmeasure,0.04823668695482641
|
|
wiki_lingua_en,1,median,rouge2_fmeasure,0.04823668695482641
|
|
wiki_lingua_en,2,tldr_en,rouge2_fmeasure,0.05230636200823752
|
|
wiki_lingua_en,2,median,rouge2_fmeasure,0.05230636200823752
|
|
wiki_lingua_en,3,tldr_en,rouge2_fmeasure,0.04453744596750722
|
|
wiki_lingua_en,3,median,rouge2_fmeasure,0.04453744596750722
|
|
wiki_lingua_en,4,tldr_en,rouge2_fmeasure,0.014698290853528981
|
|
wiki_lingua_en,4,median,rouge2_fmeasure,0.014698290853528981
|
|
wiki_lingua_en,5,tldr_en,rouge2_fmeasure,0.0027535231928660694
|
|
wiki_lingua_en,5,median,rouge2_fmeasure,0.0027535231928660694
|
|
wiki_lingua_en,5,average,multiple,0.03174478704084447
|
|
|