|
dataset,fewshots,prompt,metric,value
|
|
e2e_nlg_cleaned,0,generate_text_restaurant,rouge2_fmeasure,0.010736674908829128
|
|
e2e_nlg_cleaned,0,median,rouge2_fmeasure,0.010736674908829128
|
|
e2e_nlg_cleaned,1,generate_text_restaurant,rouge2_fmeasure,0.05706123212585479
|
|
e2e_nlg_cleaned,1,median,rouge2_fmeasure,0.05706123212585479
|
|
e2e_nlg_cleaned,2,generate_text_restaurant,rouge2_fmeasure,0.08456553732934603
|
|
e2e_nlg_cleaned,2,median,rouge2_fmeasure,0.08456553732934603
|
|
e2e_nlg_cleaned,3,generate_text_restaurant,rouge2_fmeasure,0.09792307241998234
|
|
e2e_nlg_cleaned,3,median,rouge2_fmeasure,0.09792307241998234
|
|
e2e_nlg_cleaned,4,generate_text_restaurant,rouge2_fmeasure,0.11225233292150326
|
|
e2e_nlg_cleaned,4,median,rouge2_fmeasure,0.11225233292150326
|
|
e2e_nlg_cleaned,5,generate_text_restaurant,rouge2_fmeasure,0.12437458519230632
|
|
e2e_nlg_cleaned,5,median,rouge2_fmeasure,0.12437458519230632
|
|
e2e_nlg_cleaned,5,average,multiple,0.08115223914963698
|
|
gem_xsum,0,article_DOC_summary,rouge2_fmeasure,0.02440112287257367
|
|
gem_xsum,0,median,rouge2_fmeasure,0.02440112287257367
|
|
gem_xsum,1,article_DOC_summary,rouge2_fmeasure,0.018226182677564602
|
|
gem_xsum,1,median,rouge2_fmeasure,0.018226182677564602
|
|
gem_xsum,2,article_DOC_summary,rouge2_fmeasure,0.018525660614874147
|
|
gem_xsum,2,median,rouge2_fmeasure,0.018525660614874147
|
|
gem_xsum,3,article_DOC_summary,rouge2_fmeasure,0.017445968725527953
|
|
gem_xsum,3,median,rouge2_fmeasure,0.017445968725527953
|
|
gem_xsum,4,article_DOC_summary,rouge2_fmeasure,0.005129090360707225
|
|
gem_xsum,4,median,rouge2_fmeasure,0.005129090360707225
|
|
gem_xsum,5,article_DOC_summary,rouge2_fmeasure,0.0003192230499539746
|
|
gem_xsum,5,median,rouge2_fmeasure,0.0003192230499539746
|
|
gem_xsum,5,average,multiple,0.014007874716866929
|
|
web_nlg_en,0,PALM_prompt,rouge2_fmeasure,0.04138231986575359
|
|
web_nlg_en,0,median,rouge2_fmeasure,0.04138231986575359
|
|
web_nlg_en,1,PALM_prompt,rouge2_fmeasure,0.03623174370339374
|
|
web_nlg_en,1,median,rouge2_fmeasure,0.03623174370339374
|
|
web_nlg_en,2,PALM_prompt,rouge2_fmeasure,0.035231660164805785
|
|
web_nlg_en,2,median,rouge2_fmeasure,0.035231660164805785
|
|
web_nlg_en,3,PALM_prompt,rouge2_fmeasure,0.03498308879465038
|
|
web_nlg_en,3,median,rouge2_fmeasure,0.03498308879465038
|
|
web_nlg_en,4,PALM_prompt,rouge2_fmeasure,0.03616407362539412
|
|
web_nlg_en,4,median,rouge2_fmeasure,0.03616407362539412
|
|
web_nlg_en,5,PALM_prompt,rouge2_fmeasure,0.03554619045223363
|
|
web_nlg_en,5,median,rouge2_fmeasure,0.03554619045223363
|
|
web_nlg_en,5,average,multiple,0.03658984610103854
|
|
wiki_lingua_en,0,tldr_en,rouge2_fmeasure,0.012242312744229137
|
|
wiki_lingua_en,0,median,rouge2_fmeasure,0.012242312744229137
|
|
wiki_lingua_en,1,tldr_en,rouge2_fmeasure,0.0073507199277508825
|
|
wiki_lingua_en,1,median,rouge2_fmeasure,0.0073507199277508825
|
|
wiki_lingua_en,2,tldr_en,rouge2_fmeasure,0.007001951186011981
|
|
wiki_lingua_en,2,median,rouge2_fmeasure,0.007001951186011981
|
|
wiki_lingua_en,3,tldr_en,rouge2_fmeasure,0.009383113142976338
|
|
wiki_lingua_en,3,median,rouge2_fmeasure,0.009383113142976338
|
|
wiki_lingua_en,4,tldr_en,rouge2_fmeasure,0.003984021707078218
|
|
wiki_lingua_en,4,median,rouge2_fmeasure,0.003984021707078218
|
|
wiki_lingua_en,5,tldr_en,rouge2_fmeasure,0.0009343759708146302
|
|
wiki_lingua_en,5,median,rouge2_fmeasure,0.0009343759708146302
|
|
wiki_lingua_en,5,average,multiple,0.006816082446476864
|
|
|