|
dataset,fewshots,prompt,metric,value
|
|
e2e_nlg_cleaned,0,generate_text_restaurant,rouge2_fmeasure,0.0
|
|
e2e_nlg_cleaned,0,median,rouge2_fmeasure,0.0
|
|
e2e_nlg_cleaned,1,generate_text_restaurant,rouge2_fmeasure,0.0790458842297352
|
|
e2e_nlg_cleaned,1,median,rouge2_fmeasure,0.0790458842297352
|
|
e2e_nlg_cleaned,2,generate_text_restaurant,rouge2_fmeasure,0.09494958872823868
|
|
e2e_nlg_cleaned,2,median,rouge2_fmeasure,0.09494958872823868
|
|
e2e_nlg_cleaned,3,generate_text_restaurant,rouge2_fmeasure,0.10541398390697426
|
|
e2e_nlg_cleaned,3,median,rouge2_fmeasure,0.10541398390697426
|
|
e2e_nlg_cleaned,4,generate_text_restaurant,rouge2_fmeasure,0.11600779243298241
|
|
e2e_nlg_cleaned,4,median,rouge2_fmeasure,0.11600779243298241
|
|
e2e_nlg_cleaned,5,generate_text_restaurant,rouge2_fmeasure,0.1273300920831121
|
|
e2e_nlg_cleaned,5,median,rouge2_fmeasure,0.1273300920831121
|
|
e2e_nlg_cleaned,5,average,multiple,0.08712455689684044
|
|
gem_xsum,0,article_DOC_summary,rouge2_fmeasure,0.023697282994221247
|
|
gem_xsum,0,median,rouge2_fmeasure,0.023697282994221247
|
|
gem_xsum,1,article_DOC_summary,rouge2_fmeasure,0.018497303697898898
|
|
gem_xsum,1,median,rouge2_fmeasure,0.018497303697898898
|
|
gem_xsum,2,article_DOC_summary,rouge2_fmeasure,0.019662620850184154
|
|
gem_xsum,2,median,rouge2_fmeasure,0.019662620850184154
|
|
gem_xsum,3,article_DOC_summary,rouge2_fmeasure,0.018803041332499517
|
|
gem_xsum,3,median,rouge2_fmeasure,0.018803041332499517
|
|
gem_xsum,4,article_DOC_summary,rouge2_fmeasure,0.005563844272859168
|
|
gem_xsum,4,median,rouge2_fmeasure,0.005563844272859168
|
|
gem_xsum,5,article_DOC_summary,rouge2_fmeasure,0.00043251733980451243
|
|
gem_xsum,5,median,rouge2_fmeasure,0.00043251733980451243
|
|
gem_xsum,5,average,multiple,0.014442768414577915
|
|
web_nlg_en,0,PALM_prompt,rouge2_fmeasure,0.03996425304915668
|
|
web_nlg_en,0,median,rouge2_fmeasure,0.03996425304915668
|
|
web_nlg_en,1,PALM_prompt,rouge2_fmeasure,0.03533421218479914
|
|
web_nlg_en,1,median,rouge2_fmeasure,0.03533421218479914
|
|
web_nlg_en,2,PALM_prompt,rouge2_fmeasure,0.034017897932799156
|
|
web_nlg_en,2,median,rouge2_fmeasure,0.034017897932799156
|
|
web_nlg_en,3,PALM_prompt,rouge2_fmeasure,0.033414173983495055
|
|
web_nlg_en,3,median,rouge2_fmeasure,0.033414173983495055
|
|
web_nlg_en,4,PALM_prompt,rouge2_fmeasure,0.03361031713979665
|
|
web_nlg_en,4,median,rouge2_fmeasure,0.03361031713979665
|
|
web_nlg_en,5,PALM_prompt,rouge2_fmeasure,0.0336482487712469
|
|
web_nlg_en,5,median,rouge2_fmeasure,0.0336482487712469
|
|
web_nlg_en,5,average,multiple,0.03499818384354893
|
|
wiki_lingua_en,0,tldr_en,rouge2_fmeasure,0.013569083806173431
|
|
wiki_lingua_en,0,median,rouge2_fmeasure,0.013569083806173431
|
|
wiki_lingua_en,1,tldr_en,rouge2_fmeasure,0.014839503603430174
|
|
wiki_lingua_en,1,median,rouge2_fmeasure,0.014839503603430174
|
|
wiki_lingua_en,2,tldr_en,rouge2_fmeasure,0.014779019287405309
|
|
wiki_lingua_en,2,median,rouge2_fmeasure,0.014779019287405309
|
|
wiki_lingua_en,3,tldr_en,rouge2_fmeasure,0.015116060561354339
|
|
wiki_lingua_en,3,median,rouge2_fmeasure,0.015116060561354339
|
|
wiki_lingua_en,4,tldr_en,rouge2_fmeasure,0.006564722152989603
|
|
wiki_lingua_en,4,median,rouge2_fmeasure,0.006564722152989603
|
|
wiki_lingua_en,5,tldr_en,rouge2_fmeasure,0.001256549559807457
|
|
wiki_lingua_en,5,median,rouge2_fmeasure,0.001256549559807457
|
|
wiki_lingua_en,5,average,multiple,0.011020823161860052
|
|
|