Spaces:

CZLC
/

BenCzechMark

Running

App Files Files Community

idolezal commited on Sep 27, 2024

Commit

01c6f6b

1 Parent(s): 387e6ad

Removed contaminated tasks from "tasks_metadata.json"

Browse files

Files changed (1) hide show

tasks_metadata.json +0 -32

tasks_metadata.json CHANGED Viewed

@@ -127,14 +127,6 @@
     "abbreviation": "S-CSFD",
     "metric": "avg_mcauroc"
   },
-  "benczechmark_summarization": {
-    "name": "SUMECZECH",
-    "source_url": "https://huggingface.co/datasets/CZLC/sumeczech_downsampled",
-    "short_name": "Summarization",
-    "category": "Summarization",
-    "abbreviation": "SUM",
-    "metric": "rouge_raw_r2_mid_f"
-  },
   "benczechmark_grammarerrorcorrection": {
     "name": "GrammarErrorCorrection",
     "source_url": "https://huggingface.co/datasets/CZLC/cs_gec",
@@ -343,14 +335,6 @@
     "short_name": "Belebele",
     "metric": "acc"
   },
-  "benczechmark_czechnews": {
-    "name": "CZ-NEWS",
-    "source_url": "https://huggingface.co/datasets/davidadamczyk/czechbench_czech_news",
-    "abbreviation": "CZ-NEWS",
-    "category": "Topic Classification",
-    "short_name": "Czech News",
-    "metric": "avg_mcauroc"
-  },
   "benczechmark_subjectivity": {
     "name": "Subjectivity",
     "source_url": "https://huggingface.co/datasets/davidadamczyk/czechbench_subjectivity",
@@ -375,14 +359,6 @@
     "short_name": "CNC – Fiction",
     "metric": "word_perplexity"
   },
-  "benczechmark_capek": {
-    "name": "Czech National Corpus – Karel Čapek",
-    "source_url": "https://huggingface.co/datasets/CZLC/CNC_Capek",
-    "abbreviation": "CNC-CAP",
-    "category": "Language Modeling",
-    "short_name": "CNC – Čapek",
-    "metric": "word_perplexity"
-  },
   "benczechmark_correspondence": {
     "name": "Czech National Corpus – Correspondence",
     "source_url": "https://huggingface.co/datasets/CZLC/CNC_KSK",
@@ -399,14 +375,6 @@
     "short_name": "CNC – KHavlicek – HistNews",
     "metric": "word_perplexity"
   },
-  "benczechmark_speeches": {
-    "name": "Czech National Corpus – Speeches",
-    "source_url": "https://huggingface.co/datasets/CZLC/CNC_PrezPrejavy",
-    "abbreviation": "CNC-SPCH",
-    "category": "Language Modeling",
-    "short_name": "CNC – Speeches",
-    "metric": "word_perplexity"
-  },
   "benczechmark_spoken": {
     "name": "Czech National Corpus – Spoken",
     "source_url": "https://huggingface.co/datasets/CZLC/CNC_oral_ortofon",

     "abbreviation": "S-CSFD",
     "metric": "avg_mcauroc"
   },
   "benczechmark_grammarerrorcorrection": {
     "name": "GrammarErrorCorrection",
     "source_url": "https://huggingface.co/datasets/CZLC/cs_gec",
     "short_name": "Belebele",
     "metric": "acc"
   },
   "benczechmark_subjectivity": {
     "name": "Subjectivity",
     "source_url": "https://huggingface.co/datasets/davidadamczyk/czechbench_subjectivity",
     "short_name": "CNC – Fiction",
     "metric": "word_perplexity"
   },
   "benczechmark_correspondence": {
     "name": "Czech National Corpus – Correspondence",
     "source_url": "https://huggingface.co/datasets/CZLC/CNC_KSK",
     "short_name": "CNC – KHavlicek – HistNews",
     "metric": "word_perplexity"
   },
   "benczechmark_spoken": {
     "name": "Czech National Corpus – Spoken",
     "source_url": "https://huggingface.co/datasets/CZLC/CNC_oral_ortofon",