BenCzechMark-unstable

Running

App Files Files Community

idolezal commited on Jul 8, 2024

Commit

c93b288

1 Parent(s): 20b8116

Přidány kategorie do `tasks_metadata.json`

Browse files

Files changed (5) hide show

.gitignore +21 -0
app.py +2 -2
compare_significance.py +1 -1
server.py +2 -3
tasks_metadata.json +280 -202

.gitignore ADDED Viewed

	@@ -0,0 +1,21 @@

+.eric6project/
+.eric7project/
+.ropeproject/
+.jedi/
+.directory/
+*.pyc
+*.pyo
+*.orig
+*.bak
+*.rej
+*~
+cur/
+tmp/
+__pycache__/
+__pypackages__
+*.DS_Store
+.pytest_cache/
+venv/
+.venv/
+env/
+.env/

app.py CHANGED Viewed

@@ -8,7 +8,7 @@ from gradio_modal import Modal
 from content import (HEADER_MARKDOWN, LEADERBOARD_TAB_TITLE_MARKDOWN, SUBMISSION_TAB_TITLE_MARKDOWN,
                      MODAL_SUBMIT_MARKDOWN,
                      SUBMISSION_DETAILS_MARKDOWN, RANKING_AFTER_SUBMISSION_MARKDOWN, MORE_DETAILS_MARKDOWN)
-from server import LeaderboardServer, categories
 leaderboard_server = LeaderboardServer()
@@ -157,7 +157,7 @@ with (gr.Blocks(theme=gr.themes.Soft(text_size=text_md), css=custom_css) as main
                 with gr.Tab("Overall"):
                     results_table = gr.DataFrame(leaderboard_server.get_leaderboard(), interactive=False, label=None,
                                                  visible=True, elem_classes="leaderboard-table")
-                for c in categories:
                     with gr.Tab(c):
                         results_table = gr.DataFrame(leaderboard_server.get_leaderboard(), interactive=False, label=None,
                                                      visible=True, elem_classes="leaderboard-table")

 from content import (HEADER_MARKDOWN, LEADERBOARD_TAB_TITLE_MARKDOWN, SUBMISSION_TAB_TITLE_MARKDOWN,
                      MODAL_SUBMIT_MARKDOWN,
                      SUBMISSION_DETAILS_MARKDOWN, RANKING_AFTER_SUBMISSION_MARKDOWN, MORE_DETAILS_MARKDOWN)
+from server import LeaderboardServer
 leaderboard_server = LeaderboardServer()
                 with gr.Tab("Overall"):
                     results_table = gr.DataFrame(leaderboard_server.get_leaderboard(), interactive=False, label=None,
                                                  visible=True, elem_classes="leaderboard-table")
+                for c in leaderboard_server.tasks_categories:
                     with gr.Tab(c):
                         results_table = gr.DataFrame(leaderboard_server.get_leaderboard(), interactive=False, label=None,
                                                      visible=True, elem_classes="leaderboard-table")

compare_significance.py CHANGED Viewed

@@ -176,7 +176,7 @@ def read_json(file_path):
     with open(METADATA_FILE, "r") as f:
         metadata = json.load(f)
-    all_tasks = list(metadata["tasks"].keys())
     all_missing_tasks = []
     for task in all_tasks:
         if task not in data:

     with open(METADATA_FILE, "r") as f:
         metadata = json.load(f)
+    all_tasks = list(metadata.keys())
     all_missing_tasks = []
     for task in all_tasks:
         if task not in data:

server.py CHANGED Viewed

@@ -18,8 +18,6 @@ REPO = f"{ORG}/LLM_benchmark_data"
 HF_TOKEN = os.environ.get("HF_TOKEN")
 TASKS_METADATA_PATH = "./tasks_metadata.json"
-categories = ['Czech Math Reasoning', 'General Reasoning', 'Historical', 'Knowledge', 'Language Modeling', 'NER', 'NLI', 'Sentiment', 'Summarization', 'Syntactical Reasoning', 'Topic Classification']
 class LeaderboardServer:
     def __init__(self):
         self.server_address = REPO
@@ -27,7 +25,8 @@ class LeaderboardServer:
         self.local_leaderboard = snapshot_download(self.server_address, repo_type=self.repo_type, token=HF_TOKEN,
                                                    local_dir="./")
         self.submisssion_id_to_file = {}  # Map submission ids to file paths
-        self.tasks_metadata = json.load(open(TASKS_METADATA_PATH))['tasks']
         self.submission_ids = set()
         self.fetch_existing_models()
         self.tournament_results = self.load_tournament_results()

 HF_TOKEN = os.environ.get("HF_TOKEN")
 TASKS_METADATA_PATH = "./tasks_metadata.json"
 class LeaderboardServer:
     def __init__(self):
         self.server_address = REPO
         self.local_leaderboard = snapshot_download(self.server_address, repo_type=self.repo_type, token=HF_TOKEN,
                                                    local_dir="./")
         self.submisssion_id_to_file = {}  # Map submission ids to file paths
+        self.tasks_metadata = json.load(open(TASKS_METADATA_PATH))
+        self.tasks_categories = {self.tasks_metadata[task]["category"] for task in self.tasks_metadata}
         self.submission_ids = set()
         self.fetch_existing_models()
         self.tournament_results = self.load_tournament_results()

tasks_metadata.json CHANGED Viewed

@@ -1,204 +1,282 @@
 {
-  "tasks": {
-    "benczechmark_propaganda_argumentace": {
-      "task": "benczechmark_propaganda_argumentace",
-      "name": "P-Argumentace",
-      "source_url": "https://huggingface.co/datasets/CZLC/propaganda_argumentace"
-    },
-    "benczechmark_propaganda_fabulace": {
-      "task": "benczechmark_propaganda_fabulace",
-      "name": "P-Fabulace",
-      "source_url": "https://huggingface.co/datasets/CZLC/propaganda_fabulace"
-    },
-    "benczechmark_propaganda_nazor": {
-      "task": "benczechmark_propaganda_nazor",
-      "name": "P-Názor",
-      "source_url": "https://huggingface.co/datasets/CZLC/propaganda_nazor"
-    },
-    "benczechmark_propaganda_strach": {
-      "task": "benczechmark_propaganda_strach",
-      "name": "P-Strach",
-      "source_url": "https://huggingface.co/datasets/CZLC/propaganda_strach"
-    },
-    "benczechmark_propaganda_zamereni": {
-      "task": "benczechmark_propaganda_zamereni",
-      "name": "P-Zaměření",
-      "source_url": "https://huggingface.co/datasets/CZLC/propaganda_zamereni"
-    },
-    "benczechmark_propaganda_demonizace": {
-      "task": "benczechmark_propaganda_demonizace",
-      "name": "P-Demonizace",
-      "source_url": "https://huggingface.co/datasets/CZLC/propaganda_demonizace"
-    },
-    "benczechmark_propaganda_lokace": {
-      "task": "benczechmark_propaganda_lokace",
-      "name": "P-Lokace",
-      "source_url": "https://huggingface.co/datasets/CZLC/propaganda_lokace"
-    },
-    "benczechmark_propaganda_relativizace": {
-      "task": "benczechmark_propaganda_relativizace",
-      "name": "P-Relativizace",
-      "source_url": "https://huggingface.co/datasets/CZLC/propaganda_relativizace"
-    },
-    "benczechmark_propaganda_vina": {
-      "task": "benczechmark_propaganda_vina",
-      "name": "P-Vina",
-      "source_url": "https://huggingface.co/datasets/CZLC/propaganda_vina"
-    },
-    "benczechmark_propaganda_zanr": {
-      "task": "benczechmark_propaganda_zanr",
-      "name": "P-Žánr",
-      "source_url": "https://huggingface.co/datasets/CZLC/propaganda_zanr"
-    },
-    "benczechmark_propaganda_emoce": {
-      "task": "benczechmark_propaganda_emoce",
-      "name": "P-Emoce",
-      "source_url": "https://huggingface.co/datasets/CZLC/propaganda_emoce"
-    },
-    "benczechmark_propaganda_nalepkovani": {
-      "task": "benczechmark_propaganda_nalepkovani",
-      "name": "P-Nalepkování",
-      "source_url": "https://huggingface.co/datasets/CZLC/propaganda_nalepkovani"
-    },
-    "benczechmark_propaganda_rusko": {
-      "task": "benczechmark_propaganda_rusko",
-      "name": "P-Rusko",
-      "source_url": "https://huggingface.co/datasets/CZLC/propaganda_rusko"
-    },
-    "benczechmark_sentiment_mall": {
-      "task": "benczechmark_sentiment_mall",
-      "name": "S-Mall",
-      "source_url": "https://huggingface.co/datasets/CZLC/mall_sentiment_balanced"
-    },
-    "benczechmark_sentiment_fb": {
-      "task": "benczechmark_sentiment_fb",
-      "name": "S-FB",
-      "source_url": "https://huggingface.co/datasets/CZLC/fb_sentiment_balanced"
-    },
-    "benczechmark_sentiment_csfd": {
-      "task": "benczechmark_sentiment_csfd",
-      "name": "S-CSFD",
-      "source_url": "https://huggingface.co/datasets/CZLC/csfd_sentiment_balanced"
-    },
-    "benczechmark_summarization": {
-      "task": "benczechmark_summarization",
-      "name": "Summarization",
-      "source_url": "https://huggingface.co/datasets/CZLC/sumeczech_downsampled"
-    },
-    "benczechmark_grammarerrorcorrection": {
-      "task": "benczechmark_grammarerrorcorrection",
-      "name": "Grammar Error Correction",
-      "source_url": "https://huggingface.co/datasets/CZLC/cs_gec"
-    },
-    "benczechmark_cs_naturalquestions": {
-      "task": "benczechmark_cs_naturalquestions",
-      "name": "CS Natural Questions",
-      "source_url": "https://huggingface.co/datasets/CZLC/cs_naturalquestions"
-    },
-    "benczechmark_cs_sqad32": {
-      "task": "benczechmark_cs_sqad32",
-      "name": "CS SQAD 3.2",
-      "source_url": "https://huggingface.co/datasets/CZLC/SQAD_3.2"
-    },
-    "benczechmark_cs_triviaQA": {
-      "task": "benczechmark_cs_triviaQA",
-      "name": "CS TriviaQA",
-      "source_url": "https://huggingface.co/datasets/CZLC/cs_triviaqa"
-    },
-    "benczechmark_csfever_nli": {
-      "task": "benczechmark_csfever_nli",
-      "name": "CSFever NLI",
-      "source_url": "https://huggingface.co/datasets/CZLC/ctu-aic/csfever_nli"
-    },
-    "benczechmark_ctkfacts_nli": {
-      "task": "benczechmark_ctkfacts_nli",
-      "name": "CTKFacts NLI",
-      "source_url": "https://huggingface.co/datasets/CZLC/ctu-aic/ctkfacts_nli"
-    },
-    "benczechmark_cs_ner": {
-      "task": "benczechmark_cs_ner",
-      "name": "CS NER",
-      "source_url": "https://huggingface.co/datasets/CZLC/fewshot-goes-multilingual/cs_czech-named-entity-corpus_2.0"
-    },
-    "benczechmark_hellaswag": {
-      "task": "benczechmark_hellaswag",
-      "name": "HellaSwag",
-      "source_url": "https://huggingface.co/datasets/CZLC/cs_hellaswag"
-    },
-    "benczechmark_histcorpus": {
-      "task": "benczechmark_histcorpus",
-      "name": "HistCorpus",
-      "source_url": "https://huggingface.co/datasets/CZLC/benczechmark_histcorpus"
-    },
-    "benczechmark_klokan_qa": {
-      "task": "benczechmark_klokan_qa",
-      "name": "Klokan QA",
-      "source_url": "https://huggingface.co/datasets/hynky/klokan-qa"
-    },
-    "benczechmark_cs_court_decisions_ner": {
-      "task": "benczechmark_cs_court_decisions_ner",
-      "name": "CS Court Decisions NER",
-      "source_url": "https://huggingface.co/datasets/CZLC/fewshot-goes-multilingual/cs_czech-court-decisions-ner"
-    },
-    "benczechmark_umimeto_biology": {
-      "task": "benczechmark_umimeto_biology",
-      "name": "Umimeto.cz - Biology",
-      "source_url": "https://huggingface.co/datasets/CZLC/umimeto-biology"
-    },
-    "benczechmark_umimeto_chemistry": {
-      "task": "benczechmark_umimeto_chemistry",
-      "name": "Umimeto.cz - Chemistry",
-      "source_url": "https://huggingface.co/datasets/CZLC/umimeto-chemistry"
-    },
-    "benczechmark_umimeto_czech": {
-      "task": "benczechmark_umimeto_czech",
-      "name": "Umimeto.cz - Czech",
-      "source_url": "https://huggingface.co/datasets/CZLC/umimeto-czech"
-    },
-    "benczechmark_umimeto_history": {
-      "task": "benczechmark_umimeto_history",
-      "name": "Umimeto.cz - History",
-      "source_url": "https://huggingface.co/datasets/CZLC/umimeto-history"
-    },
-    "benczechmark_umimeto_informatics": {
-      "task": "benczechmark_umimeto_informatics",
-      "name": "Umimeto.cz - Informatics",
-      "source_url": "https://huggingface.co/datasets/CZLC/umimeto-informatics"
-    },
-    "benczechmark_umimeto_math": {
-      "task": "benczechmark_umimeto_math",
-      "name": "Umimeto.cz - Math",
-      "source_url": "https://huggingface.co/datasets/CZLC/umimeto-math"
-    },
-    "benczechmark_umimeto_physics": {
-      "task": "benczechmark_umimeto_physics",
-      "name": "Umimeto.cz - Physics",
-      "source_url": "https://huggingface.co/datasets/CZLC/umimeto-physics"
-    },
-    "benczechmark_cermat_czmath_mc": {
-      "task": "benczechmark_cermat_czmath_mc",
-      "name": "Cermat Czech Math MC",
-      "source_url": "https://huggingface.co/datasets/CZLC/cermat_math_mc"
-    },
-    "benczechmark_cermat_czmath_open": {
-      "task": "benczechmark_cermat_czmath_open",
-      "name": "Cermat Czech Math Open",
-      "source_url": "https://huggingface.co/datasets/CZLC/cermat_math_open"
-    },
-    "benczechmark_cermat_czech_tf": {
-      "task": "benczechmark_cermat_czech_tf",
-      "name": "Cermat Czech Language TF",
-      "source_url": "https://huggingface.co/datasets/CZLC/cermat_czech_tf"
-    },
-    "benczechmark_cermat_czech_mc": {
-      "task": "benczechmark_cermat_czech_mc",
-      "name": "Cermat Czech Language MC",
-      "source_url": "https://huggingface.co/datasets/CZLC/cermat_czech_mc"
-    },
-    "benczechmark_cermat_czech_open": {
-      "task": "benczechmark_cermat_czech_open",
-      "name": "Cermat Czech Language Open",
-      "source_url": "https://huggingface.co/datasets/CZLC/cermat_czech_open"
-    }
   }
-}

 {
+  "benczechmark_propaganda_argumentace": {
+    "name": "Propaganda - Argumentace",
+    "source_url": "https://huggingface.co/datasets/CZLC/propaganda_argumentace",
+    "short_name": "P-Argumentace",
+    "category": "NLI",
+    "abbreviation": "P-ARG"
+  },
+  "benczechmark_propaganda_fabulace": {
+    "name": "Propaganda - Fabulace",
+    "source_url": "https://huggingface.co/datasets/CZLC/propaganda_fabulace",
+    "short_name": "P-Fabulace",
+    "category": "NLI",
+    "abbreviation": "P-FAB"
+  },
+  "benczechmark_propaganda_nazor": {
+    "name": "Propaganda - Nazor",
+    "source_url": "https://huggingface.co/datasets/CZLC/propaganda_nazor",
+    "short_name": "P-Názor",
+    "category": "NLI",
+    "abbreviation": "P-NAZOR"
+  },
+  "benczechmark_propaganda_strach": {
+    "name": "Propaganda - Strach",
+    "source_url": "https://huggingface.co/datasets/CZLC/propaganda_strach",
+    "short_name": "P-Strach",
+    "category": "NLI",
+    "abbreviation": "P-STCH"
+  },
+  "benczechmark_propaganda_zamereni": {
+    "name": "Propaganda - Zamereni",
+    "source_url": "https://huggingface.co/datasets/CZLC/propaganda_zamereni",
+    "short_name": "P-Zaměření",
+    "category": "NLI",
+    "abbreviation": "P-MER"
+  },
+  "benczechmark_propaganda_demonizace": {
+    "name": "Propaganda - Demonizace",
+    "source_url": "https://huggingface.co/datasets/CZLC/propaganda_demonizace",
+    "short_name": "P-Demonizace",
+    "category": "NLI",
+    "abbreviation": "P-DEMON"
+  },
+  "benczechmark_propaganda_lokace": {
+    "name": "Propaganda - Lokace",
+    "source_url": "https://huggingface.co/datasets/CZLC/propaganda_lokace",
+    "short_name": "P-Lokace",
+    "category": "NLI",
+    "abbreviation": "P-LOK"
+  },
+  "benczechmark_propaganda_relativizace": {
+    "name": "Propaganda - Relativizace",
+    "source_url": "https://huggingface.co/datasets/CZLC/propaganda_relativizace",
+    "short_name": "P-Relativizace",
+    "category": "NLI",
+    "abbreviation": "P-REL"
+  },
+  "benczechmark_propaganda_vina": {
+    "name": "Propaganda - Vina",
+    "source_url": "https://huggingface.co/datasets/CZLC/propaganda_vina",
+    "short_name": "P-Vina",
+    "category": "NLI",
+    "abbreviation": "P-VINA"
+  },
+  "benczechmark_propaganda_zanr": {
+    "name": "Propaganda - Zanr",
+    "source_url": "https://huggingface.co/datasets/CZLC/propaganda_zanr",
+    "short_name": "P-Žánr",
+    "category": "NLI",
+    "abbreviation": "P-ZANR"
+  },
+  "benczechmark_propaganda_emoce": {
+    "name": "Propaganda - Emoce",
+    "source_url": "https://huggingface.co/datasets/CZLC/propaganda_emoce",
+    "short_name": "P-Emoce",
+    "category": "NLI",
+    "abbreviation": "P-EMOCE"
+  },
+  "benczechmark_propaganda_nalepkovani": {
+    "name": "Propaganda - Nalepkovani",
+    "source_url": "https://huggingface.co/datasets/CZLC/propaganda_nalepkovani",
+    "short_name": "P-Nalepkování",
+    "category": "NLI",
+    "abbreviation": "P-LEP"
+  },
+  "benczechmark_propaganda_rusko": {
+    "name": "Propaganda - Rusko",
+    "source_url": "https://huggingface.co/datasets/CZLC/propaganda_rusko",
+    "short_name": "P-Rusko",
+    "category": "NLI",
+    "abbreviation": "P-RUS"
+  },
+  "benczechmark_sentiment_mall": {
+    "name": "CzechSentiment MALL",
+    "source_url": "https://huggingface.co/datasets/CZLC/mall_sentiment_balanced",
+    "short_name": "S-Mall",
+    "category": "Sentiment",
+    "abbreviation": "S-MALL"
+  },
+  "benczechmark_sentiment_fb": {
+    "name": "CzechSentiment FB",
+    "source_url": "https://huggingface.co/datasets/CZLC/fb_sentiment_balanced",
+    "short_name": "S-FB",
+    "category": "Sentiment",
+    "abbreviation": "S-FB"
+  },
+  "benczechmark_sentiment_csfd": {
+    "name": "CzechSentiment CSFD",
+    "source_url": "https://huggingface.co/datasets/CZLC/csfd_sentiment_balanced",
+    "short_name": "S-CSFD",
+    "category": "Sentiment",
+    "abbreviation": "S-CSFD"
+  },
+  "benczechmark_summarization": {
+    "name": "SUMECZECH",
+    "source_url": "https://huggingface.co/datasets/CZLC/sumeczech_downsampled",
+    "short_name": "Summarization",
+    "category": "Summarization",
+    "abbreviation": "SUM"
+  },
+  "benczechmark_grammarerrorcorrection": {
+    "name": "GrammarErrorCorrection",
+    "source_url": "https://huggingface.co/datasets/CZLC/cs_gec",
+    "short_name": "Grammar Error Correction",
+    "category": "Syntactical Reasoning",
+    "abbreviation": "GEC"
+  },
+  "benczechmark_cs_naturalquestions": {
+    "name": "NaturalQuestions-CZ",
+    "source_url": "https://huggingface.co/datasets/CZLC/cs_naturalquestions",
+    "short_name": "CS Natural Questions",
+    "category": "Knowledge",
+    "abbreviation": "NQ"
+  },
+  "benczechmark_cs_sqad32": {
+    "name": "SQAD3.2",
+    "source_url": "https://huggingface.co/datasets/CZLC/SQAD_3.2",
+    "short_name": "CS SQAD 3.2",
+    "category": "Knowledge",
+    "abbreviation": "SQAD32"
+  },
+  "benczechmark_cs_triviaQA": {
+    "name": "TriviaQA-CZ",
+    "source_url": "https://huggingface.co/datasets/CZLC/cs_triviaqa",
+    "short_name": "CS TriviaQA",
+    "category": "Knowledge",
+    "abbreviation": "TQA"
+  },
+  "benczechmark_csfever_nli": {
+    "name": "CSFEVER",
+    "source_url": "https://huggingface.co/datasets/CZLC/ctu-aic/csfever_nli",
+    "short_name": "CSFever NLI",
+    "category": "NLI",
+    "abbreviation": "CFR"
+  },
+  "benczechmark_ctkfacts_nli": {
+    "name": "CTKFACTS",
+    "source_url": "https://huggingface.co/datasets/CZLC/ctu-aic/ctkfacts_nli",
+    "short_name": "CTKFacts NLI",
+    "category": "NLI",
+    "abbreviation": "CTK"
+  },
+  "benczechmark_cs_ner": {
+    "name": "CZECH NER CORPUS 2.0",
+    "source_url": "https://huggingface.co/datasets/CZLC/fewshot-goes-multilingual/cs_czech-named-entity-corpus_2.0",
+    "short_name": "CS NER",
+    "category": "NER",
+    "abbreviation": "CZNERC"
+  },
+  "benczechmark_hellaswag": {
+    "name": "HellaSwag-CZ",
+    "source_url": "https://huggingface.co/datasets/CZLC/cs_hellaswag",
+    "short_name": "HellaSwag",
+    "category": "Language Modeling",
+    "abbreviation": "HASG"
+  },
+  "benczechmark_histcorpus": {
+    "name": "Historical Corpus",
+    "source_url": "https://huggingface.co/datasets/CZLC/benczechmark_histcorpus",
+    "short_name": "HistCorpus",
+    "category": "Language Modeling",
+    "abbreviation": "HIST"
+  },
+  "benczechmark_klokan_qa": {
+    "name": "Klokan QA",
+    "source_url": "https://huggingface.co/datasets/hynky/klokan-qa",
+    "short_name": "Klokan QA",
+    "category": "Czech Math Reasoning",
+    "abbreviation": "KQA"
+  },
+  "benczechmark_cs_court_decisions_ner": {
+    "name": "Czech Court Decisions",
+    "source_url": "https://huggingface.co/datasets/CZLC/fewshot-goes-multilingual/cs_czech-court-decisions-ner",
+    "short_name": "CS Court Decisions NER",
+    "category": "NER",
+    "abbreviation": "CCDNER"
+  },
+  "benczechmark_umimeto_biology": {
+    "name": "Umimeto.cz - Biology",
+    "source_url": "https://huggingface.co/datasets/CZLC/umimeto-biology",
+    "short_name": "Umimeto.cz - Biology",
+    "category": "General Reasoning",
+    "abbreviation": "UT-BIO"
+  },
+  "benczechmark_umimeto_chemistry": {
+    "name": "Umimeto.cz - Chemistry",
+    "source_url": "https://huggingface.co/datasets/CZLC/umimeto-chemistry",
+    "short_name": "Umimeto.cz - Chemistry",
+    "category": "General Reasoning",
+    "abbreviation": "UT-CHEM"
+  },
+  "benczechmark_umimeto_czech": {
+    "name": "Umimeto.cz - Czech Language",
+    "source_url": "https://huggingface.co/datasets/CZLC/umimeto-czech",
+    "short_name": "Umimeto.cz - Czech",
+    "category": "General Reasoning",
+    "abbreviation": "UT-CZEL"
+  },
+  "benczechmark_umimeto_history": {
+    "name": "Umimeto.cz - History",
+    "source_url": "https://huggingface.co/datasets/CZLC/umimeto-history",
+    "short_name": "Umimeto.cz - History",
+    "category": "General Reasoning",
+    "abbreviation": "UT-HIST"
+  },
+  "benczechmark_umimeto_informatics": {
+    "name": "Umimeto.cz - Informatics",
+    "source_url": "https://huggingface.co/datasets/CZLC/umimeto-informatics",
+    "short_name": "Umimeto.cz - Informatics",
+    "category": "General Reasoning",
+    "abbreviation": "UT-IT"
+  },
+  "benczechmark_umimeto_math": {
+    "name": "Umimeto.cz - Math",
+    "source_url": "https://huggingface.co/datasets/CZLC/umimeto-math",
+    "short_name": "Umimeto.cz - Math",
+    "category": "Czech Math Reasoning",
+    "abbreviation": "UT-MATH"
+  },
+  "benczechmark_umimeto_physics": {
+    "name": "Umimeto.cz - Physics",
+    "source_url": "https://huggingface.co/datasets/CZLC/umimeto-physics",
+    "short_name": "Umimeto.cz - Physics",
+    "category": "General Reasoning",
+    "abbreviation": "UT-PHYS"
+  },
+  "benczechmark_cermat_czmath_mc": {
+    "name": "CERMAT - Czech Math - MC",
+    "source_url": "https://huggingface.co/datasets/CZLC/cermat_math_mc",
+    "short_name": "Cermat Czech Math MC",
+    "category": "Czech Math Reasoning",
+    "abbreviation": "CCM-MC"
+  },
+  "benczechmark_cermat_czmath_open": {
+    "name": "CERMAT - Czech Math - OPEN",
+    "source_url": "https://huggingface.co/datasets/CZLC/cermat_math_open",
+    "short_name": "Cermat Czech Math Open",
+    "category": "Czech Math Reasoning",
+    "abbreviation": "CCM-OPEN"
+  },
+  "benczechmark_cermat_czech_tf": {
+    "name": "CERMAT - Czech Language - TF",
+    "source_url": "https://huggingface.co/datasets/CZLC/cermat_czech_tf",
+    "short_name": "Cermat Czech Language TF",
+    "category": "General Reasoning",
+    "abbreviation": "CCL-TF"
+  },
+  "benczechmark_cermat_czech_mc": {
+    "name": "CERMAT - Czech Language - MC",
+    "source_url": "https://huggingface.co/datasets/CZLC/cermat_czech_mc",
+    "short_name": "Cermat Czech Language MC",
+    "category": "General Reasoning",
+    "abbreviation": "CCL-MC"
+  },
+  "benczechmark_cermat_czech_open": {
+    "name": "CERMAT - Czech Language - OPEN",
+    "source_url": "https://huggingface.co/datasets/CZLC/cermat_czech_open",
+    "short_name": "Cermat Czech Language Open",
+    "category": "General Reasoning",
+    "abbreviation": "CCL-OPEN"
   }
+}