from dataclasses import dataclass from enum import Enum @dataclass class Task: benchmark: str metric: str col_name: str class Tasks(Enum): task0 = Task("anli_r1", "acc", "Korean Bar Exam (Lawyer)") task1 = Task("logiqa", "acc_norm", "Senior Civil Service Examination(국가직 5급)") NUM_FEWSHOT = 0 TITLE = """

Demo leaderboard

""" INTRODUCTION_TEXT = """Intro text""" LLM_BENCHMARKS_TEXT = """\ ## How it works ## Reproducibility To reproduce our results, here is the commands you can run: """ EVALUATION_QUEUE_TEXT = """ ## Some good practices before submitting a model (중략) 여기에 긴 텍스트를 붙여넣되, 삼중 따옴표가 등장하지 않도록 주의하세요. """ CITATION_BUTTON_LABEL = "Copy the following snippet to cite these results" CITATION_BUTTON_TEXT = """ """