from dataclasses import dataclass
from enum import Enum
@dataclass
class Task:
benchmark: str
metric: str
col_name: str
class Tasks(Enum):
task0 = Task("anli_r1", "acc", "Korean Bar Exam (Lawyer)")
task1 = Task("logiqa", "acc_norm", "Senior Civil Service Examination(국가직 5급)")
NUM_FEWSHOT = 0
TITLE = """
Demo leaderboard
"""
INTRODUCTION_TEXT = """Intro text"""
LLM_BENCHMARKS_TEXT = """\
## How it works
## Reproducibility
To reproduce our results, here is the commands you can run:
"""
EVALUATION_QUEUE_TEXT = """
## Some good practices before submitting a model
(중략)
여기에 긴 텍스트를 붙여넣되,
삼중 따옴표가 등장하지 않도록 주의하세요.
"""
CITATION_BUTTON_LABEL = "Copy the following snippet to cite these results"
CITATION_BUTTON_TEXT = """
"""