|
from dataclasses import dataclass |
|
from enum import Enum |
|
|
|
@dataclass |
|
class Task: |
|
benchmark: str |
|
metric: str |
|
col_name: str |
|
|
|
class Tasks(Enum): |
|
task0 = Task("anli_r1", "acc", "Korean Bar Exam (Lawyer)") |
|
task1 = Task("logiqa", "acc_norm", "Senior Civil Service Examination(๊ตญ๊ฐ์ง 5๊ธ)") |
|
|
|
NUM_FEWSHOT = 0 |
|
|
|
TITLE = """<h1 align="center" id="space-title">Demo leaderboard</h1>""" |
|
INTRODUCTION_TEXT = """Intro text""" |
|
|
|
LLM_BENCHMARKS_TEXT = """\ |
|
## How it works |
|
## Reproducibility |
|
To reproduce our results, here is the commands you can run: |
|
""" |
|
|
|
EVALUATION_QUEUE_TEXT = """ |
|
## Some good practices before submitting a model |
|
(์ค๋ต) |
|
์ฌ๊ธฐ์ ๊ธด ํ
์คํธ๋ฅผ ๋ถ์ฌ๋ฃ๋, |
|
์ผ์ค ๋ฐ์ดํ๊ฐ ๋ฑ์ฅํ์ง ์๋๋ก ์ฃผ์ํ์ธ์. |
|
""" |
|
|
|
CITATION_BUTTON_LABEL = "Copy the following snippet to cite these results" |
|
CITATION_BUTTON_TEXT = """ |
|
""" |
|
|