Commit
·
65a9e72
1
Parent(s):
d30a6b1
add tw tasks
Browse files- src/about.py +5 -3
src/about.py
CHANGED
@@ -12,8 +12,9 @@ class Task:
|
|
12 |
# ---------------------------------------------------
|
13 |
class Tasks(Enum):
|
14 |
# task_key in the json file, metric_key in the json file, name to display in the leaderboard
|
15 |
-
|
16 |
-
|
|
|
17 |
|
18 |
NUM_FEWSHOT = 0 # Change with your few shot
|
19 |
# ---------------------------------------------------
|
@@ -35,6 +36,7 @@ LLM_BENCHMARKS_TEXT = f"""
|
|
35 |
## Reproducibility
|
36 |
To reproduce our results, here is the commands you can run:
|
37 |
|
|
|
38 |
"""
|
39 |
|
40 |
EVALUATION_QUEUE_TEXT = """
|
@@ -69,7 +71,7 @@ If everything is done, check you can launch the EleutherAIHarness on your model
|
|
69 |
|
70 |
CITATION_BUTTON_LABEL = "Copy the following snippet to cite these results"
|
71 |
CITATION_BUTTON_TEXT = r"""
|
72 |
-
@misc{open-
|
73 |
author = {Yen{-}Ting Lin, Yun{-}Nung Chen},
|
74 |
title = {Open TW-LLM Leaderboard},
|
75 |
year = {2024},
|
|
|
12 |
# ---------------------------------------------------
|
13 |
class Tasks(Enum):
|
14 |
# task_key in the json file, metric_key in the json file, name to display in the leaderboard
|
15 |
+
task2 = Task("tmlu", "acc", "TMLU")
|
16 |
+
task3 = Task("twllm_eval", "acc", "TW Truthful QA")
|
17 |
+
task4 = Task("tw_legal", "acc", "TW Legal Eval")
|
18 |
|
19 |
NUM_FEWSHOT = 0 # Change with your few shot
|
20 |
# ---------------------------------------------------
|
|
|
36 |
## Reproducibility
|
37 |
To reproduce our results, here is the commands you can run:
|
38 |
|
39 |
+
please checkout this command https://github.com/adamlin120/lm-evaluation-harness/blob/main/run_all.sh
|
40 |
"""
|
41 |
|
42 |
EVALUATION_QUEUE_TEXT = """
|
|
|
71 |
|
72 |
CITATION_BUTTON_LABEL = "Copy the following snippet to cite these results"
|
73 |
CITATION_BUTTON_TEXT = r"""
|
74 |
+
@misc{open-tw-llm-leaderboard,
|
75 |
author = {Yen{-}Ting Lin, Yun{-}Nung Chen},
|
76 |
title = {Open TW-LLM Leaderboard},
|
77 |
year = {2024},
|