Commit
·
65a9e72
1
Parent(s):
d30a6b1
add tw tasks
Browse files- src/about.py +5 -3
src/about.py
CHANGED
|
@@ -12,8 +12,9 @@ class Task:
|
|
| 12 |
# ---------------------------------------------------
|
| 13 |
class Tasks(Enum):
|
| 14 |
# task_key in the json file, metric_key in the json file, name to display in the leaderboard
|
| 15 |
-
|
| 16 |
-
|
|
|
|
| 17 |
|
| 18 |
NUM_FEWSHOT = 0 # Change with your few shot
|
| 19 |
# ---------------------------------------------------
|
|
@@ -35,6 +36,7 @@ LLM_BENCHMARKS_TEXT = f"""
|
|
| 35 |
## Reproducibility
|
| 36 |
To reproduce our results, here is the commands you can run:
|
| 37 |
|
|
|
|
| 38 |
"""
|
| 39 |
|
| 40 |
EVALUATION_QUEUE_TEXT = """
|
|
@@ -69,7 +71,7 @@ If everything is done, check you can launch the EleutherAIHarness on your model
|
|
| 69 |
|
| 70 |
CITATION_BUTTON_LABEL = "Copy the following snippet to cite these results"
|
| 71 |
CITATION_BUTTON_TEXT = r"""
|
| 72 |
-
@misc{open-
|
| 73 |
author = {Yen{-}Ting Lin, Yun{-}Nung Chen},
|
| 74 |
title = {Open TW-LLM Leaderboard},
|
| 75 |
year = {2024},
|
|
|
|
| 12 |
# ---------------------------------------------------
|
| 13 |
class Tasks(Enum):
|
| 14 |
# task_key in the json file, metric_key in the json file, name to display in the leaderboard
|
| 15 |
+
task2 = Task("tmlu", "acc", "TMLU")
|
| 16 |
+
task3 = Task("twllm_eval", "acc", "TW Truthful QA")
|
| 17 |
+
task4 = Task("tw_legal", "acc", "TW Legal Eval")
|
| 18 |
|
| 19 |
NUM_FEWSHOT = 0 # Change with your few shot
|
| 20 |
# ---------------------------------------------------
|
|
|
|
| 36 |
## Reproducibility
|
| 37 |
To reproduce our results, here is the commands you can run:
|
| 38 |
|
| 39 |
+
please checkout this command https://github.com/adamlin120/lm-evaluation-harness/blob/main/run_all.sh
|
| 40 |
"""
|
| 41 |
|
| 42 |
EVALUATION_QUEUE_TEXT = """
|
|
|
|
| 71 |
|
| 72 |
CITATION_BUTTON_LABEL = "Copy the following snippet to cite these results"
|
| 73 |
CITATION_BUTTON_TEXT = r"""
|
| 74 |
+
@misc{open-tw-llm-leaderboard,
|
| 75 |
author = {Yen{-}Ting Lin, Yun{-}Nung Chen},
|
| 76 |
title = {Open TW-LLM Leaderboard},
|
| 77 |
year = {2024},
|