xeon27
commited on
Commit
·
64ec699
1
Parent(s):
51b158d
Fix bug
Browse files- src/populate.py +5 -1
src/populate.py
CHANGED
|
@@ -9,6 +9,8 @@ from src.display.formatting import has_no_nan_values, make_clickable_model
|
|
| 9 |
from src.display.utils import AutoEvalColumn, EvalQueueColumn
|
| 10 |
from src.leaderboard.read_evals import get_raw_eval_results
|
| 11 |
|
|
|
|
|
|
|
| 12 |
|
| 13 |
TASK_NAME_INVERSE_MAP = dict()
|
| 14 |
for task in Tasks:
|
|
@@ -51,9 +53,11 @@ def get_leaderboard_df(results_path: str, requests_path: str, cols: list, benchm
|
|
| 51 |
|
| 52 |
df = df.fillna(EMPTY_SYMBOL)
|
| 53 |
|
|
|
|
|
|
|
| 54 |
# make values clickable and link to log files
|
| 55 |
for col in benchmark_cols:
|
| 56 |
-
df[col] = df[[AutoEvalColumn.model.name, col]].apply(lambda x: f"[{x[col]}]({get_inspect_log_url(model_name=x[AutoEvalColumn.model.name].split('>')[1].split('<')[0], benchmark_name=TASK_NAME_INVERSE_MAP[col]['name'])})" if x[col] != EMPTY_SYMBOL else x[col], axis=1)
|
| 57 |
|
| 58 |
return df
|
| 59 |
|
|
|
|
| 9 |
from src.display.utils import AutoEvalColumn, EvalQueueColumn
|
| 10 |
from src.leaderboard.read_evals import get_raw_eval_results
|
| 11 |
|
| 12 |
+
from refactor_eval_results import MODEL_VERSION_MAP
|
| 13 |
+
|
| 14 |
|
| 15 |
TASK_NAME_INVERSE_MAP = dict()
|
| 16 |
for task in Tasks:
|
|
|
|
| 53 |
|
| 54 |
df = df.fillna(EMPTY_SYMBOL)
|
| 55 |
|
| 56 |
+
inverse_model_version_map = {v: k for k, v in MODEL_VERSION_MAP.items()}
|
| 57 |
+
|
| 58 |
# make values clickable and link to log files
|
| 59 |
for col in benchmark_cols:
|
| 60 |
+
df[col] = df[[AutoEvalColumn.model.name, col]].apply(lambda x: f"[{x[col]}]({get_inspect_log_url(model_name=inverse_model_version_map[x[AutoEvalColumn.model.name].split('>')[1].split('<')[0]], benchmark_name=TASK_NAME_INVERSE_MAP[col]['name'])})" if x[col] != EMPTY_SYMBOL else x[col], axis=1)
|
| 61 |
|
| 62 |
return df
|
| 63 |
|