Update evals
Browse files
app.py
CHANGED
@@ -49,7 +49,10 @@ def get_leaderboard_df(merge_values: bool = True):
|
|
49 |
value = data["results"][first_result_key]["acc_norm"]
|
50 |
# BBH has several metrics but we report just the average one
|
51 |
elif task.lower() == "bbh":
|
52 |
-
value = [
|
|
|
|
|
|
|
53 |
else:
|
54 |
first_metric_key = next(
|
55 |
iter(data["results"][first_result_key])
|
|
|
49 |
value = data["results"][first_result_key]["acc_norm"]
|
50 |
# BBH has several metrics but we report just the average one
|
51 |
elif task.lower() == "bbh":
|
52 |
+
value = data["results"]["all"]["acc"] if "all" in data["results"] else None
|
53 |
+
# AGIEval reports acc_norm
|
54 |
+
elif task.lower() == "agieval":
|
55 |
+
value = data["results"]["all"]["acc_norm"]
|
56 |
else:
|
57 |
first_metric_key = next(
|
58 |
iter(data["results"][first_result_key])
|