lewtun HF Staff commited on
Commit
88fd41c
·
1 Parent(s): 486aa44

Update evals

Browse files
Files changed (1) hide show
  1. app.py +4 -1
app.py CHANGED
@@ -49,7 +49,10 @@ def get_leaderboard_df(merge_values: bool = True):
49
  value = data["results"][first_result_key]["acc_norm"]
50
  # BBH has several metrics but we report just the average one
51
  elif task.lower() == "bbh":
52
- value = [v["qem"] for k, v in data["results"].items() if "_average" in k.lower()][0]
 
 
 
53
  else:
54
  first_metric_key = next(
55
  iter(data["results"][first_result_key])
 
49
  value = data["results"][first_result_key]["acc_norm"]
50
  # BBH has several metrics but we report just the average one
51
  elif task.lower() == "bbh":
52
+ value = data["results"]["all"]["acc"] if "all" in data["results"] else None
53
+ # AGIEval reports acc_norm
54
+ elif task.lower() == "agieval":
55
+ value = data["results"]["all"]["acc_norm"]
56
  else:
57
  first_metric_key = next(
58
  iter(data["results"][first_result_key])