Spaces:
Running
Running
Joschka Strueber
commited on
Commit
·
bf2618d
1
Parent(s):
45b2347
[Add] ignore datasets that are not functional atm
Browse files- src/dataloading.py +9 -0
src/dataloading.py
CHANGED
@@ -86,6 +86,15 @@ def get_leaderboard_datasets(model_ids):
|
|
86 |
if model_datasets:
|
87 |
common_datasets = set.intersection(*model_datasets.values())
|
88 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
89 |
return sorted(common_datasets)
|
90 |
|
91 |
|
|
|
86 |
if model_datasets:
|
87 |
common_datasets = set.intersection(*model_datasets.values())
|
88 |
|
89 |
+
# Filter datasets that are not MCQ or currently do not work
|
90 |
+
ignore = ["_bbh_", "_gpqa_", "_math_", "_ifeval_"]
|
91 |
+
discard = []
|
92 |
+
for dataset in common_datasets:
|
93 |
+
for ignore_data in ignore:
|
94 |
+
if ignore_data in dataset:
|
95 |
+
discard.append(dataset)
|
96 |
+
common_datasets = [dataset for dataset in common_datasets if dataset not in discard]
|
97 |
+
|
98 |
return sorted(common_datasets)
|
99 |
|
100 |
|