Adam Jirkovsky
commited on
Commit
·
54b05ee
1
Parent(s):
6bebd55
Revert header changes
Browse files- app.py +1 -1
- src/display/utils.py +24 -25
app.py
CHANGED
@@ -215,7 +215,7 @@ with demo:
|
|
215 |
+ shown_columns.value
|
216 |
|
217 |
],
|
218 |
-
headers=[c.
|
219 |
datatype=TYPES,
|
220 |
elem_id="leaderboard-table",
|
221 |
interactive=False,
|
|
|
215 |
+ shown_columns.value
|
216 |
|
217 |
],
|
218 |
+
headers=[c.name for c in fields(AutoEvalColumn) if c.never_hidden] + shown_columns.value,
|
219 |
datatype=TYPES,
|
220 |
elem_id="leaderboard-table",
|
221 |
interactive=False,
|
src/display/utils.py
CHANGED
@@ -16,7 +16,6 @@ def fields(raw_class):
|
|
16 |
@dataclass
|
17 |
class ColumnContent:
|
18 |
name: str
|
19 |
-
display_name: str
|
20 |
type: str
|
21 |
displayed_by_default: bool
|
22 |
hidden: bool = False
|
@@ -48,24 +47,24 @@ auto_eval_column_dict.append(["revision", ColumnContent, ColumnContent("Model sh
|
|
48 |
auto_eval_column_dict.append(["dummy", ColumnContent, ColumnContent("model_name_for_query", "str", False, dummy=True)])
|
49 |
"""
|
50 |
|
51 |
-
auto_eval_column_dict.append(["eval_name", ColumnContent, ColumnContent("eval_name", "
|
52 |
-
auto_eval_column_dict.append(["precision", ColumnContent, ColumnContent("precision", "
|
53 |
-
auto_eval_column_dict.append(["hf_model_id", ColumnContent, ColumnContent("hf_model_id", "
|
54 |
-
auto_eval_column_dict.append(["agree_cs", ColumnContent, ColumnContent("agree_cs", "
|
55 |
-
auto_eval_column_dict.append(["anli_cs", ColumnContent, ColumnContent("anli_cs", "
|
56 |
-
auto_eval_column_dict.append(["arc_challenge_cs", ColumnContent, ColumnContent("arc_challenge_cs", "
|
57 |
-
auto_eval_column_dict.append(["arc_easy_cs", ColumnContent, ColumnContent("arc_easy_cs", "
|
58 |
-
auto_eval_column_dict.append(["belebele_cs", ColumnContent, ColumnContent("belebele_cs", "
|
59 |
-
auto_eval_column_dict.append(["ctkfacts_cs", ColumnContent, ColumnContent("ctkfacts_cs", "
|
60 |
-
auto_eval_column_dict.append(["czechnews_cs", ColumnContent, ColumnContent("czechnews_cs", "
|
61 |
-
auto_eval_column_dict.append(["fb_comments_cs", ColumnContent, ColumnContent("fb_comments_cs", "
|
62 |
-
auto_eval_column_dict.append(["gsm8k_cs", ColumnContent, ColumnContent("gsm8k_cs", "
|
63 |
-
auto_eval_column_dict.append(["klokanek_cs", ColumnContent, ColumnContent("klokanek_cs", "
|
64 |
-
auto_eval_column_dict.append(["mall_reviews_cs", ColumnContent, ColumnContent("mall_reviews_cs", "
|
65 |
-
auto_eval_column_dict.append(["mmlu_cs", ColumnContent, ColumnContent("mmlu_cs", "
|
66 |
-
auto_eval_column_dict.append(["sqad_cs", ColumnContent, ColumnContent("sqad_cs", "
|
67 |
-
auto_eval_column_dict.append(["subjectivity_cs", ColumnContent, ColumnContent("subjectivity_cs", "
|
68 |
-
auto_eval_column_dict.append(["truthfulqa_cs", ColumnContent, ColumnContent("truthfulqa_cs", "
|
69 |
|
70 |
|
71 |
# We use make dataclass to dynamically fill the scores from Tasks
|
@@ -75,12 +74,12 @@ AutoEvalColumn = make_dataclass("AutoEvalColumn", auto_eval_column_dict, frozen=
|
|
75 |
## For the queue columns in the submission tab
|
76 |
@dataclass(frozen=True)
|
77 |
class EvalQueueColumn: # Queue column
|
78 |
-
model = ColumnContent("model", "
|
79 |
-
revision = ColumnContent("revision", "
|
80 |
-
private = ColumnContent("private", "
|
81 |
-
precision = ColumnContent("precision", "
|
82 |
-
weight_type = ColumnContent("weight_type", "
|
83 |
-
status = ColumnContent("status", "
|
84 |
|
85 |
|
86 |
## All the model information that we might need
|
|
|
16 |
@dataclass
|
17 |
class ColumnContent:
|
18 |
name: str
|
|
|
19 |
type: str
|
20 |
displayed_by_default: bool
|
21 |
hidden: bool = False
|
|
|
47 |
auto_eval_column_dict.append(["dummy", ColumnContent, ColumnContent("model_name_for_query", "str", False, dummy=True)])
|
48 |
"""
|
49 |
|
50 |
+
auto_eval_column_dict.append(["eval_name", ColumnContent, ColumnContent("eval_name", "str", True, never_hidden=True)])
|
51 |
+
auto_eval_column_dict.append(["precision", ColumnContent, ColumnContent("precision", "str", True)])
|
52 |
+
auto_eval_column_dict.append(["hf_model_id", ColumnContent, ColumnContent("hf_model_id", "str", True)])
|
53 |
+
auto_eval_column_dict.append(["agree_cs", ColumnContent, ColumnContent("agree_cs", "number", True)])
|
54 |
+
auto_eval_column_dict.append(["anli_cs", ColumnContent, ColumnContent("anli_cs", "number", True)])
|
55 |
+
auto_eval_column_dict.append(["arc_challenge_cs", ColumnContent, ColumnContent("arc_challenge_cs", "number", True)])
|
56 |
+
auto_eval_column_dict.append(["arc_easy_cs", ColumnContent, ColumnContent("arc_easy_cs", "number", True)])
|
57 |
+
auto_eval_column_dict.append(["belebele_cs", ColumnContent, ColumnContent("belebele_cs", "number", True)])
|
58 |
+
auto_eval_column_dict.append(["ctkfacts_cs", ColumnContent, ColumnContent("ctkfacts_cs", "number", True)])
|
59 |
+
auto_eval_column_dict.append(["czechnews_cs", ColumnContent, ColumnContent("czechnews_cs", "number", True)])
|
60 |
+
auto_eval_column_dict.append(["fb_comments_cs", ColumnContent, ColumnContent("fb_comments_cs", "number", True)])
|
61 |
+
auto_eval_column_dict.append(["gsm8k_cs", ColumnContent, ColumnContent("gsm8k_cs", "number", True)])
|
62 |
+
auto_eval_column_dict.append(["klokanek_cs", ColumnContent, ColumnContent("klokanek_cs", "number", True)])
|
63 |
+
auto_eval_column_dict.append(["mall_reviews_cs", ColumnContent, ColumnContent("mall_reviews_cs", "number", True)])
|
64 |
+
auto_eval_column_dict.append(["mmlu_cs", ColumnContent, ColumnContent("mmlu_cs", "number", True)])
|
65 |
+
auto_eval_column_dict.append(["sqad_cs", ColumnContent, ColumnContent("sqad_cs", "number", True)])
|
66 |
+
auto_eval_column_dict.append(["subjectivity_cs", ColumnContent, ColumnContent("subjectivity_cs", "number", True)])
|
67 |
+
auto_eval_column_dict.append(["truthfulqa_cs", ColumnContent, ColumnContent("truthfulqa_cs", "number", True)])
|
68 |
|
69 |
|
70 |
# We use make dataclass to dynamically fill the scores from Tasks
|
|
|
74 |
## For the queue columns in the submission tab
|
75 |
@dataclass(frozen=True)
|
76 |
class EvalQueueColumn: # Queue column
|
77 |
+
model = ColumnContent("model", "markdown", True)
|
78 |
+
revision = ColumnContent("revision", "str", True)
|
79 |
+
private = ColumnContent("private", "bool", True)
|
80 |
+
precision = ColumnContent("precision", "str", True)
|
81 |
+
weight_type = ColumnContent("weight_type", "str", "Original")
|
82 |
+
status = ColumnContent("status", "str", True)
|
83 |
|
84 |
|
85 |
## All the model information that we might need
|