Spaces:
Sleeping
Sleeping
Commit
·
a76ea88
1
Parent(s):
9d7de52
upgrade leaderboard
Browse files
app.py
CHANGED
@@ -802,10 +802,12 @@ def filter_by_model_type(df, selected_types):
|
|
802 |
|
803 |
def format_dataframe(df, dataset):
|
804 |
print(df)
|
|
|
805 |
columns = ['Method'] + [col for col in df.columns if dataset in col]
|
806 |
filtered_df = df[columns].copy()
|
807 |
filtered_df.columns = [col.split('_')[-1] if '_' in col else col for col in filtered_df.columns]
|
808 |
print(filtered_df)
|
|
|
809 |
# filtered_df = filtered_df.sort_values('MRR', ascending=False)
|
810 |
filtered_df = filtered_df.sort_values('Kappa', ascending=False)
|
811 |
return filtered_df
|
@@ -826,7 +828,8 @@ def update_tables(selected_types):
|
|
826 |
outputs = []
|
827 |
# for df in [filtered_df_full, filtered_df_10, filtered_df_human]:
|
828 |
for df in [filtered_df_full]:
|
829 |
-
for dataset in ['DL2023', 'MAG', 'PRIME']:
|
|
|
830 |
outputs.append(format_dataframe(df, f"LLMJudge-{dataset}"))
|
831 |
|
832 |
return outputs
|
|
|
802 |
|
803 |
def format_dataframe(df, dataset):
|
804 |
print(df)
|
805 |
+
print("----- *** ------")
|
806 |
columns = ['Method'] + [col for col in df.columns if dataset in col]
|
807 |
filtered_df = df[columns].copy()
|
808 |
filtered_df.columns = [col.split('_')[-1] if '_' in col else col for col in filtered_df.columns]
|
809 |
print(filtered_df)
|
810 |
+
print("----- ### ------")
|
811 |
# filtered_df = filtered_df.sort_values('MRR', ascending=False)
|
812 |
filtered_df = filtered_df.sort_values('Kappa', ascending=False)
|
813 |
return filtered_df
|
|
|
828 |
outputs = []
|
829 |
# for df in [filtered_df_full, filtered_df_10, filtered_df_human]:
|
830 |
for df in [filtered_df_full]:
|
831 |
+
# for dataset in ['DL2023', 'MAG', 'PRIME']:
|
832 |
+
for dataset in ['DL2023']:
|
833 |
outputs.append(format_dataframe(df, f"LLMJudge-{dataset}"))
|
834 |
|
835 |
return outputs
|