tathagataraha commited on
Commit
faceee1
·
1 Parent(s): 553b217

[MODIFY] Cross-evaluation framework column names

Browse files
Files changed (2) hide show
  1. src/about.py +12 -12
  2. src/populate.py +3 -3
src/about.py CHANGED
@@ -64,10 +64,10 @@ class MedicalSummarizationColumn:
64
  col_name: str
65
 
66
  class MedicalSummarizationColumns(Enum):
67
- medical_summarization_column0 = MedicalSummarizationColumn("brief", "score", "Brief Score")
68
- medical_summarization_column1 = MedicalSummarizationColumn("coverage", "score", "Coverage Score")
69
- medical_summarization_column2 = MedicalSummarizationColumn("conform", "score", "Conform Score")
70
- medical_summarization_column3 = MedicalSummarizationColumn("fact", "score", "Fact Score")
71
 
72
  @dataclass
73
  class ACIColumn:
@@ -76,10 +76,10 @@ class ACIColumn:
76
  col_name: str
77
 
78
  class ACIColumns(Enum):
79
- aci_column0 = ACIColumn("brief", "score", "Brief Score")
80
- aci_column1 = ACIColumn("coverage", "score", "Coverage Score")
81
- aci_column2 = ACIColumn("conform", "score", "Conform Score")
82
- aci_column3 = ACIColumn("fact", "score", "Fact Score")
83
 
84
  @dataclass
85
  class SOAPColumn:
@@ -88,10 +88,10 @@ class SOAPColumn:
88
  col_name: str
89
 
90
  class SOAPColumns(Enum):
91
- soap_column0 = SOAPColumn("brief", "score", "Brief Score")
92
- soap_column1 = SOAPColumn("coverage", "score", "Coverage Score")
93
- soap_column2 = SOAPColumn("conform", "score", "Conform Score")
94
- soap_column3 = SOAPColumn("fact", "score", "Fact Score")
95
 
96
  NUM_FEWSHOT = 0 # Change with your few shot
97
  # ---------------------------------------------------
 
64
  col_name: str
65
 
66
  class MedicalSummarizationColumns(Enum):
67
+ medical_summarization_column0 = MedicalSummarizationColumn("coverage", "score", "Coverage")
68
+ medical_summarization_column1 = MedicalSummarizationColumn("conform", "score", "Conformity")
69
+ medical_summarization_column2 = MedicalSummarizationColumn("fact", "score", "Consistency")
70
+ medical_summarization_column3 = MedicalSummarizationColumn("brief", "score", "Conciseness")
71
 
72
  @dataclass
73
  class ACIColumn:
 
76
  col_name: str
77
 
78
  class ACIColumns(Enum):
79
+ aci_column0 = ACIColumn("coverage", "score", "Coverage")
80
+ aci_column1 = ACIColumn("conform", "score", "Conformity")
81
+ aci_column2 = ACIColumn("fact", "score", "Consistency")
82
+ aci_column3 = ACIColumn("brief", "score", "Conciseness")
83
 
84
  @dataclass
85
  class SOAPColumn:
 
88
  col_name: str
89
 
90
  class SOAPColumns(Enum):
91
+ soap_column0 = SOAPColumn("coverage", "score", "Coverage")
92
+ soap_column1 = SOAPColumn("conform", "score", "Conformity")
93
+ soap_column2 = SOAPColumn("fact", "score", "Consistency")
94
+ soap_column3 = SOAPColumn("brief", "score", "Conciseness")
95
 
96
  NUM_FEWSHOT = 0 # Change with your few shot
97
  # ---------------------------------------------------
src/populate.py CHANGED
@@ -25,11 +25,11 @@ def get_leaderboard_df(results_path: str, requests_path: str, cols: list, benchm
25
  elif subset == "open_ended":
26
  df = df.sort_values(by=["ELO"], ascending=False)
27
  elif subset == "medical_summarization":
28
- df = df.sort_values(by=["Coverage Score"], ascending=False)
29
  elif subset == "aci":
30
- df = df.sort_values(by=["Coverage Score"], ascending=False)
31
  elif subset == "soap":
32
- df = df.sort_values(by=["Coverage Score"], ascending=False)
33
  cols = list(set(df.columns).intersection(set(cols)))
34
  df = df[cols].round(decimals=2)
35
  # filter out if any of the benchmarks have not been produced
 
25
  elif subset == "open_ended":
26
  df = df.sort_values(by=["ELO"], ascending=False)
27
  elif subset == "medical_summarization":
28
+ df = df.sort_values(by=["Coverage"], ascending=False)
29
  elif subset == "aci":
30
+ df = df.sort_values(by=["Coverage"], ascending=False)
31
  elif subset == "soap":
32
+ df = df.sort_values(by=["Coverage"], ascending=False)
33
  cols = list(set(df.columns).intersection(set(cols)))
34
  df = df[cols].round(decimals=2)
35
  # filter out if any of the benchmarks have not been produced