jbnayahu commited on
Commit
f94bfef
Β·
1 Parent(s): 35a3872

add Airbench

Browse files

Signed-off-by: Jonathan Bnayahu <[email protected]>

Files changed (1) hide show
  1. app.py +3 -10
app.py CHANGED
@@ -9,7 +9,7 @@ from datetime import datetime
9
 
10
 
11
  st.set_page_config(
12
- page_title="BenchBench",
13
  page_icon="πŸ‹οΈβ€β™‚οΈ",
14
  layout="wide",
15
  initial_sidebar_state="auto",
@@ -29,20 +29,13 @@ st.set_page_config(
29
  # )
30
 
31
  holistic_scenarios = [
32
- "Helm Lite",
33
- "HF OpenLLM v2",
34
- "OpenCompass Academic",
35
- "LMSys Arena",
36
- "Helm Classic",
37
- "AlphacaEval v2lc",
38
- "LiveBench 240725",
39
- "WildBench Elo LC",
40
  ]
41
 
42
 
43
  st.markdown(
44
  """
45
- <h1 style='text-align: center; color: black;'>πŸ‹οΈβ€β™‚οΈ BenchBench Leaderboard πŸ‹οΈβ€β™‚οΈ</h1>
46
  """,
47
  unsafe_allow_html=True,
48
  )
 
9
 
10
 
11
  st.set_page_config(
12
+ page_title="Safety BAT",
13
  page_icon="πŸ‹οΈβ€β™‚οΈ",
14
  layout="wide",
15
  initial_sidebar_state="auto",
 
29
  # )
30
 
31
  holistic_scenarios = [
32
+ "HELM_AIRBENCH_AIR_Score",
 
 
 
 
 
 
 
33
  ]
34
 
35
 
36
  st.markdown(
37
  """
38
+ <h1 style='text-align: center; color: black;'>πŸ‹οΈβ€β™‚οΈ Safety BAT Leaderboard πŸ‹οΈβ€β™‚οΈ</h1>
39
  """,
40
  unsafe_allow_html=True,
41
  )