onekq commited on
Commit
3fee132
·
verified ·
1 Parent(s): 8fe6c77

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +4 -6
app.py CHANGED
@@ -38,7 +38,7 @@ def filter_data(model, scenario):
38
  return pd.DataFrame([pass_at_k])
39
 
40
  # Initialize the leaderboard
41
- def init_leaderboard(dataframe, default_selection=["Model", "pass@1", "pass@5", "pass@10"], height=600):
42
  if dataframe is None or dataframe.empty:
43
  raise ValueError("Leaderboard DataFrame is empty or None.")
44
  return Leaderboard(
@@ -67,10 +67,8 @@ duo_complete_pass_at_k = duo_df.groupby('Model')[['Runs', 'Successes']].apply(la
67
  }, index=['pass@1'])).reset_index()
68
 
69
  complete_pass_at_k = df.groupby('Model')[['Runs', 'Successes']].apply(lambda x: pd.Series({
70
- 'pass@1': estimate_pass_at_k(x['Runs'].values, x['Successes'].values, 1).mean(),
71
- 'pass@5': estimate_pass_at_k(x['Runs'].values, x['Successes'].values, 5).mean(),
72
- 'pass@10': estimate_pass_at_k(x['Runs'].values, x['Successes'].values, 10).mean()
73
- }, index=['pass@1', 'pass@5', 'pass@10'])).reset_index()
74
 
75
  with gr.Blocks() as demo:
76
  gr.Markdown("# 🏆 WebApp1K Models Leaderboard")
@@ -82,7 +80,7 @@ with gr.Blocks() as demo:
82
  "[AI Models](https://www.aimodels.fyi/papers/arxiv/webapp1k-practical-code-generation-benchmark-web-app)")
83
 
84
  gr.Markdown("# WebApp1K-Duo ([Benchmark](https://huggingface.co/datasets/onekq-ai/WebApp1K-Duo-React))")
85
- duo_leaderboard = init_leaderboard(duo_complete_pass_at_k, default_selection = ["Model", "pass@1"], height=400)
86
  gr.Markdown("# WebApp1K ([Benchmark](https://huggingface.co/datasets/onekq-ai/WebApp1K-React))")
87
  leaderboard = init_leaderboard(complete_pass_at_k, default_selection = [], height=800)
88
 
 
38
  return pd.DataFrame([pass_at_k])
39
 
40
  # Initialize the leaderboard
41
+ def init_leaderboard(dataframe, default_selection=["Model", "pass@1"], height=600):
42
  if dataframe is None or dataframe.empty:
43
  raise ValueError("Leaderboard DataFrame is empty or None.")
44
  return Leaderboard(
 
67
  }, index=['pass@1'])).reset_index()
68
 
69
  complete_pass_at_k = df.groupby('Model')[['Runs', 'Successes']].apply(lambda x: pd.Series({
70
+ 'pass@1': estimate_pass_at_k(x['Runs'].values, x['Successes'].values, 1).mean()
71
+ }, index=['pass@1'])).reset_index()
 
 
72
 
73
  with gr.Blocks() as demo:
74
  gr.Markdown("# 🏆 WebApp1K Models Leaderboard")
 
80
  "[AI Models](https://www.aimodels.fyi/papers/arxiv/webapp1k-practical-code-generation-benchmark-web-app)")
81
 
82
  gr.Markdown("# WebApp1K-Duo ([Benchmark](https://huggingface.co/datasets/onekq-ai/WebApp1K-Duo-React))")
83
+ duo_leaderboard = init_leaderboard(duo_complete_pass_at_k, default_selection = [], height=400)
84
  gr.Markdown("# WebApp1K ([Benchmark](https://huggingface.co/datasets/onekq-ai/WebApp1K-React))")
85
  leaderboard = init_leaderboard(complete_pass_at_k, default_selection = [], height=800)
86