Update app.py
Browse files
app.py
CHANGED
@@ -16,7 +16,7 @@ df['Scenario'] = df['Scenario'].astype(str)
|
|
16 |
def estimate_pass_at_k(num_samples, num_correct, k):
|
17 |
def estimator(n, c, k):
|
18 |
if n - c < k:
|
19 |
-
return
|
20 |
return 1.0 - np.prod(1.0 - k / np.arange(n - c + 1, n + 1))
|
21 |
|
22 |
return np.array([estimator(n, c, k) for n, c in zip(num_samples, num_correct)])
|
@@ -65,9 +65,9 @@ duo_complete_pass_at_k = duo_df.groupby('Model')[['Runs', 'Successes']].apply(la
|
|
65 |
}, index=['pass@1'])).reset_index()
|
66 |
|
67 |
complete_pass_at_k = df.groupby('Model')[['Runs', 'Successes']].apply(lambda x: pd.Series({
|
68 |
-
'pass@1': estimate_pass_at_k(x['Runs'].values, x['Successes'].values, 1).mean()
|
69 |
-
|
70 |
-
|
71 |
}, index=['pass@1', 'pass@5', 'pass@10'])).reset_index()
|
72 |
|
73 |
with gr.Blocks() as demo:
|
|
|
16 |
def estimate_pass_at_k(num_samples, num_correct, k):
|
17 |
def estimator(n, c, k):
|
18 |
if n - c < k:
|
19 |
+
return 'N/A'
|
20 |
return 1.0 - np.prod(1.0 - k / np.arange(n - c + 1, n + 1))
|
21 |
|
22 |
return np.array([estimator(n, c, k) for n, c in zip(num_samples, num_correct)])
|
|
|
65 |
}, index=['pass@1'])).reset_index()
|
66 |
|
67 |
complete_pass_at_k = df.groupby('Model')[['Runs', 'Successes']].apply(lambda x: pd.Series({
|
68 |
+
'pass@1': estimate_pass_at_k(x['Runs'].values, x['Successes'].values, 1).mean(),
|
69 |
+
'pass@5': estimate_pass_at_k(x['Runs'].values, x['Successes'].values, 5).mean(),
|
70 |
+
'pass@10': estimate_pass_at_k(x['Runs'].values, x['Successes'].values, 10).mean()
|
71 |
}, index=['pass@1', 'pass@5', 'pass@10'])).reset_index()
|
72 |
|
73 |
with gr.Blocks() as demo:
|