factrbench

Running

App Files Files Community

shezamunir commited on Mar 10

Commit

033550b

1 Parent(s): bf350d1

Update app.py

Browse files

Files changed (1) hide show

app.py +16 -25

app.py CHANGED Viewed

@@ -216,11 +216,11 @@ with tab1:
 """, unsafe_allow_html=True)
     # Dropdown menu to filter tiers
-    tiers = ['All Tiers', 'Tier 1: Hard', 'Tier 2: Moderate', 'Tier 3: Easy']
-    selected_tier = st.selectbox('Select Tier:', tiers)
     # Filter the data based on the selected tier
-    if selected_tier != 'All Tiers':
         filtered_df = df[df['tier'] == selected_tier]
     else:
         filtered_df = df
@@ -230,7 +230,7 @@ with tab1:
     # Sort the dataframe based on Factuality Score if the checkbox is selected
     if sort_by_factuality:
         updated_filtered_df = filtered_df.sort_values(
-            by=['tier', 'factuality_score'], ascending=[True, False]
         )
     else:
         updated_filtered_df = filtered_df.sort_values(
@@ -243,15 +243,12 @@ with tab1:
         <table>
             <thead>
                 <tr>
-                    <th>Tier</th>
                     <th>Rank</th>
                     <th>Model</th>
-                    <th>🎯 Factual Precision</th>
-                    <th>🌀 Hallucination Score</th>
-                    <th>Avg. # Tokens</th>
-                    <th>Avg. # Units</th>
-                    <th>Avg. # Undecidable</th>
-                    <th>Avg. # Unsupported</th>
                 </tr>
             </thead>
             <tbody>
@@ -263,12 +260,9 @@ with tab1:
                 <tr>
                     <th>Rank</th>
                     <th>Model</th>
-                    <th>🎯 Factual Precision</th>
-                    <th>🌀 Hallucination Score</th>
-                    <th>Avg. # Tokens</th>
-                    <th>Avg. # Units</th>
-                    <th>Avg. # Undecidable</th>
-                    <th>Avg. # Unsupported</th>
                 </tr>
             </thead>
             <tbody>
@@ -280,21 +274,18 @@ with tab1:
         html += '<tr>'
         # Only display the 'Tier' column if 'All Tiers' is selected
-        if selected_tier == 'All Tiers':
             if row['tier'] != current_tier:
                 current_tier = row['tier']
-                html += f'<td rowspan="7" style="vertical-align: middle;">{current_tier}</td>'
         # Fill in model and scores
         html += f'''
             <td>{row['rank']}</td>
             <td>{row['model']}</td>
-            <td>{row['factuality_score']}</td>
-            <td>{row['hallucination_score']}</td>
-            <td>{row['avg_tokens']}</td>
-            <td>{row['avg_factual_units']}</td>
-            <td>{row['avg_undecidable_units']:.2f}</td>
-            <td>{row['avg_unsupported_units']:.2f}</td>
         </tr>
     '''

 """, unsafe_allow_html=True)
     # Dropdown menu to filter tiers
+    tiers = ['All Metrics', 'Precision', 'Recall', 'F1']
+    selected_tier = st.selectbox('Select metric:', tiers)
     # Filter the data based on the selected tier
+    if selected_tier != 'All Metrics':
         filtered_df = df[df['tier'] == selected_tier]
     else:
         filtered_df = df
     # Sort the dataframe based on Factuality Score if the checkbox is selected
     if sort_by_factuality:
         updated_filtered_df = filtered_df.sort_values(
+            by=['tier', 'Overall'], ascending=[True, False]
         )
     else:
         updated_filtered_df = filtered_df.sort_values(
         <table>
             <thead>
                 <tr>
+                    <th>Metric</th>
                     <th>Rank</th>
                     <th>Model</th>
+                    <th>Factbench</th>
+                    <th>Reddit</th>
+                    <th>Overall</th>
                 </tr>
             </thead>
             <tbody>
                 <tr>
                     <th>Rank</th>
                     <th>Model</th>
+                    <th>Factbench</th>
+                    <th>Reddit</th>
+                    <th>Overall</th>
                 </tr>
             </thead>
             <tbody>
         html += '<tr>'
         # Only display the 'Tier' column if 'All Tiers' is selected
+        if selected_tier == 'All Metrics':
             if row['tier'] != current_tier:
                 current_tier = row['tier']
+                html += f'<td rowspan="8" style="vertical-align: middle;">{current_tier}</td>'
         # Fill in model and scores
         html += f'''
             <td>{row['rank']}</td>
             <td>{row['model']}</td>
+            <td>{row['FactBench']}</td>
+            <td>{row['Reddit']}</td>
+            <td>{row['Overall']}</td>
         </tr>
     '''