Spaces:

Cognitive-Lab
/

indic_llm_leaderboard

Running

App Files Files Community

AdithyaSK commited on Apr 4, 2024

Commit

72657ca

1 Parent(s): c12d258

updated UI - Adithya S K

Browse files

Files changed (1) hide show

app.py +60 -49

app.py CHANGED Viewed

@@ -61,67 +61,78 @@ def main():
     with Leaderboard_tab:
         data = get_data()
         table_data = []
         all_models = []
-        for item in data:
-            model_name = item.get("name")
-            language = item.get("language")
-            try:
-                ALL = item["result"]["all"]["acc_norm"]
-            except KeyError:
-                ALL = None
-            try:
-                ARC_Easy = item["result"]["ARC-Easy"]["acc_norm"]
-            except KeyError:
-                ARC_Easy = None
-            try:
-                ARC_Challenge = item["result"]["ARC-Challenge"]["acc_norm"]
-            except KeyError:
-                ARC_Challenge = None
-            try:
-                Hellaswag = item["result"]["Hellaswag"]["acc_norm"]
-            except KeyError:
-                Hellaswag = None
-            try:
-                Boolq = item["result"]["Boolq"]["acc_norm"]
-            except KeyError:
-                Boolq = None
-            try:
-                MMLU = item["result"]["MMLU"]["acc_norm"]
-            except KeyError:
-                MMLU = None
-            try:
-                Translation = item["result"]["Translation"]["acc_norm"]
-            except KeyError:
-                Translation = None
-            # If you are going through the code and wondering what is happening this code is a mess
-            all_models.append(model_name)
-            table_data.append({
-                "Model": model_name,
-                "Language": language,
-                "Avergae": ALL,
-                "ARC-Easy": ARC_Easy,
-                "ARC-Challenge": ARC_Challenge,
-                "Hellaswag": Hellaswag,
-                "Boolq": Boolq,
-                "MMLU": MMLU,
-                "Translation": Translation,
-            })
-        df = pd.DataFrame(table_data)
         title = st.text_input('Model', placeholder=" 🔍 Search for your model (separate multiple queries with `;`) and press ENTER...")
         on = st.checkbox('Sort by Language')
         col1, col2 = st.columns(2)
         with col1:
             benchmark_options = st.multiselect(
                 'Pick Benchmark',
-                ['ARC-Easy', 'ARC-Challenge', 'Hellaswag', 'Boolq','MMLU','Translation'],['ARC-Easy', 'ARC-Challenge', 'Hellaswag', 'Boolq','MMLU','Translation'])
         with col2:
             language_options = st.multiselect(
                 'Pick Languages',

     with Leaderboard_tab:
         data = get_data()
         table_data = []
         all_models = []
+        try:
+            for item in data:
+                model_name = item.get("name")
+                language = item.get("language")
+                try:
+                    ALL = item["result"]["all"]["acc_norm"]
+                except KeyError:
+                    ALL = None
+                try:
+                    ARC_Easy = item["result"]["ARC-Easy"]["acc_norm"]
+                except KeyError:
+                    ARC_Easy = None
+                try:
+                    ARC_Challenge = item["result"]["ARC-Challenge"]["acc_norm"]
+                except KeyError:
+                    ARC_Challenge = None
+                try:
+                    Hellaswag = item["result"]["Hellaswag"]["acc_norm"]
+                except KeyError:
+                    Hellaswag = None
+                try:
+                    Boolq = item["result"]["Boolq"]["acc_norm"]
+                except KeyError:
+                    Boolq = None
+                try:
+                    MMLU = item["result"]["MMLU"]["acc_norm"]
+                except KeyError:
+                    MMLU = None
+                try:
+                    Translation = item["result"]["Translation"]["acc_norm"]
+                except KeyError:
+                    Translation = None
+                # If you are going through the code and wondering what is happening this code is a mess
+                all_models.append(model_name)
+                table_data.append({
+                    "Model": model_name,
+                    "Language": language,
+                    "Avergae": ALL,
+                    "ARC-Easy": ARC_Easy,
+                    "ARC-Challenge": ARC_Challenge,
+                    "Hellaswag": Hellaswag,
+                    "Boolq": Boolq,
+                    "MMLU": MMLU,
+                    "Translation": Translation,
+                })
+            df = pd.DataFrame(table_data)
+        except:
+            columns = ["Model", "Language", "Avergae", "ARC-Easy", "ARC-Challenge", "Hellaswag", "Boolq", "MMLU", "Translation"]
+            # Create an empty list to hold the data
+            table_data = []
+            # Append an empty dictionary with column names as keys to the table_data list
+            table_data.append({col: None for col in columns})
+            # Create a DataFrame from the table_data list
+            df = pd.DataFrame(table_data)
         title = st.text_input('Model', placeholder=" 🔍 Search for your model (separate multiple queries with `;`) and press ENTER...")
         on = st.checkbox('Sort by Language')
+        st.text("Boolq , MMLU , Translation is still being tested")
         col1, col2 = st.columns(2)
         with col1:
             benchmark_options = st.multiselect(
                 'Pick Benchmark',
+                ['ARC-Easy', 'ARC-Challenge', 'Hellaswag', 'Boolq','MMLU','Translation'],['ARC-Easy', 'ARC-Challenge', 'Hellaswag'])
         with col2:
             language_options = st.multiselect(
                 'Pick Languages',