Spaces:

clarin-pl
/

datasets-explorer

Runtime error

App Files Files Community

Mariusz Kossakowski commited on Jul 22, 2022

Commit

7a69b9c

1 Parent(s): d86d2fc

Fix typing

Browse files

Files changed (1) hide show

app.py +19 -9

app.py CHANGED Viewed

@@ -1,4 +1,5 @@
 import re
 import pandas as pd
 import plotly.figure_factory as ff
@@ -12,11 +13,11 @@ st.set_page_config(layout="wide")
 DATA_SPLITS = ["train", "dev", "test"]
-def load_data() -> dict[str, pd.DataFrame]:
     return {data: pd.read_csv(f"data/{data}.csv") for data in DATA_SPLITS}
-def flatten_list(main_list: list[list]) -> list:
     return [item for sublist in main_list for item in sublist]
@@ -62,8 +63,10 @@ with description:
     analyze contracts and understand what they agree upon.
     """
     st.write(desc)
-    st.markdown("<h1 style='text-align: center; color: white;'>Dataset statistics</h1>",
-                unsafe_allow_html=True)
 with dataset_statistics:
     st.header("Number of samples in each data split")
@@ -85,7 +88,11 @@ with dataset_statistics:
     metrics_df.columns = ["Subset", "Number of samples"]
     st.dataframe(metrics_df)
     latex_df = metrics_df.style.to_latex()
-    st.button(label="Copy table to LaTeX", on_click=lambda: pyperclip.copy(latex_df), key="copy_metrics_df")
 # Class distribution in each subset
 with class_distribution:
@@ -99,8 +106,8 @@ with class_distribution:
                     for k, df in DATA_DICT.items()
                 ]
             )
-                .reset_index()
-                .rename({"index": "split_name"}, axis=1)
         )
         barchart_class_dist = go.Figure(
             data=[
@@ -128,8 +135,11 @@ with class_distribution:
             st.text("")
         st.dataframe(hist)
         latex_df_class_dist = hist.style.to_latex()
-        st.button(label="Copy table to LaTeX", on_click=lambda: pyperclip.copy(latex_df_class_dist),
-                  key="copy_class_dist_df")
     # Number of words per observation
     hist_data_num_words = [

 import re
+from typing import Dict, List
 import pandas as pd
 import plotly.figure_factory as ff
 DATA_SPLITS = ["train", "dev", "test"]
+def load_data() -> Dict[str, pd.DataFrame]:
     return {data: pd.read_csv(f"data/{data}.csv") for data in DATA_SPLITS}
+def flatten_list(main_list: List[list]) -> list:
     return [item for sublist in main_list for item in sublist]
     analyze contracts and understand what they agree upon.
     """
     st.write(desc)
+    st.markdown(
+        "<h1 style='text-align: center; color: white;'>Dataset statistics</h1>",
+        unsafe_allow_html=True,
+    )
 with dataset_statistics:
     st.header("Number of samples in each data split")
     metrics_df.columns = ["Subset", "Number of samples"]
     st.dataframe(metrics_df)
     latex_df = metrics_df.style.to_latex()
+    st.button(
+        label="Copy table to LaTeX",
+        on_click=lambda: pyperclip.copy(latex_df),
+        key="copy_metrics_df",
+    )
 # Class distribution in each subset
 with class_distribution:
                     for k, df in DATA_DICT.items()
                 ]
             )
+            .reset_index()
+            .rename({"index": "split_name"}, axis=1)
         )
         barchart_class_dist = go.Figure(
             data=[
             st.text("")
         st.dataframe(hist)
         latex_df_class_dist = hist.style.to_latex()
+        st.button(
+            label="Copy table to LaTeX",
+            on_click=lambda: pyperclip.copy(latex_df_class_dist),
+            key="copy_class_dist_df",
+        )
     # Number of words per observation
     hist_data_num_words = [