Spaces:

ImagingDataCommons
/

CloudSegmentatorResults

Runtime error

App Files Files Community

Vamsi Thiriveedhi commited on May 29, 2024

Commit

d7e211f

1 Parent(s): 2c67485

enh: slider to filter radiomics features values, move violin plots to top

Browse files

Files changed (1) hide show

filter_data_app.py +40 -27

filter_data_app.py CHANGED Viewed

@@ -39,13 +39,15 @@ def load_data(radiomics_feature='Volume from Voxel Summation'):
     return df
 # Function to filter data based on user input
-def filter_data(df, filters):
     for col, value in filters.items():
         if value is not None and col != 'radiomics_feature':  # Exclude radiomics_feature from filtering
             if col == 'connected_volumes' and value:
                 df = df.filter((pl.col(col) <= value) & (pl.col(col).is_not_null()))
             elif col == 'voxel_num_values' and value:
                 df = df.filter((pl.col('voxel_num') >= value[0]) & (pl.col('voxel_num') <= value[1]))
             else:
                 df = df.filter(pl.col(col) == value)
     # Filter based on radiomics feature
@@ -94,12 +96,12 @@ def main():
     st.title("Qualitative Checks of TotalSegmentator Segmentations on NLST")
     # Sidebar widgets for navigation and filtering
-    page = st.sidebar.selectbox("Choose a page", ["Summary", "UpSet Plots"])
     # Load the data
     #df = load_data()
-    if page == "UpSet Plots":
         st.write("Filter the data based on radiomics feature, qualitative checks, bodyPart, and laterality.")
         with st.sidebar:
             st.title("Filters")
@@ -114,7 +116,8 @@ def main():
                     'connected_volumes': None,
                     'laterality': None,
                     'radiomics_feature': 'Volume from Voxel Summation',  # Default radiomics feature
-                    'voxel_num_values': None
                 }
             filters = st.session_state.filters
@@ -129,6 +132,7 @@ def main():
                     'laterality': None,
                     #'radiomics_feature': 'Volume from Voxel Summation'
                     'voxel_num_values':None,
                 })
                 st.session_state.filters = filters
@@ -185,7 +189,7 @@ def main():
             filters['bodyPart'] = body_part
             # Apply the current filters to update options for other filters
-            filtered_df = filter_data(df, filters)
             # Update options for other filters based on the current selection
@@ -195,6 +199,7 @@ def main():
             connected_volumes_options = filtered_df['connected_volumes'].unique().to_list()
             laterality_options = [""] + filtered_df['laterality'].unique().to_list()
             voxel_num_options = filtered_df.filter(col('voxel_num').is_not_null()).select('voxel_num').unique().to_pandas().iloc[:, 0].tolist()
             laterality = st.selectbox(
                 "Laterality",
@@ -244,9 +249,16 @@ def main():
                                     value=(min(voxel_num_options),max(voxel_num_options)),
                                     on_change=lambda: apply_filter('voxel_num_values', st.session_state.voxel_num_values)
             )
             st.session_state.filters = filters
-            filtered_df = filter_data(df, filters)
             if laterality:
                 body_part_df = df.filter((col('bodyPart') == lit(body_part)) & (col('laterality') == lit(laterality)))
@@ -278,7 +290,7 @@ def main():
         start_idx = (page_number - 1) * page_size
         end_idx = min(start_idx + page_size, len(filtered_df))  # Ensure end_idx does not go beyond the dataframe length
         paginated_df = filtered_df[start_idx:end_idx].to_pandas()  # Convert to Pandas DataFrame
-        paginated_df['Viewer Url'] = 'https://viewer.imaging.datacommons.cancer.gov/viewer/'+paginated_df['StudyInstanceUID']
         # Display the paginated dataframe
         st.header("Filtered Data")
@@ -288,7 +300,7 @@ def main():
             paginated_df,
             column_config={
                 "Viewer Url":st.column_config.LinkColumn("StudyInstanceUID",
-                              display_text=r"https:\/\/viewer\.imaging\.datacommons\.cancer\.gov\/viewer\/(.*)"
                               ),
             },
@@ -296,25 +308,6 @@ def main():
             hide_index=True,
             use_container_width=True
         )
-        st.header("UpSet Plots of Qualitative Checks")
-        # Explanation about the UpSet plot
-        with st.expander("About the UpSet Plot"):
-            st.write("""
-            The UpSet plot is a way to visualize intersections of multiple sets. Each row in the plot represents a different set, and the dots indicate the presence or absence of intersections among these sets. The vertical bars show the size of each intersection, making it easy to see which intersections are most common.
-            """)
-        # Create and display the UpSet plot for failed checks
-        st.header("UpSet Plot for Failed Checks")
-        st.write("This plot shows the combinations of checks that failed.")
-        if not filtered_df.is_empty():
-            create_upset_plot_failures(filtered_df)
-        # Create and display the UpSet plot for passed checks
-        st.header("UpSet Plot for Passed Checks")
-        st.write("This plot shows the combinations of checks that passed.")
-        if not filtered_df.is_empty():
-            create_upset_plot_passes(filtered_df)
         # Assuming calculate_std_dev returns a Series
         std_dev_before_filtering = calculate_std_dev(body_part_df, radiomics_feature)
         std_dev_after_filtering = calculate_std_dev(filtered_df, radiomics_feature)
@@ -339,6 +332,26 @@ def main():
         sns.violinplot(x='Filtering', y=radiomics_feature, data=combined_df, ax=ax)
         ax.set_ylabel(f"Standard Deviation of {radiomics_feature}")
         st.pyplot(fig2)
         def convert_df(df):
                 return df.write_csv()

     return df
 # Function to filter data based on user input
+def filter_data(df, filters,radiomics_feature):
     for col, value in filters.items():
         if value is not None and col != 'radiomics_feature':  # Exclude radiomics_feature from filtering
             if col == 'connected_volumes' and value:
                 df = df.filter((pl.col(col) <= value) & (pl.col(col).is_not_null()))
             elif col == 'voxel_num_values' and value:
                 df = df.filter((pl.col('voxel_num') >= value[0]) & (pl.col('voxel_num') <= value[1]))
+            elif col == 'radiomics_feature_values' and value:
+                df = df.filter((pl.col(radiomics_feature) >= value[0]) & (pl.col(radiomics_feature) <= value[1]))
             else:
                 df = df.filter(pl.col(col) == value)
     # Filter based on radiomics feature
     st.title("Qualitative Checks of TotalSegmentator Segmentations on NLST")
     # Sidebar widgets for navigation and filtering
+    page = st.sidebar.selectbox("Choose a page", ["Summary", "Plots"])
     # Load the data
     #df = load_data()
+    if page == "Plots":
         st.write("Filter the data based on radiomics feature, qualitative checks, bodyPart, and laterality.")
         with st.sidebar:
             st.title("Filters")
                     'connected_volumes': None,
                     'laterality': None,
                     'radiomics_feature': 'Volume from Voxel Summation',  # Default radiomics feature
+                    'voxel_num_values': None,
+                    'radiomics_feature_values': None
                 }
             filters = st.session_state.filters
                     'laterality': None,
                     #'radiomics_feature': 'Volume from Voxel Summation'
                     'voxel_num_values':None,
+                    'radiomics_feature_values': None
                 })
                 st.session_state.filters = filters
             filters['bodyPart'] = body_part
             # Apply the current filters to update options for other filters
+            filtered_df = filter_data(df, filters,radiomics_feature)
             # Update options for other filters based on the current selection
             connected_volumes_options = filtered_df['connected_volumes'].unique().to_list()
             laterality_options = [""] + filtered_df['laterality'].unique().to_list()
             voxel_num_options = filtered_df.filter(col('voxel_num').is_not_null()).select('voxel_num').unique().to_pandas().iloc[:, 0].tolist()
+            radiomics_feature_values = filtered_df.filter(col(radiomics_feature).is_not_null()).select(radiomics_feature).unique().to_pandas().iloc[:, 0].tolist()
             laterality = st.selectbox(
                 "Laterality",
                                     value=(min(voxel_num_options),max(voxel_num_options)),
                                     on_change=lambda: apply_filter('voxel_num_values', st.session_state.voxel_num_values)
             )
+            radiomics_num_values = st.slider(f"{radiomics_feature} Values",
+                                    min_value=min(radiomics_feature_values),
+                                    max_value=max(radiomics_feature_values),
+                                    key='radiomics_feature_values',
+                                    value=(min(radiomics_feature_values),max(radiomics_feature_values)),
+                                    on_change=lambda: apply_filter('radiomics_feature_values', st.session_state.radiomics_feature_values)
+            )
             st.session_state.filters = filters
+            filtered_df = filter_data(df, filters,radiomics_feature)
             if laterality:
                 body_part_df = df.filter((col('bodyPart') == lit(body_part)) & (col('laterality') == lit(laterality)))
         start_idx = (page_number - 1) * page_size
         end_idx = min(start_idx + page_size, len(filtered_df))  # Ensure end_idx does not go beyond the dataframe length
         paginated_df = filtered_df[start_idx:end_idx].to_pandas()  # Convert to Pandas DataFrame
+        paginated_df['Viewer Url'] = 'https://viewer.imaging.datacommons.cancer.gov/v3/viewer/?StudyInstanceUIDs='+paginated_df['StudyInstanceUID']
         # Display the paginated dataframe
         st.header("Filtered Data")
             paginated_df,
             column_config={
                 "Viewer Url":st.column_config.LinkColumn("StudyInstanceUID",
+                              display_text=r"https:\/\/viewer\.imaging\.datacommons\.cancer\.gov\/v3\/viewer\/\?StudyInstanceUIDs=(.*)"
                               ),
             },
             hide_index=True,
             use_container_width=True
         )
         # Assuming calculate_std_dev returns a Series
         std_dev_before_filtering = calculate_std_dev(body_part_df, radiomics_feature)
         std_dev_after_filtering = calculate_std_dev(filtered_df, radiomics_feature)
         sns.violinplot(x='Filtering', y=radiomics_feature, data=combined_df, ax=ax)
         ax.set_ylabel(f"Standard Deviation of {radiomics_feature}")
         st.pyplot(fig2)
+        st.header("UpSet Plots of Qualitative Checks")
+        # Explanation about the UpSet plot
+        with st.expander("About the UpSet Plot"):
+            st.write("""
+            The UpSet plot is a way to visualize intersections of multiple sets. Each row in the plot represents a different set, and the dots indicate the presence or absence of intersections among these sets. The vertical bars show the size of each intersection, making it easy to see which intersections are most common.
+            """)
+        # Create and display the UpSet plot for failed checks
+        st.header("UpSet Plot for Failed Checks")
+        st.write("This plot shows the combinations of checks that failed.")
+        if not filtered_df.is_empty():
+            create_upset_plot_failures(filtered_df)
+        # Create and display the UpSet plot for passed checks
+        st.header("UpSet Plot for Passed Checks")
+        st.write("This plot shows the combinations of checks that passed.")
+        if not filtered_df.is_empty():
+            create_upset_plot_passes(filtered_df)
         def convert_df(df):
                 return df.write_csv()