mcp-deepfake-forensics

Running

App Files Files Community

LPX commited on Jun 10

Commit

6909ab7

1 Parent(s): 5aa075b

refactor: reorganize Gradio interface layout for improved user experience and accessibility

Browse files

Files changed (1) hide show

app_mcp.py +104 -113

app_mcp.py CHANGED Viewed

@@ -3,9 +3,6 @@ import time
 from typing import Literal
 import spaces
 import gradio as gr
-import modelscope_studio.components.antd as antd
-import modelscope_studio.components.antdx as antdx
-import modelscope_studio.components.base as ms
 from transformers import pipeline, AutoImageProcessor, SwinForImageClassification, Swinv2ForImageClassification, AutoFeatureExtractor, AutoModelForImageClassification
 from torchvision import transforms
 import torch
@@ -485,118 +482,112 @@ def predict_image_with_json(img, confidence_threshold, augment_methods, rotate_d
     return img_pil, cleaned_forensics_images, table_rows, json_results, consensus_html
 with gr.Blocks(css="#post-gallery { overflow: hidden !important;} .grid-wrap{ overflow-y: hidden !important;} .ms-gr-ant-welcome-icon{ height:unset !important;} .tabs{margin-top:10px;}") as demo:
-    with ms.Application() as app:
-        with antd.ConfigProvider():
-            antdx.Welcome(
-                icon="https://cdn-avatars.huggingface.co/v1/production/uploads/639daf827270667011153fbc/WpeSFhuB81DY-1TjNUmV_.png",
-                title="Welcome to Project OpenSight",
-                description="The OpenSight aims to be an open-source SOTA generated image detection model. This HF Space is not only an introduction but a educational playground for the public to evaluate and challenge current open source models.  **Space will be upgraded shortly; inference on all 6 models should take about 1.2~ seconds.** "
-            )
-            with gr.Tab("👀 Detection Models Eval / Playground"):
-                gr.Markdown("# Open Source Detection Models Found on the Hub\n\n - **Space will be upgraded shortly;** inference on all 6 models should take about 1.2~ seconds once we're back on CUDA.\n - The **Community Forensics** mother of all detection models is now available for inference, head to the middle tab above this.\n - Lots of exciting things coming up, stay tuned!")
-                with gr.Row():
-                    with gr.Column(scale=1):
-                        image_input = gr.Image(label="Upload Image to Analyze", sources=['upload', 'webcam'], type='pil')
-                        with gr.Accordion("Settings (Optional)", open=False, elem_id="settings_accordion"):
-                            augment_checkboxgroup = gr.CheckboxGroup(["rotate", "add_noise", "sharpen"], label="Augmentation Methods")
-                            rotate_slider = gr.Slider(0, 45, value=2, step=1, label="Rotate Degrees", visible=False)
-                            noise_slider = gr.Slider(0, 50, value=4, step=1, label="Noise Level", visible=False)
-                            sharpen_slider = gr.Slider(0, 50, value=11, step=1, label="Sharpen Strength", visible=False)
-                            confidence_slider = gr.Slider(0.0, 1.0, value=0.75, step=0.05, label="Confidence Threshold")
-                        inputs = [image_input, confidence_slider, augment_checkboxgroup, rotate_slider, noise_slider, sharpen_slider]
-                        predict_button = gr.Button("Predict")
-                        augment_button = gr.Button("Augment & Predict")
-                        image_output = gr.Image(label="Processed Image", visible=False)
-                    with gr.Column(scale=2):
-                        # Use Gradio-native Dataframe to display results with headers
-                        results_table = gr.Dataframe(
-                            label="Model Predictions",
-                            headers=["Model", "Contributor", "AI Score", "Real Score", "Label"],
-                            datatype=["str", "str", "number", "number", "str"]
-                        )
-                        forensics_gallery = gr.Gallery(label="Post Processed Images", visible=True, columns=[4], rows=[2], container=False, height="auto", object_fit="contain", elem_id="post-gallery")
-                        with gr.Accordion("Debug Output (Raw JSON)", open=False):
-                            debug_json = gr.JSON(label="Raw Model Results")
-                        consensus_md = gr.Markdown(label="Consensus", value="")
-                        outputs = [image_output, forensics_gallery, results_table, debug_json, consensus_md]
-                # Show/hide rotate slider based on selected augmentation method
-                augment_checkboxgroup.change(lambda methods: gr.update(visible="rotate" in methods), inputs=[augment_checkboxgroup], outputs=[rotate_slider])
-                augment_checkboxgroup.change(lambda methods: gr.update(visible="add_noise" in methods), inputs=[augment_checkboxgroup], outputs=[noise_slider])
-                augment_checkboxgroup.change(lambda methods: gr.update(visible="sharpen" in methods), inputs=[augment_checkboxgroup], outputs=[sharpen_slider])
-                predict_button.click(
-                    fn=predict_image_with_json,
-                    inputs=inputs,
-                    outputs=outputs,
-                    api_name="predict"
-                )
-                augment_button.click(  # Connect Augment button to the function
-                    fn=predict_image_with_json,
-                    inputs=[
-                        image_input,
-                        confidence_slider,
-                        gr.CheckboxGroup(["rotate", "add_noise", "sharpen"], value=["rotate", "add_noise", "sharpen"], visible=False),  # Default values
-                        rotate_slider,
-                        noise_slider,
-                        sharpen_slider
-                    ],
-                    outputs=outputs,
-                    api_name="augment_then_predict"
-                )
-            with gr.Tab("🙈 Project Introduction"):
-                gr.Markdown(QUICK_INTRO)
-            with gr.Tab("👑 Community Forensics Preview"):
-                # temp_space = gr.load("aiwithoutborders-xyz/OpenSight-Community-Forensics-Preview", src="spaces")
-                gr.Markdown("Community Forensics Preview coming soon!") # Placeholder for now
-            with gr.Tab("🥇 Leaderboard"):
-                gr.Markdown("# AI Generated / Deepfake Detection Models Leaderboard: Soon™")
-            with gr.Tab("Wavelet Blocking Noise Estimation", visible=False):
-                gr.Interface(
-                    fn=wavelet_blocking_noise_estimation,
-                    inputs=[gr.Image(type="pil"), gr.Slider(1, 32, value=8, step=1, label="Block Size")],
-                    outputs=gr.Image(type="pil"),
-                    title="Wavelet-Based Noise Analysis",
-                    description="Analyzes image noise patterns using wavelet decomposition. This tool helps detect compression artifacts and artificial noise patterns that may indicate image manipulation. Higher noise levels in specific regions can reveal areas of potential tampering.",
-                    api_name="tool_waveletnoise"
-                )
-            """Forensics Tool: Bit Plane Extractor
-            Args:
-                image: PIL Image to analyze
-                channel: Color channel to extract bit plane from ("Luminance", "Red", "Green", "Blue", "RGB Norm")
-                bit_plane: Bit plane index to extract (0-7)
-                filter_type: Filter to apply ("Disabled", "Median", "Gaussian")
-            """
-            with gr.Tab("Bit Plane Values", visible=False):
-                gr.Interface(
-                    fn=bit_plane_extractor,
-                    inputs=[
-                        gr.Image(type="pil"),
-                        gr.Dropdown(["Luminance", "Red", "Green", "Blue", "RGB Norm"], label="Channel", value="Luminance"),
-                        gr.Slider(0, 7, value=0, step=1, label="Bit Plane"),
-                        gr.Dropdown(["Disabled", "Median", "Gaussian"], label="Filter", value="Disabled")
-                    ],
-                    outputs=gr.Image(type="pil"),
-                    title="Bit Plane Analysis",
-                    description="Extracts and visualizes individual bit planes from different color channels. This forensic tool helps identify hidden patterns and artifacts in image data that may indicate manipulation. Different bit planes can reveal inconsistencies in image processing or editing.",
-                    api_name="tool_bitplane"
                 )
-            # with gr.Tab("EXIF Full Dump"):
-            #     gr.Interface(
-            #         fn=exif_full_dump,
-            #         inputs=gr.Image(type="pil"),
-            #         outputs=gr.JSON(),
-            #         description="Extract all EXIF metadata from the uploaded image."
-            #     )
 # --- MCP-Ready Launch ---
 if __name__ == "__main__":

 from typing import Literal
 import spaces
 import gradio as gr
 from transformers import pipeline, AutoImageProcessor, SwinForImageClassification, Swinv2ForImageClassification, AutoFeatureExtractor, AutoModelForImageClassification
 from torchvision import transforms
 import torch
     return img_pil, cleaned_forensics_images, table_rows, json_results, consensus_html
 with gr.Blocks(css="#post-gallery { overflow: hidden !important;} .grid-wrap{ overflow-y: hidden !important;} .ms-gr-ant-welcome-icon{ height:unset !important;} .tabs{margin-top:10px;}") as demo:
+    with gr.Tab("👀 Detection Models Eval / Playground"):
+        gr.Markdown("# Open Source Detection Models Found on the Hub\n\n - **Space will be upgraded shortly;** inference on all 6 models should take about 1.2~ seconds once we're back on CUDA.\n - The **Community Forensics** mother of all detection models is now available for inference, head to the middle tab above this.\n - Lots of exciting things coming up, stay tuned!")
+        with gr.Row():
+            with gr.Column(scale=1):
+                image_input = gr.Image(label="Upload Image to Analyze", sources=['upload', 'webcam'], type='pil')
+                with gr.Accordion("Settings (Optional)", open=False, elem_id="settings_accordion"):
+                    augment_checkboxgroup = gr.CheckboxGroup(["rotate", "add_noise", "sharpen"], label="Augmentation Methods")
+                    rotate_slider = gr.Slider(0, 45, value=2, step=1, label="Rotate Degrees", visible=False)
+                    noise_slider = gr.Slider(0, 50, value=4, step=1, label="Noise Level", visible=False)
+                    sharpen_slider = gr.Slider(0, 50, value=11, step=1, label="Sharpen Strength", visible=False)
+                    confidence_slider = gr.Slider(0.0, 1.0, value=0.75, step=0.05, label="Confidence Threshold")
+                inputs = [image_input, confidence_slider, augment_checkboxgroup, rotate_slider, noise_slider, sharpen_slider]
+                predict_button = gr.Button("Predict")
+                augment_button = gr.Button("Augment & Predict")
+                image_output = gr.Image(label="Processed Image", visible=False)
+            with gr.Column(scale=2):
+                # Use Gradio-native Dataframe to display results with headers
+                results_table = gr.Dataframe(
+                    label="Model Predictions",
+                    headers=["Model", "Contributor", "AI Score", "Real Score", "Label"],
+                    datatype=["str", "str", "number", "number", "str"]
                 )
+                forensics_gallery = gr.Gallery(label="Post Processed Images", visible=True, columns=[4], rows=[2], container=False, height="auto", object_fit="contain", elem_id="post-gallery")
+                with gr.Accordion("Debug Output (Raw JSON)", open=False):
+                    debug_json = gr.JSON(label="Raw Model Results")
+                consensus_md = gr.Markdown(label="Consensus", value="")
+                outputs = [image_output, forensics_gallery, results_table, debug_json, consensus_md]
+        # Show/hide rotate slider based on selected augmentation method
+        augment_checkboxgroup.change(lambda methods: gr.update(visible="rotate" in methods), inputs=[augment_checkboxgroup], outputs=[rotate_slider])
+        augment_checkboxgroup.change(lambda methods: gr.update(visible="add_noise" in methods), inputs=[augment_checkboxgroup], outputs=[noise_slider])
+        augment_checkboxgroup.change(lambda methods: gr.update(visible="sharpen" in methods), inputs=[augment_checkboxgroup], outputs=[sharpen_slider])
+        predict_button.click(
+            fn=predict_image_with_json,
+            inputs=inputs,
+            outputs=outputs,
+            api_name="predict"
+        )
+        augment_button.click(  # Connect Augment button to the function
+            fn=predict_image_with_json,
+            inputs=[
+                image_input,
+                confidence_slider,
+                gr.CheckboxGroup(["rotate", "add_noise", "sharpen"], value=["rotate", "add_noise", "sharpen"], visible=False),  # Default values
+                rotate_slider,
+                noise_slider,
+                sharpen_slider
+            ],
+            outputs=outputs,
+            api_name="augment_then_predict"
+        )
+    with gr.Tab("🙈 Project Introduction"):
+        gr.Markdown(QUICK_INTRO)
+    with gr.Tab("👑 Community Forensics Preview"):
+        # temp_space = gr.load("aiwithoutborders-xyz/OpenSight-Community-Forensics-Preview", src="spaces")
+        gr.Markdown("Community Forensics Preview coming soon!") # Placeholder for now
+    with gr.Tab("🥇 Leaderboard"):
+        gr.Markdown("# AI Generated / Deepfake Detection Models Leaderboard: Soon™")
+    with gr.Tab("Wavelet Blocking Noise Estimation", visible=False):
+        gr.Interface(
+            fn=wavelet_blocking_noise_estimation,
+            inputs=[gr.Image(type="pil"), gr.Slider(1, 32, value=8, step=1, label="Block Size")],
+            outputs=gr.Image(type="pil"),
+            title="Wavelet-Based Noise Analysis",
+            description="Analyzes image noise patterns using wavelet decomposition. This tool helps detect compression artifacts and artificial noise patterns that may indicate image manipulation. Higher noise levels in specific regions can reveal areas of potential tampering.",
+            api_name="tool_waveletnoise"
+        )
+    """Forensics Tool: Bit Plane Extractor
+    Args:
+        image: PIL Image to analyze
+        channel: Color channel to extract bit plane from ("Luminance", "Red", "Green", "Blue", "RGB Norm")
+        bit_plane: Bit plane index to extract (0-7)
+        filter_type: Filter to apply ("Disabled", "Median", "Gaussian")
+    """
+    with gr.Tab("Bit Plane Values", visible=False):
+        gr.Interface(
+            fn=bit_plane_extractor,
+            inputs=[
+                gr.Image(type="pil"),
+                gr.Dropdown(["Luminance", "Red", "Green", "Blue", "RGB Norm"], label="Channel", value="Luminance"),
+                gr.Slider(0, 7, value=0, step=1, label="Bit Plane"),
+                gr.Dropdown(["Disabled", "Median", "Gaussian"], label="Filter", value="Disabled")
+            ],
+            outputs=gr.Image(type="pil"),
+            title="Bit Plane Analysis",
+            description="Extracts and visualizes individual bit planes from different color channels. This forensic tool helps identify hidden patterns and artifacts in image data that may indicate manipulation. Different bit planes can reveal inconsistencies in image processing or editing.",
+            api_name="tool_bitplane"
+        )
+    # with gr.Tab("EXIF Full Dump"):
+    #     gr.Interface(
+    #         fn=exif_full_dump,
+    #         inputs=gr.Image(type="pil"),
+    #         outputs=gr.JSON(),
+    #         description="Extract all EXIF metadata from the uploaded image."
+    #     )
 # --- MCP-Ready Launch ---
 if __name__ == "__main__":