Spaces:

chunking-ai
/

smoldocling-preview

Paused

App Files Files Community

taprosoft commited on Feb 25

Commit

3bce890

1 Parent(s): 36add35

feat: add enable visualization flag

Browse files

Files changed (6) hide show

app.py +33 -9
backends/docling.py +4 -2
backends/marker.py +3 -1
backends/mineru.py +4 -0
backends/settings.py +3 -0
backends/unstructured.py +3 -1

app.py CHANGED Viewed

@@ -11,6 +11,7 @@ from backends import (
     convert_mineru,
     convert_unstructured,
 )
 from utils import remove_images_from_markdown, trim_pages
 TRIMMED_PDF_PATH = Path("/tmp/gradio/trim")
@@ -18,9 +19,9 @@ TRIMMED_PDF_PATH.mkdir(exist_ok=True)
 def convert_document(path, method, enabled=True):
-    print("Processing file", path, "with method", method, "enabled", enabled)
-    if not enabled:
         return "", "", []
     # benchmarking
@@ -84,7 +85,6 @@ with gr.Blocks(
     output_tabs = []
     visualization_sub_tabs = []
     first_method = supported_methods[0]
-    num_methods = len(supported_methods)
     with gr.Row():
         with gr.Column(variant="panel", scale=5):
@@ -106,7 +106,9 @@ with gr.Blocks(
                 )
             with gr.Row():
                 visual_checkbox = gr.Checkbox(
-                    label="Enable debug visualizations", value=True
                 )
             with gr.Row():
                 convert_btn = gr.Button("Convert", variant="primary", scale=2)
@@ -134,7 +136,10 @@ with gr.Blocks(
                                     line_breaks=True,
                                     latex_delimiters=latex_delimiters,
                                 )
-                            with gr.Tab("Debug visualizations") as visual_sub_tab:
                                 debug_images = gr.Gallery(
                                     show_label=False,
                                     container=False,
@@ -159,16 +164,35 @@ with gr.Blocks(
     )
     for idx, method in enumerate(supported_methods):
-        def progress_message(idx=idx, method=method):
-            return f"Processing ({idx + 1} / {num_methods}) **{method}**...\n\n"
         def process_method(input_file, selected_methods, method=method):
             return convert_document(
                 input_file, method=method, enabled=method in selected_methods
             )
         click_event = click_event.then(
-            fn=lambda idx=idx, method=method: progress_message(idx, method),
             outputs=[progress_status],
         ).then(
             fn=lambda input_file, methods, method=method: process_method(

     convert_mineru,
     convert_unstructured,
 )
+from backends.settings import ENABLE_DEBUG_MODE
 from utils import remove_images_from_markdown, trim_pages
 TRIMMED_PDF_PATH = Path("/tmp/gradio/trim")
 def convert_document(path, method, enabled=True):
+    if enabled:
+        print("Processing file", path, "with method", method)
+    else:
         return "", "", []
     # benchmarking
     output_tabs = []
     visualization_sub_tabs = []
     first_method = supported_methods[0]
     with gr.Row():
         with gr.Column(variant="panel", scale=5):
                 )
             with gr.Row():
                 visual_checkbox = gr.Checkbox(
+                    label="Enable debug visualizations",
+                    visible=ENABLE_DEBUG_MODE,
+                    value=True,
                 )
             with gr.Row():
                 convert_btn = gr.Button("Convert", variant="primary", scale=2)
                                     line_breaks=True,
                                     latex_delimiters=latex_delimiters,
                                 )
+                            with gr.Tab(
+                                "Debug visualizations",
+                                visible=ENABLE_DEBUG_MODE,
+                            ) as visual_sub_tab:
                                 debug_images = gr.Gallery(
                                     show_label=False,
                                     container=False,
     )
     for idx, method in enumerate(supported_methods):
+        def progress_message(selected_methods, method=method):
+            selected_methods_indices = [
+                idx
+                for idx, current_method in enumerate(supported_methods)
+                if current_method in selected_methods
+            ]
+            try:
+                current_method_idx = selected_methods_indices.index(
+                    supported_methods.index(method)
+                )
+                msg = (
+                    f"Processing ({current_method_idx + 1} / "
+                    f"{len(selected_methods)}) **{method}**...\n\n"
+                )
+            except ValueError:
+                msg = gr.update()
+            return msg
         def process_method(input_file, selected_methods, method=method):
+            if input_file is None:
+                raise ValueError("Please upload a PDF file first!")
             return convert_document(
                 input_file, method=method, enabled=method in selected_methods
             )
         click_event = click_event.then(
+            fn=lambda methods, method=method: progress_message(methods, method),
+            inputs=[methods],
             outputs=[progress_status],
         ).then(
             fn=lambda input_file, methods, method=method: process_method(

backends/docling.py CHANGED Viewed

@@ -10,6 +10,8 @@ from docling.datamodel.settings import settings
 from docling.document_converter import DocumentConverter, PdfFormatOption
 from docling_core.types.doc import ImageRefMode
 DOCLING_DEBUG_PATH = Path("/tmp/docling")
 # Docling settings
@@ -23,8 +25,8 @@ pipeline_options.images_scale = 2.0
 # debug visualization settings
 settings.debug.debug_output_path = str(DOCLING_DEBUG_PATH)
-settings.debug.visualize_layout = True
-settings.debug.visualize_tables = True
 # Docling init
 docling_converter = DocumentConverter(

 from docling.document_converter import DocumentConverter, PdfFormatOption
 from docling_core.types.doc import ImageRefMode
+from .settings import ENABLE_DEBUG_MODE
 DOCLING_DEBUG_PATH = Path("/tmp/docling")
 # Docling settings
 # debug visualization settings
 settings.debug.debug_output_path = str(DOCLING_DEBUG_PATH)
+settings.debug.visualize_layout = ENABLE_DEBUG_MODE
+settings.debug.visualize_tables = ENABLE_DEBUG_MODE
 # Docling init
 docling_converter = DocumentConverter(

backends/marker.py CHANGED Viewed

@@ -8,11 +8,13 @@ from marker.models import create_model_dict
 from marker.output import text_from_rendered
 from marker.settings import settings
 # Marker init
 marker_converter = PdfConverter(
     artifact_dict=create_model_dict(),
     config={
-        "debug_pdf_images": True,
     },
 )

 from marker.output import text_from_rendered
 from marker.settings import settings
+from .settings import ENABLE_DEBUG_MODE
 # Marker init
 marker_converter = PdfConverter(
     artifact_dict=create_model_dict(),
     config={
+        "debug_pdf_images": ENABLE_DEBUG_MODE,
     },
 )

backends/mineru.py CHANGED Viewed

@@ -7,6 +7,8 @@ import pymupdf
 from magic_pdf.data.data_reader_writer import FileBasedDataReader
 from magic_pdf.tools.common import do_parse, prepare_env
 MINERU_DEBUG_PATH = Path("/tmp/mineru")
 MINERU_DEBUG_PATH.mkdir(exist_ok=True)
@@ -48,6 +50,8 @@ def do_process_mineru(input_path, output_dir):
         parse_method,
         debug_able=False,
         f_dump_orig_pdf=False,
         formula_enable=False,
         table_enable=True,
     )

 from magic_pdf.data.data_reader_writer import FileBasedDataReader
 from magic_pdf.tools.common import do_parse, prepare_env
+from .settings import ENABLE_DEBUG_MODE
 MINERU_DEBUG_PATH = Path("/tmp/mineru")
 MINERU_DEBUG_PATH.mkdir(exist_ok=True)
         parse_method,
         debug_able=False,
         f_dump_orig_pdf=False,
+        f_draw_layout_bbox=ENABLE_DEBUG_MODE,
+        f_draw_char_bbox=ENABLE_DEBUG_MODE,
         formula_enable=False,
         table_enable=True,
     )

backends/settings.py ADDED Viewed

	@@ -0,0 +1,3 @@


1	+ import os
2	+
3	+ ENABLE_DEBUG_MODE = os.environ.get("ENABLE_DEBUG_MODE", "True").lower() == "true"

backends/unstructured.py CHANGED Viewed

@@ -5,6 +5,8 @@ from matplotlib import font_manager
 from unstructured.partition.pdf import partition_pdf
 from unstructured.partition.pdf_image.analysis import bbox_visualisation
 UNSTRUCTURED_DEBUG_PATH = Path("/tmp/unstructured")
@@ -59,7 +61,7 @@ def convert_unstructured(path: str, file_name: str):
         # extract_images_in_pdf=True,
         extract_image_block_types=["Image", "Table"],
         extract_image_block_to_payload=True,
-        analysis=True,
         analyzed_image_output_dir_path=UNSTRUCTURED_DEBUG_PATH,
     )
     text = convert_elements_to_markdown(elements)

 from unstructured.partition.pdf import partition_pdf
 from unstructured.partition.pdf_image.analysis import bbox_visualisation
+from .settings import ENABLE_DEBUG_MODE
 UNSTRUCTURED_DEBUG_PATH = Path("/tmp/unstructured")
         # extract_images_in_pdf=True,
         extract_image_block_types=["Image", "Table"],
         extract_image_block_to_payload=True,
+        analysis=ENABLE_DEBUG_MODE,
         analyzed_image_output_dir_path=UNSTRUCTURED_DEBUG_PATH,
     )
     text = convert_elements_to_markdown(elements)