taprosoft
commited on
Commit
·
eda147a
1
Parent(s):
c587922
fix: update default config for Docling
Browse files- backends/docling.py +1 -0
- backends/mineru.py +1 -0
backends/docling.py
CHANGED
@@ -20,6 +20,7 @@ pipeline_options = PdfPipelineOptions()
|
|
20 |
pipeline_options.accelerator_options = accelerator_options
|
21 |
pipeline_options.do_ocr = True
|
22 |
pipeline_options.do_table_structure = True
|
|
|
23 |
pipeline_options.generate_picture_images = True
|
24 |
pipeline_options.images_scale = 2.0
|
25 |
|
|
|
20 |
pipeline_options.accelerator_options = accelerator_options
|
21 |
pipeline_options.do_ocr = True
|
22 |
pipeline_options.do_table_structure = True
|
23 |
+
pipeline_options.do_formula_enrichment = True
|
24 |
pipeline_options.generate_picture_images = True
|
25 |
pipeline_options.images_scale = 2.0
|
26 |
|
backends/mineru.py
CHANGED
@@ -53,6 +53,7 @@ def do_process_mineru(input_path, output_dir):
|
|
53 |
f_draw_layout_bbox=ENABLE_DEBUG_MODE,
|
54 |
f_draw_char_bbox=False,
|
55 |
formula_enable=False,
|
|
|
56 |
table_enable=True,
|
57 |
)
|
58 |
return local_md_dir, file_name
|
|
|
53 |
f_draw_layout_bbox=ENABLE_DEBUG_MODE,
|
54 |
f_draw_char_bbox=False,
|
55 |
formula_enable=False,
|
56 |
+
# disable formula recognition due to dependency issue
|
57 |
table_enable=True,
|
58 |
)
|
59 |
return local_md_dir, file_name
|