taprosoft commited on
Commit
eda147a
·
1 Parent(s): c587922

fix: update default config for Docling

Browse files
Files changed (2) hide show
  1. backends/docling.py +1 -0
  2. backends/mineru.py +1 -0
backends/docling.py CHANGED
@@ -20,6 +20,7 @@ pipeline_options = PdfPipelineOptions()
20
  pipeline_options.accelerator_options = accelerator_options
21
  pipeline_options.do_ocr = True
22
  pipeline_options.do_table_structure = True
 
23
  pipeline_options.generate_picture_images = True
24
  pipeline_options.images_scale = 2.0
25
 
 
20
  pipeline_options.accelerator_options = accelerator_options
21
  pipeline_options.do_ocr = True
22
  pipeline_options.do_table_structure = True
23
+ pipeline_options.do_formula_enrichment = True
24
  pipeline_options.generate_picture_images = True
25
  pipeline_options.images_scale = 2.0
26
 
backends/mineru.py CHANGED
@@ -53,6 +53,7 @@ def do_process_mineru(input_path, output_dir):
53
  f_draw_layout_bbox=ENABLE_DEBUG_MODE,
54
  f_draw_char_bbox=False,
55
  formula_enable=False,
 
56
  table_enable=True,
57
  )
58
  return local_md_dir, file_name
 
53
  f_draw_layout_bbox=ENABLE_DEBUG_MODE,
54
  f_draw_char_bbox=False,
55
  formula_enable=False,
56
+ # disable formula recognition due to dependency issue
57
  table_enable=True,
58
  )
59
  return local_md_dir, file_name