Spaces:

Keemoz0
/

my-table-transformer-structure-recognition

Runtime error

Keemoz0 commited on Sep 23, 2024

Commit

32ccca8

1 Parent(s): 0fc8569

reaplce tesseract with easyocr

because tesseract assumed not working in gradio

Files changed (1) hide show

app.py CHANGED Viewed

@@ -2,7 +2,7 @@ import gradio as gr
 from huggingface_hub import hf_hub_download
 from PIL import Image
 import torch
-import pytesseract
 from transformers import AutoImageProcessor, AutoModelForObjectDetection
 # Load the processor and model for table structure recognition
@@ -13,6 +13,9 @@ model = AutoModelForObjectDetection.from_pretrained("microsoft/table-transformer
 device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
 model.to(device)
 # Define the inference and OCR function
 def predict(image):
     # Preprocess the input image
@@ -53,8 +56,8 @@ def predict(image):
         # Crop the image to the bounding box area
         cropped_image = image.crop((left, top, right, bottom))
-        # Perform OCR on the cropped image
-        ocr_text = pytesseract.image_to_string(cropped_image)
         # Append OCR result for this box
         ocr_results.append({
@@ -74,4 +77,3 @@ interface = gr.Interface(
 # Launch the Gradio app
 interface.launch()
-#recheck gradio bugging

 from huggingface_hub import hf_hub_download
 from PIL import Image
 import torch
+import easyocr
 from transformers import AutoImageProcessor, AutoModelForObjectDetection
 # Load the processor and model for table structure recognition
 device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
 model.to(device)
+# Initialize EasyOCR Reader
+reader = easyocr.Reader(['en'])  # You can specify the language (e.g., 'en' for English)
 # Define the inference and OCR function
 def predict(image):
     # Preprocess the input image
         # Crop the image to the bounding box area
         cropped_image = image.crop((left, top, right, bottom))
+        # Perform OCR using EasyOCR
+        ocr_text = reader.readtext(cropped_image, detail=0)  # detail=0 returns just the text
         # Append OCR result for this box
         ocr_results.append({
 # Launch the Gradio app
 interface.launch()