OCR_Tutorial / app.py
llmat's picture
Update app.py
001f24f verified
raw
history blame
923 Bytes
import gradio as gr
import cv2
import pytesseract
from PIL import Image
def ocr(image):
# Step 1: Convert the image to gray scale
gray = cv2.cvtColor(image, cv2.COLOR_BGR2GRAY)
# Step 2: Perform OCR on the image
text = pytesseract.image_to_string(gray)
# Step 3: Prepare the output
output = {
"step1": "The first step is to convert the image to grayscale. This often improves the accuracy of OCR.",
"step1_image": gray,
"step2": "The second step is to perform OCR on the grayscale image using pytesseract.",
"step2_text": text
}
return output
def process_output(output):
output["step1_image"] = Image.fromarray(output["step1_image"])
return output
iface = gr.Interface(fn=ocr,
inputs=gr.Image(type="pil"),
outputs=["text", "image", "text", "text"])
iface.process_output = process_output
iface.launch()