Keemoz0 commited on
Commit
9add349
·
1 Parent(s): a6fc7d1

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +25 -23
app.py CHANGED
@@ -36,29 +36,31 @@ def predict(image):
36
  # Unpack the normalized bounding box (x_min, y_min, x_max, y_max)
37
  x_min, y_min, x_max, y_max = box
38
 
39
- # Calculate width and height (denormalize)
40
- width = x_max - x_min
41
- height = y_max - y_min
42
-
43
- # Filter for columns based on aspect ratio (height > width)
44
- if height / width > 2: # A threshold for vertical aspect ratio (adjust if needed)
45
- # Convert normalized coordinates to pixel values
46
- left = int(x_min * image_width)
47
- top = int(y_min * image_height)
48
- right = int(x_max * image_width)
49
- bottom = int(y_max * image_height)
50
-
51
- # Crop the image to the bounding box area
52
- cropped_image = image.crop((left, top, right, bottom))
53
-
54
- # Perform OCR on the cropped image
55
- ocr_text = pytesseract.image_to_string(cropped_image)
56
-
57
- # Append OCR result for this box
58
- ocr_results.append({
59
- "box": [left, top, right, bottom],
60
- "text": ocr_text
61
- })
 
 
62
 
63
  # Return OCR results
64
  return {"ocr_results": ocr_results}
 
36
  # Unpack the normalized bounding box (x_min, y_min, x_max, y_max)
37
  x_min, y_min, x_max, y_max = box
38
 
39
+ # Ensure the coordinates are valid (x_max > x_min, y_max > y_min)
40
+ if x_min >= x_max or y_min >= y_max:
41
+ continue
42
+
43
+ # Convert normalized coordinates to pixel values
44
+ left = max(int(x_min * image_width), 0)
45
+ top = max(int(y_min * image_height), 0)
46
+ right = min(int(x_max * image_width), image_width)
47
+ bottom = min(int(y_max * image_height), image_height)
48
+
49
+ # Double-check that the coordinates are valid after conversion
50
+ if right <= left or bottom <= top:
51
+ continue
52
+
53
+ # Crop the image to the bounding box area
54
+ cropped_image = image.crop((left, top, right, bottom))
55
+
56
+ # Perform OCR on the cropped image
57
+ ocr_text = pytesseract.image_to_string(cropped_image)
58
+
59
+ # Append OCR result for this box
60
+ ocr_results.append({
61
+ "box": [left, top, right, bottom],
62
+ "text": ocr_text
63
+ })
64
 
65
  # Return OCR results
66
  return {"ocr_results": ocr_results}