Update app.py
Browse files
app.py
CHANGED
@@ -50,13 +50,15 @@ import pytesseract
|
|
50 |
from PIL import Image
|
51 |
@st.experimental_singleton
|
52 |
def read_pdf(file):
|
53 |
-
|
|
|
54 |
pdfReader = PdfFileReader(file)
|
55 |
count = pdfReader.numPages
|
56 |
all_page_text = ""
|
57 |
for i in range(count):
|
58 |
-
|
59 |
-
img = Image.open(page
|
|
|
60 |
img = img.save("img.png")
|
61 |
image_name = cv2.imread("img.png")
|
62 |
# get co-ordinates to cr
|
|
|
50 |
from PIL import Image
|
51 |
@st.experimental_singleton
|
52 |
def read_pdf(file):
|
53 |
+
images=pdf2image.convert_from_bytes(file.read())
|
54 |
+
print(type(images))
|
55 |
pdfReader = PdfFileReader(file)
|
56 |
count = pdfReader.numPages
|
57 |
all_page_text = ""
|
58 |
for i in range(count):
|
59 |
+
# page = pdfReader.getPage(i)
|
60 |
+
#img = Image.open(page)
|
61 |
+
img = Image.open(images[i])
|
62 |
img = img.save("img.png")
|
63 |
image_name = cv2.imread("img.png")
|
64 |
# get co-ordinates to cr
|