Soumen commited on
Commit
25ae3be
·
1 Parent(s): 5167da5

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +5 -3
app.py CHANGED
@@ -50,13 +50,15 @@ import pytesseract
50
  from PIL import Image
51
  @st.experimental_singleton
52
  def read_pdf(file):
53
- #images=pdf2image.convert_from_bytes(file.read(),"rb")
 
54
  pdfReader = PdfFileReader(file)
55
  count = pdfReader.numPages
56
  all_page_text = ""
57
  for i in range(count):
58
- page = pdfReader.getPage(i)
59
- img = Image.open(page.to_image())
 
60
  img = img.save("img.png")
61
  image_name = cv2.imread("img.png")
62
  # get co-ordinates to cr
 
50
  from PIL import Image
51
  @st.experimental_singleton
52
  def read_pdf(file):
53
+ images=pdf2image.convert_from_bytes(file.read())
54
+ print(type(images))
55
  pdfReader = PdfFileReader(file)
56
  count = pdfReader.numPages
57
  all_page_text = ""
58
  for i in range(count):
59
+ # page = pdfReader.getPage(i)
60
+ #img = Image.open(page)
61
+ img = Image.open(images[i])
62
  img = img.save("img.png")
63
  image_name = cv2.imread("img.png")
64
  # get co-ordinates to cr