Spaces:

Soumen
/

Text-Summarization-and-NLP-tasks

Running

Soumen commited on Nov 25, 2022

Commit

d0ba2f9

1 Parent(s): f780d66

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -50,7 +50,7 @@ import pytesseract
 from PIL import Image
 @st.experimental_singleton
 def read_pdf(file):
-    images=pdf2image.convert_from_bytes(file.read())
     # print(type(images))
     # pdfReader = PdfFileReader(file)
     # count = pdfReader.numPages
@@ -124,7 +124,10 @@ def main():
     if st.session_state["photo"]=="done" or message:
         #text=""
         if uploaded_photo.type=='application/pdf':
-            text = read_pdf(uploaded_photo)
             #text = pytesseract.image_to_string(img, lang="ben") if st.checkbox("Mark to see Bangla Image's Text") else pytesseract.image_to_string(img)
             st.success(text)
         elif uploaded_photo.type != "application/image":

 from PIL import Image
 @st.experimental_singleton
 def read_pdf(file):
+    images=pdf2image.convert_from_path(file)
     # print(type(images))
     # pdfReader = PdfFileReader(file)
     # count = pdfReader.numPages
     if st.session_state["photo"]=="done" or message:
         #text=""
         if uploaded_photo.type=='application/pdf':
+            file = uploaded_file.read() # Read the data
+            image_result = open(uploaded_file.name, 'wb') # creates a writable image and later we can write the decoded result
+            image_result.write(file)
+            text = read_pdf(image_result)
             #text = pytesseract.image_to_string(img, lang="ben") if st.checkbox("Mark to see Bangla Image's Text") else pytesseract.image_to_string(img)
             st.success(text)
         elif uploaded_photo.type != "application/image":