nickmuchi commited on
Commit
2554e39
·
1 Parent(s): 2e065a4

Error scenario for blank pdf pages

Browse files

try/except block to take care of blank pdf pages

Files changed (1) hide show
  1. app.py +9 -3
app.py CHANGED
@@ -64,9 +64,15 @@ def extract_text_from_file(file):
64
  pdf_title = pdfReader.getDocumentInfo().title
65
 
66
  for i in range(count):
67
- page = pdfReader.getPage(i)
68
- all_text += page.extractText()
69
- file_text = all_text
 
 
 
 
 
 
70
 
71
  return file_text, pdf_title
72
 
 
64
  pdf_title = pdfReader.getDocumentInfo().title
65
 
66
  for i in range(count):
67
+
68
+ try:
69
+ page = pdfReader.getPage(i)
70
+ all_text += page.extractText()
71
+
72
+ except:
73
+ continue
74
+
75
+ file_text = all_text
76
 
77
  return file_text, pdf_title
78