Spaces:
Sleeping
Sleeping
Omar ID EL MOUMEN
commited on
Commit
·
52717e9
1
Parent(s):
952bac3
Attempt of fix #2
Browse files
app.py
CHANGED
@@ -119,7 +119,7 @@ async def extract_pdf(pdf: PDF):
|
|
119 |
if pdf_req.status_code == 200:
|
120 |
pdf_data = BytesIO(pdf_req.content)
|
121 |
doc = fitz.open(stream=pdf_data, filetype="pdf")
|
122 |
-
pdf_text = " ".join([page.get_text("text") for page in range(
|
123 |
pdf_metadata = doc.metadata
|
124 |
print(pdf_metadata)
|
125 |
|
|
|
119 |
if pdf_req.status_code == 200:
|
120 |
pdf_data = BytesIO(pdf_req.content)
|
121 |
doc = fitz.open(stream=pdf_data, filetype="pdf")
|
122 |
+
pdf_text = " ".join([doc[page].get_text("text") for page in range(doc.page_count if pdf.page_num == -1 else pdf.page_num)])
|
123 |
pdf_metadata = doc.metadata
|
124 |
print(pdf_metadata)
|
125 |
|