Spaces:
Sleeping
Sleeping
File size: 334 Bytes
806d7c6 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 |
import pypdf
def read_pdf(filepath) -> list[str]:
outputs = []
with open(filepath, 'rb') as f:
pdf_reader = pypdf.PdfReader(f)
for page in pdf_reader.pages:
outputs.append(page.extract_text())
return outputs
if __name__ == '__main__':
r = read_pdf('data/109-411-2-PB.pdf')
print(r)
|