puppala13 commited on
Commit
c846977
·
verified ·
1 Parent(s): 6608f42

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +4 -4
app.py CHANGED
@@ -1,6 +1,7 @@
1
  import streamlit as st
2
  import PyPDF2
3
  import PyPDF2 as PDF
 
4
  from transformers import AutoModelForSeq2SeqLM, AutoTokenizer
5
  from transformers import MBartForConditionalGeneration, MBart50TokenizerFast
6
 
@@ -35,11 +36,10 @@ def main():
35
  st.write(translated_text)
36
 
37
  def extract_text_from_pdf(pdf_file):
38
- pdf_reader = PyPDF2.PdfFileReader(pdf_file)
39
  text = ""
40
- for page_num in range(pdf_reader.numPages):
41
- page = pdf_reader.getPage(page_num)
42
- text += page.extractText()
43
  return text
44
 
45
  def translate_text(input_text, model, tokenizer):
 
1
  import streamlit as st
2
  import PyPDF2
3
  import PyPDF2 as PDF
4
+ from PyPDF2 import PdfReader
5
  from transformers import AutoModelForSeq2SeqLM, AutoTokenizer
6
  from transformers import MBartForConditionalGeneration, MBart50TokenizerFast
7
 
 
36
  st.write(translated_text)
37
 
38
  def extract_text_from_pdf(pdf_file):
39
+ pdf_reader = PdfReader(pdf_file)
40
  text = ""
41
+ for page in pdf_reader.pages:
42
+ text += page.extract_text()
 
43
  return text
44
 
45
  def translate_text(input_text, model, tokenizer):