mrsk1883 commited on
Commit
e1ff374
·
1 Parent(s): 5cecb0e

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +22 -22
app.py CHANGED
@@ -1,34 +1,34 @@
1
  import gradio as gr
2
- from PyPDF2 import PdfReader
3
  from transformers import AutoModelForSeq2SeqLM, AutoTokenizer
4
 
5
- model_name = "ArtifactAI/led_large_16384_arxiv_summarization"
6
- model = AutoModelForSeq2SeqLM.from_pretrained(model_name)
7
  tokenizer = AutoTokenizer.from_pretrained(model_name)
8
 
9
  def summarize_pdf_abstract(pdf_file):
10
 
11
- try:
12
- reader = PdfReader(pdf_file)
13
- abstract_text = ""
14
- for page in reader.pages:
15
- if "Abstract" in page.extract_text() or "Introduction" in page.extract_text():
16
- abstract_text = page.extract_text()
17
- break
18
-
19
- inputs = tokenizer(abstract_text, return_tensors="pt")
20
- outputs = model.generate(**inputs)
21
- summary = tokenizer.decode(outputs[0])
22
 
23
- return {"summary": summary}
24
-
25
- except Exception as e:
26
- raise Exception(str(e))
27
 
28
  interface = gr.Interface(
29
- fn=summarize_pdf_abstract,
30
- inputs=gr.inputs.File(label="Upload PDF"),
31
- outputs=gr.outputs.Textbox(label="Summary")
32
  )
33
 
34
- interface.launch(share=True)
 
1
  import gradio as gr
2
+ from PyPDF2 import PdfReader  
3
  from transformers import AutoModelForSeq2SeqLM, AutoTokenizer
4
 
5
+ model_name = "ArtifactAI/led_large_16384_arxiv_summarization" 
6
+ model = AutoModelForSeq2SeqLM.from_pretrained(model_name)  
7
  tokenizer = AutoTokenizer.from_pretrained(model_name)
8
 
9
  def summarize_pdf_abstract(pdf_file):
10
 
11
+   try:
12
+     reader = PdfReader(pdf_file)  
13
+     abstract_text = ""  
14
+     for page in reader.pages:
15
+       if "Abstract" in page.extract_text() or "Introduction" in page.extract_text():
16
+         abstract_text = page.extract_text()
17
+         break
18
+          
19
+     inputs = tokenizer(abstract_text, return_tensors="pt")
20
+     outputs = model.generate(**inputs) 
21
+     summary = tokenizer.decode(outputs[0])      
22
 
23
+     return {"summary": summary}
24
+    
25
+   except Exception as e:
26
+     raise Exception(str(e))
27
 
28
  interface = gr.Interface(
29
+   fn=summarize_pdf_abstract,
30
+   inputs=[gr.File(label="Upload PDF")],
31
+   outputs=[gr.Textbox(label="Summary")]
32
  )
33
 
34
+ interface.launch(share=True)