mrsk1883 commited on
Commit
5db38c7
·
1 Parent(s): efced72

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +5 -5
app.py CHANGED
@@ -2,23 +2,23 @@ import gradio as gr
2
  from PyPDF2 import PdfReader
3
  from transformers import AutoModelForSeq2SeqLM, AutoTokenizer
4
 
5
- model_name = "ArtifactAI/led_large_16384_arxiv_summarization" 
6
- model = AutoModelForSeq2SeqLM.from_pretrained(model_name)  
7
  tokenizer = AutoTokenizer.from_pretrained(model_name)
8
 
9
  def summarize_pdf_abstract(pdf_file):
10
 
11
    try:
12
      reader = PdfReader(pdf_file)
13
-     abstract_text = ""  
14
      for page in reader.pages:
15
        if "Abstract" in page.extract_text() or "Introduction" in page.extract_text():
16
          abstract_text = page.extract_text()
17
          break
18
           
19
      inputs = tokenizer(abstract_text, return_tensors="pt")
20
-     outputs = model.generate(**inputs) 
21
-     summary = tokenizer.decode(outputs[0])      
22
 
23
      return {"summary": summary}
24
     
 
2
  from PyPDF2 import PdfReader
3
  from transformers import AutoModelForSeq2SeqLM, AutoTokenizer
4
 
5
+ model_name = "ArtifactAI/led_large_16384_arxiv_summarization"
6
+ model = AutoModelForSeq2SeqLM.from_pretrained(model_name)
7
  tokenizer = AutoTokenizer.from_pretrained(model_name)
8
 
9
  def summarize_pdf_abstract(pdf_file):
10
 
11
    try:
12
      reader = PdfReader(pdf_file)
13
+     abstract_text = ""
14
      for page in reader.pages:
15
        if "Abstract" in page.extract_text() or "Introduction" in page.extract_text():
16
          abstract_text = page.extract_text()
17
          break
18
           
19
      inputs = tokenizer(abstract_text, return_tensors="pt")
20
+     outputs = model.generate(**inputs)
21
+     summary = tokenizer.decode(outputs[0])    
22
 
23
      return {"summary": summary}
24