uartimcs commited on
Commit
e06eb7e
·
verified ·
1 Parent(s): 384caa2

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +12 -6
app.py CHANGED
@@ -3,16 +3,22 @@ import argparse
3
  import torch
4
  from donut import DonutModel
5
  from pdf2image import convert_from_path
 
6
 
7
  def demo_process(pdf_file):
 
 
 
 
 
 
 
 
8
 
9
- images = convert_from_path(pdf_file.name)
10
- # output = model.inference(image=input_img, prompt=task_prompt)["predictions"][0]
11
- return str(len([1,2,3,4,5]))
12
- # model = DonutModel.from_pretrained("uartimcs/donut-invoice-extract")
13
- # model.eval()
14
  task_name = "SGSInvoice"
15
  task_prompt = f"<s_{task_name}>"
16
 
17
- demo = gr.Interface(fn=demo_process,inputs=gr.File(label="Upload PDF"),outputs="text", title=f"Donut 🍩 demonstration for `{task_name}` task",)
18
  demo.launch()
 
3
  import torch
4
  from donut import DonutModel
5
  from pdf2image import convert_from_path
6
+ from poppler import load_from_file, PageRenderer
7
 
8
  def demo_process(pdf_file):
9
+ pdf_document = load_from_file(pdf_file.name)
10
+ page_1 = pdf_document.create_page(0)
11
+
12
+ renderer = PageRenderer()
13
+ image = renderer.render_page(page_1)
14
+ image_data = image.data
15
+ output = model.inference(image=image_data, prompt=task_prompt)["predictions"][0]
16
+ return output
17
 
18
+ model = DonutModel.from_pretrained("uartimcs/donut-invoice-extract")
19
+ model.eval()
 
 
 
20
  task_name = "SGSInvoice"
21
  task_prompt = f"<s_{task_name}>"
22
 
23
+ demo = gr.Interface(fn=demo_process,inputs=gr.File(label="Upload PDF"),outputs="json", title=f"Donut 🍩 demonstration for `{task_name}` task",)
24
  demo.launch()