Spaces:
Sleeping
Sleeping
Update app.py
Browse files
app.py
CHANGED
@@ -3,16 +3,22 @@ import argparse
|
|
3 |
import torch
|
4 |
from donut import DonutModel
|
5 |
from pdf2image import convert_from_path
|
|
|
6 |
|
7 |
def demo_process(pdf_file):
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
8 |
|
9 |
-
|
10 |
-
|
11 |
-
return str(len([1,2,3,4,5]))
|
12 |
-
# model = DonutModel.from_pretrained("uartimcs/donut-invoice-extract")
|
13 |
-
# model.eval()
|
14 |
task_name = "SGSInvoice"
|
15 |
task_prompt = f"<s_{task_name}>"
|
16 |
|
17 |
-
demo = gr.Interface(fn=demo_process,inputs=gr.File(label="Upload PDF"),outputs="
|
18 |
demo.launch()
|
|
|
3 |
import torch
|
4 |
from donut import DonutModel
|
5 |
from pdf2image import convert_from_path
|
6 |
+
from poppler import load_from_file, PageRenderer
|
7 |
|
8 |
def demo_process(pdf_file):
|
9 |
+
pdf_document = load_from_file(pdf_file.name)
|
10 |
+
page_1 = pdf_document.create_page(0)
|
11 |
+
|
12 |
+
renderer = PageRenderer()
|
13 |
+
image = renderer.render_page(page_1)
|
14 |
+
image_data = image.data
|
15 |
+
output = model.inference(image=image_data, prompt=task_prompt)["predictions"][0]
|
16 |
+
return output
|
17 |
|
18 |
+
model = DonutModel.from_pretrained("uartimcs/donut-invoice-extract")
|
19 |
+
model.eval()
|
|
|
|
|
|
|
20 |
task_name = "SGSInvoice"
|
21 |
task_prompt = f"<s_{task_name}>"
|
22 |
|
23 |
+
demo = gr.Interface(fn=demo_process,inputs=gr.File(label="Upload PDF"),outputs="json", title=f"Donut 🍩 demonstration for `{task_name}` task",)
|
24 |
demo.launch()
|