Spaces:
Sleeping
Sleeping
app.py
Browse filesTest Image-Text to Text Models
app.py
ADDED
|
@@ -0,0 +1,11 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
import streamlit as st
|
| 2 |
+
from transformers import AutoProcessor, UdopForConditionalGeneration
|
| 3 |
+
from datasets import load_dataset
|
| 4 |
+
|
| 5 |
+
processor = AutoProcessor.from_pretrained("microsoft/udop-large", apply_ocr=True)
|
| 6 |
+
model = UdopForConditionalGeneration.from_pretrained("microsoft/udop-large")
|
| 7 |
+
|
| 8 |
+
# encoding = processor(image, question, words, boxes=boxes, return_tensors="pt")
|
| 9 |
+
|
| 10 |
+
# predicted_ids = model.generate(**encoding)
|
| 11 |
+
# print(processor.batch_decode(predicted_ids, skip_special_tokens=True)[0])
|