Spaces:
Sleeping
Sleeping
app.py
Browse filesTest Image-Text to Text Models
app.py
ADDED
@@ -0,0 +1,11 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
import streamlit as st
|
2 |
+
from transformers import AutoProcessor, UdopForConditionalGeneration
|
3 |
+
from datasets import load_dataset
|
4 |
+
|
5 |
+
processor = AutoProcessor.from_pretrained("microsoft/udop-large", apply_ocr=True)
|
6 |
+
model = UdopForConditionalGeneration.from_pretrained("microsoft/udop-large")
|
7 |
+
|
8 |
+
# encoding = processor(image, question, words, boxes=boxes, return_tensors="pt")
|
9 |
+
|
10 |
+
# predicted_ids = model.generate(**encoding)
|
11 |
+
# print(processor.batch_decode(predicted_ids, skip_special_tokens=True)[0])
|