retrAIced / pages /Image to text.py
JavierGon12's picture
Insert all files
d8e07ba
raw
history blame
810 Bytes
from transformers import Pix2StructProcessor, Pix2StructForConditionalGeneration
import requests
from PIL import Image
import streamlit as st
processor = Pix2StructProcessor.from_pretrained('google/deplot')
model = Pix2StructForConditionalGeneration.from_pretrained('google/deplot')
document = st.file_uploader(label="Upload the document you want to explore",type=["png",'jpg', "jpeg","pdf"])
if document == None:
st.write("Please upload the document in the box above")
else:
image = Image.open(document)
st.image(image,"Document uploaded")
inputs = processor(images=image, text="Generate underlying data table of the figure below:", return_tensors="pt")
predictions = model.generate(**inputs, max_new_tokens=512)
st.write(processor.decode(predictions[0], skip_special_tokens=True))