ArOCR-writting / app.py
gagan3012's picture
Update app.py
ba6396d
import pandas as pd
from PIL import Image
import streamlit as st
from streamlit_drawable_canvas import st_canvas
from transformers import TrOCRProcessor, VisionEncoderDecoderModel
processor = TrOCRProcessor.from_pretrained("UBC-NLP/ArOCR-Fonts-v2")
model = VisionEncoderDecoderModel.from_pretrained("UBC-NLP/ArOCR-Fonts-v2")
def predict(img):
# if img is None:
# _,generated_text=main(image)
# return generated_text
# else:
images = Image.fromarray(img).convert("RGB")
pixel_values = processor(images, return_tensors="pt").pixel_values
# PIL_image = Image.fromarray(np.uint8(pixel_values.squeeze()[0,:,:])).convert('RGB')
generated_ids = model.generate(pixel_values,max_length=512)
generated_text = processor.batch_decode(
generated_ids, skip_special_tokens=True)[0]
return generated_text
# Specify canvas parameters in application
stroke_width = st.sidebar.slider("Stroke width: ", 1, 25, 3)
stroke_color = st.sidebar.color_picker("Stroke color hex: ")
bg_color = st.sidebar.color_picker("Background color hex: ", "#eee")
bg_image = st.sidebar.file_uploader("Background image:", type=["png", "jpg"])
realtime_update = st.sidebar.checkbox("Update in realtime", True)
# Create a canvas component
canvas_result = st_canvas(
fill_color="rgba(255, 165, 0, 0.3)", # Fixed fill color with some opacity
stroke_width=stroke_width,
stroke_color=stroke_color,
background_color=bg_color,
background_image=Image.open(bg_image) if bg_image else None,
update_streamlit=realtime_update,
height=200,
drawing_mode="freedraw",
display_toolbar=st.sidebar.checkbox("Display toolbar", True),
key="full_app",
)
# Do something interesting with the image data and paths
if canvas_result.image_data is not None:
st.image(canvas_result.image_data)
st.text(predict(canvas_result.image_data))