import gradio as gr from PIL import Image from support import processor import os os.system("pip install -r requirements.txt") def OCR_processor(input_image): ##input_image = Image.open(input_image) return processor(input_image) examples =[['eg1.png'],['eg2.png'],['eg3.png']] iface = gr.Interface( fn=OCR_processor, inputs=gr.inputs.Image(type="pil", label="Upload an Image"), outputs=gr.outputs.Image(type="pil", label="Processed Image"), title="Form understanding using Multimodal Transformers", examples=examples, description="Upload an image, and the app will process it using the LayoutLMV3 multimodal transformer. You can get all the OCR tags marked in the image as output.", theme="huggingface", # You can use "default", "compact", or "huggingface" themes layout="vertical", live=True, ) if __name__ == "__main__": iface.launch()