Spaces:

microsoft
/

document-image-transformer

Running

App Files Files Community

nielsr HF Staff commited on Mar 8, 2022

Commit

84b9078

1 Parent(s): 248dc7c

Update app.py

Browse files

Files changed (1) hide show

app.py +10 -23

app.py CHANGED Viewed

@@ -1,29 +1,16 @@
-from transformers import AutoFeatureExtractor, AutoModelForImageClassification
 import gradio as gr
-import torch
-feature_extractor = AutoFeatureExtractor.from_pretrained("microsoft/dit-base-finetuned-rvlcdip")
-model = AutoModelForImageClassification.from_pretrained("microsoft/dit-base-finetuned-rvlcdip")
-def classify_image(image):
-   encoding = feature_extractor(image, return_tensors="pt")
-   with torch.no_grad():
-     outputs = model(**encoding)
-     logits = outputs.logits
-   predicted_class = model.config.id2label[logits.argmax(-1).item()]
-   return predicted_class
-image = gr.inputs.Image(type="pil")
-label = gr.outputs.Label(num_top_classes=3)
 title = "Document Image Transformer"
 description = "Gradio Demo for DiT, the Document Image Transformer pre-trained on IIT-CDIP, a dataset that includes 42 million document images and fine-tuned on RVL-CDIP, a dataset consisting of 400,000 grayscale images in 16 classes, with 25,000 images per class. To use it, simply add your image, or click one of the examples to load them. Read more at the links below."
 article = "<p style='text-align: center'><a href='https://huggingface.co/microsoft/dit-base-finetuned-rvlcdip' target='_blank'>Huggingface Model</a></p>"
-examples = [
-    ["coca_cola_advertisement.png"],
-    ["scientific_publication.png"]
-]
-gr.Interface(fn=classify_image, inputs=image, outputs=label, title=title, description=description, examples=examples, enable_queue=True).launch(debug=True)

 import gradio as gr
+from transformers import pipeline
 title = "Document Image Transformer"
 description = "Gradio Demo for DiT, the Document Image Transformer pre-trained on IIT-CDIP, a dataset that includes 42 million document images and fine-tuned on RVL-CDIP, a dataset consisting of 400,000 grayscale images in 16 classes, with 25,000 images per class. To use it, simply add your image, or click one of the examples to load them. Read more at the links below."
 article = "<p style='text-align: center'><a href='https://huggingface.co/microsoft/dit-base-finetuned-rvlcdip' target='_blank'>Huggingface Model</a></p>"
+pipe = pipeline(task="image-classification",
+                model="microsoft/dit-base-finetuned-rvlcdip")
+gr.Interface.from_pipeline(pipe,
+                           title=title,
+                           description=description,
+                           examples=['coca_cola_advertisement.png', 'scientific_publication.png',],
+                           article=article,
+                           enable_queue=True,
+                           ).launch()