nielsr HF staff commited on
Commit
b59fa62
1 Parent(s): 6d77d30

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +4 -0
app.py CHANGED
@@ -26,5 +26,9 @@ question = gr.inputs.Textbox(label="Question")
26
  answer = gr.outputs.Textbox(label="Predicted answer")
27
  examples = [["cats.jpg", "How many cats are there?"], ["banana.png", "What is the mustache made of?"]]
28
 
 
 
 
 
29
  interface = gr.Interface(fn=answer_question, inputs=[image, question], outputs=answer, examples=examples, enable_queue=True)
30
  interface.launch(debug=True)
 
26
  answer = gr.outputs.Textbox(label="Predicted answer")
27
  examples = [["cats.jpg", "How many cats are there?"], ["banana.png", "What is the mustache made of?"]]
28
 
29
+ title = "Interactive demo: ViLT"
30
+ description = "Gradio Demo for Vision and Language Transformer (ViLT) model fine-tuned on VQAv2 To use it, simply upload your image and type a question and click 'submit', or click one of the examples to load them. Read more at the links below."
31
+ article = "<p style='text-align: center'><a href='https://arxiv.org/abs/2102.03334' target='_blank'>ViLT: Vision-and-Language Transformer Without Convolution or Region Supervision</a> | <a href='https://github.com/dandelin/ViLT' target='_blank'>Github Repo</a></p>"
32
+
33
  interface = gr.Interface(fn=answer_question, inputs=[image, question], outputs=answer, examples=examples, enable_queue=True)
34
  interface.launch(debug=True)