nitzanguetta
commited on
Commit
•
46b2dc4
1
Parent(s):
9a3bbfe
Add new leaderboard
Browse files- app.py +21 -0
- whoops_leaderboard_full.tsv +31 -0
app.py
ADDED
@@ -0,0 +1,21 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
import gradio as gr
|
2 |
+
import pandas as pd
|
3 |
+
|
4 |
+
|
5 |
+
df = pd.read_table("whoops_leaderboard_full.tsv")
|
6 |
+
headline = """# WHOOPS! Leaderboard Full
|
7 |
+
To submit your results to the leaderboard, please add a "predictions" column to [this csv](https://huggingface.co/datasets/nlphuji/whoops/blob/main/whoops_dataset.csv), and send to [this mail](mailto:yonatanbitton1@gmail.com) or [this mail](mailto:whoops.benchmark@gmail.com,).
|
8 |
+
"""
|
9 |
+
|
10 |
+
demo = gr.Blocks()
|
11 |
+
with demo:
|
12 |
+
with gr.Row():
|
13 |
+
gr.Markdown(headline)
|
14 |
+
|
15 |
+
with gr.Column():
|
16 |
+
leaderboard_df = gr.components.DataFrame(
|
17 |
+
value=df,
|
18 |
+
datatype=["markdown", "number", "number", "number", "number", "number", "number"]
|
19 |
+
)
|
20 |
+
|
21 |
+
demo.launch()
|
whoops_leaderboard_full.tsv
ADDED
@@ -0,0 +1,31 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
|
2 |
+
Model Image Captioning Visual Question Answering Image-Text Matching Human Metric - Explanation of Violation Auto Metric - Explanation of Violation identify - Explanation of Violation
|
3 |
+
Humans 95 92
|
4 |
+
Ground-truth Caption _ GPT3 (Oracle) 68 62 74
|
5 |
+
BLIP2 FlanT5-XXL (Fine-tuned) 177 57 84 27 24 73
|
6 |
+
BLIP2 FlanT5-XL (Fine-tuned) 174 55 81 15 18 60
|
7 |
+
Predicted Caption _ GPT3 33 42 59
|
8 |
+
BLIP2 FlanT5-XXL (Zero-shot) 120 55 71 0 0 50
|
9 |
+
CLIP ViT-L/14 (Zero-shot) 70
|
10 |
+
OFA Large (Zero-shot) 0 38
|
11 |
+
CoCa ViT-L-14 MSCOCO (Zero-shot) 102 72
|
12 |
+
BLIP Large (Zero-shot) 65 39 77
|
13 |
+
BLIP2 FlanT5-XXL (Text only FT) 2 24 94
|
14 |
+
|
15 |
+
|
16 |
+
|
17 |
+
|
18 |
+
|
19 |
+
|
20 |
+
|
21 |
+
|
22 |
+
|
23 |
+
|
24 |
+
|
25 |
+
|
26 |
+
|
27 |
+
|
28 |
+
|
29 |
+
|
30 |
+
|
31 |
+
|