nitzanguetta commited on
Commit
46b2dc4
1 Parent(s): 9a3bbfe

Add new leaderboard

Browse files
Files changed (2) hide show
  1. app.py +21 -0
  2. whoops_leaderboard_full.tsv +31 -0
app.py ADDED
@@ -0,0 +1,21 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ import gradio as gr
2
+ import pandas as pd
3
+
4
+
5
+ df = pd.read_table("whoops_leaderboard_full.tsv")
6
+ headline = """# WHOOPS! Leaderboard Full
7
+ To submit your results to the leaderboard, please add a "predictions" column to [this csv](https://huggingface.co/datasets/nlphuji/whoops/blob/main/whoops_dataset.csv), and send to [this mail](mailto:yonatanbitton1@gmail.com) or [this mail](mailto:whoops.benchmark@gmail.com,).
8
+ """
9
+
10
+ demo = gr.Blocks()
11
+ with demo:
12
+ with gr.Row():
13
+ gr.Markdown(headline)
14
+
15
+ with gr.Column():
16
+ leaderboard_df = gr.components.DataFrame(
17
+ value=df,
18
+ datatype=["markdown", "number", "number", "number", "number", "number", "number"]
19
+ )
20
+
21
+ demo.launch()
whoops_leaderboard_full.tsv ADDED
@@ -0,0 +1,31 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+
2
+ Model Image Captioning Visual Question Answering Image-Text Matching Human Metric - Explanation of Violation Auto Metric - Explanation of Violation identify - Explanation of Violation
3
+ Humans 95 92
4
+ Ground-truth Caption _ GPT3 (Oracle) 68 62 74
5
+ BLIP2 FlanT5-XXL (Fine-tuned) 177 57 84 27 24 73
6
+ BLIP2 FlanT5-XL (Fine-tuned) 174 55 81 15 18 60
7
+ Predicted Caption _ GPT3 33 42 59
8
+ BLIP2 FlanT5-XXL (Zero-shot) 120 55 71 0 0 50
9
+ CLIP ViT-L/14 (Zero-shot) 70
10
+ OFA Large (Zero-shot) 0 38
11
+ CoCa ViT-L-14 MSCOCO (Zero-shot) 102 72
12
+ BLIP Large (Zero-shot) 65 39 77
13
+ BLIP2 FlanT5-XXL (Text only FT) 2 24 94
14
+
15
+
16
+
17
+
18
+
19
+
20
+
21
+
22
+
23
+
24
+
25
+
26
+
27
+
28
+
29
+
30
+
31
+