nitzanguetta
commited on
Commit
·
46b2dc4
1
Parent(s):
9a3bbfe
Add new leaderboard
Browse files- app.py +21 -0
- whoops_leaderboard_full.tsv +31 -0
app.py
ADDED
|
@@ -0,0 +1,21 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
import gradio as gr
|
| 2 |
+
import pandas as pd
|
| 3 |
+
|
| 4 |
+
|
| 5 |
+
df = pd.read_table("whoops_leaderboard_full.tsv")
|
| 6 |
+
headline = """# WHOOPS! Leaderboard Full
|
| 7 |
+
To submit your results to the leaderboard, please add a "predictions" column to [this csv](https://huggingface.co/datasets/nlphuji/whoops/blob/main/whoops_dataset.csv), and send to [this mail](mailto:[email protected]) or [this mail](mailto:[email protected],).
|
| 8 |
+
"""
|
| 9 |
+
|
| 10 |
+
demo = gr.Blocks()
|
| 11 |
+
with demo:
|
| 12 |
+
with gr.Row():
|
| 13 |
+
gr.Markdown(headline)
|
| 14 |
+
|
| 15 |
+
with gr.Column():
|
| 16 |
+
leaderboard_df = gr.components.DataFrame(
|
| 17 |
+
value=df,
|
| 18 |
+
datatype=["markdown", "number", "number", "number", "number", "number", "number"]
|
| 19 |
+
)
|
| 20 |
+
|
| 21 |
+
demo.launch()
|
whoops_leaderboard_full.tsv
ADDED
|
@@ -0,0 +1,31 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
|
| 2 |
+
Model Image Captioning Visual Question Answering Image-Text Matching Human Metric - Explanation of Violation Auto Metric - Explanation of Violation identify - Explanation of Violation
|
| 3 |
+
Humans 95 92
|
| 4 |
+
Ground-truth Caption _ GPT3 (Oracle) 68 62 74
|
| 5 |
+
BLIP2 FlanT5-XXL (Fine-tuned) 177 57 84 27 24 73
|
| 6 |
+
BLIP2 FlanT5-XL (Fine-tuned) 174 55 81 15 18 60
|
| 7 |
+
Predicted Caption _ GPT3 33 42 59
|
| 8 |
+
BLIP2 FlanT5-XXL (Zero-shot) 120 55 71 0 0 50
|
| 9 |
+
CLIP ViT-L/14 (Zero-shot) 70
|
| 10 |
+
OFA Large (Zero-shot) 0 38
|
| 11 |
+
CoCa ViT-L-14 MSCOCO (Zero-shot) 102 72
|
| 12 |
+
BLIP Large (Zero-shot) 65 39 77
|
| 13 |
+
BLIP2 FlanT5-XXL (Text only FT) 2 24 94
|
| 14 |
+
|
| 15 |
+
|
| 16 |
+
|
| 17 |
+
|
| 18 |
+
|
| 19 |
+
|
| 20 |
+
|
| 21 |
+
|
| 22 |
+
|
| 23 |
+
|
| 24 |
+
|
| 25 |
+
|
| 26 |
+
|
| 27 |
+
|
| 28 |
+
|
| 29 |
+
|
| 30 |
+
|
| 31 |
+
|