Spaces:
Running
on
Zero
Running
on
Zero
Init
#5
by
yuanshengni
- opened
This view is limited to 50 files because it contains too many changes.
See the raw diff here.
- .gitignore +0 -175
- .gitmodules +3 -0
- .idea/.gitignore +0 -8
- .idea/GenAI-Arena.iml +0 -15
- .idea/inspectionProfiles/profiles_settings.xml +0 -6
- .idea/modules.xml +0 -8
- .idea/vcs.xml +0 -6
- README.md +3 -37
- app.py +9 -27
- arena_elo/edition_model_info.json +37 -0
- arena_elo/elo_rating/clean_battle_data.py +134 -131
- arena_elo/elo_rating/elo_analysis.py +5 -40
- arena_elo/elo_rating/generate_leaderboard.py +17 -14
- arena_elo/elo_rating/model_registry.py +578 -0
- arena_elo/elo_rating/upload_battle_data.py +122 -97
- arena_elo/elo_rating/utils.py +4 -12
- arena_elo/generation_model_info.json +42 -0
- arena_elo/results/20240315/elo_results_image_editing.pkl +2 -2
- arena_elo/results/20240327/clean_battle_t2i_generation.json +0 -0
- arena_elo/results/20240327/elo_results_t2i_generation.pkl +2 -2
- arena_elo/results/20240327/t2i_generation_leaderboard.csv +10 -9
- arena_elo/results/20240328/clean_battle_image_editing.json +0 -890
- arena_elo/results/20240328/elo_results_image_editing.pkl +0 -3
- arena_elo/results/20240328/image_editing_leaderboard.csv +0 -8
- arena_elo/results/20240330/elo_results_t2i_generation.pkl +0 -3
- arena_elo/results/20240330/t2i_generation_leaderboard.csv +0 -10
- arena_elo/results/20240408/clean_battle_t2i_generation.json +0 -0
- arena_elo/results/20240408/elo_results_t2i_generation.pkl +0 -3
- arena_elo/results/20240408/t2i_generation_leaderboard.csv +0 -10
- arena_elo/results/20240411/clean_battle_image_editing.json +0 -906
- arena_elo/results/20240411/clean_battle_t2i_generation.json +0 -0
- arena_elo/results/20240411/elo_results_image_editing.pkl +0 -3
- arena_elo/results/20240411/elo_results_t2i_generation.pkl +0 -3
- arena_elo/results/20240411/image_editing_leaderboard.csv +0 -8
- arena_elo/results/20240411/t2i_generation_leaderboard.csv +0 -10
- arena_elo/results/20240428/elo_results_image_editing.pkl +0 -3
- arena_elo/results/20240428/image_editing_leaderboard.csv +0 -8
- arena_elo/results/20240501/clean_battle_t2i_generation.json +0 -0
- arena_elo/results/20240501/elo_results_t2i_generation.pkl +0 -3
- arena_elo/results/20240501/t2i_generation_leaderboard.csv +0 -11
- arena_elo/results/20240516/clean_battle_image_editing.json +0 -1578
- arena_elo/results/20240516/elo_results_image_editing.pkl +0 -3
- arena_elo/results/20240516/image_editing_leaderboard.csv +0 -10
- arena_elo/results/20240517/clean_battle_t2i_generation.json +0 -0
- arena_elo/results/20240517/elo_results_t2i_generation.pkl +0 -3
- arena_elo/results/20240517/t2i_generation_leaderboard.csv +0 -12
- arena_elo/results/20240525/clean_battle_image_editing.json +0 -0
- arena_elo/results/20240525/clean_battle_t2i_generation.json +0 -0
- arena_elo/results/20240525/elo_results_image_editing.pkl +0 -3
- arena_elo/results/20240525/elo_results_t2i_generation.pkl +0 -3
.gitignore
DELETED
@@ -1,175 +0,0 @@
|
|
1 |
-
checkpoints/
|
2 |
-
|
3 |
-
# Byte-compiled / optimized / DLL files
|
4 |
-
__pycache__/
|
5 |
-
*.py[cod]
|
6 |
-
*$py.class
|
7 |
-
src/
|
8 |
-
# C extensions
|
9 |
-
*.so
|
10 |
-
temp
|
11 |
-
|
12 |
-
# Distribution / packaging
|
13 |
-
.Python
|
14 |
-
build/
|
15 |
-
develop-eggs/
|
16 |
-
dist/
|
17 |
-
downloads/
|
18 |
-
eggs/
|
19 |
-
.eggs/
|
20 |
-
lib/
|
21 |
-
lib64/
|
22 |
-
parts/
|
23 |
-
sdist/
|
24 |
-
var/
|
25 |
-
wheels/
|
26 |
-
share/python-wheels/
|
27 |
-
*.egg-info/
|
28 |
-
.installed.cfg
|
29 |
-
*.egg
|
30 |
-
MANIFEST
|
31 |
-
|
32 |
-
# PyInstaller
|
33 |
-
# Usually these files are written by a python script from a template
|
34 |
-
# before PyInstaller builds the exe, so as to inject date/other infos into it.
|
35 |
-
*.manifest
|
36 |
-
*.spec
|
37 |
-
|
38 |
-
# Installer logs
|
39 |
-
pip-log.txt
|
40 |
-
pip-delete-this-directory.txt
|
41 |
-
|
42 |
-
# Unit test / coverage reports
|
43 |
-
htmlcov/
|
44 |
-
.tox/
|
45 |
-
.nox/
|
46 |
-
.coverage
|
47 |
-
.coverage.*
|
48 |
-
.cache
|
49 |
-
nosetests.xml
|
50 |
-
coverage.xml
|
51 |
-
*.cover
|
52 |
-
*.py,cover
|
53 |
-
.hypothesis/
|
54 |
-
.pytest_cache/
|
55 |
-
cover/
|
56 |
-
|
57 |
-
# Translations
|
58 |
-
*.mo
|
59 |
-
*.pot
|
60 |
-
|
61 |
-
# Django stuff:
|
62 |
-
*.log
|
63 |
-
local_settings.py
|
64 |
-
db.sqlite3
|
65 |
-
db.sqlite3-journal
|
66 |
-
|
67 |
-
# Flask stuff:
|
68 |
-
instance/
|
69 |
-
.webassets-cache
|
70 |
-
|
71 |
-
# Scrapy stuff:
|
72 |
-
.scrapy
|
73 |
-
|
74 |
-
# Sphinx documentation
|
75 |
-
docs/_build/
|
76 |
-
|
77 |
-
# PyBuilder
|
78 |
-
.pybuilder/
|
79 |
-
target/
|
80 |
-
|
81 |
-
# Jupyter Notebook
|
82 |
-
.ipynb_checkpoints
|
83 |
-
|
84 |
-
# IPython
|
85 |
-
profile_default/
|
86 |
-
ipython_config.py
|
87 |
-
|
88 |
-
# pyenv
|
89 |
-
# For a library or package, you might want to ignore these files since the code is
|
90 |
-
# intended to run in multiple environments; otherwise, check them in:
|
91 |
-
# .python-version
|
92 |
-
|
93 |
-
# pipenv
|
94 |
-
# According to pypa/pipenv#598, it is recommended to include Pipfile.lock in version control.
|
95 |
-
# However, in case of collaboration, if having platform-specific dependencies or dependencies
|
96 |
-
# having no cross-platform support, pipenv may install dependencies that don't work, or not
|
97 |
-
# install all needed dependencies.
|
98 |
-
#Pipfile.lock
|
99 |
-
|
100 |
-
# poetry
|
101 |
-
# Similar to Pipfile.lock, it is generally recommended to include poetry.lock in version control.
|
102 |
-
# This is especially recommended for binary packages to ensure reproducibility, and is more
|
103 |
-
# commonly ignored for libraries.
|
104 |
-
# https://python-poetry.org/docs/basic-usage/#commit-your-poetrylock-file-to-version-control
|
105 |
-
#poetry.lock
|
106 |
-
|
107 |
-
# pdm
|
108 |
-
# Similar to Pipfile.lock, it is generally recommended to include pdm.lock in version control.
|
109 |
-
#pdm.lock
|
110 |
-
# pdm stores project-wide configurations in .pdm.toml, but it is recommended to not include it
|
111 |
-
# in version control.
|
112 |
-
# https://pdm.fming.dev/#use-with-ide
|
113 |
-
.pdm.toml
|
114 |
-
|
115 |
-
# PEP 582; used by e.g. github.com/David-OConnor/pyflow and github.com/pdm-project/pdm
|
116 |
-
__pypackages__/
|
117 |
-
|
118 |
-
# Celery stuff
|
119 |
-
celerybeat-schedule
|
120 |
-
celerybeat.pid
|
121 |
-
|
122 |
-
# SageMath parsed files
|
123 |
-
*.sage.py
|
124 |
-
|
125 |
-
# Environments
|
126 |
-
.env
|
127 |
-
.venv
|
128 |
-
env/
|
129 |
-
venv/
|
130 |
-
ENV/
|
131 |
-
env.bak/
|
132 |
-
venv.bak/
|
133 |
-
|
134 |
-
# Spyder project settings
|
135 |
-
.spyderproject
|
136 |
-
.spyproject
|
137 |
-
|
138 |
-
# Rope project settings
|
139 |
-
.ropeproject
|
140 |
-
|
141 |
-
# mkdocs documentation
|
142 |
-
/site
|
143 |
-
|
144 |
-
# mypy
|
145 |
-
.mypy_cache/
|
146 |
-
.dmypy.json
|
147 |
-
dmypy.json
|
148 |
-
|
149 |
-
# Pyre type checker
|
150 |
-
.pyre/
|
151 |
-
|
152 |
-
# pytype static type analyzer
|
153 |
-
.pytype/
|
154 |
-
|
155 |
-
# Cython debug symbols
|
156 |
-
cython_debug/
|
157 |
-
|
158 |
-
# PyCharm
|
159 |
-
# JetBrains specific template is maintained in a separate JetBrains.gitignore that can
|
160 |
-
# be found at https://github.com/github/gitignore/blob/main/Global/JetBrains.gitignore
|
161 |
-
# and can be added to the global gitignore or merged into this file. For a more nuclear
|
162 |
-
# option (not recommended) you can uncomment the following to ignore the entire idea folder.
|
163 |
-
#.idea/
|
164 |
-
/tmp
|
165 |
-
/logs
|
166 |
-
/*.json
|
167 |
-
/*.jpg
|
168 |
-
/*.ipynb
|
169 |
-
/GenAI-Arena-hf-logs
|
170 |
-
/3DGen-Arena-logs*
|
171 |
-
/tmp*
|
172 |
-
/arena_elo/results/**/*.jpg
|
173 |
-
/arena_elo/results/**/*.png
|
174 |
-
/arena_elo/6_04_log_results
|
175 |
-
/arena_elo/update_elo_rating_6_04.sh
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
.gitmodules
CHANGED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
[submodule "GenAI-Arena-hf-logs"]
|
2 |
+
path = GenAI-Arena-hf-logs
|
3 |
+
url = https://github.com/jdf-prog/GenAI-Arena-hf-logs.git
|
.idea/.gitignore
DELETED
@@ -1,8 +0,0 @@
|
|
1 |
-
# Default ignored files
|
2 |
-
/shelf/
|
3 |
-
/workspace.xml
|
4 |
-
# Editor-based HTTP Client requests
|
5 |
-
/httpRequests/
|
6 |
-
# Datasource local storage ignored files
|
7 |
-
/dataSources/
|
8 |
-
/dataSources.local.xml
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
.idea/GenAI-Arena.iml
DELETED
@@ -1,15 +0,0 @@
|
|
1 |
-
<?xml version="1.0" encoding="UTF-8"?>
|
2 |
-
<module type="PYTHON_MODULE" version="4">
|
3 |
-
<component name="NewModuleRootManager">
|
4 |
-
<content url="file://$MODULE_DIR$" />
|
5 |
-
<orderEntry type="inheritedJdk" />
|
6 |
-
<orderEntry type="sourceFolder" forTests="false" />
|
7 |
-
</component>
|
8 |
-
<component name="PyDocumentationSettings">
|
9 |
-
<option name="format" value="GOOGLE" />
|
10 |
-
<option name="myDocStringFormat" value="Google" />
|
11 |
-
</component>
|
12 |
-
<component name="TemplatesService">
|
13 |
-
<option name="TEMPLATE_CONFIGURATION" value="Jinja2" />
|
14 |
-
</component>
|
15 |
-
</module>
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
.idea/inspectionProfiles/profiles_settings.xml
DELETED
@@ -1,6 +0,0 @@
|
|
1 |
-
<component name="InspectionProjectProfileManager">
|
2 |
-
<settings>
|
3 |
-
<option name="USE_PROJECT_PROFILE" value="false" />
|
4 |
-
<version value="1.0" />
|
5 |
-
</settings>
|
6 |
-
</component>
|
|
|
|
|
|
|
|
|
|
|
|
|
|
.idea/modules.xml
DELETED
@@ -1,8 +0,0 @@
|
|
1 |
-
<?xml version="1.0" encoding="UTF-8"?>
|
2 |
-
<project version="4">
|
3 |
-
<component name="ProjectModuleManager">
|
4 |
-
<modules>
|
5 |
-
<module fileurl="file://$PROJECT_DIR$/.idea/GenAI-Arena.iml" filepath="$PROJECT_DIR$/.idea/GenAI-Arena.iml" />
|
6 |
-
</modules>
|
7 |
-
</component>
|
8 |
-
</project>
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
.idea/vcs.xml
DELETED
@@ -1,6 +0,0 @@
|
|
1 |
-
<?xml version="1.0" encoding="UTF-8"?>
|
2 |
-
<project version="4">
|
3 |
-
<component name="VcsDirectoryMappings">
|
4 |
-
<mapping directory="" vcs="Git" />
|
5 |
-
</component>
|
6 |
-
</project>
|
|
|
|
|
|
|
|
|
|
|
|
|
|
README.md
CHANGED
@@ -4,44 +4,10 @@ emoji: 📈
|
|
4 |
colorFrom: purple
|
5 |
colorTo: pink
|
6 |
sdk: gradio
|
7 |
-
sdk_version: 4.
|
8 |
-
python_version: 3.12
|
9 |
app_file: app.py
|
10 |
-
pinned:
|
11 |
license: mit
|
12 |
-
tags:
|
13 |
-
- arena
|
14 |
-
- leaderboard
|
15 |
-
short_description: Realtime Image/Video Gen AI Arena
|
16 |
---
|
17 |
|
18 |
-
|
19 |
-
|
20 |
-
- for cuda 11.8
|
21 |
-
```bash
|
22 |
-
conda install pytorch torchvision torchaudio pytorch-cuda=11.8 -c pytorch -c nvidia
|
23 |
-
pip3 install -U xformers --index-url https://download.pytorch.org/whl/cu118
|
24 |
-
pip install -r requirements.txt
|
25 |
-
```
|
26 |
-
- for cuda 12.1
|
27 |
-
```bash
|
28 |
-
conda install pytorch torchvision torchaudio pytorch-cuda=12.1 -c pytorch -c nvidia
|
29 |
-
pip install -r requirements.txt
|
30 |
-
```
|
31 |
-
|
32 |
-
## Start Hugging Face UI
|
33 |
-
```bash
|
34 |
-
python app.py
|
35 |
-
```
|
36 |
-
|
37 |
-
## Start Log server
|
38 |
-
```bash
|
39 |
-
uvicorn serve.log_server:app --reload --port 22005 --host 0.0.0.0
|
40 |
-
```
|
41 |
-
|
42 |
-
## Update leaderboard
|
43 |
-
```bash
|
44 |
-
cd arena_elo && bash update_leaderboard.sh
|
45 |
-
```
|
46 |
-
|
47 |
-
Paper: arxiv.org/abs/2406.04485
|
|
|
4 |
colorFrom: purple
|
5 |
colorTo: pink
|
6 |
sdk: gradio
|
7 |
+
sdk_version: 4.21.0
|
|
|
8 |
app_file: app.py
|
9 |
+
pinned: false
|
10 |
license: mit
|
|
|
|
|
|
|
|
|
11 |
---
|
12 |
|
13 |
+
Check out the configuration reference at https://huggingface.co/docs/hub/spaces-config-reference
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
app.py
CHANGED
@@ -2,7 +2,6 @@ import gradio as gr
|
|
2 |
import os
|
3 |
from serve.gradio_web import *
|
4 |
from serve.gradio_web_image_editing import *
|
5 |
-
from serve.gradio_web_video_generation import *
|
6 |
from serve.leaderboard import build_leaderboard_tab
|
7 |
from model.model_manager import ModelManager
|
8 |
from pathlib import Path
|
@@ -24,11 +23,13 @@ def build_combine_demo(models, elo_results_file, leaderboard_table_file):
|
|
24 |
with gr.Tab("Generation Arena (side-by-side)", id=1):
|
25 |
build_side_by_side_ui_named(models)
|
26 |
|
27 |
-
with gr.Tab("Generation
|
28 |
build_single_model_ui(models, add_promotion_links=True)
|
29 |
if elo_results_file:
|
30 |
with gr.Tab("Generation Leaderboard", id=3):
|
31 |
build_leaderboard_tab(elo_results_file['t2i_generation'], leaderboard_table_file['t2i_generation'])
|
|
|
|
|
32 |
|
33 |
with gr.Tab("Image Edition", id=5):
|
34 |
with gr.Tabs() as tabs_ie:
|
@@ -38,27 +39,13 @@ def build_combine_demo(models, elo_results_file, leaderboard_table_file):
|
|
38 |
with gr.Tab("Edition Arena (side-by-side)", id=6):
|
39 |
build_side_by_side_ui_named_ie(models)
|
40 |
|
41 |
-
with gr.Tab("Edition
|
42 |
build_single_model_ui_ie(models, add_promotion_links=True)
|
43 |
if elo_results_file:
|
44 |
with gr.Tab("Edition Leaderboard", id=8):
|
45 |
build_leaderboard_tab(elo_results_file['image_editing'], leaderboard_table_file['image_editing'])
|
46 |
-
|
47 |
-
|
48 |
-
with gr.Tabs() as tabs_vg:
|
49 |
-
with gr.Tab("Video Generation Arena (battle)", id=10):
|
50 |
-
build_side_by_side_ui_anony_vg(models)
|
51 |
-
|
52 |
-
with gr.Tab("Video Generation Arena (side-by-side)", id=11):
|
53 |
-
build_side_by_side_ui_named_vg(models)
|
54 |
-
|
55 |
-
with gr.Tab("Video Generation Playground", id=12): #Direct Chat
|
56 |
-
build_single_model_ui_vg(models, add_promotion_links=True)
|
57 |
-
if elo_results_file and 'video_generation' in elo_results_file:
|
58 |
-
with gr.Tab("Video Generation Leaderboard", id=13):
|
59 |
-
build_leaderboard_tab(elo_results_file['video_generation'], leaderboard_table_file['video_generation'])
|
60 |
-
with gr.Tab("About Us", id=4):
|
61 |
-
build_about()
|
62 |
|
63 |
return demo
|
64 |
|
@@ -76,8 +63,6 @@ def load_elo_results(elo_results_dir):
|
|
76 |
elo_results_file['t2i_generation'] = file
|
77 |
elif 'image_editing' in file.name:
|
78 |
elo_results_file['image_editing'] = file
|
79 |
-
elif 'video_generation' in file.name:
|
80 |
-
elo_results_file['video_generation'] = file
|
81 |
else:
|
82 |
raise ValueError(f"Unknown file name: {file.name}")
|
83 |
for file in elo_results_dir.glob('*_leaderboard.csv'):
|
@@ -85,20 +70,17 @@ def load_elo_results(elo_results_dir):
|
|
85 |
leaderboard_table_file['t2i_generation'] = file
|
86 |
elif 'image_editing' in file.name:
|
87 |
leaderboard_table_file['image_editing'] = file
|
88 |
-
elif 'video_generation' in file.name:
|
89 |
-
leaderboard_table_file['video_generation'] = file
|
90 |
else:
|
91 |
raise ValueError(f"Unknown file name: {file.name}")
|
92 |
|
93 |
return elo_results_file, leaderboard_table_file
|
94 |
|
95 |
if __name__ == "__main__":
|
96 |
-
server_port =
|
97 |
root_path = ROOT_PATH
|
98 |
elo_results_dir = ELO_RESULTS_DIR
|
99 |
-
models = ModelManager(
|
100 |
-
# models = ModelManager(enable_nsfw=False, do_pre_download=False, do_debug_packages=False)
|
101 |
|
102 |
elo_results_file, leaderboard_table_file = load_elo_results(elo_results_dir)
|
103 |
demo = build_combine_demo(models, elo_results_file, leaderboard_table_file)
|
104 |
-
demo.queue(max_size=20).launch(server_port=server_port, root_path=ROOT_PATH)
|
|
|
2 |
import os
|
3 |
from serve.gradio_web import *
|
4 |
from serve.gradio_web_image_editing import *
|
|
|
5 |
from serve.leaderboard import build_leaderboard_tab
|
6 |
from model.model_manager import ModelManager
|
7 |
from pathlib import Path
|
|
|
23 |
with gr.Tab("Generation Arena (side-by-side)", id=1):
|
24 |
build_side_by_side_ui_named(models)
|
25 |
|
26 |
+
with gr.Tab("Generation Direct Chat", id=2):
|
27 |
build_single_model_ui(models, add_promotion_links=True)
|
28 |
if elo_results_file:
|
29 |
with gr.Tab("Generation Leaderboard", id=3):
|
30 |
build_leaderboard_tab(elo_results_file['t2i_generation'], leaderboard_table_file['t2i_generation'])
|
31 |
+
with gr.Tab("About Us", id=4):
|
32 |
+
build_about()
|
33 |
|
34 |
with gr.Tab("Image Edition", id=5):
|
35 |
with gr.Tabs() as tabs_ie:
|
|
|
39 |
with gr.Tab("Edition Arena (side-by-side)", id=6):
|
40 |
build_side_by_side_ui_named_ie(models)
|
41 |
|
42 |
+
with gr.Tab("Edition Direct Chat", id=7):
|
43 |
build_single_model_ui_ie(models, add_promotion_links=True)
|
44 |
if elo_results_file:
|
45 |
with gr.Tab("Edition Leaderboard", id=8):
|
46 |
build_leaderboard_tab(elo_results_file['image_editing'], leaderboard_table_file['image_editing'])
|
47 |
+
with gr.Tab("About Us", id=9):
|
48 |
+
build_about()
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
49 |
|
50 |
return demo
|
51 |
|
|
|
63 |
elo_results_file['t2i_generation'] = file
|
64 |
elif 'image_editing' in file.name:
|
65 |
elo_results_file['image_editing'] = file
|
|
|
|
|
66 |
else:
|
67 |
raise ValueError(f"Unknown file name: {file.name}")
|
68 |
for file in elo_results_dir.glob('*_leaderboard.csv'):
|
|
|
70 |
leaderboard_table_file['t2i_generation'] = file
|
71 |
elif 'image_editing' in file.name:
|
72 |
leaderboard_table_file['image_editing'] = file
|
|
|
|
|
73 |
else:
|
74 |
raise ValueError(f"Unknown file name: {file.name}")
|
75 |
|
76 |
return elo_results_file, leaderboard_table_file
|
77 |
|
78 |
if __name__ == "__main__":
|
79 |
+
server_port = SERVER_PORT
|
80 |
root_path = ROOT_PATH
|
81 |
elo_results_dir = ELO_RESULTS_DIR
|
82 |
+
models = ModelManager()
|
|
|
83 |
|
84 |
elo_results_file, leaderboard_table_file = load_elo_results(elo_results_dir)
|
85 |
demo = build_combine_demo(models, elo_results_file, leaderboard_table_file)
|
86 |
+
demo.queue(max_size=20).launch(server_port=server_port, root_path=ROOT_PATH)
|
arena_elo/edition_model_info.json
ADDED
@@ -0,0 +1,37 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"CycleDiffusion": {
|
3 |
+
"Link": "https://github.com/ChenWu98/cycle-diffusion",
|
4 |
+
"License": "X11",
|
5 |
+
"Organization": "Carnegie Mellon University"
|
6 |
+
},
|
7 |
+
"PNP": {
|
8 |
+
"Link": "https://github.com/MichalGeyer/plug-and-play",
|
9 |
+
"License": "-",
|
10 |
+
"Organization": "Weizmann Institute of Science"
|
11 |
+
},
|
12 |
+
"InstructPix2Pix": {
|
13 |
+
"Link": "https://www.timothybrooks.com/instruct-pix2pix",
|
14 |
+
"License": "Copyright 2023 Timothy Brooks, Aleksander Holynski, Alexei A. Efros",
|
15 |
+
"Organization": "University of California, Berkeley"
|
16 |
+
},
|
17 |
+
"Pix2PixZero": {
|
18 |
+
"Link": "https://pix2pixzero.github.io",
|
19 |
+
"License": "MIT License",
|
20 |
+
"Organization": "Carnegie Mellon University, Adobe Research"
|
21 |
+
},
|
22 |
+
"MagicBrush": {
|
23 |
+
"Link": "https://osu-nlp-group.github.io/MagicBrush",
|
24 |
+
"License": "CC-BY-4.0",
|
25 |
+
"Organization": "The Ohio State University, University of Waterloo"
|
26 |
+
},
|
27 |
+
"Prompt2prompt": {
|
28 |
+
"Link": "https://prompt-to-prompt.github.io",
|
29 |
+
"License": "Apache-2.0",
|
30 |
+
"Organization": "Google, Tel Aviv University"
|
31 |
+
},
|
32 |
+
"SDEdit": {
|
33 |
+
"Link": "https://sde-image-editing.github.io",
|
34 |
+
"License": "MIT License",
|
35 |
+
"Organization": "Stanford University"
|
36 |
+
}
|
37 |
+
}
|
arena_elo/elo_rating/clean_battle_data.py
CHANGED
@@ -18,13 +18,46 @@ ImageFile.LOAD_TRUNCATED_IMAGES = True
|
|
18 |
from tqdm import tqdm
|
19 |
|
20 |
from .basic_stats import get_log_files, NUM_SERVERS, LOG_ROOT_DIR
|
21 |
-
from .utils import detect_language, get_time_stamp_from_date
|
22 |
|
23 |
VOTES = ["tievote", "leftvote", "rightvote", "bothbad_vote"]
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
24 |
|
25 |
-
def parse_model_name(model_name):
|
26 |
-
return NotImplementedError()
|
27 |
-
return model_source, model_name, model_type
|
28 |
|
29 |
def remove_html(raw):
|
30 |
if raw.startswith("<h3>"):
|
@@ -44,19 +77,19 @@ def to_openai_format(messages):
|
|
44 |
|
45 |
def replace_model_name(old_name, tstamp):
|
46 |
replace_dict = {
|
47 |
-
"
|
48 |
-
"
|
49 |
-
"
|
50 |
-
"
|
51 |
-
"
|
52 |
}
|
|
|
|
|
|
|
|
|
|
|
53 |
if old_name in replace_dict:
|
54 |
-
|
55 |
-
if "Flux" in old_name:
|
56 |
-
print(f"Invalid model names: {old_name}")
|
57 |
-
exit(1)
|
58 |
-
model_info = get_model_info(old_name)
|
59 |
-
old_name = model_info.simple_name
|
60 |
return old_name
|
61 |
|
62 |
|
@@ -72,27 +105,18 @@ def read_file(filename):
|
|
72 |
break
|
73 |
except FileNotFoundError:
|
74 |
time.sleep(2)
|
75 |
-
except json.JSONDecodeError:
|
76 |
-
print(f"Error in reading {filename}")
|
77 |
-
print(row)
|
78 |
-
exit(0)
|
79 |
return data
|
80 |
|
81 |
|
82 |
def read_file_parallel(log_files, num_threads=16):
|
83 |
data_all = []
|
84 |
-
|
85 |
-
|
86 |
-
|
87 |
-
|
88 |
-
|
89 |
-
|
90 |
-
|
91 |
-
with Pool(num_threads) as p:
|
92 |
-
ret_all = list(tqdm(p.imap(read_file, log_files), total=len(log_files)))
|
93 |
-
for ret in ret_all:
|
94 |
-
data_all.extend(ret)
|
95 |
-
return data_all
|
96 |
|
97 |
def load_image(image_path):
|
98 |
try:
|
@@ -103,7 +127,7 @@ def load_image(image_path):
|
|
103 |
def clean_battle_data(
|
104 |
log_files, exclude_model_names, ban_ip_list=None, sanitize_ip=False, mode="simple", task_name="image_editing"
|
105 |
):
|
106 |
-
data = read_file_parallel(log_files, num_threads=
|
107 |
|
108 |
convert_type = {
|
109 |
"leftvote": "model_a",
|
@@ -121,7 +145,6 @@ def clean_battle_data(
|
|
121 |
battles = []
|
122 |
for row in tqdm(data, desc="Cleaning"):
|
123 |
if row["models"][0] is None or row["models"][1] is None:
|
124 |
-
print(f"Invalid model names: {row['models']}")
|
125 |
continue
|
126 |
|
127 |
# Resolve model names
|
@@ -140,7 +163,6 @@ def clean_battle_data(
|
|
140 |
models_public[1] == "" and models_public[0] != ""
|
141 |
):
|
142 |
ct_invalid += 1
|
143 |
-
print(f"Invalid model names: {models_public}")
|
144 |
continue
|
145 |
|
146 |
if models_public[0] == "" or models_public[0] == "Model A":
|
@@ -151,82 +173,71 @@ def clean_battle_data(
|
|
151 |
anony = False
|
152 |
models = models_public
|
153 |
if not models_public == models_hidden:
|
154 |
-
print(f"Model names mismatch: {models_public} vs {models_hidden}")
|
155 |
ct_invalid += 1
|
156 |
continue
|
157 |
-
|
158 |
-
|
159 |
-
|
160 |
-
|
161 |
-
|
162 |
-
|
163 |
-
|
164 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
165 |
|
166 |
# Replace bard with palm
|
|
|
167 |
if task_name == "image_editing":
|
168 |
-
|
169 |
-
|
170 |
-
try:
|
171 |
-
platform, model_name, task = _model.split("_")
|
172 |
-
except ValueError:
|
173 |
-
valid = False
|
174 |
-
break
|
175 |
-
if not (platform in ["playground", "imagenhub"] and task == "edition"):
|
176 |
-
valid = False
|
177 |
-
break
|
178 |
-
if not valid:
|
179 |
ct_invalid += 1
|
180 |
continue
|
181 |
-
for
|
182 |
-
platform, model_name, task = _model.split("_")
|
183 |
-
models[i] = model_name
|
184 |
-
|
185 |
elif task_name == "t2i_generation":
|
186 |
-
|
187 |
-
|
188 |
-
try:
|
189 |
-
platform, model_name, task = _model.split("_")
|
190 |
-
except ValueError:
|
191 |
-
valid = False
|
192 |
-
break
|
193 |
-
if not (platform.lower() in ["playground", "imagenhub", 'fal'] and (task == "generation" or task == "text2image")):
|
194 |
-
valid = False
|
195 |
-
break
|
196 |
-
if not valid:
|
197 |
ct_invalid += 1
|
198 |
continue
|
199 |
-
for
|
200 |
-
|
201 |
-
|
202 |
-
|
203 |
-
elif task_name == "video_generation":
|
204 |
-
valid = True
|
205 |
-
for _model in models:
|
206 |
-
try:
|
207 |
-
platform, model_name, task = _model.split("_")
|
208 |
-
except ValueError:
|
209 |
-
valid = False
|
210 |
-
break
|
211 |
-
if not (platform in ["videogenhub", "fal"] and task == "generation" or task == "text2video"):
|
212 |
-
valid = False
|
213 |
-
break
|
214 |
-
if not valid:
|
215 |
-
ct_invalid += 1
|
216 |
-
continue
|
217 |
-
for i, _model in enumerate(models):
|
218 |
-
platform, model_name, task = _model.split("_")
|
219 |
-
models[i] = model_name
|
220 |
|
221 |
else:
|
222 |
raise ValueError(f"Invalid task_name: {task_name}")
|
223 |
|
224 |
-
models = [replace_model_name(m, row["tstamp"]) for m in models]
|
225 |
-
|
226 |
# Exclude certain models
|
227 |
if exclude_model_names and any(x in exclude_model_names for x in models):
|
228 |
ct_invalid += 1
|
229 |
continue
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
230 |
|
231 |
if mode == "conv_release":
|
232 |
# assert the two images are the same
|
@@ -251,6 +262,14 @@ def clean_battle_data(
|
|
251 |
continue
|
252 |
|
253 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
254 |
ip = row["ip"]
|
255 |
if ip not in all_ips:
|
256 |
all_ips[ip] = {"ip": ip, "count": 0, "sanitized_id": len(all_ips)}
|
@@ -262,45 +281,21 @@ def clean_battle_data(
|
|
262 |
|
263 |
if ban_ip_list is not None and ip in ban_ip_list:
|
264 |
ct_banned += 1
|
265 |
-
print(f"User {user_id} is banned")
|
266 |
continue
|
267 |
-
|
268 |
-
"image_editing": ["source_prompt", "target_prompt", "instruct_prompt"],
|
269 |
-
"t2i_generation": ["prompt"],
|
270 |
-
"video_generation": ["prompt"]
|
271 |
-
}
|
272 |
-
|
273 |
-
model_a_inputs = row["states"][0].copy()
|
274 |
-
# pop conv_id and model_name
|
275 |
-
model_a_inputs.pop("conv_id")
|
276 |
-
model_a_inputs.pop("model_name")
|
277 |
-
model_b_inputs = row["states"][1].copy()
|
278 |
-
model_b_inputs.pop("conv_id")
|
279 |
-
model_b_inputs.pop("model_name")
|
280 |
-
for key in model_a_inputs:
|
281 |
-
if not (key in model_b_inputs and model_a_inputs[key] == model_b_inputs[key]):
|
282 |
-
print(f"Inconsistent inputs: {model_a_inputs} vs {model_b_inputs}")
|
283 |
-
ct_invalid += 1
|
284 |
-
continue
|
285 |
-
if mode == "conv_release":
|
286 |
-
if any(key not in model_a_inputs for key in required_keys_each_task[task_name]):
|
287 |
-
print(f"Missing required keys: {model_a_inputs}, {required_keys_each_task[task_name]}")
|
288 |
-
ct_invalid += 1
|
289 |
-
continue
|
290 |
-
|
291 |
-
inputs = model_a_inputs
|
292 |
# Save the results
|
293 |
battles.append(
|
294 |
dict(
|
295 |
-
|
296 |
-
model_b_conv_id=row["states"][1]["conv_id"],
|
297 |
-
inputs=inputs,
|
298 |
model_a=models[0],
|
299 |
model_b=models[1],
|
300 |
-
vote_type=row["type"],
|
301 |
winner=convert_type[row["type"]],
|
302 |
judge=f"arena_user_{user_id}",
|
|
|
|
|
|
|
303 |
anony=anony,
|
|
|
304 |
tstamp=row["tstamp"],
|
305 |
)
|
306 |
)
|
@@ -337,7 +332,7 @@ if __name__ == "__main__":
|
|
337 |
parser.add_argument(
|
338 |
"--mode", type=str, choices=["simple", "conv_release"], default="simple"
|
339 |
)
|
340 |
-
parser.add_argument("--task_name", type=str, default="image_editing", choices=["image_editing", "t2i_generation"
|
341 |
parser.add_argument("--exclude-model-names", type=str, nargs="+")
|
342 |
parser.add_argument("--ban-ip-file", type=str)
|
343 |
parser.add_argument("--sanitize-ip", action="store_true", default=False)
|
@@ -355,19 +350,27 @@ if __name__ == "__main__":
|
|
355 |
).strftime("%Y%m%d")
|
356 |
|
357 |
if args.mode == "simple":
|
358 |
-
|
359 |
-
|
360 |
-
|
361 |
-
|
362 |
-
|
363 |
-
|
364 |
-
|
365 |
-
|
366 |
print("Samples:")
|
367 |
for i in range(min(4, len(battles))):
|
368 |
print(battles[i])
|
369 |
output = f"clean_battle_{args.task_name}_{cutoff_date}.json"
|
370 |
elif args.mode == "conv_release":
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
371 |
output = f"clean_battle_{args.task_name}_conv_{cutoff_date}.json"
|
372 |
|
373 |
with open(output, "w") as fout:
|
|
|
18 |
from tqdm import tqdm
|
19 |
|
20 |
from .basic_stats import get_log_files, NUM_SERVERS, LOG_ROOT_DIR
|
21 |
+
from .utils import detect_language, get_time_stamp_from_date
|
22 |
|
23 |
VOTES = ["tievote", "leftvote", "rightvote", "bothbad_vote"]
|
24 |
+
IDENTITY_WORDS = [
|
25 |
+
"vicuna",
|
26 |
+
"lmsys",
|
27 |
+
"koala",
|
28 |
+
"uc berkeley",
|
29 |
+
"open assistant",
|
30 |
+
"laion",
|
31 |
+
"chatglm",
|
32 |
+
"chatgpt",
|
33 |
+
"gpt-4",
|
34 |
+
"openai",
|
35 |
+
"anthropic",
|
36 |
+
"claude",
|
37 |
+
"bard",
|
38 |
+
"palm",
|
39 |
+
"lamda",
|
40 |
+
"google",
|
41 |
+
"llama",
|
42 |
+
"qianwan",
|
43 |
+
"alibaba",
|
44 |
+
"mistral",
|
45 |
+
"zhipu",
|
46 |
+
"KEG lab",
|
47 |
+
"01.AI",
|
48 |
+
"AI2",
|
49 |
+
"Tülu",
|
50 |
+
"Tulu",
|
51 |
+
"NETWORK ERROR DUE TO HIGH TRAFFIC. PLEASE REGENERATE OR REFRESH THIS PAGE.",
|
52 |
+
"$MODERATION$ YOUR INPUT VIOLATES OUR CONTENT MODERATION GUIDELINES.",
|
53 |
+
"API REQUEST ERROR. Please increase the number of max tokens.",
|
54 |
+
"**API REQUEST ERROR** Reason: The response was blocked.",
|
55 |
+
"**API REQUEST ERROR**",
|
56 |
+
]
|
57 |
+
|
58 |
+
for i in range(len(IDENTITY_WORDS)):
|
59 |
+
IDENTITY_WORDS[i] = IDENTITY_WORDS[i].lower()
|
60 |
|
|
|
|
|
|
|
61 |
|
62 |
def remove_html(raw):
|
63 |
if raw.startswith("<h3>"):
|
|
|
77 |
|
78 |
def replace_model_name(old_name, tstamp):
|
79 |
replace_dict = {
|
80 |
+
"bard": "palm-2",
|
81 |
+
"claude-v1": "claude-1",
|
82 |
+
"claude-instant-v1": "claude-instant-1",
|
83 |
+
"oasst-sft-1-pythia-12b": "oasst-pythia-12b",
|
84 |
+
"claude-2": "claude-2.0",
|
85 |
}
|
86 |
+
if old_name in ["gpt-4", "gpt-3.5-turbo"]:
|
87 |
+
if tstamp > 1687849200:
|
88 |
+
return old_name + "-0613"
|
89 |
+
else:
|
90 |
+
return old_name + "-0314"
|
91 |
if old_name in replace_dict:
|
92 |
+
return replace_dict[old_name]
|
|
|
|
|
|
|
|
|
|
|
93 |
return old_name
|
94 |
|
95 |
|
|
|
105 |
break
|
106 |
except FileNotFoundError:
|
107 |
time.sleep(2)
|
|
|
|
|
|
|
|
|
108 |
return data
|
109 |
|
110 |
|
111 |
def read_file_parallel(log_files, num_threads=16):
|
112 |
data_all = []
|
113 |
+
from multiprocessing import Pool
|
114 |
+
|
115 |
+
with Pool(num_threads) as p:
|
116 |
+
ret_all = list(tqdm(p.imap(read_file, log_files), total=len(log_files)))
|
117 |
+
for ret in ret_all:
|
118 |
+
data_all.extend(ret)
|
119 |
+
return data_all
|
|
|
|
|
|
|
|
|
|
|
120 |
|
121 |
def load_image(image_path):
|
122 |
try:
|
|
|
127 |
def clean_battle_data(
|
128 |
log_files, exclude_model_names, ban_ip_list=None, sanitize_ip=False, mode="simple", task_name="image_editing"
|
129 |
):
|
130 |
+
data = read_file_parallel(log_files, num_threads=16)
|
131 |
|
132 |
convert_type = {
|
133 |
"leftvote": "model_a",
|
|
|
145 |
battles = []
|
146 |
for row in tqdm(data, desc="Cleaning"):
|
147 |
if row["models"][0] is None or row["models"][1] is None:
|
|
|
148 |
continue
|
149 |
|
150 |
# Resolve model names
|
|
|
163 |
models_public[1] == "" and models_public[0] != ""
|
164 |
):
|
165 |
ct_invalid += 1
|
|
|
166 |
continue
|
167 |
|
168 |
if models_public[0] == "" or models_public[0] == "Model A":
|
|
|
173 |
anony = False
|
174 |
models = models_public
|
175 |
if not models_public == models_hidden:
|
|
|
176 |
ct_invalid += 1
|
177 |
continue
|
178 |
+
|
179 |
+
# # Detect langauge
|
180 |
+
# state = row["states"][0]
|
181 |
+
# if state["offset"] >= len(state["messages"]):
|
182 |
+
# ct_invalid += 1
|
183 |
+
# continue
|
184 |
+
# lang_code = detect_language(state["messages"][state["offset"]][1])
|
185 |
+
|
186 |
+
# # Drop conversations if the model names are leaked
|
187 |
+
# leaked_identity = False
|
188 |
+
# messages = ""
|
189 |
+
# for i in range(2):
|
190 |
+
# state = row["states"][i]
|
191 |
+
# for turn_idx, (role, msg) in enumerate(
|
192 |
+
# state["messages"][state["offset"] :]
|
193 |
+
# ):
|
194 |
+
# if msg:
|
195 |
+
# messages += msg.lower()
|
196 |
+
# for word in IDENTITY_WORDS:
|
197 |
+
# if word in messages:
|
198 |
+
# leaked_identity = True
|
199 |
+
# break
|
200 |
+
|
201 |
+
# if leaked_identity:
|
202 |
+
# ct_leaked_identity += 1
|
203 |
+
# continue
|
204 |
|
205 |
# Replace bard with palm
|
206 |
+
models = [replace_model_name(m, row["tstamp"]) for m in models]
|
207 |
if task_name == "image_editing":
|
208 |
+
if not all(x.startswith("imagenhub_") and x.endswith("_edition") for x in models):
|
209 |
+
# print(f"Invalid model names: {models}")
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
210 |
ct_invalid += 1
|
211 |
continue
|
212 |
+
models = [x[len("imagenhub_"):-len("_edition")] for x in models]
|
|
|
|
|
|
|
213 |
elif task_name == "t2i_generation":
|
214 |
+
if not all("playground" in x.lower() or (x.startswith("imagenhub_") and x.endswith("_generation")) for x in models):
|
215 |
+
# print(f"Invalid model names: {models}")
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
216 |
ct_invalid += 1
|
217 |
continue
|
218 |
+
# models = [x[len("imagenhub_"):-len("_generation")] for x in models]
|
219 |
+
for i, model_name in enumerate(models):
|
220 |
+
if model_name.startswith("imagenhub_"):
|
221 |
+
models[i] = model_name[len("imagenhub_"):-len("_generation")]
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
222 |
|
223 |
else:
|
224 |
raise ValueError(f"Invalid task_name: {task_name}")
|
225 |
|
|
|
|
|
226 |
# Exclude certain models
|
227 |
if exclude_model_names and any(x in exclude_model_names for x in models):
|
228 |
ct_invalid += 1
|
229 |
continue
|
230 |
+
|
231 |
+
# if models[0] not in model_infos or models[1] not in model_infos:
|
232 |
+
# continue
|
233 |
+
|
234 |
+
# # Exclude votes before the starting date
|
235 |
+
# if model_infos and (model_infos[models[0]]["starting_from"] > row["tstamp"] or model_infos[models[1]]["starting_from"] > row["tstamp"]):
|
236 |
+
# print(f"Invalid vote before the valid starting date for {models[0]} and {models[1]}")
|
237 |
+
# ct_invalid += 1
|
238 |
+
# continue
|
239 |
+
|
240 |
+
|
241 |
|
242 |
if mode == "conv_release":
|
243 |
# assert the two images are the same
|
|
|
262 |
continue
|
263 |
|
264 |
|
265 |
+
question_id = row["states"][0]["conv_id"]
|
266 |
+
# conversation_a = to_openai_format(
|
267 |
+
# row["states"][0]["messages"][row["states"][0]["offset"] :]
|
268 |
+
# )
|
269 |
+
# conversation_b = to_openai_format(
|
270 |
+
# row["states"][1]["messages"][row["states"][1]["offset"] :]
|
271 |
+
# )
|
272 |
+
|
273 |
ip = row["ip"]
|
274 |
if ip not in all_ips:
|
275 |
all_ips[ip] = {"ip": ip, "count": 0, "sanitized_id": len(all_ips)}
|
|
|
281 |
|
282 |
if ban_ip_list is not None and ip in ban_ip_list:
|
283 |
ct_banned += 1
|
|
|
284 |
continue
|
285 |
+
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
286 |
# Save the results
|
287 |
battles.append(
|
288 |
dict(
|
289 |
+
question_id=question_id,
|
|
|
|
|
290 |
model_a=models[0],
|
291 |
model_b=models[1],
|
|
|
292 |
winner=convert_type[row["type"]],
|
293 |
judge=f"arena_user_{user_id}",
|
294 |
+
# conversation_a=conversation_a,
|
295 |
+
# conversation_b=conversation_b,
|
296 |
+
# turn=len(conversation_a) // 2,
|
297 |
anony=anony,
|
298 |
+
# language=lang_code,
|
299 |
tstamp=row["tstamp"],
|
300 |
)
|
301 |
)
|
|
|
332 |
parser.add_argument(
|
333 |
"--mode", type=str, choices=["simple", "conv_release"], default="simple"
|
334 |
)
|
335 |
+
parser.add_argument("--task_name", type=str, default="image_editing", choices=["image_editing", "t2i_generation"])
|
336 |
parser.add_argument("--exclude-model-names", type=str, nargs="+")
|
337 |
parser.add_argument("--ban-ip-file", type=str)
|
338 |
parser.add_argument("--sanitize-ip", action="store_true", default=False)
|
|
|
350 |
).strftime("%Y%m%d")
|
351 |
|
352 |
if args.mode == "simple":
|
353 |
+
for x in battles:
|
354 |
+
for key in [
|
355 |
+
"conversation_a",
|
356 |
+
"conversation_b",
|
357 |
+
"question_id",
|
358 |
+
]:
|
359 |
+
if key in x:
|
360 |
+
del x[key]
|
361 |
print("Samples:")
|
362 |
for i in range(min(4, len(battles))):
|
363 |
print(battles[i])
|
364 |
output = f"clean_battle_{args.task_name}_{cutoff_date}.json"
|
365 |
elif args.mode == "conv_release":
|
366 |
+
# new_battles = []
|
367 |
+
# for x in battles:
|
368 |
+
# if not x["anony"]:
|
369 |
+
# continue
|
370 |
+
# for key in []:
|
371 |
+
# del x[key]
|
372 |
+
# new_battles.append(x)
|
373 |
+
# battles = new_battles
|
374 |
output = f"clean_battle_{args.task_name}_conv_{cutoff_date}.json"
|
375 |
|
376 |
with open(output, "w") as fout:
|
arena_elo/elo_rating/elo_analysis.py
CHANGED
@@ -11,9 +11,9 @@ import pandas as pd
|
|
11 |
import plotly.express as px
|
12 |
from tqdm import tqdm
|
13 |
|
|
|
14 |
from .basic_stats import get_log_files
|
15 |
from .clean_battle_data import clean_battle_data
|
16 |
-
from .utils import get_model_info
|
17 |
|
18 |
pd.options.display.float_format = "{:.2f}".format
|
19 |
|
@@ -214,9 +214,8 @@ def visualize_average_win_rate(battles, limit_show_number):
|
|
214 |
width=700,
|
215 |
)
|
216 |
fig.update_layout(
|
217 |
-
yaxis_title="Average Win Rate", xaxis_title="Model", showlegend=False
|
218 |
)
|
219 |
-
fig.update_traces(textfont_size=16)
|
220 |
return fig
|
221 |
|
222 |
|
@@ -247,7 +246,6 @@ def visualize_bootstrap_elo_rating(df, df_final, limit_show_number):
|
|
247 |
width=700,
|
248 |
)
|
249 |
fig.update_layout(xaxis_title="Model", yaxis_title="Rating")
|
250 |
-
fig.update_traces(textfont_size=16)
|
251 |
return fig
|
252 |
|
253 |
|
@@ -340,7 +338,6 @@ if __name__ == "__main__":
|
|
340 |
"--rating-system", type=str, choices=["bt", "elo"], default="bt"
|
341 |
)
|
342 |
parser.add_argument("--exclude-tie", action="store_true", default=False)
|
343 |
-
parser.add_argument("--min_num_battles_per_model", type=int, default=25)
|
344 |
args = parser.parse_args()
|
345 |
|
346 |
np.random.seed(42)
|
@@ -352,23 +349,7 @@ if __name__ == "__main__":
|
|
352 |
# Read data from all log files
|
353 |
log_files = get_log_files(args.max_num_files)
|
354 |
battles = clean_battle_data(log_files)
|
355 |
-
|
356 |
-
if args.min_num_battles_per_model:
|
357 |
-
num_battles_per_model = defaultdict(int)
|
358 |
-
# use pd
|
359 |
-
for _, battle in battles.iterrows():
|
360 |
-
num_battles_per_model[battle["model_a"]] += 1
|
361 |
-
num_battles_per_model[battle["model_b"]] += 1
|
362 |
-
to_remove_models = [
|
363 |
-
model for model, num_battles in num_battles_per_model.items() if num_battles < args.min_num_battles_per_model
|
364 |
-
]
|
365 |
-
battles_with_enough_battles = battles[
|
366 |
-
~battles["model_a"].isin(to_remove_models) & ~battles["model_b"].isin(to_remove_models)
|
367 |
-
]
|
368 |
-
print(f"Remove models with less than {args.min_num_battles_per_model} battles: {to_remove_models}")
|
369 |
-
print(f"Number of battles: {len(battles)} -> {len(battles_with_enough_battles)}")
|
370 |
-
battles = battles_with_enough_battles
|
371 |
-
|
372 |
anony_results = report_elo_analysis_results(
|
373 |
battles, rating_system=args.rating_system, num_bootstrap=args.num_bootstrap, anony_only=True
|
374 |
)
|
@@ -381,22 +362,9 @@ if __name__ == "__main__":
|
|
381 |
pretty_print_elo_rating(anony_results["elo_rating_online"])
|
382 |
print("# Median")
|
383 |
pretty_print_elo_rating(anony_results["elo_rating_final"])
|
384 |
-
print(f"
|
385 |
-
print(f"Full last update : {full_results['last_updated_datetime']}")
|
386 |
-
|
387 |
-
|
388 |
-
# # save heatmap results in the same directory of the cleaned battle file
|
389 |
-
win_fraction_heatmap_file = args.clean_battle_file.replace(".json", "_win_fraction_heatmap.jpg")
|
390 |
-
battle_count_heatmap_file = args.clean_battle_file.replace(".json", "_battle_count_heatmap.jpg")
|
391 |
-
average_win_rate_bar_file = args.clean_battle_file.replace(".json", "_average_win_rate_bar.jpg")
|
392 |
-
bootstrap_elo_rating_file = args.clean_battle_file.replace(".json", "_bootstrap_elo_rating.jpg")
|
393 |
-
anony_results["win_fraction_heatmap"].write_image(win_fraction_heatmap_file)
|
394 |
-
anony_results["battle_count_heatmap"].write_image(battle_count_heatmap_file)
|
395 |
-
anony_results["average_win_rate_bar"].write_image(average_win_rate_bar_file)
|
396 |
-
anony_results["bootstrap_elo_rating"].write_image(bootstrap_elo_rating_file)
|
397 |
-
|
398 |
|
399 |
-
last_updated_tstamp =
|
400 |
cutoff_date = datetime.datetime.fromtimestamp(
|
401 |
last_updated_tstamp, tz=timezone("US/Pacific")
|
402 |
).strftime("%Y%m%d")
|
@@ -408,6 +376,3 @@ if __name__ == "__main__":
|
|
408 |
}
|
409 |
with open(f"elo_results_{cutoff_date}.pkl", "wb") as fout:
|
410 |
pickle.dump(results, fout)
|
411 |
-
|
412 |
-
with open("cut_off_date.txt", "w") as fout:
|
413 |
-
fout.write(cutoff_date)
|
|
|
11 |
import plotly.express as px
|
12 |
from tqdm import tqdm
|
13 |
|
14 |
+
from .model_registry import get_model_info
|
15 |
from .basic_stats import get_log_files
|
16 |
from .clean_battle_data import clean_battle_data
|
|
|
17 |
|
18 |
pd.options.display.float_format = "{:.2f}".format
|
19 |
|
|
|
214 |
width=700,
|
215 |
)
|
216 |
fig.update_layout(
|
217 |
+
yaxis_title="Average Win Rate", xaxis_title="Model", showlegend=False
|
218 |
)
|
|
|
219 |
return fig
|
220 |
|
221 |
|
|
|
246 |
width=700,
|
247 |
)
|
248 |
fig.update_layout(xaxis_title="Model", yaxis_title="Rating")
|
|
|
249 |
return fig
|
250 |
|
251 |
|
|
|
338 |
"--rating-system", type=str, choices=["bt", "elo"], default="bt"
|
339 |
)
|
340 |
parser.add_argument("--exclude-tie", action="store_true", default=False)
|
|
|
341 |
args = parser.parse_args()
|
342 |
|
343 |
np.random.seed(42)
|
|
|
349 |
# Read data from all log files
|
350 |
log_files = get_log_files(args.max_num_files)
|
351 |
battles = clean_battle_data(log_files)
|
352 |
+
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
353 |
anony_results = report_elo_analysis_results(
|
354 |
battles, rating_system=args.rating_system, num_bootstrap=args.num_bootstrap, anony_only=True
|
355 |
)
|
|
|
362 |
pretty_print_elo_rating(anony_results["elo_rating_online"])
|
363 |
print("# Median")
|
364 |
pretty_print_elo_rating(anony_results["elo_rating_final"])
|
365 |
+
print(f"last update : {anony_results['last_updated_datetime']}")
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
366 |
|
367 |
+
last_updated_tstamp = anony_results["last_updated_tstamp"]
|
368 |
cutoff_date = datetime.datetime.fromtimestamp(
|
369 |
last_updated_tstamp, tz=timezone("US/Pacific")
|
370 |
).strftime("%Y%m%d")
|
|
|
376 |
}
|
377 |
with open(f"elo_results_{cutoff_date}.pkl", "wb") as fout:
|
378 |
pickle.dump(results, fout)
|
|
|
|
|
|
arena_elo/elo_rating/generate_leaderboard.py
CHANGED
@@ -2,12 +2,15 @@ import fire
|
|
2 |
import json
|
3 |
import pandas as pd
|
4 |
import pickle
|
5 |
-
|
6 |
|
7 |
def main(
|
8 |
-
|
9 |
-
|
|
|
10 |
):
|
|
|
|
|
11 |
with open(elo_rating_pkl, "rb") as fin:
|
12 |
elo_rating_results = pickle.load(fin)
|
13 |
|
@@ -16,23 +19,19 @@ def main(
|
|
16 |
anony_leaderboard_data = anony_elo_rating_results["leaderboard_table_df"]
|
17 |
full_leaderboard_data = full_elo_rating_results["leaderboard_table_df"]
|
18 |
|
19 |
-
print(anony_leaderboard_data)
|
20 |
# Model,MT-bench (score),Arena Elo rating,MMLU,License,Link
|
21 |
fields = ["key", "Model", "Arena Elo rating (anony)", "Arena Elo rating (full)", "License", "Organization", "Link"]
|
22 |
# set Organization and license to empty for now
|
23 |
all_models = anony_leaderboard_data.index.tolist()
|
24 |
|
25 |
-
model_info = {}
|
26 |
for model in all_models:
|
27 |
-
|
28 |
-
|
29 |
-
|
30 |
-
"
|
31 |
-
"
|
32 |
-
|
33 |
-
|
34 |
-
"Link": registered_model_info.link
|
35 |
-
}
|
36 |
|
37 |
if model in anony_leaderboard_data.index:
|
38 |
model_info[model]["Arena Elo rating (anony)"] = anony_leaderboard_data.loc[model, "rating"]
|
@@ -43,6 +42,10 @@ def main(
|
|
43 |
model_info[model]["Arena Elo rating (full)"] = full_leaderboard_data.loc[model, "rating"]
|
44 |
else:
|
45 |
model_info[model]["Arena Elo rating (full)"] = 0
|
|
|
|
|
|
|
|
|
46 |
|
47 |
final_model_info = {}
|
48 |
for model in model_info:
|
|
|
2 |
import json
|
3 |
import pandas as pd
|
4 |
import pickle
|
5 |
+
|
6 |
|
7 |
def main(
|
8 |
+
model_info_file: str,
|
9 |
+
elo_rating_pkl: str,
|
10 |
+
output_csv: str
|
11 |
):
|
12 |
+
model_info = json.load(open(model_info_file))
|
13 |
+
|
14 |
with open(elo_rating_pkl, "rb") as fin:
|
15 |
elo_rating_results = pickle.load(fin)
|
16 |
|
|
|
19 |
anony_leaderboard_data = anony_elo_rating_results["leaderboard_table_df"]
|
20 |
full_leaderboard_data = full_elo_rating_results["leaderboard_table_df"]
|
21 |
|
|
|
22 |
# Model,MT-bench (score),Arena Elo rating,MMLU,License,Link
|
23 |
fields = ["key", "Model", "Arena Elo rating (anony)", "Arena Elo rating (full)", "License", "Organization", "Link"]
|
24 |
# set Organization and license to empty for now
|
25 |
all_models = anony_leaderboard_data.index.tolist()
|
26 |
|
|
|
27 |
for model in all_models:
|
28 |
+
if not model in model_info:
|
29 |
+
model_info[model] = {}
|
30 |
+
model_info[model]["License"] = "N/A"
|
31 |
+
model_info[model]["Organization"] = "N/A"
|
32 |
+
model_info[model]["Link"] = "N/A"
|
33 |
+
model_info[model]["Model"] = model
|
34 |
+
model_info[model]["key"] = model
|
|
|
|
|
35 |
|
36 |
if model in anony_leaderboard_data.index:
|
37 |
model_info[model]["Arena Elo rating (anony)"] = anony_leaderboard_data.loc[model, "rating"]
|
|
|
42 |
model_info[model]["Arena Elo rating (full)"] = full_leaderboard_data.loc[model, "rating"]
|
43 |
else:
|
44 |
model_info[model]["Arena Elo rating (full)"] = 0
|
45 |
+
# if model in anony_leaderboard_data.index:
|
46 |
+
# model_info[model]["Arena Elo rating"] = anony_leaderboard_data.loc[model, "rating"]
|
47 |
+
# else:
|
48 |
+
# model_info[model]["Arena Elo rating"] = 0
|
49 |
|
50 |
final_model_info = {}
|
51 |
for model in model_info:
|
arena_elo/elo_rating/model_registry.py
ADDED
@@ -0,0 +1,578 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
"""Additional information of the models."""
|
2 |
+
from collections import namedtuple, OrderedDict
|
3 |
+
from typing import List
|
4 |
+
|
5 |
+
|
6 |
+
ModelInfo = namedtuple("ModelInfo", ["simple_name", "link", "description"])
|
7 |
+
|
8 |
+
|
9 |
+
model_info = OrderedDict()
|
10 |
+
|
11 |
+
|
12 |
+
def register_model_info(
|
13 |
+
full_names: List[str], simple_name: str, link: str, description: str
|
14 |
+
):
|
15 |
+
info = ModelInfo(simple_name, link, description)
|
16 |
+
|
17 |
+
for full_name in full_names:
|
18 |
+
model_info[full_name] = info
|
19 |
+
|
20 |
+
|
21 |
+
def get_model_info(name: str) -> ModelInfo:
|
22 |
+
if name in model_info:
|
23 |
+
return model_info[name]
|
24 |
+
else:
|
25 |
+
# To fix this, please use `register_model_info` to register your model
|
26 |
+
return ModelInfo(
|
27 |
+
name, "", "Register the description at arena.model/model_registry.py"
|
28 |
+
)
|
29 |
+
|
30 |
+
|
31 |
+
register_model_info(
|
32 |
+
[
|
33 |
+
"IEITYuan/Yuan2-2B-Janus-hf",
|
34 |
+
"IEITYuan/Yuan2-2B-hf",
|
35 |
+
"IEITYuan/Yuan2-51B-hf",
|
36 |
+
"IEITYuan/Yuan2-102B-hf",
|
37 |
+
],
|
38 |
+
"IEIT-Yuan2",
|
39 |
+
"https://github.com/IEIT-Yuan/Yuan-2.0",
|
40 |
+
"Yuan2.0 is a new generation Fundamental Large Language Model developed by IEIT System.",
|
41 |
+
)
|
42 |
+
|
43 |
+
register_model_info(
|
44 |
+
["mixtral-8x7b-instruct-v0.1", "mistral-7b-instruct"],
|
45 |
+
"Mixtral of experts",
|
46 |
+
"https://mistral.ai/news/mixtral-of-experts/",
|
47 |
+
"A Mixture-of-Experts model by Mistral AI",
|
48 |
+
)
|
49 |
+
|
50 |
+
register_model_info(
|
51 |
+
["gemini-pro"],
|
52 |
+
"Gemini",
|
53 |
+
"https://blog.google/technology/ai/google-gemini-pro-imagen-duet-ai-update/",
|
54 |
+
"Gemini by Google",
|
55 |
+
)
|
56 |
+
|
57 |
+
register_model_info(
|
58 |
+
["gemini-pro-vision"],
|
59 |
+
"Gemini",
|
60 |
+
"https://blog.google/technology/ai/google-gemini-pro-imagen-duet-ai-update/",
|
61 |
+
"Gemini by Google",
|
62 |
+
)
|
63 |
+
|
64 |
+
register_model_info(
|
65 |
+
["solar-10.7b-instruct-v1.0"],
|
66 |
+
"SOLAR-10.7B-Instruct",
|
67 |
+
"https://huggingface.co/upstage/SOLAR-10.7B-Instruct-v1.0",
|
68 |
+
"A model trained using depth up-scaling by Upstage AI",
|
69 |
+
)
|
70 |
+
|
71 |
+
register_model_info(
|
72 |
+
["gpt-4-turbo"],
|
73 |
+
"GPT-4-Turbo",
|
74 |
+
"https://platform.openai.com/docs/models/gpt-4-and-gpt-4-turbo",
|
75 |
+
"GPT-4-Turbo by OpenAI",
|
76 |
+
)
|
77 |
+
|
78 |
+
register_model_info(
|
79 |
+
["gpt-4-vision-preview"],
|
80 |
+
"gpt-4-vision-preview",
|
81 |
+
"https://platform.openai.com/docs/models/gpt-4-and-gpt-4-turbo",
|
82 |
+
"GPT-4(V) by OpenAI",
|
83 |
+
)
|
84 |
+
|
85 |
+
register_model_info(
|
86 |
+
["gpt-3.5-turbo", "gpt-3.5-turbo-0314", "gpt-3.5-turbo-0613", "gpt-3.5-turbo-1106"],
|
87 |
+
"GPT-3.5",
|
88 |
+
"https://platform.openai.com/docs/models/gpt-3-5",
|
89 |
+
"GPT-3.5-Turbo by OpenAI",
|
90 |
+
)
|
91 |
+
|
92 |
+
register_model_info(
|
93 |
+
["gpt-4", "gpt-4-0314", "gpt-4-0613"],
|
94 |
+
"GPT-4",
|
95 |
+
"https://openai.com/research/gpt-4",
|
96 |
+
"GPT-4 by OpenAI",
|
97 |
+
)
|
98 |
+
|
99 |
+
register_model_info(
|
100 |
+
["claude-2.1", "claude-2.0"],
|
101 |
+
"Claude",
|
102 |
+
"https://www.anthropic.com/index/claude-2",
|
103 |
+
"Claude 2 by Anthropic",
|
104 |
+
)
|
105 |
+
|
106 |
+
register_model_info(
|
107 |
+
["claude-1"],
|
108 |
+
"Claude",
|
109 |
+
"https://www.anthropic.com/index/introducing-claude",
|
110 |
+
"Claude 1 by Anthropic",
|
111 |
+
)
|
112 |
+
|
113 |
+
register_model_info(
|
114 |
+
["claude-instant-1", "claude-instant-1.2"],
|
115 |
+
"Claude Instant",
|
116 |
+
"https://www.anthropic.com/index/introducing-claude",
|
117 |
+
"Claude Instant by Anthropic",
|
118 |
+
)
|
119 |
+
|
120 |
+
register_model_info(
|
121 |
+
["pplx-70b-online", "pplx-7b-online"],
|
122 |
+
"pplx-online-llms",
|
123 |
+
"https://blog.perplexity.ai/blog/introducing-pplx-online-llms",
|
124 |
+
"Online LLM API by Perplexity AI",
|
125 |
+
)
|
126 |
+
|
127 |
+
register_model_info(
|
128 |
+
["openhermes-2.5-mistral-7b"],
|
129 |
+
"OpenHermes-2.5-Mistral-7B",
|
130 |
+
"https://huggingface.co/teknium/OpenHermes-2.5-Mistral-7B",
|
131 |
+
"a mistral-based model fine-tuned on 1M GPT-4 outputs",
|
132 |
+
)
|
133 |
+
|
134 |
+
register_model_info(
|
135 |
+
["starling-lm-7b-alpha"],
|
136 |
+
"Starling-LM-7B-alpha",
|
137 |
+
"https://huggingface.co/berkeley-nest/Starling-LM-7B-alpha",
|
138 |
+
"an open model trained using RLAIF by Berkeley",
|
139 |
+
)
|
140 |
+
|
141 |
+
register_model_info(
|
142 |
+
["tulu-2-dpo-70b"],
|
143 |
+
"Tulu 2",
|
144 |
+
"https://huggingface.co/allenai/tulu-2-dpo-70b",
|
145 |
+
"an instruction and RLHF model by UW/AllenAI",
|
146 |
+
)
|
147 |
+
|
148 |
+
register_model_info(
|
149 |
+
["yi-34b-chat", "yi-6b-chat"],
|
150 |
+
"Yi-Chat",
|
151 |
+
"https://huggingface.co/01-ai/Yi-34B-Chat",
|
152 |
+
"A large language model by 01 AI",
|
153 |
+
)
|
154 |
+
|
155 |
+
register_model_info(
|
156 |
+
["llama-2-70b-chat", "llama-2-34b-chat", "llama-2-13b-chat", "llama-2-7b-chat"],
|
157 |
+
"Llama 2",
|
158 |
+
"https://ai.meta.com/llama/",
|
159 |
+
"open foundation and fine-tuned chat models by Meta",
|
160 |
+
)
|
161 |
+
|
162 |
+
register_model_info(
|
163 |
+
[
|
164 |
+
"vicuna-33b",
|
165 |
+
"vicuna-33b-v1.3",
|
166 |
+
"vicuna-13b",
|
167 |
+
"vicuna-13b-v1.3",
|
168 |
+
"vicuna-7b",
|
169 |
+
"vicuna-7b-v1.3",
|
170 |
+
],
|
171 |
+
"Vicuna",
|
172 |
+
"https://lmsys.org/blog/2023-03-30-vicuna/",
|
173 |
+
"a chat assistant fine-tuned on user-shared conversations by LMSYS",
|
174 |
+
)
|
175 |
+
|
176 |
+
register_model_info(
|
177 |
+
["chatglm3-6b", "chatglm2-6b", "chatglm-6b"],
|
178 |
+
"ChatGLM",
|
179 |
+
"https://chatglm.cn/blog",
|
180 |
+
"an open bilingual dialogue language model by Tsinghua University",
|
181 |
+
)
|
182 |
+
|
183 |
+
register_model_info(
|
184 |
+
["openchat-3.5"],
|
185 |
+
"OpenChat 3.5",
|
186 |
+
"https://github.com/imoneoi/openchat",
|
187 |
+
"an open model fine-tuned on Mistral-7B using C-RLFT",
|
188 |
+
)
|
189 |
+
|
190 |
+
register_model_info(
|
191 |
+
["tenyxchat-7b-v1"],
|
192 |
+
"TenyxChat-7B",
|
193 |
+
"https://huggingface.co/tenyx/TenyxChat-7B-v1",
|
194 |
+
"an open model DPO trained on top of OpenChat-3.5 using Tenyx fine-tuning",
|
195 |
+
)
|
196 |
+
|
197 |
+
register_model_info(
|
198 |
+
["zephyr-7b-beta", "zephyr-7b-alpha"],
|
199 |
+
"Zephyr",
|
200 |
+
"https://huggingface.co/HuggingFaceH4/zephyr-7b-alpha",
|
201 |
+
"a chatbot fine-tuned from Mistral by Hugging Face",
|
202 |
+
)
|
203 |
+
|
204 |
+
register_model_info(
|
205 |
+
["notus-7b-v1"],
|
206 |
+
"Notus",
|
207 |
+
"https://huggingface.co/argilla/notus-7b-v1",
|
208 |
+
"a chatbot fine-tuned from Zephyr SFT by Argilla",
|
209 |
+
)
|
210 |
+
|
211 |
+
register_model_info(
|
212 |
+
["catppt"],
|
213 |
+
"CatPPT",
|
214 |
+
"https://huggingface.co/rishiraj/CatPPT",
|
215 |
+
"a chatbot fine-tuned from a SLERP merged model by Rishiraj Acharya",
|
216 |
+
)
|
217 |
+
|
218 |
+
register_model_info(
|
219 |
+
["TinyLlama"],
|
220 |
+
"TinyLlama",
|
221 |
+
"https://huggingface.co/TinyLlama/TinyLlama-1.1B-Chat-v1.0",
|
222 |
+
"The TinyLlama project is an open endeavor to pretrain a 1.1B Llama model on 3 trillion tokens.",
|
223 |
+
)
|
224 |
+
|
225 |
+
register_model_info(
|
226 |
+
["qwen-14b-chat"],
|
227 |
+
"Qwen",
|
228 |
+
"https://huggingface.co/Qwen/Qwen-14B-Chat",
|
229 |
+
"a large language model by Alibaba Cloud",
|
230 |
+
)
|
231 |
+
|
232 |
+
register_model_info(
|
233 |
+
["codellama-34b-instruct", "codellama-13b-instruct", "codellama-7b-instruct"],
|
234 |
+
"Code Llama",
|
235 |
+
"https://ai.meta.com/blog/code-llama-large-language-model-coding/",
|
236 |
+
"open foundation models for code by Meta",
|
237 |
+
)
|
238 |
+
|
239 |
+
register_model_info(
|
240 |
+
["wizardlm-70b", "wizardlm-30b", "wizardlm-13b"],
|
241 |
+
"WizardLM",
|
242 |
+
"https://github.com/nlpxucan/WizardLM",
|
243 |
+
"an instruction-following LLM using evol-instruct by Microsoft",
|
244 |
+
)
|
245 |
+
|
246 |
+
register_model_info(
|
247 |
+
["wizardcoder-15b-v1.0"],
|
248 |
+
"WizardLM",
|
249 |
+
"https://github.com/nlpxucan/WizardLM/tree/main/WizardCoder",
|
250 |
+
"Empowering Code Large Language Models with Evol-Instruct",
|
251 |
+
)
|
252 |
+
|
253 |
+
register_model_info(
|
254 |
+
["mpt-7b-chat", "mpt-30b-chat"],
|
255 |
+
"MPT-Chat",
|
256 |
+
"https://www.mosaicml.com/blog/mpt-30b",
|
257 |
+
"a chatbot fine-tuned from MPT by MosaicML",
|
258 |
+
)
|
259 |
+
|
260 |
+
register_model_info(
|
261 |
+
["guanaco-33b", "guanaco-65b"],
|
262 |
+
"Guanaco",
|
263 |
+
"https://github.com/artidoro/qlora",
|
264 |
+
"a model fine-tuned with QLoRA by UW",
|
265 |
+
)
|
266 |
+
|
267 |
+
register_model_info(
|
268 |
+
["gpt4all-13b-snoozy"],
|
269 |
+
"GPT4All-Snoozy",
|
270 |
+
"https://github.com/nomic-ai/gpt4all",
|
271 |
+
"a finetuned LLaMA model on assistant style data by Nomic AI",
|
272 |
+
)
|
273 |
+
|
274 |
+
register_model_info(
|
275 |
+
["koala-13b"],
|
276 |
+
"Koala",
|
277 |
+
"https://bair.berkeley.edu/blog/2023/04/03/koala",
|
278 |
+
"a dialogue model for academic research by BAIR",
|
279 |
+
)
|
280 |
+
|
281 |
+
register_model_info(
|
282 |
+
["RWKV-4-Raven-14B"],
|
283 |
+
"RWKV-4-Raven",
|
284 |
+
"https://huggingface.co/BlinkDL/rwkv-4-raven",
|
285 |
+
"an RNN with transformer-level LLM performance",
|
286 |
+
)
|
287 |
+
|
288 |
+
register_model_info(
|
289 |
+
["alpaca-13b"],
|
290 |
+
"Alpaca",
|
291 |
+
"https://crfm.stanford.edu/2023/03/13/alpaca.html",
|
292 |
+
"a model fine-tuned from LLaMA on instruction-following demonstrations by Stanford",
|
293 |
+
)
|
294 |
+
|
295 |
+
register_model_info(
|
296 |
+
["oasst-pythia-12b"],
|
297 |
+
"OpenAssistant (oasst)",
|
298 |
+
"https://open-assistant.io",
|
299 |
+
"an Open Assistant for everyone by LAION",
|
300 |
+
)
|
301 |
+
|
302 |
+
register_model_info(
|
303 |
+
["oasst-sft-7-llama-30b"],
|
304 |
+
"OpenAssistant (oasst)",
|
305 |
+
"https://open-assistant.io",
|
306 |
+
"an Open Assistant for everyone by LAION",
|
307 |
+
)
|
308 |
+
|
309 |
+
register_model_info(
|
310 |
+
["palm-2"],
|
311 |
+
"PaLM 2 Chat",
|
312 |
+
"https://cloud.google.com/vertex-ai/docs/release-notes#May_10_2023",
|
313 |
+
"PaLM 2 for Chat (chat-bison@001) by Google",
|
314 |
+
)
|
315 |
+
|
316 |
+
register_model_info(
|
317 |
+
["llama-7b", "llama-13b"],
|
318 |
+
"LLaMA",
|
319 |
+
"https://arxiv.org/abs/2302.13971",
|
320 |
+
"open and efficient foundation language models by Meta",
|
321 |
+
)
|
322 |
+
|
323 |
+
register_model_info(
|
324 |
+
["open-llama-7b-v2-open-instruct", "open-llama-7b-open-instruct"],
|
325 |
+
"Open LLaMa (Open Instruct)",
|
326 |
+
"https://medium.com/vmware-data-ml-blog/starter-llm-for-the-enterprise-instruction-tuning-openllama-7b-d05fc3bbaccc",
|
327 |
+
"Open LLaMa fine-tuned on instruction-following data by VMware",
|
328 |
+
)
|
329 |
+
|
330 |
+
register_model_info(
|
331 |
+
["dolly-v2-12b"],
|
332 |
+
"Dolly",
|
333 |
+
"https://www.databricks.com/blog/2023/04/12/dolly-first-open-commercially-viable-instruction-tuned-llm",
|
334 |
+
"an instruction-tuned open large language model by Databricks",
|
335 |
+
)
|
336 |
+
|
337 |
+
register_model_info(
|
338 |
+
["stablelm-tuned-alpha-7b"],
|
339 |
+
"StableLM",
|
340 |
+
"https://github.com/stability-AI/stableLM",
|
341 |
+
"Stability AI language models",
|
342 |
+
)
|
343 |
+
|
344 |
+
register_model_info(
|
345 |
+
["codet5p-6b"],
|
346 |
+
"CodeT5p-6b",
|
347 |
+
"https://huggingface.co/Salesforce/codet5p-6b",
|
348 |
+
"Code completion model released by Salesforce",
|
349 |
+
)
|
350 |
+
|
351 |
+
register_model_info(
|
352 |
+
["fastchat-t5-3b", "fastchat-t5-3b-v1.0"],
|
353 |
+
"FastChat-T5",
|
354 |
+
"https://huggingface.co/lmsys/fastchat-t5-3b-v1.0",
|
355 |
+
"a chat assistant fine-tuned from FLAN-T5 by LMSYS",
|
356 |
+
)
|
357 |
+
|
358 |
+
register_model_info(
|
359 |
+
["phoenix-inst-chat-7b"],
|
360 |
+
"Phoenix-7B",
|
361 |
+
"https://huggingface.co/FreedomIntelligence/phoenix-inst-chat-7b",
|
362 |
+
"a multilingual chat assistant fine-tuned from Bloomz to democratize ChatGPT across languages by CUHK(SZ)",
|
363 |
+
)
|
364 |
+
|
365 |
+
register_model_info(
|
366 |
+
["realm-7b-v1"],
|
367 |
+
"ReaLM",
|
368 |
+
"https://github.com/FreedomIntelligence/ReaLM",
|
369 |
+
"A chatbot fine-tuned from LLaMA2 with data generated via iterative calls to UserGPT and ChatGPT by CUHK(SZ) and SRIBD.",
|
370 |
+
)
|
371 |
+
|
372 |
+
register_model_info(
|
373 |
+
["billa-7b-sft"],
|
374 |
+
"BiLLa-7B-SFT",
|
375 |
+
"https://huggingface.co/Neutralzz/BiLLa-7B-SFT",
|
376 |
+
"an instruction-tuned bilingual LLaMA with enhanced reasoning ability by an independent researcher",
|
377 |
+
)
|
378 |
+
|
379 |
+
register_model_info(
|
380 |
+
["h2ogpt-gm-oasst1-en-2048-open-llama-7b-preview-300bt-v2"],
|
381 |
+
"h2oGPT-GM-7b",
|
382 |
+
"https://huggingface.co/h2oai/h2ogpt-gm-oasst1-en-2048-open-llama-7b-preview-300bt-v2",
|
383 |
+
"an instruction-tuned OpenLLaMA with enhanced conversational ability by H2O.ai",
|
384 |
+
)
|
385 |
+
|
386 |
+
register_model_info(
|
387 |
+
["baize-v2-7b", "baize-v2-13b"],
|
388 |
+
"Baize v2",
|
389 |
+
"https://github.com/project-baize/baize-chatbot#v2",
|
390 |
+
"A chatbot fine-tuned from LLaMA with ChatGPT self-chat data and Self-Disillation with Feedback (SDF) by UCSD and SYSU.",
|
391 |
+
)
|
392 |
+
|
393 |
+
register_model_info(
|
394 |
+
[
|
395 |
+
"airoboros-l2-7b-2.1",
|
396 |
+
"airoboros-l2-13b-2.1",
|
397 |
+
"airoboros-c34b-2.1",
|
398 |
+
"airoboros-l2-70b-2.1",
|
399 |
+
],
|
400 |
+
"airoboros",
|
401 |
+
"https://huggingface.co/jondurbin/airoboros-l2-70b-2.1",
|
402 |
+
"an instruction-tuned LlaMa model tuned with 100% synthetic instruction-response pairs from GPT4",
|
403 |
+
)
|
404 |
+
|
405 |
+
register_model_info(
|
406 |
+
[
|
407 |
+
"spicyboros-7b-2.2",
|
408 |
+
"spicyboros-13b-2.2",
|
409 |
+
"spicyboros-70b-2.2",
|
410 |
+
],
|
411 |
+
"spicyboros",
|
412 |
+
"https://huggingface.co/jondurbin/spicyboros-70b-2.2",
|
413 |
+
"de-aligned versions of the airoboros models",
|
414 |
+
)
|
415 |
+
|
416 |
+
register_model_info(
|
417 |
+
["Robin-7b-v2", "Robin-13b-v2", "Robin-33b-v2"],
|
418 |
+
"Robin-v2",
|
419 |
+
"https://huggingface.co/OptimalScale/robin-7b-v2-delta",
|
420 |
+
"A chatbot fine-tuned from LLaMA-7b, achieving competitive performance on chitchat, commonsense reasoning and instruction-following tasks, by OptimalScale, HKUST.",
|
421 |
+
)
|
422 |
+
|
423 |
+
register_model_info(
|
424 |
+
["manticore-13b-chat"],
|
425 |
+
"Manticore 13B Chat",
|
426 |
+
"https://huggingface.co/openaccess-ai-collective/manticore-13b-chat-pyg",
|
427 |
+
"A chatbot fine-tuned from LlaMa across several CoT and chat datasets.",
|
428 |
+
)
|
429 |
+
|
430 |
+
register_model_info(
|
431 |
+
["redpajama-incite-7b-chat"],
|
432 |
+
"RedPajama-INCITE-7B-Chat",
|
433 |
+
"https://huggingface.co/togethercomputer/RedPajama-INCITE-7B-Chat",
|
434 |
+
"A chatbot fine-tuned from RedPajama-INCITE-7B-Base by Together",
|
435 |
+
)
|
436 |
+
|
437 |
+
register_model_info(
|
438 |
+
[
|
439 |
+
"falcon-7b",
|
440 |
+
"falcon-7b-instruct",
|
441 |
+
"falcon-40b",
|
442 |
+
"falcon-40b-instruct",
|
443 |
+
"falcon-180b",
|
444 |
+
"falcon-180b-chat",
|
445 |
+
],
|
446 |
+
"Falcon",
|
447 |
+
"https://huggingface.co/tiiuae/falcon-180B",
|
448 |
+
"TII's flagship series of large language models",
|
449 |
+
)
|
450 |
+
|
451 |
+
register_model_info(
|
452 |
+
["tigerbot-7b-sft"],
|
453 |
+
"Tigerbot",
|
454 |
+
"https://huggingface.co/TigerResearch/tigerbot-7b-sft",
|
455 |
+
"TigerBot is a large-scale language model (LLM) with multiple languages and tasks.",
|
456 |
+
)
|
457 |
+
|
458 |
+
register_model_info(
|
459 |
+
["internlm-chat-7b", "internlm-chat-7b-8k"],
|
460 |
+
"InternLM",
|
461 |
+
"https://huggingface.co/internlm/internlm-chat-7b",
|
462 |
+
"InternLM is a multi-language large-scale language model (LLM), developed by SHLAB.",
|
463 |
+
)
|
464 |
+
|
465 |
+
register_model_info(
|
466 |
+
["Qwen-7B-Chat"],
|
467 |
+
"Qwen",
|
468 |
+
"https://huggingface.co/Qwen/Qwen-7B-Chat",
|
469 |
+
"Qwen is a multi-language large-scale language model (LLM), developed by Damo Academy.",
|
470 |
+
)
|
471 |
+
|
472 |
+
register_model_info(
|
473 |
+
["Llama2-Chinese-13b-Chat", "LLama2-Chinese-13B"],
|
474 |
+
"Llama2-Chinese",
|
475 |
+
"https://huggingface.co/FlagAlpha/Llama2-Chinese-13b-Chat",
|
476 |
+
"Llama2-Chinese is a multi-language large-scale language model (LLM), developed by FlagAlpha.",
|
477 |
+
)
|
478 |
+
|
479 |
+
register_model_info(
|
480 |
+
["Chinese-Alpaca-2-7B", "Chinese-Alpaca-2-13B"],
|
481 |
+
"Chinese-Alpaca",
|
482 |
+
"https://huggingface.co/hfl/chinese-alpaca-2-13b",
|
483 |
+
"New extended Chinese vocabulary beyond Llama-2, open-sourcing the Chinese LLaMA-2 and Alpaca-2 LLMs.",
|
484 |
+
)
|
485 |
+
|
486 |
+
register_model_info(
|
487 |
+
["Vigogne-2-7B-Instruct", "Vigogne-2-13B-Instruct"],
|
488 |
+
"Vigogne-Instruct",
|
489 |
+
"https://huggingface.co/bofenghuang/vigogne-2-7b-instruct",
|
490 |
+
"Vigogne-Instruct is a French large language model (LLM) optimized for instruction-following, developed by Bofeng Huang",
|
491 |
+
)
|
492 |
+
|
493 |
+
register_model_info(
|
494 |
+
["Vigogne-2-7B-Chat", "Vigogne-2-13B-Chat"],
|
495 |
+
"Vigogne-Chat",
|
496 |
+
"https://huggingface.co/bofenghuang/vigogne-2-7b-chat",
|
497 |
+
"Vigogne-Chat is a French large language model (LLM) optimized for instruction-following and multi-turn dialogues, developed by Bofeng Huang",
|
498 |
+
)
|
499 |
+
|
500 |
+
register_model_info(
|
501 |
+
["stable-vicuna-13B-HF"],
|
502 |
+
"stable-vicuna",
|
503 |
+
"https://huggingface.co/TheBloke/stable-vicuna-13B-HF",
|
504 |
+
"StableVicuna is a Vicuna model fine-tuned using RLHF via PPO on various conversational and instructional datasets.",
|
505 |
+
)
|
506 |
+
|
507 |
+
register_model_info(
|
508 |
+
["deluxe-chat-v1", "deluxe-chat-v1.1", "deluxe-chat-v1.2"],
|
509 |
+
"DeluxeChat",
|
510 |
+
"",
|
511 |
+
"Deluxe Chat",
|
512 |
+
)
|
513 |
+
|
514 |
+
register_model_info(
|
515 |
+
[
|
516 |
+
"Xwin-LM-7B-V0.1",
|
517 |
+
"Xwin-LM-13B-V0.1",
|
518 |
+
"Xwin-LM-70B-V0.1",
|
519 |
+
"Xwin-LM-7B-V0.2",
|
520 |
+
"Xwin-LM-13B-V0.2",
|
521 |
+
],
|
522 |
+
"Xwin-LM",
|
523 |
+
"https://github.com/Xwin-LM/Xwin-LM",
|
524 |
+
"Chat models developed by Xwin-LM team",
|
525 |
+
)
|
526 |
+
|
527 |
+
register_model_info(
|
528 |
+
["lemur-70b-chat"],
|
529 |
+
"Lemur-Chat",
|
530 |
+
"https://huggingface.co/OpenLemur/lemur-70b-chat-v1",
|
531 |
+
"an openly accessible language model optimized for both natural language and coding capabilities ",
|
532 |
+
)
|
533 |
+
|
534 |
+
register_model_info(
|
535 |
+
["Mistral-7B-OpenOrca"],
|
536 |
+
"Open-Orca",
|
537 |
+
"https://huggingface.co/Open-Orca/Mistral-7B-OpenOrca",
|
538 |
+
"A fine-tune of [Mistral 7B](https://huggingface.co/mistralai/Mistral-7B-v0.1) using [OpenOrca dataset](https://huggingface.co/datasets/Open-Orca/OpenOrca)",
|
539 |
+
)
|
540 |
+
|
541 |
+
register_model_info(
|
542 |
+
["dolphin-2.2.1-mistral-7b"],
|
543 |
+
"dolphin-mistral",
|
544 |
+
"https://huggingface.co/ehartford/dolphin-2.2.1-mistral-7b",
|
545 |
+
"An uncensored fine-tuned Mistral 7B",
|
546 |
+
)
|
547 |
+
|
548 |
+
register_model_info(
|
549 |
+
[
|
550 |
+
"AquilaChat-7B",
|
551 |
+
"AquilaChat2-7B",
|
552 |
+
"AquilaChat2-34B",
|
553 |
+
],
|
554 |
+
"Aquila-Chat",
|
555 |
+
"https://huggingface.co/BAAI/AquilaChat2-34B",
|
556 |
+
"Chat models developed by BAAI team",
|
557 |
+
)
|
558 |
+
|
559 |
+
register_model_info(
|
560 |
+
["xDAN-L1-Chat-RL-v1"],
|
561 |
+
"xDAN-L1-Chat",
|
562 |
+
"https://huggingface.co/xDAN-AI/xDAN-L1-Chat-RL-v1",
|
563 |
+
"A large language chat model created by xDAN-AI.",
|
564 |
+
)
|
565 |
+
|
566 |
+
register_model_info(
|
567 |
+
["MetaMath-70B-V1.0", "MetaMath-7B-V1.0"],
|
568 |
+
"MetaMath",
|
569 |
+
"https://huggingface.co/meta-math",
|
570 |
+
"MetaMath is a finetune of Llama2 on [MetaMathQA](https://huggingface.co/datasets/meta-math/MetaMathQA) that specializes in mathematical reasoning.",
|
571 |
+
)
|
572 |
+
|
573 |
+
register_model_info(
|
574 |
+
["Yuan2-2B-hf", "Yuan2-51B-hf", "Yuan2-102B-hf"],
|
575 |
+
"IEIYuan",
|
576 |
+
"https://huggingface.co/IEITYuan",
|
577 |
+
"Yuan2 is a Basemodel developed by IEI.",
|
578 |
+
)
|
arena_elo/elo_rating/upload_battle_data.py
CHANGED
@@ -2,36 +2,60 @@ import fire
|
|
2 |
import json
|
3 |
import os
|
4 |
import datasets
|
5 |
-
import random
|
6 |
import datetime
|
7 |
from pathlib import Path
|
8 |
from datetime import datetime
|
9 |
from PIL import Image
|
10 |
|
11 |
datasets.config.DEFAULT_MAX_BATCH_SIZE = 500
|
12 |
-
|
13 |
-
|
14 |
-
|
15 |
-
features
|
16 |
{
|
17 |
-
"
|
18 |
-
"
|
19 |
-
"
|
20 |
-
|
21 |
-
|
22 |
-
|
23 |
-
|
24 |
-
|
25 |
-
"
|
26 |
-
"
|
27 |
-
"
|
28 |
}
|
29 |
-
)
|
30 |
-
|
31 |
-
|
|
|
|
|
|
|
32 |
hf_dataset = datasets.Dataset.from_list(
|
33 |
data_file,
|
34 |
-
features=
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
35 |
split=split,
|
36 |
)
|
37 |
return hf_dataset
|
@@ -57,105 +81,106 @@ def get_date_from_time_stamp(unix_timestamp: int):
|
|
57 |
def load_battle_image(battle, log_dir):
|
58 |
image_path = Path(log_dir) / f"{get_date_from_time_stamp(battle['tstamp'])}-convinput_images" / f"input_image_{battle['question_id']}.png"
|
59 |
return load_image(image_path)
|
60 |
-
|
61 |
-
def find_media_path(conv_id, task_type, log_dir):
|
62 |
-
media_directory_map = {
|
63 |
-
"t2i_generation": "images/generation",
|
64 |
-
"image_edition": "images/edition",
|
65 |
-
"text2video": "videos/generation"
|
66 |
-
}
|
67 |
-
if task_type == "t2i_generation":
|
68 |
-
media_path = Path(log_dir) / media_directory_map[task_type] / f"{conv_id}.jpg"
|
69 |
-
else:
|
70 |
-
raise ValueError(f"Task type {task_type} not supported")
|
71 |
-
return media_path
|
72 |
|
73 |
|
74 |
def main(
|
75 |
-
|
76 |
-
|
77 |
-
|
78 |
-
|
79 |
-
|
80 |
-
config_name='battle',
|
81 |
-
split='test',
|
82 |
-
token = os.environ.get("HUGGINGFACE_TOKEN", None),
|
83 |
-
seed=42,
|
84 |
):
|
85 |
-
if data_file is None:
|
86 |
-
data_file = f"./results/latest/clean_battle_{task_type}.json"
|
87 |
-
if not os.path.exists(data_file):
|
88 |
-
raise ValueError(f"Data file {data_file} does not exist")
|
89 |
with open(data_file, "r") as f:
|
90 |
data = json.load(f)
|
91 |
|
92 |
-
# add index according to the tsamp
|
93 |
-
if seed is not None:
|
94 |
-
random.seed(seed)
|
95 |
|
96 |
|
97 |
-
|
98 |
-
|
99 |
-
"
|
100 |
-
"t2i_generation": ["prompt"],
|
101 |
-
"video_generation": ["prompt"]
|
102 |
}
|
103 |
-
|
104 |
-
|
105 |
-
|
106 |
-
|
107 |
-
|
108 |
-
|
109 |
-
|
110 |
-
|
111 |
-
|
112 |
-
|
113 |
-
|
114 |
-
|
115 |
-
|
116 |
-
|
117 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
118 |
|
119 |
-
|
120 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
121 |
for battle in data:
|
122 |
-
|
123 |
-
|
124 |
-
|
125 |
-
model_a_conv_id = battle['model_a_conv_id']
|
126 |
-
model_b_conv_id = battle['model_b_conv_id']
|
127 |
-
tstamp = battle['tstamp']
|
128 |
-
vote_type = battle['vote_type']
|
129 |
-
left_image_path = find_media_path(model_a_conv_id, task_type, log_dir)
|
130 |
-
right_image_path = find_media_path(model_b_conv_id, task_type, log_dir)
|
131 |
-
left_image = load_image(left_image_path)
|
132 |
-
right_image = load_image(right_image_path)
|
133 |
-
if left_image is None or right_image is None:
|
134 |
-
print(f"Skipping battle {battle['index']} due to missing images")
|
135 |
continue
|
|
|
136 |
new_data.append({
|
137 |
-
"
|
138 |
-
"
|
139 |
-
"
|
140 |
-
"
|
141 |
-
"
|
142 |
-
"
|
143 |
-
"
|
144 |
-
"
|
145 |
-
"
|
146 |
-
"anony": battle['anony'],
|
147 |
-
"judge": battle['judge'],
|
148 |
})
|
149 |
split = "test"
|
150 |
-
hf_dataset = create_hf_battle_dataset(new_data,
|
151 |
else:
|
152 |
-
raise ValueError(f"
|
153 |
|
|
|
154 |
print(hf_dataset)
|
155 |
print(f"Uploading to part {repo_id}:{split}...")
|
156 |
hf_dataset.push_to_hub(
|
157 |
repo_id=repo_id,
|
158 |
-
config_name=
|
159 |
split=split,
|
160 |
token=token,
|
161 |
commit_message=f"Add vision-arena {split} dataset",
|
|
|
2 |
import json
|
3 |
import os
|
4 |
import datasets
|
|
|
5 |
import datetime
|
6 |
from pathlib import Path
|
7 |
from datetime import datetime
|
8 |
from PIL import Image
|
9 |
|
10 |
datasets.config.DEFAULT_MAX_BATCH_SIZE = 500
|
11 |
+
def create_hf_dataset(data_file: str, split="test"):
|
12 |
+
hf_dataset = datasets.Dataset.from_list(
|
13 |
+
data_file,
|
14 |
+
features=datasets.Features(
|
15 |
{
|
16 |
+
"question_id": datasets.Value("string"),
|
17 |
+
"model": datasets.Value("string"),
|
18 |
+
"conversation": [
|
19 |
+
{
|
20 |
+
"role": datasets.Value("string"),
|
21 |
+
"content": datasets.Value("string"),
|
22 |
+
}
|
23 |
+
],
|
24 |
+
"language": datasets.Value("string"),
|
25 |
+
"image": datasets.Image(),
|
26 |
+
"turn": datasets.Value("int32"),
|
27 |
}
|
28 |
+
),
|
29 |
+
split=split,
|
30 |
+
)
|
31 |
+
return hf_dataset
|
32 |
+
|
33 |
+
def create_hf_battle_dataset(data_file: str, split="test"):
|
34 |
hf_dataset = datasets.Dataset.from_list(
|
35 |
data_file,
|
36 |
+
features=datasets.Features(
|
37 |
+
{
|
38 |
+
"question_id": datasets.Value("string"),
|
39 |
+
"model_a": datasets.Value("string"),
|
40 |
+
"model_b": datasets.Value("string"),
|
41 |
+
"conversation_a": [
|
42 |
+
{
|
43 |
+
"role": datasets.Value("string"),
|
44 |
+
"content": datasets.Value("string"),
|
45 |
+
}
|
46 |
+
],
|
47 |
+
"conversation_b": [
|
48 |
+
{
|
49 |
+
"role": datasets.Value("string"),
|
50 |
+
"content": datasets.Value("string"),
|
51 |
+
}
|
52 |
+
],
|
53 |
+
"language": datasets.Value("string"),
|
54 |
+
"image": datasets.Image(),
|
55 |
+
"turn": datasets.Value("int32"),
|
56 |
+
"anony": datasets.Value("bool"),
|
57 |
+
}
|
58 |
+
),
|
59 |
split=split,
|
60 |
)
|
61 |
return hf_dataset
|
|
|
81 |
def load_battle_image(battle, log_dir):
|
82 |
image_path = Path(log_dir) / f"{get_date_from_time_stamp(battle['tstamp'])}-convinput_images" / f"input_image_{battle['question_id']}.png"
|
83 |
return load_image(image_path)
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
84 |
|
85 |
|
86 |
def main(
|
87 |
+
data_file: str = "./results/latest/clean_battle_conv.json",
|
88 |
+
repo_id: str = "DongfuTingle/wildvision-bench",
|
89 |
+
log_dir: str = os.getenv("LOGDIR", "./vision-arena-logs/"),
|
90 |
+
mode="battle",
|
91 |
+
token = os.environ.get("HUGGINGFACE_TOKEN", None)
|
|
|
|
|
|
|
|
|
92 |
):
|
|
|
|
|
|
|
|
|
93 |
with open(data_file, "r") as f:
|
94 |
data = json.load(f)
|
95 |
|
|
|
|
|
|
|
96 |
|
97 |
|
98 |
+
has_image_stats = {
|
99 |
+
"has_image": 0,
|
100 |
+
"no_image": 0,
|
|
|
|
|
101 |
}
|
102 |
+
if mode == "keep_bad_only":
|
103 |
+
# anony only
|
104 |
+
data = [d for d in data if d["anony"]]
|
105 |
+
|
106 |
+
new_data = []
|
107 |
+
for battle in data:
|
108 |
+
image = load_battle_image(battle, log_dir)
|
109 |
+
if image is None:
|
110 |
+
has_image_stats["no_image"] += 1
|
111 |
+
# we don't keep the data without image
|
112 |
+
continue
|
113 |
+
has_image_stats["has_image"] += 1
|
114 |
+
|
115 |
+
if battle["winner"] in ["model_a", "model_b"]:
|
116 |
+
if battle["winner"] == "model_a":
|
117 |
+
worse_model = "model_b"
|
118 |
+
worse_conv = "conversation_b"
|
119 |
+
if battle["winner"] == "model_b":
|
120 |
+
worse_model = "model_a"
|
121 |
+
worse_conv = "conversation_a"
|
122 |
+
|
123 |
+
new_data.append({
|
124 |
+
"question_id": battle["question_id"],
|
125 |
+
"model": battle[worse_model],
|
126 |
+
"conversation": battle[worse_conv],
|
127 |
+
"language": battle["language"],
|
128 |
+
"image": image,
|
129 |
+
"turn": battle["turn"],
|
130 |
+
})
|
131 |
+
elif battle["winner"] == "tie (bothbad)":
|
132 |
+
|
133 |
+
new_data.append({
|
134 |
+
"question_id": battle["question_id"],
|
135 |
+
"model": battle["model_a"],
|
136 |
+
"conversation": battle["conversation_a"],
|
137 |
+
"language": battle["language"],
|
138 |
+
"image": image,
|
139 |
+
"turn": battle["turn"],
|
140 |
+
})
|
141 |
|
142 |
+
new_data.append({
|
143 |
+
"question_id": battle["question_id"],
|
144 |
+
"model": battle["model_b"],
|
145 |
+
"conversation": battle["conversation_b"],
|
146 |
+
"language": battle["language"],
|
147 |
+
"image": image,
|
148 |
+
"turn": battle["turn"],
|
149 |
+
})
|
150 |
+
|
151 |
+
split = "test"
|
152 |
+
hf_dataset = create_hf_dataset(new_data, "test")
|
153 |
+
|
154 |
+
elif mode == "battle":
|
155 |
+
new_data = []
|
156 |
for battle in data:
|
157 |
+
image = load_battle_image(battle, log_dir)
|
158 |
+
if image is None:
|
159 |
+
has_image_stats["no_image"] += 1
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
160 |
continue
|
161 |
+
has_image_stats["has_image"] += 1
|
162 |
new_data.append({
|
163 |
+
"question_id": battle["question_id"],
|
164 |
+
"model_a": battle["model_a"],
|
165 |
+
"model_b": battle["model_b"],
|
166 |
+
"conversation_a": battle["conversation_a"],
|
167 |
+
"conversation_b": battle["conversation_b"],
|
168 |
+
"language": battle["language"],
|
169 |
+
"image": image,
|
170 |
+
"turn": battle["turn"],
|
171 |
+
"anony": battle["anony"],
|
|
|
|
|
172 |
})
|
173 |
split = "test"
|
174 |
+
hf_dataset = create_hf_battle_dataset(new_data, "test")
|
175 |
else:
|
176 |
+
raise ValueError(f"Invalid mode: {mode}")
|
177 |
|
178 |
+
print(f"Stats: {has_image_stats}")
|
179 |
print(hf_dataset)
|
180 |
print(f"Uploading to part {repo_id}:{split}...")
|
181 |
hf_dataset.push_to_hub(
|
182 |
repo_id=repo_id,
|
183 |
+
config_name=mode,
|
184 |
split=split,
|
185 |
token=token,
|
186 |
commit_message=f"Add vision-arena {split} dataset",
|
arena_elo/elo_rating/utils.py
CHANGED
@@ -3,20 +3,12 @@ import pytz
|
|
3 |
import PIL
|
4 |
import os
|
5 |
|
6 |
-
import sys
|
7 |
-
sys.path.append('../')
|
8 |
-
from model.model_registry import get_model_info
|
9 |
-
|
10 |
def detect_language(text: str) -> str:
|
11 |
"""Detect the langauge of a string."""
|
12 |
-
|
13 |
-
|
14 |
-
|
15 |
-
|
16 |
-
import pycld2
|
17 |
-
except ImportError as e:
|
18 |
-
print("Please install the required libraries: polyglot, pycld2: pip3 install polyglot pyicu pycld2")
|
19 |
-
exit(1)
|
20 |
|
21 |
polyglot_logger.setLevel("ERROR")
|
22 |
|
|
|
3 |
import PIL
|
4 |
import os
|
5 |
|
|
|
|
|
|
|
|
|
6 |
def detect_language(text: str) -> str:
|
7 |
"""Detect the langauge of a string."""
|
8 |
+
import polyglot # pip3 install polyglot pyicu pycld2
|
9 |
+
from polyglot.detect import Detector
|
10 |
+
from polyglot.detect.base import logger as polyglot_logger
|
11 |
+
import pycld2
|
|
|
|
|
|
|
|
|
12 |
|
13 |
polyglot_logger.setLevel("ERROR")
|
14 |
|
arena_elo/generation_model_info.json
ADDED
@@ -0,0 +1,42 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"LCM": {
|
3 |
+
"Link": "https://huggingface.co/SimianLuo/LCM_Dreamshaper_v7",
|
4 |
+
"License": "MIT License",
|
5 |
+
"Organization": "Tsinghua University"
|
6 |
+
},
|
7 |
+
"Playground v2": {
|
8 |
+
"Link": "https://huggingface.co/playgroundai/playground-v2-1024px-aesthetic",
|
9 |
+
"License": "Playground v2 Community License",
|
10 |
+
"Organization": "Playground"
|
11 |
+
},
|
12 |
+
"OpenJourney": {
|
13 |
+
"Link": "https://huggingface.co/prompthero/openjourney",
|
14 |
+
"License": "creativeml-openrail-m",
|
15 |
+
"Organization": "PromptHero"
|
16 |
+
},
|
17 |
+
"SDXLTurbo": {
|
18 |
+
"Link": "https://huggingface.co/stabilityai/sdxl-turbo",
|
19 |
+
"License": "sai-nc-community (other)",
|
20 |
+
"Organization": "Stability AI"
|
21 |
+
},
|
22 |
+
"SDXL": {
|
23 |
+
"Link": "https://huggingface.co/stabilityai/stable-diffusion-xl-base-1.0",
|
24 |
+
"License": "openrail++",
|
25 |
+
"Organization": "Stability AI"
|
26 |
+
},
|
27 |
+
"PixArtAlpha": {
|
28 |
+
"Link": "https://huggingface.co/PixArt-alpha/PixArt-XL-2-1024-MS",
|
29 |
+
"License": "openrail++",
|
30 |
+
"Organization": "PixArt-alpha"
|
31 |
+
},
|
32 |
+
"SDXLLightning": {
|
33 |
+
"Link": "https://huggingface.co/ByteDance/SDXL-Lightning",
|
34 |
+
"License": "openrail++",
|
35 |
+
"Organization": "ByteDance"
|
36 |
+
},
|
37 |
+
"StableCascade": {
|
38 |
+
"Link": "https://huggingface.co/stabilityai/stable-cascade",
|
39 |
+
"License": "stable-cascade-nc-community (other)",
|
40 |
+
"Organization": "Stability AI"
|
41 |
+
}
|
42 |
+
}
|
arena_elo/results/20240315/elo_results_image_editing.pkl
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e528d30840c8a5787b0d2f08f27758b02f7eb718ccab695010b30df2127efe5e
|
3 |
+
size 57064
|
arena_elo/results/20240327/clean_battle_t2i_generation.json
CHANGED
The diff for this file is too large to render.
See raw diff
|
|
arena_elo/results/20240327/elo_results_t2i_generation.pkl
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fec01fe5af62dce3990634cffd1d926330ccbf170ef0c3b5d2f07fb06c4cf149
|
3 |
+
size 65189
|
arena_elo/results/20240327/t2i_generation_leaderboard.csv
CHANGED
@@ -1,10 +1,11 @@
|
|
1 |
key,Model,Arena Elo rating (anony),Arena Elo rating (full),License,Organization,Link
|
2 |
-
Playground v2.5,Playground v2.5,
|
3 |
-
StableCascade,StableCascade,
|
4 |
-
|
5 |
-
|
6 |
-
|
7 |
-
|
8 |
-
|
9 |
-
|
10 |
-
|
|
|
|
1 |
key,Model,Arena Elo rating (anony),Arena Elo rating (full),License,Organization,Link
|
2 |
+
Playground v2.5,Playground v2.5,1212.4660228554317,1233.021110469063,N/A,N/A,N/A
|
3 |
+
StableCascade,StableCascade,1098.8180832734447,1081.4707812969855,stable-cascade-nc-community (other),Stability AI,https://huggingface.co/stabilityai/stable-cascade
|
4 |
+
PlayGroundV2,PlayGroundV2,1089.993871580802,1088.6262085724481,N/A,N/A,N/A
|
5 |
+
Playground v2,Playground v2,1049.6156124554975,1051.618375116693,Playground v2 Community License,Playground,https://huggingface.co/playgroundai/playground-v2-1024px-aesthetic
|
6 |
+
SDXLLightning,SDXLLightning,1036.8582186059539,1039.3079223370821,openrail++,ByteDance,https://huggingface.co/ByteDance/SDXL-Lightning
|
7 |
+
PixArtAlpha,PixArtAlpha,1016.2085497703334,1002.5100184720693,openrail++,PixArt-alpha,https://huggingface.co/PixArt-alpha/PixArt-XL-2-1024-MS
|
8 |
+
SDXL,SDXL,960.5073412035289,965.3037978455568,openrail++,Stability AI,https://huggingface.co/stabilityai/stable-diffusion-xl-base-1.0
|
9 |
+
SDXLTurbo,SDXLTurbo,907.997473382927,910.1644152252661,sai-nc-community (other),Stability AI,https://huggingface.co/stabilityai/sdxl-turbo
|
10 |
+
OpenJourney,OpenJourney,836.9689192463355,827.9470053715127,creativeml-openrail-m,PromptHero,https://huggingface.co/prompthero/openjourney
|
11 |
+
LCM,LCM,790.5659076257482,805.8155782210948,MIT License,Tsinghua University,https://huggingface.co/SimianLuo/LCM_Dreamshaper_v7
|
arena_elo/results/20240328/clean_battle_image_editing.json
DELETED
@@ -1,890 +0,0 @@
|
|
1 |
-
[
|
2 |
-
{
|
3 |
-
"model_a": "CycleDiffusion",
|
4 |
-
"model_b": "InstructPix2Pix",
|
5 |
-
"winner": "model_b",
|
6 |
-
"judge": "arena_user_::1",
|
7 |
-
"anony": true,
|
8 |
-
"tstamp": 1707712630.872
|
9 |
-
},
|
10 |
-
{
|
11 |
-
"model_a": "CycleDiffusion",
|
12 |
-
"model_b": "InstructPix2Pix",
|
13 |
-
"winner": "model_b",
|
14 |
-
"judge": "arena_user_::1",
|
15 |
-
"anony": false,
|
16 |
-
"tstamp": 1707712699.668
|
17 |
-
},
|
18 |
-
{
|
19 |
-
"model_a": "Pix2PixZero",
|
20 |
-
"model_b": "MagicBrush",
|
21 |
-
"winner": "model_a",
|
22 |
-
"judge": "arena_user_::1",
|
23 |
-
"anony": true,
|
24 |
-
"tstamp": 1707712896.0427
|
25 |
-
},
|
26 |
-
{
|
27 |
-
"model_a": "CycleDiffusion",
|
28 |
-
"model_b": "InstructPix2Pix",
|
29 |
-
"winner": "model_b",
|
30 |
-
"judge": "arena_user_::1",
|
31 |
-
"anony": false,
|
32 |
-
"tstamp": 1707712929.7061
|
33 |
-
},
|
34 |
-
{
|
35 |
-
"model_a": "CycleDiffusion",
|
36 |
-
"model_b": "InstructPix2Pix",
|
37 |
-
"winner": "model_b",
|
38 |
-
"judge": "arena_user_::1",
|
39 |
-
"anony": true,
|
40 |
-
"tstamp": 1707713147.0445
|
41 |
-
},
|
42 |
-
{
|
43 |
-
"model_a": "CycleDiffusion",
|
44 |
-
"model_b": "PNP",
|
45 |
-
"winner": "model_b",
|
46 |
-
"judge": "arena_user_::1",
|
47 |
-
"anony": true,
|
48 |
-
"tstamp": 1707713198.9284
|
49 |
-
},
|
50 |
-
{
|
51 |
-
"model_a": "CycleDiffusion",
|
52 |
-
"model_b": "Prompt2prompt",
|
53 |
-
"winner": "model_b",
|
54 |
-
"judge": "arena_user_::1",
|
55 |
-
"anony": true,
|
56 |
-
"tstamp": 1707713210.1306
|
57 |
-
},
|
58 |
-
{
|
59 |
-
"model_a": "Prompt2prompt",
|
60 |
-
"model_b": "SDEdit",
|
61 |
-
"winner": "model_a",
|
62 |
-
"judge": "arena_user_::1",
|
63 |
-
"anony": true,
|
64 |
-
"tstamp": 1707713747.5115
|
65 |
-
},
|
66 |
-
{
|
67 |
-
"model_a": "PNP",
|
68 |
-
"model_b": "Pix2PixZero",
|
69 |
-
"winner": "model_a",
|
70 |
-
"judge": "arena_user_::1",
|
71 |
-
"anony": true,
|
72 |
-
"tstamp": 1707715613.7226
|
73 |
-
},
|
74 |
-
{
|
75 |
-
"model_a": "CycleDiffusion",
|
76 |
-
"model_b": "MagicBrush",
|
77 |
-
"winner": "model_b",
|
78 |
-
"judge": "arena_user_::1",
|
79 |
-
"anony": true,
|
80 |
-
"tstamp": 1707765708.2644
|
81 |
-
},
|
82 |
-
{
|
83 |
-
"model_a": "PNP",
|
84 |
-
"model_b": "CycleDiffusion",
|
85 |
-
"winner": "model_a",
|
86 |
-
"judge": "arena_user_::1",
|
87 |
-
"anony": true,
|
88 |
-
"tstamp": 1707765861.2742
|
89 |
-
},
|
90 |
-
{
|
91 |
-
"model_a": "PNP",
|
92 |
-
"model_b": "CycleDiffusion",
|
93 |
-
"winner": "model_a",
|
94 |
-
"judge": "arena_user_::1",
|
95 |
-
"anony": false,
|
96 |
-
"tstamp": 1707765975.0206
|
97 |
-
},
|
98 |
-
{
|
99 |
-
"model_a": "PNP",
|
100 |
-
"model_b": "CycleDiffusion",
|
101 |
-
"winner": "model_a",
|
102 |
-
"judge": "arena_user_::1",
|
103 |
-
"anony": true,
|
104 |
-
"tstamp": 1707768866.9065
|
105 |
-
},
|
106 |
-
{
|
107 |
-
"model_a": "SDEdit",
|
108 |
-
"model_b": "MagicBrush",
|
109 |
-
"winner": "model_b",
|
110 |
-
"judge": "arena_user_::1",
|
111 |
-
"anony": true,
|
112 |
-
"tstamp": 1707771673.2989
|
113 |
-
},
|
114 |
-
{
|
115 |
-
"model_a": "SDEdit",
|
116 |
-
"model_b": "MagicBrush",
|
117 |
-
"winner": "model_b",
|
118 |
-
"judge": "arena_user_::1",
|
119 |
-
"anony": true,
|
120 |
-
"tstamp": 1707784377.6617
|
121 |
-
},
|
122 |
-
{
|
123 |
-
"model_a": "SDEdit",
|
124 |
-
"model_b": "MagicBrush",
|
125 |
-
"winner": "model_b",
|
126 |
-
"judge": "arena_user_::1",
|
127 |
-
"anony": true,
|
128 |
-
"tstamp": 1707784466.8915
|
129 |
-
},
|
130 |
-
{
|
131 |
-
"model_a": "CycleDiffusion",
|
132 |
-
"model_b": "PNP",
|
133 |
-
"winner": "model_b",
|
134 |
-
"judge": "arena_user_::1",
|
135 |
-
"anony": true,
|
136 |
-
"tstamp": 1707784983.9581
|
137 |
-
},
|
138 |
-
{
|
139 |
-
"model_a": "MagicBrush",
|
140 |
-
"model_b": "SDEdit",
|
141 |
-
"winner": "model_a",
|
142 |
-
"judge": "arena_user_::1",
|
143 |
-
"anony": true,
|
144 |
-
"tstamp": 1707785277.16
|
145 |
-
},
|
146 |
-
{
|
147 |
-
"model_a": "MagicBrush",
|
148 |
-
"model_b": "SDEdit",
|
149 |
-
"winner": "model_a",
|
150 |
-
"judge": "arena_user_::1",
|
151 |
-
"anony": true,
|
152 |
-
"tstamp": 1707795299.0619
|
153 |
-
},
|
154 |
-
{
|
155 |
-
"model_a": "MagicBrush",
|
156 |
-
"model_b": "SDEdit",
|
157 |
-
"winner": "tie (bothbad)",
|
158 |
-
"judge": "arena_user_::1",
|
159 |
-
"anony": true,
|
160 |
-
"tstamp": 1707795798.752
|
161 |
-
},
|
162 |
-
{
|
163 |
-
"model_a": "SDEdit",
|
164 |
-
"model_b": "Prompt2prompt",
|
165 |
-
"winner": "model_b",
|
166 |
-
"judge": "arena_user_::1",
|
167 |
-
"anony": false,
|
168 |
-
"tstamp": 1707796435.7996
|
169 |
-
},
|
170 |
-
{
|
171 |
-
"model_a": "SDEdit",
|
172 |
-
"model_b": "CycleDiffusion",
|
173 |
-
"winner": "model_b",
|
174 |
-
"judge": "arena_user_::1",
|
175 |
-
"anony": false,
|
176 |
-
"tstamp": 1707797278.7369
|
177 |
-
},
|
178 |
-
{
|
179 |
-
"model_a": "SDEdit",
|
180 |
-
"model_b": "CycleDiffusion",
|
181 |
-
"winner": "model_a",
|
182 |
-
"judge": "arena_user_::1",
|
183 |
-
"anony": false,
|
184 |
-
"tstamp": 1707797279.6004
|
185 |
-
},
|
186 |
-
{
|
187 |
-
"model_a": "SDEdit",
|
188 |
-
"model_b": "Prompt2prompt",
|
189 |
-
"winner": "model_b",
|
190 |
-
"judge": "arena_user_::1",
|
191 |
-
"anony": true,
|
192 |
-
"tstamp": 1707805086.9739
|
193 |
-
},
|
194 |
-
{
|
195 |
-
"model_a": "PNP",
|
196 |
-
"model_b": "SDEdit",
|
197 |
-
"winner": "model_a",
|
198 |
-
"judge": "arena_user_::1",
|
199 |
-
"anony": true,
|
200 |
-
"tstamp": 1707805220.3253
|
201 |
-
},
|
202 |
-
{
|
203 |
-
"model_a": "InstructPix2Pix",
|
204 |
-
"model_b": "CycleDiffusion",
|
205 |
-
"winner": "tie (bothbad)",
|
206 |
-
"judge": "arena_user_::1",
|
207 |
-
"anony": true,
|
208 |
-
"tstamp": 1707805332.6322
|
209 |
-
},
|
210 |
-
{
|
211 |
-
"model_a": "InstructPix2Pix",
|
212 |
-
"model_b": "Prompt2prompt",
|
213 |
-
"winner": "model_b",
|
214 |
-
"judge": "arena_user_::1",
|
215 |
-
"anony": true,
|
216 |
-
"tstamp": 1707805476.0509
|
217 |
-
},
|
218 |
-
{
|
219 |
-
"model_a": "InstructPix2Pix",
|
220 |
-
"model_b": "Prompt2prompt",
|
221 |
-
"winner": "model_b",
|
222 |
-
"judge": "arena_user_::1",
|
223 |
-
"anony": true,
|
224 |
-
"tstamp": 1707818374.3438
|
225 |
-
},
|
226 |
-
{
|
227 |
-
"model_a": "PNP",
|
228 |
-
"model_b": "Prompt2prompt",
|
229 |
-
"winner": "model_b",
|
230 |
-
"judge": "arena_user_::1",
|
231 |
-
"anony": true,
|
232 |
-
"tstamp": 1707834631.9088
|
233 |
-
},
|
234 |
-
{
|
235 |
-
"model_a": "InstructPix2Pix",
|
236 |
-
"model_b": "SDEdit",
|
237 |
-
"winner": "model_a",
|
238 |
-
"judge": "arena_user_::1",
|
239 |
-
"anony": true,
|
240 |
-
"tstamp": 1707834954.0147
|
241 |
-
},
|
242 |
-
{
|
243 |
-
"model_a": "Prompt2prompt",
|
244 |
-
"model_b": "Pix2PixZero",
|
245 |
-
"winner": "tie (bothbad)",
|
246 |
-
"judge": "arena_user_::1",
|
247 |
-
"anony": true,
|
248 |
-
"tstamp": 1707835366.544
|
249 |
-
},
|
250 |
-
{
|
251 |
-
"model_a": "PNP",
|
252 |
-
"model_b": "SDEdit",
|
253 |
-
"winner": "model_a",
|
254 |
-
"judge": "arena_user_::1",
|
255 |
-
"anony": true,
|
256 |
-
"tstamp": 1707835643.6178
|
257 |
-
},
|
258 |
-
{
|
259 |
-
"model_a": "MagicBrush",
|
260 |
-
"model_b": "InstructPix2Pix",
|
261 |
-
"winner": "tie (bothbad)",
|
262 |
-
"judge": "arena_user_::1",
|
263 |
-
"anony": true,
|
264 |
-
"tstamp": 1707835789.25
|
265 |
-
},
|
266 |
-
{
|
267 |
-
"model_a": "MagicBrush",
|
268 |
-
"model_b": "PNP",
|
269 |
-
"winner": "tie (bothbad)",
|
270 |
-
"judge": "arena_user_::1",
|
271 |
-
"anony": true,
|
272 |
-
"tstamp": 1707836852.671
|
273 |
-
},
|
274 |
-
{
|
275 |
-
"model_a": "MagicBrush",
|
276 |
-
"model_b": "InstructPix2Pix",
|
277 |
-
"winner": "model_a",
|
278 |
-
"judge": "arena_user_::1",
|
279 |
-
"anony": false,
|
280 |
-
"tstamp": 1707836952.6082
|
281 |
-
},
|
282 |
-
{
|
283 |
-
"model_a": "CycleDiffusion",
|
284 |
-
"model_b": "SDEdit",
|
285 |
-
"winner": "tie (bothbad)",
|
286 |
-
"judge": "arena_user_::1",
|
287 |
-
"anony": false,
|
288 |
-
"tstamp": 1707837020.7148
|
289 |
-
},
|
290 |
-
{
|
291 |
-
"model_a": "InstructPix2Pix",
|
292 |
-
"model_b": "PNP",
|
293 |
-
"winner": "model_a",
|
294 |
-
"judge": "arena_user_::1",
|
295 |
-
"anony": true,
|
296 |
-
"tstamp": 1707837226.2259
|
297 |
-
},
|
298 |
-
{
|
299 |
-
"model_a": "Prompt2prompt",
|
300 |
-
"model_b": "Pix2PixZero",
|
301 |
-
"winner": "model_a",
|
302 |
-
"judge": "arena_user_::1",
|
303 |
-
"anony": true,
|
304 |
-
"tstamp": 1707838166.1449
|
305 |
-
},
|
306 |
-
{
|
307 |
-
"model_a": "InstructPix2Pix",
|
308 |
-
"model_b": "MagicBrush",
|
309 |
-
"winner": "tie (bothbad)",
|
310 |
-
"judge": "arena_user_::1",
|
311 |
-
"anony": true,
|
312 |
-
"tstamp": 1707838405.0013
|
313 |
-
},
|
314 |
-
{
|
315 |
-
"model_a": "MagicBrush",
|
316 |
-
"model_b": "CycleDiffusion",
|
317 |
-
"winner": "model_a",
|
318 |
-
"judge": "arena_user_::1",
|
319 |
-
"anony": true,
|
320 |
-
"tstamp": 1707839133.3126
|
321 |
-
},
|
322 |
-
{
|
323 |
-
"model_a": "Prompt2prompt",
|
324 |
-
"model_b": "InstructPix2Pix",
|
325 |
-
"winner": "model_a",
|
326 |
-
"judge": "arena_user_::1",
|
327 |
-
"anony": true,
|
328 |
-
"tstamp": 1707839484.6824
|
329 |
-
},
|
330 |
-
{
|
331 |
-
"model_a": "PNP",
|
332 |
-
"model_b": "InstructPix2Pix",
|
333 |
-
"winner": "tie (bothbad)",
|
334 |
-
"judge": "arena_user_::1",
|
335 |
-
"anony": true,
|
336 |
-
"tstamp": 1707850104.2499
|
337 |
-
},
|
338 |
-
{
|
339 |
-
"model_a": "InstructPix2Pix",
|
340 |
-
"model_b": "Pix2PixZero",
|
341 |
-
"winner": "model_a",
|
342 |
-
"judge": "arena_user_::1",
|
343 |
-
"anony": true,
|
344 |
-
"tstamp": 1707851384.7689
|
345 |
-
},
|
346 |
-
{
|
347 |
-
"model_a": "PNP",
|
348 |
-
"model_b": "MagicBrush",
|
349 |
-
"winner": "model_b",
|
350 |
-
"judge": "arena_user_::1",
|
351 |
-
"anony": true,
|
352 |
-
"tstamp": 1707851936.9466
|
353 |
-
},
|
354 |
-
{
|
355 |
-
"model_a": "CycleDiffusion",
|
356 |
-
"model_b": "MagicBrush",
|
357 |
-
"winner": "tie (bothbad)",
|
358 |
-
"judge": "arena_user_::1",
|
359 |
-
"anony": true,
|
360 |
-
"tstamp": 1707852836.3291
|
361 |
-
},
|
362 |
-
{
|
363 |
-
"model_a": "CycleDiffusion",
|
364 |
-
"model_b": "MagicBrush",
|
365 |
-
"winner": "tie (bothbad)",
|
366 |
-
"judge": "arena_user_::1",
|
367 |
-
"anony": false,
|
368 |
-
"tstamp": 1707852878.673
|
369 |
-
},
|
370 |
-
{
|
371 |
-
"model_a": "Prompt2prompt",
|
372 |
-
"model_b": "InstructPix2Pix",
|
373 |
-
"winner": "model_a",
|
374 |
-
"judge": "arena_user_::1",
|
375 |
-
"anony": true,
|
376 |
-
"tstamp": 1707853008.1359
|
377 |
-
},
|
378 |
-
{
|
379 |
-
"model_a": "InstructPix2Pix",
|
380 |
-
"model_b": "Pix2PixZero",
|
381 |
-
"winner": "model_a",
|
382 |
-
"judge": "arena_user_::1",
|
383 |
-
"anony": false,
|
384 |
-
"tstamp": 1707856807.6229
|
385 |
-
},
|
386 |
-
{
|
387 |
-
"model_a": "MagicBrush",
|
388 |
-
"model_b": "Pix2PixZero",
|
389 |
-
"winner": "tie (bothbad)",
|
390 |
-
"judge": "arena_user_::1",
|
391 |
-
"anony": false,
|
392 |
-
"tstamp": 1707863740.3507
|
393 |
-
},
|
394 |
-
{
|
395 |
-
"model_a": "MagicBrush",
|
396 |
-
"model_b": "PNP",
|
397 |
-
"winner": "model_b",
|
398 |
-
"judge": "arena_user_::1",
|
399 |
-
"anony": true,
|
400 |
-
"tstamp": 1707866312.1118
|
401 |
-
},
|
402 |
-
{
|
403 |
-
"model_a": "Pix2PixZero",
|
404 |
-
"model_b": "Prompt2prompt",
|
405 |
-
"winner": "model_b",
|
406 |
-
"judge": "arena_user_::1",
|
407 |
-
"anony": true,
|
408 |
-
"tstamp": 1707883083.3533
|
409 |
-
},
|
410 |
-
{
|
411 |
-
"model_a": "Pix2PixZero",
|
412 |
-
"model_b": "InstructPix2Pix",
|
413 |
-
"winner": "model_b",
|
414 |
-
"judge": "arena_user_::1",
|
415 |
-
"anony": true,
|
416 |
-
"tstamp": 1707883181.1397
|
417 |
-
},
|
418 |
-
{
|
419 |
-
"model_a": "Pix2PixZero",
|
420 |
-
"model_b": "Prompt2prompt",
|
421 |
-
"winner": "model_b",
|
422 |
-
"judge": "arena_user_::1",
|
423 |
-
"anony": true,
|
424 |
-
"tstamp": 1707883187.9173
|
425 |
-
},
|
426 |
-
{
|
427 |
-
"model_a": "PNP",
|
428 |
-
"model_b": "Prompt2prompt",
|
429 |
-
"winner": "model_a",
|
430 |
-
"judge": "arena_user_::1",
|
431 |
-
"anony": true,
|
432 |
-
"tstamp": 1707883507.587
|
433 |
-
},
|
434 |
-
{
|
435 |
-
"model_a": "Prompt2prompt",
|
436 |
-
"model_b": "CycleDiffusion",
|
437 |
-
"winner": "model_a",
|
438 |
-
"judge": "arena_user_::1",
|
439 |
-
"anony": true,
|
440 |
-
"tstamp": 1707883939.6125
|
441 |
-
},
|
442 |
-
{
|
443 |
-
"model_a": "Prompt2prompt",
|
444 |
-
"model_b": "MagicBrush",
|
445 |
-
"winner": "model_b",
|
446 |
-
"judge": "arena_user_::1",
|
447 |
-
"anony": true,
|
448 |
-
"tstamp": 1707892689.4407
|
449 |
-
},
|
450 |
-
{
|
451 |
-
"model_a": "MagicBrush",
|
452 |
-
"model_b": "InstructPix2Pix",
|
453 |
-
"winner": "model_b",
|
454 |
-
"judge": "arena_user_::1",
|
455 |
-
"anony": true,
|
456 |
-
"tstamp": 1707908988.749
|
457 |
-
},
|
458 |
-
{
|
459 |
-
"model_a": "Prompt2prompt",
|
460 |
-
"model_b": "InstructPix2Pix",
|
461 |
-
"winner": "model_a",
|
462 |
-
"judge": "arena_user_::1",
|
463 |
-
"anony": true,
|
464 |
-
"tstamp": 1707912639.2701
|
465 |
-
},
|
466 |
-
{
|
467 |
-
"model_a": "MagicBrush",
|
468 |
-
"model_b": "Pix2PixZero",
|
469 |
-
"winner": "model_a",
|
470 |
-
"judge": "arena_user_::1",
|
471 |
-
"anony": false,
|
472 |
-
"tstamp": 1707917685.9574
|
473 |
-
},
|
474 |
-
{
|
475 |
-
"model_a": "MagicBrush",
|
476 |
-
"model_b": "InstructPix2Pix",
|
477 |
-
"winner": "tie (bothbad)",
|
478 |
-
"judge": "arena_user_::1",
|
479 |
-
"anony": false,
|
480 |
-
"tstamp": 1707919429.336
|
481 |
-
},
|
482 |
-
{
|
483 |
-
"model_a": "InstructPix2Pix",
|
484 |
-
"model_b": "CycleDiffusion",
|
485 |
-
"winner": "model_a",
|
486 |
-
"judge": "arena_user_::1",
|
487 |
-
"anony": true,
|
488 |
-
"tstamp": 1707932651.9192
|
489 |
-
},
|
490 |
-
{
|
491 |
-
"model_a": "MagicBrush",
|
492 |
-
"model_b": "InstructPix2Pix",
|
493 |
-
"winner": "model_a",
|
494 |
-
"judge": "arena_user_::1",
|
495 |
-
"anony": true,
|
496 |
-
"tstamp": 1707932749.3107
|
497 |
-
},
|
498 |
-
{
|
499 |
-
"model_a": "Prompt2prompt",
|
500 |
-
"model_b": "PNP",
|
501 |
-
"winner": "model_a",
|
502 |
-
"judge": "arena_user_::1",
|
503 |
-
"anony": true,
|
504 |
-
"tstamp": 1707933208.5797
|
505 |
-
},
|
506 |
-
{
|
507 |
-
"model_a": "MagicBrush",
|
508 |
-
"model_b": "Pix2PixZero",
|
509 |
-
"winner": "model_a",
|
510 |
-
"judge": "arena_user_::1",
|
511 |
-
"anony": false,
|
512 |
-
"tstamp": 1707945335.6341
|
513 |
-
},
|
514 |
-
{
|
515 |
-
"model_a": "MagicBrush",
|
516 |
-
"model_b": "PNP",
|
517 |
-
"winner": "model_a",
|
518 |
-
"judge": "arena_user_::1",
|
519 |
-
"anony": false,
|
520 |
-
"tstamp": 1708031168.6838
|
521 |
-
},
|
522 |
-
{
|
523 |
-
"model_a": "Pix2PixZero",
|
524 |
-
"model_b": "PNP",
|
525 |
-
"winner": "model_b",
|
526 |
-
"judge": "arena_user_::1",
|
527 |
-
"anony": false,
|
528 |
-
"tstamp": 1708038931.5388
|
529 |
-
},
|
530 |
-
{
|
531 |
-
"model_a": "Pix2PixZero",
|
532 |
-
"model_b": "CycleDiffusion",
|
533 |
-
"winner": "tie (bothbad)",
|
534 |
-
"judge": "arena_user_::1",
|
535 |
-
"anony": true,
|
536 |
-
"tstamp": 1708057382.78
|
537 |
-
},
|
538 |
-
{
|
539 |
-
"model_a": "PNP",
|
540 |
-
"model_b": "InstructPix2Pix",
|
541 |
-
"winner": "model_b",
|
542 |
-
"judge": "arena_user_::1",
|
543 |
-
"anony": true,
|
544 |
-
"tstamp": 1708093689.8237
|
545 |
-
},
|
546 |
-
{
|
547 |
-
"model_a": "MagicBrush",
|
548 |
-
"model_b": "PNP",
|
549 |
-
"winner": "model_b",
|
550 |
-
"judge": "arena_user_::1",
|
551 |
-
"anony": true,
|
552 |
-
"tstamp": 1708093910.4683
|
553 |
-
},
|
554 |
-
{
|
555 |
-
"model_a": "Pix2PixZero",
|
556 |
-
"model_b": "Prompt2prompt",
|
557 |
-
"winner": "model_b",
|
558 |
-
"judge": "arena_user_::1",
|
559 |
-
"anony": false,
|
560 |
-
"tstamp": 1708095090.8232
|
561 |
-
},
|
562 |
-
{
|
563 |
-
"model_a": "Pix2PixZero",
|
564 |
-
"model_b": "Prompt2prompt",
|
565 |
-
"winner": "model_a",
|
566 |
-
"judge": "arena_user_::1",
|
567 |
-
"anony": false,
|
568 |
-
"tstamp": 1708095305.4665
|
569 |
-
},
|
570 |
-
{
|
571 |
-
"model_a": "InstructPix2Pix",
|
572 |
-
"model_b": "Prompt2prompt",
|
573 |
-
"winner": "model_b",
|
574 |
-
"judge": "arena_user_::1",
|
575 |
-
"anony": true,
|
576 |
-
"tstamp": 1708140553.1694
|
577 |
-
},
|
578 |
-
{
|
579 |
-
"model_a": "MagicBrush",
|
580 |
-
"model_b": "Prompt2prompt",
|
581 |
-
"winner": "model_a",
|
582 |
-
"judge": "arena_user_::1",
|
583 |
-
"anony": true,
|
584 |
-
"tstamp": 1708145512.3656
|
585 |
-
},
|
586 |
-
{
|
587 |
-
"model_a": "Pix2PixZero",
|
588 |
-
"model_b": "Prompt2prompt",
|
589 |
-
"winner": "tie (bothbad)",
|
590 |
-
"judge": "arena_user_::1",
|
591 |
-
"anony": true,
|
592 |
-
"tstamp": 1708145724.4127
|
593 |
-
},
|
594 |
-
{
|
595 |
-
"model_a": "Pix2PixZero",
|
596 |
-
"model_b": "PNP",
|
597 |
-
"winner": "model_b",
|
598 |
-
"judge": "arena_user_::1",
|
599 |
-
"anony": true,
|
600 |
-
"tstamp": 1708146846.5098
|
601 |
-
},
|
602 |
-
{
|
603 |
-
"model_a": "PNP",
|
604 |
-
"model_b": "MagicBrush",
|
605 |
-
"winner": "model_a",
|
606 |
-
"judge": "arena_user_::1",
|
607 |
-
"anony": true,
|
608 |
-
"tstamp": 1708189738.4864
|
609 |
-
},
|
610 |
-
{
|
611 |
-
"model_a": "Prompt2prompt",
|
612 |
-
"model_b": "InstructPix2Pix",
|
613 |
-
"winner": "model_b",
|
614 |
-
"judge": "arena_user_::1",
|
615 |
-
"anony": true,
|
616 |
-
"tstamp": 1708235874.9246
|
617 |
-
},
|
618 |
-
{
|
619 |
-
"model_a": "Pix2PixZero",
|
620 |
-
"model_b": "PNP",
|
621 |
-
"winner": "model_b",
|
622 |
-
"judge": "arena_user_::1",
|
623 |
-
"anony": false,
|
624 |
-
"tstamp": 1708257619.7115
|
625 |
-
},
|
626 |
-
{
|
627 |
-
"model_a": "MagicBrush",
|
628 |
-
"model_b": "Pix2PixZero",
|
629 |
-
"winner": "tie (bothbad)",
|
630 |
-
"judge": "arena_user_::1",
|
631 |
-
"anony": true,
|
632 |
-
"tstamp": 1708341265.7655
|
633 |
-
},
|
634 |
-
{
|
635 |
-
"model_a": "MagicBrush",
|
636 |
-
"model_b": "InstructPix2Pix",
|
637 |
-
"winner": "model_b",
|
638 |
-
"judge": "arena_user_::1",
|
639 |
-
"anony": true,
|
640 |
-
"tstamp": 1708350183.3086
|
641 |
-
},
|
642 |
-
{
|
643 |
-
"model_a": "MagicBrush",
|
644 |
-
"model_b": "Pix2PixZero",
|
645 |
-
"winner": "tie (bothbad)",
|
646 |
-
"judge": "arena_user_::1",
|
647 |
-
"anony": true,
|
648 |
-
"tstamp": 1708399707.1681
|
649 |
-
},
|
650 |
-
{
|
651 |
-
"model_a": "PNP",
|
652 |
-
"model_b": "MagicBrush",
|
653 |
-
"winner": "model_a",
|
654 |
-
"judge": "arena_user_::1",
|
655 |
-
"anony": true,
|
656 |
-
"tstamp": 1708441502.4707
|
657 |
-
},
|
658 |
-
{
|
659 |
-
"model_a": "InstructPix2Pix",
|
660 |
-
"model_b": "MagicBrush",
|
661 |
-
"winner": "model_a",
|
662 |
-
"judge": "arena_user_::1",
|
663 |
-
"anony": true,
|
664 |
-
"tstamp": 1708441716.8195
|
665 |
-
},
|
666 |
-
{
|
667 |
-
"model_a": "InstructPix2Pix",
|
668 |
-
"model_b": "MagicBrush",
|
669 |
-
"winner": "model_b",
|
670 |
-
"judge": "arena_user_::1",
|
671 |
-
"anony": false,
|
672 |
-
"tstamp": 1708546759.2009
|
673 |
-
},
|
674 |
-
{
|
675 |
-
"model_a": "InstructPix2Pix",
|
676 |
-
"model_b": "MagicBrush",
|
677 |
-
"winner": "model_a",
|
678 |
-
"judge": "arena_user_::1",
|
679 |
-
"anony": false,
|
680 |
-
"tstamp": 1708546805.4892
|
681 |
-
},
|
682 |
-
{
|
683 |
-
"model_a": "Pix2PixZero",
|
684 |
-
"model_b": "CycleDiffusion",
|
685 |
-
"winner": "tie (bothbad)",
|
686 |
-
"judge": "arena_user_::1",
|
687 |
-
"anony": true,
|
688 |
-
"tstamp": 1708547082.7124
|
689 |
-
},
|
690 |
-
{
|
691 |
-
"model_a": "InstructPix2Pix",
|
692 |
-
"model_b": "MagicBrush",
|
693 |
-
"winner": "model_b",
|
694 |
-
"judge": "arena_user_::1",
|
695 |
-
"anony": false,
|
696 |
-
"tstamp": 1708547166.9685
|
697 |
-
},
|
698 |
-
{
|
699 |
-
"model_a": "InstructPix2Pix",
|
700 |
-
"model_b": "MagicBrush",
|
701 |
-
"winner": "model_b",
|
702 |
-
"judge": "arena_user_::1",
|
703 |
-
"anony": false,
|
704 |
-
"tstamp": 1708547293.7107
|
705 |
-
},
|
706 |
-
{
|
707 |
-
"model_a": "CycleDiffusion",
|
708 |
-
"model_b": "PNP",
|
709 |
-
"winner": "tie (bothbad)",
|
710 |
-
"judge": "arena_user_::1",
|
711 |
-
"anony": true,
|
712 |
-
"tstamp": 1708575046.0529
|
713 |
-
},
|
714 |
-
{
|
715 |
-
"model_a": "CycleDiffusion",
|
716 |
-
"model_b": "MagicBrush",
|
717 |
-
"winner": "tie (bothbad)",
|
718 |
-
"judge": "arena_user_::1",
|
719 |
-
"anony": true,
|
720 |
-
"tstamp": 1708615466.9264
|
721 |
-
},
|
722 |
-
{
|
723 |
-
"model_a": "CycleDiffusion",
|
724 |
-
"model_b": "MagicBrush",
|
725 |
-
"winner": "model_b",
|
726 |
-
"judge": "arena_user_::1",
|
727 |
-
"anony": false,
|
728 |
-
"tstamp": 1708615516.3341
|
729 |
-
},
|
730 |
-
{
|
731 |
-
"model_a": "InstructPix2Pix",
|
732 |
-
"model_b": "PNP",
|
733 |
-
"winner": "model_b",
|
734 |
-
"judge": "arena_user_::1",
|
735 |
-
"anony": false,
|
736 |
-
"tstamp": 1709205399.0098
|
737 |
-
},
|
738 |
-
{
|
739 |
-
"model_a": "InstructPix2Pix",
|
740 |
-
"model_b": "PNP",
|
741 |
-
"winner": "model_b",
|
742 |
-
"judge": "arena_user_::1",
|
743 |
-
"anony": false,
|
744 |
-
"tstamp": 1709205767.8923
|
745 |
-
},
|
746 |
-
{
|
747 |
-
"model_a": "PNP",
|
748 |
-
"model_b": "InstructPix2Pix",
|
749 |
-
"winner": "model_b",
|
750 |
-
"judge": "arena_user_::1",
|
751 |
-
"anony": true,
|
752 |
-
"tstamp": 1709443700.05
|
753 |
-
},
|
754 |
-
{
|
755 |
-
"model_a": "MagicBrush",
|
756 |
-
"model_b": "Pix2PixZero",
|
757 |
-
"winner": "model_a",
|
758 |
-
"judge": "arena_user_::1",
|
759 |
-
"anony": true,
|
760 |
-
"tstamp": 1709702898.9291
|
761 |
-
},
|
762 |
-
{
|
763 |
-
"model_a": "CycleDiffusion",
|
764 |
-
"model_b": "Prompt2prompt",
|
765 |
-
"winner": "tie (bothbad)",
|
766 |
-
"judge": "arena_user_::1",
|
767 |
-
"anony": true,
|
768 |
-
"tstamp": 1710091925.1861
|
769 |
-
},
|
770 |
-
{
|
771 |
-
"model_a": "MagicBrush",
|
772 |
-
"model_b": "InstructPix2Pix",
|
773 |
-
"winner": "tie (bothbad)",
|
774 |
-
"judge": "arena_user_::1",
|
775 |
-
"anony": true,
|
776 |
-
"tstamp": 1710517781.1525
|
777 |
-
},
|
778 |
-
{
|
779 |
-
"model_a": "MagicBrush",
|
780 |
-
"model_b": "InstructPix2Pix",
|
781 |
-
"winner": "tie (bothbad)",
|
782 |
-
"judge": "arena_user_::1",
|
783 |
-
"anony": false,
|
784 |
-
"tstamp": 1710517859.2942
|
785 |
-
},
|
786 |
-
{
|
787 |
-
"model_a": "Pix2PixZero",
|
788 |
-
"model_b": "CycleDiffusion",
|
789 |
-
"winner": "tie (bothbad)",
|
790 |
-
"judge": "arena_user_::1",
|
791 |
-
"anony": true,
|
792 |
-
"tstamp": 1710535672.9791
|
793 |
-
},
|
794 |
-
{
|
795 |
-
"model_a": "CycleDiffusion",
|
796 |
-
"model_b": "Pix2PixZero",
|
797 |
-
"winner": "model_b",
|
798 |
-
"judge": "arena_user_10.16.25.191",
|
799 |
-
"anony": false,
|
800 |
-
"tstamp": 1711610477.1213
|
801 |
-
},
|
802 |
-
{
|
803 |
-
"model_a": "CycleDiffusion",
|
804 |
-
"model_b": "Pix2PixZero",
|
805 |
-
"winner": "model_b",
|
806 |
-
"judge": "arena_user_10.16.7.189",
|
807 |
-
"anony": false,
|
808 |
-
"tstamp": 1711629129.3894
|
809 |
-
},
|
810 |
-
{
|
811 |
-
"model_a": "InstructPix2Pix",
|
812 |
-
"model_b": "CycleDiffusion",
|
813 |
-
"winner": "model_b",
|
814 |
-
"judge": "arena_user_10.16.7.189",
|
815 |
-
"anony": false,
|
816 |
-
"tstamp": 1711629705.2246
|
817 |
-
},
|
818 |
-
{
|
819 |
-
"model_a": "CycleDiffusion",
|
820 |
-
"model_b": "Pix2PixZero",
|
821 |
-
"winner": "model_b",
|
822 |
-
"judge": "arena_user_10.16.25.191",
|
823 |
-
"anony": false,
|
824 |
-
"tstamp": 1711630362.5575
|
825 |
-
},
|
826 |
-
{
|
827 |
-
"model_a": "MagicBrush",
|
828 |
-
"model_b": "SDEdit",
|
829 |
-
"winner": "model_a",
|
830 |
-
"judge": "arena_user_127.0.0.1",
|
831 |
-
"anony": false,
|
832 |
-
"tstamp": 1711631112.5207
|
833 |
-
},
|
834 |
-
{
|
835 |
-
"model_a": "Pix2PixZero",
|
836 |
-
"model_b": "Prompt2prompt",
|
837 |
-
"winner": "model_a",
|
838 |
-
"judge": "arena_user_10.16.41.118",
|
839 |
-
"anony": false,
|
840 |
-
"tstamp": 1711631690.5127
|
841 |
-
},
|
842 |
-
{
|
843 |
-
"model_a": "MagicBrush",
|
844 |
-
"model_b": "InstructPix2Pix",
|
845 |
-
"winner": "model_a",
|
846 |
-
"judge": "arena_user_127.0.0.1",
|
847 |
-
"anony": false,
|
848 |
-
"tstamp": 1711633200.2923
|
849 |
-
},
|
850 |
-
{
|
851 |
-
"model_a": "MagicBrush",
|
852 |
-
"model_b": "InstructPix2Pix",
|
853 |
-
"winner": "model_a",
|
854 |
-
"judge": "arena_user_127.0.0.1",
|
855 |
-
"anony": false,
|
856 |
-
"tstamp": 1711633594.9922
|
857 |
-
},
|
858 |
-
{
|
859 |
-
"model_a": "MagicBrush",
|
860 |
-
"model_b": "SDEdit",
|
861 |
-
"winner": "model_a",
|
862 |
-
"judge": "arena_user_10.16.7.189",
|
863 |
-
"anony": false,
|
864 |
-
"tstamp": 1711635443.3071
|
865 |
-
},
|
866 |
-
{
|
867 |
-
"model_a": "CycleDiffusion",
|
868 |
-
"model_b": "MagicBrush",
|
869 |
-
"winner": "model_b",
|
870 |
-
"judge": "arena_user_10.16.25.191",
|
871 |
-
"anony": false,
|
872 |
-
"tstamp": 1711635899.3088
|
873 |
-
},
|
874 |
-
{
|
875 |
-
"model_a": "SDEdit",
|
876 |
-
"model_b": "MagicBrush",
|
877 |
-
"winner": "model_b",
|
878 |
-
"judge": "arena_user_10.16.41.118",
|
879 |
-
"anony": false,
|
880 |
-
"tstamp": 1711639015.428
|
881 |
-
},
|
882 |
-
{
|
883 |
-
"model_a": "InstructPix2Pix",
|
884 |
-
"model_b": "MagicBrush",
|
885 |
-
"winner": "model_b",
|
886 |
-
"judge": "arena_user_10.16.7.189",
|
887 |
-
"anony": false,
|
888 |
-
"tstamp": 1711646372.1201
|
889 |
-
}
|
890 |
-
]
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
arena_elo/results/20240328/elo_results_image_editing.pkl
DELETED
@@ -1,3 +0,0 @@
|
|
1 |
-
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:1430e6703dd6fc1e5b8ce06b11bb3a47516763a33edaf99e4c8547da5d9a8516
|
3 |
-
size 57064
|
|
|
|
|
|
|
|
arena_elo/results/20240328/image_editing_leaderboard.csv
DELETED
@@ -1,8 +0,0 @@
|
|
1 |
-
key,Model,Arena Elo rating (anony),Arena Elo rating (full),License,Organization,Link
|
2 |
-
Prompt2prompt,Prompt2prompt,1227.5508595026165,1158.5510681980204,Apache-2.0,"Google, Tel Aviv University",https://prompt-to-prompt.github.io
|
3 |
-
InstructPix2Pix,InstructPix2Pix,1160.2057367236093,1071.0628993075604,"Copyright 2023 Timothy Brooks, Aleksander Holynski, Alexei A. Efros","University of California, Berkeley",https://www.timothybrooks.com/instruct-pix2pix
|
4 |
-
PNP,PNP,1142.693603173293,1165.4957550490212,-,Weizmann Institute of Science,https://github.com/MichalGeyer/plug-and-play
|
5 |
-
MagicBrush,MagicBrush,1053.1728944865915,1130.5422054860635,CC-BY-4.0,"The Ohio State University, University of Waterloo",https://osu-nlp-group.github.io/MagicBrush
|
6 |
-
Pix2PixZero,Pix2PixZero,918.6047552604578,960.3217617445996,MIT License,"Carnegie Mellon University, Adobe Research",https://pix2pixzero.github.io
|
7 |
-
CycleDiffusion,CycleDiffusion,865.0529105743963,813.4794423328381,X11,Carnegie Mellon University,https://github.com/ChenWu98/cycle-diffusion
|
8 |
-
SDEdit,SDEdit,632.7192402790356,700.546867881897,MIT License,Stanford University,https://sde-image-editing.github.io
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
arena_elo/results/20240330/elo_results_t2i_generation.pkl
DELETED
@@ -1,3 +0,0 @@
|
|
1 |
-
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:e963f9d4b66d29c2f05a3923eff56cebd1f09b07223ac069456e08dc6143cda8
|
3 |
-
size 66894
|
|
|
|
|
|
|
|
arena_elo/results/20240330/t2i_generation_leaderboard.csv
DELETED
@@ -1,10 +0,0 @@
|
|
1 |
-
key,Model,Arena Elo rating (anony),Arena Elo rating (full),License,Organization,Link
|
2 |
-
Playground v2.5,Playground v2.5,1226.2872445351936,1236.5076527218755,Playground v2.5 Community License,Playground,https://huggingface.co/playgroundai/playground-v2.5-1024px-aesthetic
|
3 |
-
StableCascade,StableCascade,1105.3322734027522,1062.0980902577003,stable-cascade-nc-community (other),Stability AI,https://huggingface.co/stabilityai/stable-cascade
|
4 |
-
Playground v2,Playground v2,1091.4371447234744,1087.3576445526567,Playground v2 Community License,Playground,https://huggingface.co/playgroundai/playground-v2-1024px-aesthetic
|
5 |
-
SDXLLightning,SDXLLightning,1043.235902888147,1019.4526672266176,openrail++,ByteDance,https://huggingface.co/ByteDance/SDXL-Lightning
|
6 |
-
PixArtAlpha,PixArtAlpha,1020.6412075829058,1001.5090282446616,openrail++,PixArt-alpha,https://huggingface.co/PixArt-alpha/PixArt-XL-2-1024-MS
|
7 |
-
SDXL,SDXL,964.7626495363717,969.8928133531979,openrail++,Stability AI,https://huggingface.co/stabilityai/stable-diffusion-xl-base-1.0
|
8 |
-
SDXLTurbo,SDXLTurbo,912.2113859675355,914.9478831930971,sai-nc-community (other),Stability AI,https://huggingface.co/stabilityai/sdxl-turbo
|
9 |
-
OpenJourney,OpenJourney,841.2224045541894,835.4563491411935,creativeml-openrail-m,PromptHero,https://huggingface.co/prompthero/openjourney
|
10 |
-
LCM,LCM,794.8697868094328,812.962889153237,MIT License,Tsinghua University,https://huggingface.co/SimianLuo/LCM_Dreamshaper_v7
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
arena_elo/results/20240408/clean_battle_t2i_generation.json
DELETED
The diff for this file is too large to render.
See raw diff
|
|
arena_elo/results/20240408/elo_results_t2i_generation.pkl
DELETED
@@ -1,3 +0,0 @@
|
|
1 |
-
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:dd88783d1cf752a0977152f7e16e88b54759173cbb04fb55e9392703ff4819f5
|
3 |
-
size 66931
|
|
|
|
|
|
|
|
arena_elo/results/20240408/t2i_generation_leaderboard.csv
DELETED
@@ -1,10 +0,0 @@
|
|
1 |
-
key,Model,Arena Elo rating (anony),Arena Elo rating (full),License,Organization,Link
|
2 |
-
Playground v2.5,Playground v2.5,1226.2872445351936,1233.8616648345985,Playground v2.5 Community License,Playground,https://huggingface.co/playgroundai/playground-v2.5-1024px-aesthetic
|
3 |
-
StableCascade,StableCascade,1105.3322734027522,1031.1844458387527,stable-cascade-nc-community (other),Stability AI,https://huggingface.co/stabilityai/stable-cascade
|
4 |
-
Playground v2,Playground v2,1091.4371447234744,1093.6921447327898,Playground v2 Community License,Playground,https://huggingface.co/playgroundai/playground-v2-1024px-aesthetic
|
5 |
-
SDXLLightning,SDXLLightning,1043.235902888147,1004.2360415152086,openrail++,ByteDance,https://huggingface.co/ByteDance/SDXL-Lightning
|
6 |
-
PixArtAlpha,PixArtAlpha,1020.6412075829058,999.6264863931511,openrail++,PixArt-alpha,https://huggingface.co/PixArt-alpha/PixArt-XL-2-1024-MS
|
7 |
-
SDXL,SDXL,964.7626495363717,975.3460583905047,openrail++,Stability AI,https://huggingface.co/stabilityai/stable-diffusion-xl-base-1.0
|
8 |
-
SDXLTurbo,SDXLTurbo,912.2113859675355,927.1873122981513,sai-nc-community (other),Stability AI,https://huggingface.co/stabilityai/sdxl-turbo
|
9 |
-
OpenJourney,OpenJourney,841.2224045541894,848.6657236271969,creativeml-openrail-m,PromptHero,https://huggingface.co/prompthero/openjourney
|
10 |
-
LCM,LCM,794.8697868094328,828.5108951096241,MIT License,Tsinghua University,https://huggingface.co/SimianLuo/LCM_Dreamshaper_v7
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
arena_elo/results/20240411/clean_battle_image_editing.json
DELETED
@@ -1,906 +0,0 @@
|
|
1 |
-
[
|
2 |
-
{
|
3 |
-
"model_a": "CycleDiffusion",
|
4 |
-
"model_b": "InstructPix2Pix",
|
5 |
-
"winner": "model_b",
|
6 |
-
"judge": "arena_user_::1",
|
7 |
-
"anony": true,
|
8 |
-
"tstamp": 1707712630.872
|
9 |
-
},
|
10 |
-
{
|
11 |
-
"model_a": "CycleDiffusion",
|
12 |
-
"model_b": "InstructPix2Pix",
|
13 |
-
"winner": "model_b",
|
14 |
-
"judge": "arena_user_::1",
|
15 |
-
"anony": false,
|
16 |
-
"tstamp": 1707712699.668
|
17 |
-
},
|
18 |
-
{
|
19 |
-
"model_a": "Pix2PixZero",
|
20 |
-
"model_b": "MagicBrush",
|
21 |
-
"winner": "model_a",
|
22 |
-
"judge": "arena_user_::1",
|
23 |
-
"anony": true,
|
24 |
-
"tstamp": 1707712896.0427
|
25 |
-
},
|
26 |
-
{
|
27 |
-
"model_a": "CycleDiffusion",
|
28 |
-
"model_b": "InstructPix2Pix",
|
29 |
-
"winner": "model_b",
|
30 |
-
"judge": "arena_user_::1",
|
31 |
-
"anony": false,
|
32 |
-
"tstamp": 1707712929.7061
|
33 |
-
},
|
34 |
-
{
|
35 |
-
"model_a": "CycleDiffusion",
|
36 |
-
"model_b": "InstructPix2Pix",
|
37 |
-
"winner": "model_b",
|
38 |
-
"judge": "arena_user_::1",
|
39 |
-
"anony": true,
|
40 |
-
"tstamp": 1707713147.0445
|
41 |
-
},
|
42 |
-
{
|
43 |
-
"model_a": "CycleDiffusion",
|
44 |
-
"model_b": "PNP",
|
45 |
-
"winner": "model_b",
|
46 |
-
"judge": "arena_user_::1",
|
47 |
-
"anony": true,
|
48 |
-
"tstamp": 1707713198.9284
|
49 |
-
},
|
50 |
-
{
|
51 |
-
"model_a": "CycleDiffusion",
|
52 |
-
"model_b": "Prompt2prompt",
|
53 |
-
"winner": "model_b",
|
54 |
-
"judge": "arena_user_::1",
|
55 |
-
"anony": true,
|
56 |
-
"tstamp": 1707713210.1306
|
57 |
-
},
|
58 |
-
{
|
59 |
-
"model_a": "Prompt2prompt",
|
60 |
-
"model_b": "SDEdit",
|
61 |
-
"winner": "model_a",
|
62 |
-
"judge": "arena_user_::1",
|
63 |
-
"anony": true,
|
64 |
-
"tstamp": 1707713747.5115
|
65 |
-
},
|
66 |
-
{
|
67 |
-
"model_a": "PNP",
|
68 |
-
"model_b": "Pix2PixZero",
|
69 |
-
"winner": "model_a",
|
70 |
-
"judge": "arena_user_::1",
|
71 |
-
"anony": true,
|
72 |
-
"tstamp": 1707715613.7226
|
73 |
-
},
|
74 |
-
{
|
75 |
-
"model_a": "CycleDiffusion",
|
76 |
-
"model_b": "MagicBrush",
|
77 |
-
"winner": "model_b",
|
78 |
-
"judge": "arena_user_::1",
|
79 |
-
"anony": true,
|
80 |
-
"tstamp": 1707765708.2644
|
81 |
-
},
|
82 |
-
{
|
83 |
-
"model_a": "PNP",
|
84 |
-
"model_b": "CycleDiffusion",
|
85 |
-
"winner": "model_a",
|
86 |
-
"judge": "arena_user_::1",
|
87 |
-
"anony": true,
|
88 |
-
"tstamp": 1707765861.2742
|
89 |
-
},
|
90 |
-
{
|
91 |
-
"model_a": "PNP",
|
92 |
-
"model_b": "CycleDiffusion",
|
93 |
-
"winner": "model_a",
|
94 |
-
"judge": "arena_user_::1",
|
95 |
-
"anony": false,
|
96 |
-
"tstamp": 1707765975.0206
|
97 |
-
},
|
98 |
-
{
|
99 |
-
"model_a": "PNP",
|
100 |
-
"model_b": "CycleDiffusion",
|
101 |
-
"winner": "model_a",
|
102 |
-
"judge": "arena_user_::1",
|
103 |
-
"anony": true,
|
104 |
-
"tstamp": 1707768866.9065
|
105 |
-
},
|
106 |
-
{
|
107 |
-
"model_a": "SDEdit",
|
108 |
-
"model_b": "MagicBrush",
|
109 |
-
"winner": "model_b",
|
110 |
-
"judge": "arena_user_::1",
|
111 |
-
"anony": true,
|
112 |
-
"tstamp": 1707771673.2989
|
113 |
-
},
|
114 |
-
{
|
115 |
-
"model_a": "SDEdit",
|
116 |
-
"model_b": "MagicBrush",
|
117 |
-
"winner": "model_b",
|
118 |
-
"judge": "arena_user_::1",
|
119 |
-
"anony": true,
|
120 |
-
"tstamp": 1707784377.6617
|
121 |
-
},
|
122 |
-
{
|
123 |
-
"model_a": "SDEdit",
|
124 |
-
"model_b": "MagicBrush",
|
125 |
-
"winner": "model_b",
|
126 |
-
"judge": "arena_user_::1",
|
127 |
-
"anony": true,
|
128 |
-
"tstamp": 1707784466.8915
|
129 |
-
},
|
130 |
-
{
|
131 |
-
"model_a": "CycleDiffusion",
|
132 |
-
"model_b": "PNP",
|
133 |
-
"winner": "model_b",
|
134 |
-
"judge": "arena_user_::1",
|
135 |
-
"anony": true,
|
136 |
-
"tstamp": 1707784983.9581
|
137 |
-
},
|
138 |
-
{
|
139 |
-
"model_a": "MagicBrush",
|
140 |
-
"model_b": "SDEdit",
|
141 |
-
"winner": "model_a",
|
142 |
-
"judge": "arena_user_::1",
|
143 |
-
"anony": true,
|
144 |
-
"tstamp": 1707785277.16
|
145 |
-
},
|
146 |
-
{
|
147 |
-
"model_a": "MagicBrush",
|
148 |
-
"model_b": "SDEdit",
|
149 |
-
"winner": "model_a",
|
150 |
-
"judge": "arena_user_::1",
|
151 |
-
"anony": true,
|
152 |
-
"tstamp": 1707795299.0619
|
153 |
-
},
|
154 |
-
{
|
155 |
-
"model_a": "MagicBrush",
|
156 |
-
"model_b": "SDEdit",
|
157 |
-
"winner": "tie (bothbad)",
|
158 |
-
"judge": "arena_user_::1",
|
159 |
-
"anony": true,
|
160 |
-
"tstamp": 1707795798.752
|
161 |
-
},
|
162 |
-
{
|
163 |
-
"model_a": "SDEdit",
|
164 |
-
"model_b": "Prompt2prompt",
|
165 |
-
"winner": "model_b",
|
166 |
-
"judge": "arena_user_::1",
|
167 |
-
"anony": false,
|
168 |
-
"tstamp": 1707796435.7996
|
169 |
-
},
|
170 |
-
{
|
171 |
-
"model_a": "SDEdit",
|
172 |
-
"model_b": "CycleDiffusion",
|
173 |
-
"winner": "model_b",
|
174 |
-
"judge": "arena_user_::1",
|
175 |
-
"anony": false,
|
176 |
-
"tstamp": 1707797278.7369
|
177 |
-
},
|
178 |
-
{
|
179 |
-
"model_a": "SDEdit",
|
180 |
-
"model_b": "CycleDiffusion",
|
181 |
-
"winner": "model_a",
|
182 |
-
"judge": "arena_user_::1",
|
183 |
-
"anony": false,
|
184 |
-
"tstamp": 1707797279.6004
|
185 |
-
},
|
186 |
-
{
|
187 |
-
"model_a": "SDEdit",
|
188 |
-
"model_b": "Prompt2prompt",
|
189 |
-
"winner": "model_b",
|
190 |
-
"judge": "arena_user_::1",
|
191 |
-
"anony": true,
|
192 |
-
"tstamp": 1707805086.9739
|
193 |
-
},
|
194 |
-
{
|
195 |
-
"model_a": "PNP",
|
196 |
-
"model_b": "SDEdit",
|
197 |
-
"winner": "model_a",
|
198 |
-
"judge": "arena_user_::1",
|
199 |
-
"anony": true,
|
200 |
-
"tstamp": 1707805220.3253
|
201 |
-
},
|
202 |
-
{
|
203 |
-
"model_a": "InstructPix2Pix",
|
204 |
-
"model_b": "CycleDiffusion",
|
205 |
-
"winner": "tie (bothbad)",
|
206 |
-
"judge": "arena_user_::1",
|
207 |
-
"anony": true,
|
208 |
-
"tstamp": 1707805332.6322
|
209 |
-
},
|
210 |
-
{
|
211 |
-
"model_a": "InstructPix2Pix",
|
212 |
-
"model_b": "Prompt2prompt",
|
213 |
-
"winner": "model_b",
|
214 |
-
"judge": "arena_user_::1",
|
215 |
-
"anony": true,
|
216 |
-
"tstamp": 1707805476.0509
|
217 |
-
},
|
218 |
-
{
|
219 |
-
"model_a": "InstructPix2Pix",
|
220 |
-
"model_b": "Prompt2prompt",
|
221 |
-
"winner": "model_b",
|
222 |
-
"judge": "arena_user_::1",
|
223 |
-
"anony": true,
|
224 |
-
"tstamp": 1707818374.3438
|
225 |
-
},
|
226 |
-
{
|
227 |
-
"model_a": "PNP",
|
228 |
-
"model_b": "Prompt2prompt",
|
229 |
-
"winner": "model_b",
|
230 |
-
"judge": "arena_user_::1",
|
231 |
-
"anony": true,
|
232 |
-
"tstamp": 1707834631.9088
|
233 |
-
},
|
234 |
-
{
|
235 |
-
"model_a": "InstructPix2Pix",
|
236 |
-
"model_b": "SDEdit",
|
237 |
-
"winner": "model_a",
|
238 |
-
"judge": "arena_user_::1",
|
239 |
-
"anony": true,
|
240 |
-
"tstamp": 1707834954.0147
|
241 |
-
},
|
242 |
-
{
|
243 |
-
"model_a": "Prompt2prompt",
|
244 |
-
"model_b": "Pix2PixZero",
|
245 |
-
"winner": "tie (bothbad)",
|
246 |
-
"judge": "arena_user_::1",
|
247 |
-
"anony": true,
|
248 |
-
"tstamp": 1707835366.544
|
249 |
-
},
|
250 |
-
{
|
251 |
-
"model_a": "PNP",
|
252 |
-
"model_b": "SDEdit",
|
253 |
-
"winner": "model_a",
|
254 |
-
"judge": "arena_user_::1",
|
255 |
-
"anony": true,
|
256 |
-
"tstamp": 1707835643.6178
|
257 |
-
},
|
258 |
-
{
|
259 |
-
"model_a": "MagicBrush",
|
260 |
-
"model_b": "InstructPix2Pix",
|
261 |
-
"winner": "tie (bothbad)",
|
262 |
-
"judge": "arena_user_::1",
|
263 |
-
"anony": true,
|
264 |
-
"tstamp": 1707835789.25
|
265 |
-
},
|
266 |
-
{
|
267 |
-
"model_a": "MagicBrush",
|
268 |
-
"model_b": "PNP",
|
269 |
-
"winner": "tie (bothbad)",
|
270 |
-
"judge": "arena_user_::1",
|
271 |
-
"anony": true,
|
272 |
-
"tstamp": 1707836852.671
|
273 |
-
},
|
274 |
-
{
|
275 |
-
"model_a": "MagicBrush",
|
276 |
-
"model_b": "InstructPix2Pix",
|
277 |
-
"winner": "model_a",
|
278 |
-
"judge": "arena_user_::1",
|
279 |
-
"anony": false,
|
280 |
-
"tstamp": 1707836952.6082
|
281 |
-
},
|
282 |
-
{
|
283 |
-
"model_a": "CycleDiffusion",
|
284 |
-
"model_b": "SDEdit",
|
285 |
-
"winner": "tie (bothbad)",
|
286 |
-
"judge": "arena_user_::1",
|
287 |
-
"anony": false,
|
288 |
-
"tstamp": 1707837020.7148
|
289 |
-
},
|
290 |
-
{
|
291 |
-
"model_a": "InstructPix2Pix",
|
292 |
-
"model_b": "PNP",
|
293 |
-
"winner": "model_a",
|
294 |
-
"judge": "arena_user_::1",
|
295 |
-
"anony": true,
|
296 |
-
"tstamp": 1707837226.2259
|
297 |
-
},
|
298 |
-
{
|
299 |
-
"model_a": "Prompt2prompt",
|
300 |
-
"model_b": "Pix2PixZero",
|
301 |
-
"winner": "model_a",
|
302 |
-
"judge": "arena_user_::1",
|
303 |
-
"anony": true,
|
304 |
-
"tstamp": 1707838166.1449
|
305 |
-
},
|
306 |
-
{
|
307 |
-
"model_a": "InstructPix2Pix",
|
308 |
-
"model_b": "MagicBrush",
|
309 |
-
"winner": "tie (bothbad)",
|
310 |
-
"judge": "arena_user_::1",
|
311 |
-
"anony": true,
|
312 |
-
"tstamp": 1707838405.0013
|
313 |
-
},
|
314 |
-
{
|
315 |
-
"model_a": "MagicBrush",
|
316 |
-
"model_b": "CycleDiffusion",
|
317 |
-
"winner": "model_a",
|
318 |
-
"judge": "arena_user_::1",
|
319 |
-
"anony": true,
|
320 |
-
"tstamp": 1707839133.3126
|
321 |
-
},
|
322 |
-
{
|
323 |
-
"model_a": "Prompt2prompt",
|
324 |
-
"model_b": "InstructPix2Pix",
|
325 |
-
"winner": "model_a",
|
326 |
-
"judge": "arena_user_::1",
|
327 |
-
"anony": true,
|
328 |
-
"tstamp": 1707839484.6824
|
329 |
-
},
|
330 |
-
{
|
331 |
-
"model_a": "PNP",
|
332 |
-
"model_b": "InstructPix2Pix",
|
333 |
-
"winner": "tie (bothbad)",
|
334 |
-
"judge": "arena_user_::1",
|
335 |
-
"anony": true,
|
336 |
-
"tstamp": 1707850104.2499
|
337 |
-
},
|
338 |
-
{
|
339 |
-
"model_a": "InstructPix2Pix",
|
340 |
-
"model_b": "Pix2PixZero",
|
341 |
-
"winner": "model_a",
|
342 |
-
"judge": "arena_user_::1",
|
343 |
-
"anony": true,
|
344 |
-
"tstamp": 1707851384.7689
|
345 |
-
},
|
346 |
-
{
|
347 |
-
"model_a": "PNP",
|
348 |
-
"model_b": "MagicBrush",
|
349 |
-
"winner": "model_b",
|
350 |
-
"judge": "arena_user_::1",
|
351 |
-
"anony": true,
|
352 |
-
"tstamp": 1707851936.9466
|
353 |
-
},
|
354 |
-
{
|
355 |
-
"model_a": "CycleDiffusion",
|
356 |
-
"model_b": "MagicBrush",
|
357 |
-
"winner": "tie (bothbad)",
|
358 |
-
"judge": "arena_user_::1",
|
359 |
-
"anony": true,
|
360 |
-
"tstamp": 1707852836.3291
|
361 |
-
},
|
362 |
-
{
|
363 |
-
"model_a": "CycleDiffusion",
|
364 |
-
"model_b": "MagicBrush",
|
365 |
-
"winner": "tie (bothbad)",
|
366 |
-
"judge": "arena_user_::1",
|
367 |
-
"anony": false,
|
368 |
-
"tstamp": 1707852878.673
|
369 |
-
},
|
370 |
-
{
|
371 |
-
"model_a": "Prompt2prompt",
|
372 |
-
"model_b": "InstructPix2Pix",
|
373 |
-
"winner": "model_a",
|
374 |
-
"judge": "arena_user_::1",
|
375 |
-
"anony": true,
|
376 |
-
"tstamp": 1707853008.1359
|
377 |
-
},
|
378 |
-
{
|
379 |
-
"model_a": "InstructPix2Pix",
|
380 |
-
"model_b": "Pix2PixZero",
|
381 |
-
"winner": "model_a",
|
382 |
-
"judge": "arena_user_::1",
|
383 |
-
"anony": false,
|
384 |
-
"tstamp": 1707856807.6229
|
385 |
-
},
|
386 |
-
{
|
387 |
-
"model_a": "MagicBrush",
|
388 |
-
"model_b": "Pix2PixZero",
|
389 |
-
"winner": "tie (bothbad)",
|
390 |
-
"judge": "arena_user_::1",
|
391 |
-
"anony": false,
|
392 |
-
"tstamp": 1707863740.3507
|
393 |
-
},
|
394 |
-
{
|
395 |
-
"model_a": "MagicBrush",
|
396 |
-
"model_b": "PNP",
|
397 |
-
"winner": "model_b",
|
398 |
-
"judge": "arena_user_::1",
|
399 |
-
"anony": true,
|
400 |
-
"tstamp": 1707866312.1118
|
401 |
-
},
|
402 |
-
{
|
403 |
-
"model_a": "Pix2PixZero",
|
404 |
-
"model_b": "Prompt2prompt",
|
405 |
-
"winner": "model_b",
|
406 |
-
"judge": "arena_user_::1",
|
407 |
-
"anony": true,
|
408 |
-
"tstamp": 1707883083.3533
|
409 |
-
},
|
410 |
-
{
|
411 |
-
"model_a": "Pix2PixZero",
|
412 |
-
"model_b": "InstructPix2Pix",
|
413 |
-
"winner": "model_b",
|
414 |
-
"judge": "arena_user_::1",
|
415 |
-
"anony": true,
|
416 |
-
"tstamp": 1707883181.1397
|
417 |
-
},
|
418 |
-
{
|
419 |
-
"model_a": "Pix2PixZero",
|
420 |
-
"model_b": "Prompt2prompt",
|
421 |
-
"winner": "model_b",
|
422 |
-
"judge": "arena_user_::1",
|
423 |
-
"anony": true,
|
424 |
-
"tstamp": 1707883187.9173
|
425 |
-
},
|
426 |
-
{
|
427 |
-
"model_a": "PNP",
|
428 |
-
"model_b": "Prompt2prompt",
|
429 |
-
"winner": "model_a",
|
430 |
-
"judge": "arena_user_::1",
|
431 |
-
"anony": true,
|
432 |
-
"tstamp": 1707883507.587
|
433 |
-
},
|
434 |
-
{
|
435 |
-
"model_a": "Prompt2prompt",
|
436 |
-
"model_b": "CycleDiffusion",
|
437 |
-
"winner": "model_a",
|
438 |
-
"judge": "arena_user_::1",
|
439 |
-
"anony": true,
|
440 |
-
"tstamp": 1707883939.6125
|
441 |
-
},
|
442 |
-
{
|
443 |
-
"model_a": "Prompt2prompt",
|
444 |
-
"model_b": "MagicBrush",
|
445 |
-
"winner": "model_b",
|
446 |
-
"judge": "arena_user_::1",
|
447 |
-
"anony": true,
|
448 |
-
"tstamp": 1707892689.4407
|
449 |
-
},
|
450 |
-
{
|
451 |
-
"model_a": "MagicBrush",
|
452 |
-
"model_b": "InstructPix2Pix",
|
453 |
-
"winner": "model_b",
|
454 |
-
"judge": "arena_user_::1",
|
455 |
-
"anony": true,
|
456 |
-
"tstamp": 1707908988.749
|
457 |
-
},
|
458 |
-
{
|
459 |
-
"model_a": "Prompt2prompt",
|
460 |
-
"model_b": "InstructPix2Pix",
|
461 |
-
"winner": "model_a",
|
462 |
-
"judge": "arena_user_::1",
|
463 |
-
"anony": true,
|
464 |
-
"tstamp": 1707912639.2701
|
465 |
-
},
|
466 |
-
{
|
467 |
-
"model_a": "MagicBrush",
|
468 |
-
"model_b": "Pix2PixZero",
|
469 |
-
"winner": "model_a",
|
470 |
-
"judge": "arena_user_::1",
|
471 |
-
"anony": false,
|
472 |
-
"tstamp": 1707917685.9574
|
473 |
-
},
|
474 |
-
{
|
475 |
-
"model_a": "MagicBrush",
|
476 |
-
"model_b": "InstructPix2Pix",
|
477 |
-
"winner": "tie (bothbad)",
|
478 |
-
"judge": "arena_user_::1",
|
479 |
-
"anony": false,
|
480 |
-
"tstamp": 1707919429.336
|
481 |
-
},
|
482 |
-
{
|
483 |
-
"model_a": "InstructPix2Pix",
|
484 |
-
"model_b": "CycleDiffusion",
|
485 |
-
"winner": "model_a",
|
486 |
-
"judge": "arena_user_::1",
|
487 |
-
"anony": true,
|
488 |
-
"tstamp": 1707932651.9192
|
489 |
-
},
|
490 |
-
{
|
491 |
-
"model_a": "MagicBrush",
|
492 |
-
"model_b": "InstructPix2Pix",
|
493 |
-
"winner": "model_a",
|
494 |
-
"judge": "arena_user_::1",
|
495 |
-
"anony": true,
|
496 |
-
"tstamp": 1707932749.3107
|
497 |
-
},
|
498 |
-
{
|
499 |
-
"model_a": "Prompt2prompt",
|
500 |
-
"model_b": "PNP",
|
501 |
-
"winner": "model_a",
|
502 |
-
"judge": "arena_user_::1",
|
503 |
-
"anony": true,
|
504 |
-
"tstamp": 1707933208.5797
|
505 |
-
},
|
506 |
-
{
|
507 |
-
"model_a": "MagicBrush",
|
508 |
-
"model_b": "Pix2PixZero",
|
509 |
-
"winner": "model_a",
|
510 |
-
"judge": "arena_user_::1",
|
511 |
-
"anony": false,
|
512 |
-
"tstamp": 1707945335.6341
|
513 |
-
},
|
514 |
-
{
|
515 |
-
"model_a": "MagicBrush",
|
516 |
-
"model_b": "PNP",
|
517 |
-
"winner": "model_a",
|
518 |
-
"judge": "arena_user_::1",
|
519 |
-
"anony": false,
|
520 |
-
"tstamp": 1708031168.6838
|
521 |
-
},
|
522 |
-
{
|
523 |
-
"model_a": "Pix2PixZero",
|
524 |
-
"model_b": "PNP",
|
525 |
-
"winner": "model_b",
|
526 |
-
"judge": "arena_user_::1",
|
527 |
-
"anony": false,
|
528 |
-
"tstamp": 1708038931.5388
|
529 |
-
},
|
530 |
-
{
|
531 |
-
"model_a": "Pix2PixZero",
|
532 |
-
"model_b": "CycleDiffusion",
|
533 |
-
"winner": "tie (bothbad)",
|
534 |
-
"judge": "arena_user_::1",
|
535 |
-
"anony": true,
|
536 |
-
"tstamp": 1708057382.78
|
537 |
-
},
|
538 |
-
{
|
539 |
-
"model_a": "PNP",
|
540 |
-
"model_b": "InstructPix2Pix",
|
541 |
-
"winner": "model_b",
|
542 |
-
"judge": "arena_user_::1",
|
543 |
-
"anony": true,
|
544 |
-
"tstamp": 1708093689.8237
|
545 |
-
},
|
546 |
-
{
|
547 |
-
"model_a": "MagicBrush",
|
548 |
-
"model_b": "PNP",
|
549 |
-
"winner": "model_b",
|
550 |
-
"judge": "arena_user_::1",
|
551 |
-
"anony": true,
|
552 |
-
"tstamp": 1708093910.4683
|
553 |
-
},
|
554 |
-
{
|
555 |
-
"model_a": "Pix2PixZero",
|
556 |
-
"model_b": "Prompt2prompt",
|
557 |
-
"winner": "model_b",
|
558 |
-
"judge": "arena_user_::1",
|
559 |
-
"anony": false,
|
560 |
-
"tstamp": 1708095090.8232
|
561 |
-
},
|
562 |
-
{
|
563 |
-
"model_a": "Pix2PixZero",
|
564 |
-
"model_b": "Prompt2prompt",
|
565 |
-
"winner": "model_a",
|
566 |
-
"judge": "arena_user_::1",
|
567 |
-
"anony": false,
|
568 |
-
"tstamp": 1708095305.4665
|
569 |
-
},
|
570 |
-
{
|
571 |
-
"model_a": "InstructPix2Pix",
|
572 |
-
"model_b": "Prompt2prompt",
|
573 |
-
"winner": "model_b",
|
574 |
-
"judge": "arena_user_::1",
|
575 |
-
"anony": true,
|
576 |
-
"tstamp": 1708140553.1694
|
577 |
-
},
|
578 |
-
{
|
579 |
-
"model_a": "MagicBrush",
|
580 |
-
"model_b": "Prompt2prompt",
|
581 |
-
"winner": "model_a",
|
582 |
-
"judge": "arena_user_::1",
|
583 |
-
"anony": true,
|
584 |
-
"tstamp": 1708145512.3656
|
585 |
-
},
|
586 |
-
{
|
587 |
-
"model_a": "Pix2PixZero",
|
588 |
-
"model_b": "Prompt2prompt",
|
589 |
-
"winner": "tie (bothbad)",
|
590 |
-
"judge": "arena_user_::1",
|
591 |
-
"anony": true,
|
592 |
-
"tstamp": 1708145724.4127
|
593 |
-
},
|
594 |
-
{
|
595 |
-
"model_a": "Pix2PixZero",
|
596 |
-
"model_b": "PNP",
|
597 |
-
"winner": "model_b",
|
598 |
-
"judge": "arena_user_::1",
|
599 |
-
"anony": true,
|
600 |
-
"tstamp": 1708146846.5098
|
601 |
-
},
|
602 |
-
{
|
603 |
-
"model_a": "PNP",
|
604 |
-
"model_b": "MagicBrush",
|
605 |
-
"winner": "model_a",
|
606 |
-
"judge": "arena_user_::1",
|
607 |
-
"anony": true,
|
608 |
-
"tstamp": 1708189738.4864
|
609 |
-
},
|
610 |
-
{
|
611 |
-
"model_a": "Prompt2prompt",
|
612 |
-
"model_b": "InstructPix2Pix",
|
613 |
-
"winner": "model_b",
|
614 |
-
"judge": "arena_user_::1",
|
615 |
-
"anony": true,
|
616 |
-
"tstamp": 1708235874.9246
|
617 |
-
},
|
618 |
-
{
|
619 |
-
"model_a": "Pix2PixZero",
|
620 |
-
"model_b": "PNP",
|
621 |
-
"winner": "model_b",
|
622 |
-
"judge": "arena_user_::1",
|
623 |
-
"anony": false,
|
624 |
-
"tstamp": 1708257619.7115
|
625 |
-
},
|
626 |
-
{
|
627 |
-
"model_a": "MagicBrush",
|
628 |
-
"model_b": "Pix2PixZero",
|
629 |
-
"winner": "tie (bothbad)",
|
630 |
-
"judge": "arena_user_::1",
|
631 |
-
"anony": true,
|
632 |
-
"tstamp": 1708341265.7655
|
633 |
-
},
|
634 |
-
{
|
635 |
-
"model_a": "MagicBrush",
|
636 |
-
"model_b": "InstructPix2Pix",
|
637 |
-
"winner": "model_b",
|
638 |
-
"judge": "arena_user_::1",
|
639 |
-
"anony": true,
|
640 |
-
"tstamp": 1708350183.3086
|
641 |
-
},
|
642 |
-
{
|
643 |
-
"model_a": "MagicBrush",
|
644 |
-
"model_b": "Pix2PixZero",
|
645 |
-
"winner": "tie (bothbad)",
|
646 |
-
"judge": "arena_user_::1",
|
647 |
-
"anony": true,
|
648 |
-
"tstamp": 1708399707.1681
|
649 |
-
},
|
650 |
-
{
|
651 |
-
"model_a": "PNP",
|
652 |
-
"model_b": "MagicBrush",
|
653 |
-
"winner": "model_a",
|
654 |
-
"judge": "arena_user_::1",
|
655 |
-
"anony": true,
|
656 |
-
"tstamp": 1708441502.4707
|
657 |
-
},
|
658 |
-
{
|
659 |
-
"model_a": "InstructPix2Pix",
|
660 |
-
"model_b": "MagicBrush",
|
661 |
-
"winner": "model_a",
|
662 |
-
"judge": "arena_user_::1",
|
663 |
-
"anony": true,
|
664 |
-
"tstamp": 1708441716.8195
|
665 |
-
},
|
666 |
-
{
|
667 |
-
"model_a": "InstructPix2Pix",
|
668 |
-
"model_b": "MagicBrush",
|
669 |
-
"winner": "model_b",
|
670 |
-
"judge": "arena_user_::1",
|
671 |
-
"anony": false,
|
672 |
-
"tstamp": 1708546759.2009
|
673 |
-
},
|
674 |
-
{
|
675 |
-
"model_a": "InstructPix2Pix",
|
676 |
-
"model_b": "MagicBrush",
|
677 |
-
"winner": "model_a",
|
678 |
-
"judge": "arena_user_::1",
|
679 |
-
"anony": false,
|
680 |
-
"tstamp": 1708546805.4892
|
681 |
-
},
|
682 |
-
{
|
683 |
-
"model_a": "Pix2PixZero",
|
684 |
-
"model_b": "CycleDiffusion",
|
685 |
-
"winner": "tie (bothbad)",
|
686 |
-
"judge": "arena_user_::1",
|
687 |
-
"anony": true,
|
688 |
-
"tstamp": 1708547082.7124
|
689 |
-
},
|
690 |
-
{
|
691 |
-
"model_a": "InstructPix2Pix",
|
692 |
-
"model_b": "MagicBrush",
|
693 |
-
"winner": "model_b",
|
694 |
-
"judge": "arena_user_::1",
|
695 |
-
"anony": false,
|
696 |
-
"tstamp": 1708547166.9685
|
697 |
-
},
|
698 |
-
{
|
699 |
-
"model_a": "InstructPix2Pix",
|
700 |
-
"model_b": "MagicBrush",
|
701 |
-
"winner": "model_b",
|
702 |
-
"judge": "arena_user_::1",
|
703 |
-
"anony": false,
|
704 |
-
"tstamp": 1708547293.7107
|
705 |
-
},
|
706 |
-
{
|
707 |
-
"model_a": "CycleDiffusion",
|
708 |
-
"model_b": "PNP",
|
709 |
-
"winner": "tie (bothbad)",
|
710 |
-
"judge": "arena_user_::1",
|
711 |
-
"anony": true,
|
712 |
-
"tstamp": 1708575046.0529
|
713 |
-
},
|
714 |
-
{
|
715 |
-
"model_a": "CycleDiffusion",
|
716 |
-
"model_b": "MagicBrush",
|
717 |
-
"winner": "tie (bothbad)",
|
718 |
-
"judge": "arena_user_::1",
|
719 |
-
"anony": true,
|
720 |
-
"tstamp": 1708615466.9264
|
721 |
-
},
|
722 |
-
{
|
723 |
-
"model_a": "CycleDiffusion",
|
724 |
-
"model_b": "MagicBrush",
|
725 |
-
"winner": "model_b",
|
726 |
-
"judge": "arena_user_::1",
|
727 |
-
"anony": false,
|
728 |
-
"tstamp": 1708615516.3341
|
729 |
-
},
|
730 |
-
{
|
731 |
-
"model_a": "InstructPix2Pix",
|
732 |
-
"model_b": "PNP",
|
733 |
-
"winner": "model_b",
|
734 |
-
"judge": "arena_user_::1",
|
735 |
-
"anony": false,
|
736 |
-
"tstamp": 1709205399.0098
|
737 |
-
},
|
738 |
-
{
|
739 |
-
"model_a": "InstructPix2Pix",
|
740 |
-
"model_b": "PNP",
|
741 |
-
"winner": "model_b",
|
742 |
-
"judge": "arena_user_::1",
|
743 |
-
"anony": false,
|
744 |
-
"tstamp": 1709205767.8923
|
745 |
-
},
|
746 |
-
{
|
747 |
-
"model_a": "PNP",
|
748 |
-
"model_b": "InstructPix2Pix",
|
749 |
-
"winner": "model_b",
|
750 |
-
"judge": "arena_user_::1",
|
751 |
-
"anony": true,
|
752 |
-
"tstamp": 1709443700.05
|
753 |
-
},
|
754 |
-
{
|
755 |
-
"model_a": "MagicBrush",
|
756 |
-
"model_b": "Pix2PixZero",
|
757 |
-
"winner": "model_a",
|
758 |
-
"judge": "arena_user_::1",
|
759 |
-
"anony": true,
|
760 |
-
"tstamp": 1709702898.9291
|
761 |
-
},
|
762 |
-
{
|
763 |
-
"model_a": "CycleDiffusion",
|
764 |
-
"model_b": "Prompt2prompt",
|
765 |
-
"winner": "tie (bothbad)",
|
766 |
-
"judge": "arena_user_::1",
|
767 |
-
"anony": true,
|
768 |
-
"tstamp": 1710091925.1861
|
769 |
-
},
|
770 |
-
{
|
771 |
-
"model_a": "MagicBrush",
|
772 |
-
"model_b": "InstructPix2Pix",
|
773 |
-
"winner": "tie (bothbad)",
|
774 |
-
"judge": "arena_user_::1",
|
775 |
-
"anony": true,
|
776 |
-
"tstamp": 1710517781.1525
|
777 |
-
},
|
778 |
-
{
|
779 |
-
"model_a": "MagicBrush",
|
780 |
-
"model_b": "InstructPix2Pix",
|
781 |
-
"winner": "tie (bothbad)",
|
782 |
-
"judge": "arena_user_::1",
|
783 |
-
"anony": false,
|
784 |
-
"tstamp": 1710517859.2942
|
785 |
-
},
|
786 |
-
{
|
787 |
-
"model_a": "Pix2PixZero",
|
788 |
-
"model_b": "CycleDiffusion",
|
789 |
-
"winner": "tie (bothbad)",
|
790 |
-
"judge": "arena_user_::1",
|
791 |
-
"anony": true,
|
792 |
-
"tstamp": 1710535672.9791
|
793 |
-
},
|
794 |
-
{
|
795 |
-
"model_a": "CycleDiffusion",
|
796 |
-
"model_b": "Pix2PixZero",
|
797 |
-
"winner": "model_b",
|
798 |
-
"judge": "arena_user_10.16.25.191",
|
799 |
-
"anony": true,
|
800 |
-
"tstamp": 1711610477.1213
|
801 |
-
},
|
802 |
-
{
|
803 |
-
"model_a": "CycleDiffusion",
|
804 |
-
"model_b": "Pix2PixZero",
|
805 |
-
"winner": "model_b",
|
806 |
-
"judge": "arena_user_10.16.7.189",
|
807 |
-
"anony": true,
|
808 |
-
"tstamp": 1711629129.3894
|
809 |
-
},
|
810 |
-
{
|
811 |
-
"model_a": "InstructPix2Pix",
|
812 |
-
"model_b": "CycleDiffusion",
|
813 |
-
"winner": "model_b",
|
814 |
-
"judge": "arena_user_10.16.7.189",
|
815 |
-
"anony": true,
|
816 |
-
"tstamp": 1711629705.2246
|
817 |
-
},
|
818 |
-
{
|
819 |
-
"model_a": "CycleDiffusion",
|
820 |
-
"model_b": "Pix2PixZero",
|
821 |
-
"winner": "model_b",
|
822 |
-
"judge": "arena_user_10.16.25.191",
|
823 |
-
"anony": true,
|
824 |
-
"tstamp": 1711630362.5575
|
825 |
-
},
|
826 |
-
{
|
827 |
-
"model_a": "MagicBrush",
|
828 |
-
"model_b": "SDEdit",
|
829 |
-
"winner": "model_a",
|
830 |
-
"judge": "arena_user_127.0.0.1",
|
831 |
-
"anony": true,
|
832 |
-
"tstamp": 1711631112.5207
|
833 |
-
},
|
834 |
-
{
|
835 |
-
"model_a": "Pix2PixZero",
|
836 |
-
"model_b": "Prompt2prompt",
|
837 |
-
"winner": "model_a",
|
838 |
-
"judge": "arena_user_10.16.41.118",
|
839 |
-
"anony": true,
|
840 |
-
"tstamp": 1711631690.5127
|
841 |
-
},
|
842 |
-
{
|
843 |
-
"model_a": "MagicBrush",
|
844 |
-
"model_b": "InstructPix2Pix",
|
845 |
-
"winner": "model_a",
|
846 |
-
"judge": "arena_user_127.0.0.1",
|
847 |
-
"anony": true,
|
848 |
-
"tstamp": 1711633200.2923
|
849 |
-
},
|
850 |
-
{
|
851 |
-
"model_a": "MagicBrush",
|
852 |
-
"model_b": "InstructPix2Pix",
|
853 |
-
"winner": "model_a",
|
854 |
-
"judge": "arena_user_127.0.0.1",
|
855 |
-
"anony": true,
|
856 |
-
"tstamp": 1711633594.9922
|
857 |
-
},
|
858 |
-
{
|
859 |
-
"model_a": "MagicBrush",
|
860 |
-
"model_b": "SDEdit",
|
861 |
-
"winner": "model_a",
|
862 |
-
"judge": "arena_user_10.16.7.189",
|
863 |
-
"anony": true,
|
864 |
-
"tstamp": 1711635443.3071
|
865 |
-
},
|
866 |
-
{
|
867 |
-
"model_a": "CycleDiffusion",
|
868 |
-
"model_b": "MagicBrush",
|
869 |
-
"winner": "model_b",
|
870 |
-
"judge": "arena_user_10.16.25.191",
|
871 |
-
"anony": true,
|
872 |
-
"tstamp": 1711635899.3088
|
873 |
-
},
|
874 |
-
{
|
875 |
-
"model_a": "SDEdit",
|
876 |
-
"model_b": "MagicBrush",
|
877 |
-
"winner": "model_b",
|
878 |
-
"judge": "arena_user_10.16.41.118",
|
879 |
-
"anony": true,
|
880 |
-
"tstamp": 1711639015.428
|
881 |
-
},
|
882 |
-
{
|
883 |
-
"model_a": "InstructPix2Pix",
|
884 |
-
"model_b": "MagicBrush",
|
885 |
-
"winner": "model_b",
|
886 |
-
"judge": "arena_user_10.16.7.189",
|
887 |
-
"anony": true,
|
888 |
-
"tstamp": 1711646372.1201
|
889 |
-
},
|
890 |
-
{
|
891 |
-
"model_a": "Pix2PixZero",
|
892 |
-
"model_b": "Prompt2prompt",
|
893 |
-
"winner": "model_b",
|
894 |
-
"judge": "arena_user_10.16.17.217",
|
895 |
-
"anony": true,
|
896 |
-
"tstamp": 1712873850.0636
|
897 |
-
},
|
898 |
-
{
|
899 |
-
"model_a": "MagicBrush",
|
900 |
-
"model_b": "SDEdit",
|
901 |
-
"winner": "tie (bothbad)",
|
902 |
-
"judge": "arena_user_10.16.25.191",
|
903 |
-
"anony": true,
|
904 |
-
"tstamp": 1712876598.7667
|
905 |
-
}
|
906 |
-
]
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
arena_elo/results/20240411/clean_battle_t2i_generation.json
DELETED
The diff for this file is too large to render.
See raw diff
|
|
arena_elo/results/20240411/elo_results_image_editing.pkl
DELETED
@@ -1,3 +0,0 @@
|
|
1 |
-
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:d66a54af51d2ecf89f461dbb4e15090d084638596952d3541ce369798a525ff3
|
3 |
-
size 57096
|
|
|
|
|
|
|
|
arena_elo/results/20240411/elo_results_t2i_generation.pkl
DELETED
@@ -1,3 +0,0 @@
|
|
1 |
-
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:caf98f560387fa9d6b8c233e9915807adad62315cfdd6d4a5e7c9fda30140eb8
|
3 |
-
size 62422
|
|
|
|
|
|
|
|
arena_elo/results/20240411/image_editing_leaderboard.csv
DELETED
@@ -1,8 +0,0 @@
|
|
1 |
-
key,Model,Arena Elo rating (anony),Arena Elo rating (full),License,Organization,Link
|
2 |
-
Prompt2prompt,Prompt2prompt,1188.219371435949,1160.9021011448333,Apache-2.0,"Google, Tel Aviv University",https://prompt-to-prompt.github.io
|
3 |
-
PNP,PNP,1133.8594830307645,1160.2784411172045,-,Weizmann Institute of Science,https://github.com/MichalGeyer/plug-and-play
|
4 |
-
InstructPix2Pix,InstructPix2Pix,1086.6617653998492,1065.4343032662,"Copyright 2023 Timothy Brooks, Aleksander Holynski, Alexei A. Efros","University of California, Berkeley",https://www.timothybrooks.com/instruct-pix2pix
|
5 |
-
MagicBrush,MagicBrush,1084.8708678670623,1120.3917913590851,CC-BY-4.0,"The Ohio State University, University of Waterloo",https://osu-nlp-group.github.io/MagicBrush
|
6 |
-
Pix2PixZero,Pix2PixZero,983.9050014855375,949.5286840298457,MIT License,"Carnegie Mellon University, Adobe Research",https://pix2pixzero.github.io
|
7 |
-
CycleDiffusion,CycleDiffusion,847.634435323394,811.6166545238106,X11,Carnegie Mellon University,https://github.com/ChenWu98/cycle-diffusion
|
8 |
-
SDEdit,SDEdit,674.8490754574439,731.8480245590208,MIT License,Stanford University,https://sde-image-editing.github.io
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
arena_elo/results/20240411/t2i_generation_leaderboard.csv
DELETED
@@ -1,10 +0,0 @@
|
|
1 |
-
key,Model,Arena Elo rating (anony),Arena Elo rating (full),License,Organization,Link
|
2 |
-
PlayGround V2,PlayGround V2,1096.7894880225679,1099.8051043857877,Playground v2 Community License,Playground,https://huggingface.co/playgroundai/playground-v2-1024px-aesthetic
|
3 |
-
PlayGround V2.5,PlayGround V2.5,1087.8676967844767,1102.012177335679,Playground v2.5 Community License,Playground,https://huggingface.co/playgroundai/playground-v2.5-1024px-aesthetic
|
4 |
-
StableCascade,StableCascade,1055.9173326915914,1059.3764815279687,stable-cascade-nc-community (other),Stability AI,https://huggingface.co/stabilityai/stable-cascade
|
5 |
-
PixArtAlpha,PixArtAlpha,1033.9990481857885,1022.7034421485712,openrail++,PixArt-alpha,https://huggingface.co/PixArt-alpha/PixArt-XL-2-1024-MS
|
6 |
-
SDXLLightning,SDXLLightning,1033.7993884424232,1038.4887196068619,openrail++,ByteDance,https://huggingface.co/ByteDance/SDXL-Lightning
|
7 |
-
SDXL,SDXL,1001.9345229118052,1000.9893451213411,openrail++,Stability AI,https://huggingface.co/stabilityai/stable-diffusion-xl-base-1.0
|
8 |
-
SDXLTurbo,SDXLTurbo,954.8868434684313,951.3491425503697,sai-nc-community (other),Stability AI,https://huggingface.co/stabilityai/sdxl-turbo
|
9 |
-
OpenJourney,OpenJourney,888.3709717134242,873.7483257587076,creativeml-openrail-m,PromptHero,https://huggingface.co/prompthero/openjourney
|
10 |
-
LCM,LCM,846.4347077794937,852.2372365264126,MIT License,Tsinghua University,https://huggingface.co/SimianLuo/LCM_Dreamshaper_v7
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
arena_elo/results/20240428/elo_results_image_editing.pkl
DELETED
@@ -1,3 +0,0 @@
|
|
1 |
-
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:c1b4f1daab3429c7656eb8b3b2128a127480fa8212b17a1a98207884d7ce7a9f
|
3 |
-
size 58442
|
|
|
|
|
|
|
|
arena_elo/results/20240428/image_editing_leaderboard.csv
DELETED
@@ -1,8 +0,0 @@
|
|
1 |
-
key,Model,Arena Elo rating (anony),Arena Elo rating (full),License,Organization,Link
|
2 |
-
Prompt2prompt,Prompt2prompt,1224.5951620965877,1133.887231157847,Apache-2.0,"Google, Tel Aviv University",https://prompt-to-prompt.github.io
|
3 |
-
InstructPix2Pix,InstructPix2Pix,1162.3591990023222,1059.7394666236296,"Copyright 2023 Timothy Brooks, Aleksander Holynski, Alexei A. Efros","University of California, Berkeley",https://www.timothybrooks.com/instruct-pix2pix
|
4 |
-
PNP,PNP,1142.872221219748,1117.461082043853,-,Weizmann Institute of Science,https://github.com/MichalGeyer/plug-and-play
|
5 |
-
MagicBrush,MagicBrush,1053.6353139288728,1055.6074426532264,CC-BY-4.0,"The Ohio State University, University of Waterloo",https://osu-nlp-group.github.io/MagicBrush
|
6 |
-
Pix2PixZero,Pix2PixZero,918.4266240422415,853.535635519584,MIT License,"Carnegie Mellon University, Adobe Research",https://pix2pixzero.github.io
|
7 |
-
CycleDiffusion,CycleDiffusion,865.2495984976465,775.6226309361784,X11,Carnegie Mellon University,https://github.com/ChenWu98/cycle-diffusion
|
8 |
-
SDEdit,SDEdit,632.8618812125814,680.2047869803968,MIT License,Stanford University,https://sde-image-editing.github.io
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
arena_elo/results/20240501/clean_battle_t2i_generation.json
DELETED
The diff for this file is too large to render.
See raw diff
|
|
arena_elo/results/20240501/elo_results_t2i_generation.pkl
DELETED
@@ -1,3 +0,0 @@
|
|
1 |
-
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:9b79d128ba01570bc59c5f48e1c0640f2541817ce1a77abb3e16131884288b1a
|
3 |
-
size 65313
|
|
|
|
|
|
|
|
arena_elo/results/20240501/t2i_generation_leaderboard.csv
DELETED
@@ -1,11 +0,0 @@
|
|
1 |
-
key,Model,Arena Elo rating (anony),Arena Elo rating (full),License,Organization,Link
|
2 |
-
PlayGround V2.5,PlayGround V2.5,1157.785440865029,1197.7936802344343,Playground v2.5 Community License,Playground,https://huggingface.co/playgroundai/playground-v2.5-1024px-aesthetic
|
3 |
-
StableCascade,StableCascade,1116.6696847615349,1116.9442071854512,stable-cascade-nc-community (other),Stability AI,https://huggingface.co/stabilityai/stable-cascade
|
4 |
-
PlayGround V2,PlayGround V2,1110.1291971452683,1120.6591618464581,Playground v2 Community License,Playground,https://huggingface.co/playgroundai/playground-v2-1024px-aesthetic
|
5 |
-
PixArtAlpha,PixArtAlpha,1042.1316579959862,1040.3305680293547,openrail++,PixArt-alpha,https://huggingface.co/PixArt-alpha/PixArt-XL-2-1024-MS
|
6 |
-
SDXLLightning,SDXLLightning,1036.0784815928241,1056.600050803737,openrail++,ByteDance,https://huggingface.co/ByteDance/SDXL-Lightning
|
7 |
-
SDXL,SDXL,987.5686859787551,1003.0595102032345,openrail++,Stability AI,https://huggingface.co/stabilityai/stable-diffusion-xl-base-1.0
|
8 |
-
PixArtSigma,PixArtSigma,948.0067582557859,961.4040676622378,N/A,N/A,N/A
|
9 |
-
SDXLTurbo,SDXLTurbo,931.094996526404,945.5610964234802,sai-nc-community (other),Stability AI,https://huggingface.co/stabilityai/sdxl-turbo
|
10 |
-
OpenJourney,OpenJourney,855.7449360962327,860.1159058283633,creativeml-openrail-m,PromptHero,https://huggingface.co/prompthero/openjourney
|
11 |
-
LCM,LCM,814.7901607821794,840.5627577743975,MIT License,Tsinghua University,https://huggingface.co/SimianLuo/LCM_Dreamshaper_v7
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
arena_elo/results/20240516/clean_battle_image_editing.json
DELETED
@@ -1,1578 +0,0 @@
|
|
1 |
-
[
|
2 |
-
{
|
3 |
-
"model_a": "CycleDiffusion",
|
4 |
-
"model_b": "InstructPix2Pix",
|
5 |
-
"winner": "model_b",
|
6 |
-
"judge": "arena_user_::1",
|
7 |
-
"anony": true,
|
8 |
-
"tstamp": 1707712630.872
|
9 |
-
},
|
10 |
-
{
|
11 |
-
"model_a": "CycleDiffusion",
|
12 |
-
"model_b": "InstructPix2Pix",
|
13 |
-
"winner": "model_b",
|
14 |
-
"judge": "arena_user_::1",
|
15 |
-
"anony": false,
|
16 |
-
"tstamp": 1707712699.668
|
17 |
-
},
|
18 |
-
{
|
19 |
-
"model_a": "Pix2PixZero",
|
20 |
-
"model_b": "MagicBrush",
|
21 |
-
"winner": "model_a",
|
22 |
-
"judge": "arena_user_::1",
|
23 |
-
"anony": true,
|
24 |
-
"tstamp": 1707712896.0427
|
25 |
-
},
|
26 |
-
{
|
27 |
-
"model_a": "CycleDiffusion",
|
28 |
-
"model_b": "InstructPix2Pix",
|
29 |
-
"winner": "model_b",
|
30 |
-
"judge": "arena_user_::1",
|
31 |
-
"anony": false,
|
32 |
-
"tstamp": 1707712929.7061
|
33 |
-
},
|
34 |
-
{
|
35 |
-
"model_a": "CycleDiffusion",
|
36 |
-
"model_b": "InstructPix2Pix",
|
37 |
-
"winner": "model_b",
|
38 |
-
"judge": "arena_user_::1",
|
39 |
-
"anony": true,
|
40 |
-
"tstamp": 1707713147.0445
|
41 |
-
},
|
42 |
-
{
|
43 |
-
"model_a": "CycleDiffusion",
|
44 |
-
"model_b": "PNP",
|
45 |
-
"winner": "model_b",
|
46 |
-
"judge": "arena_user_::1",
|
47 |
-
"anony": true,
|
48 |
-
"tstamp": 1707713198.9284
|
49 |
-
},
|
50 |
-
{
|
51 |
-
"model_a": "CycleDiffusion",
|
52 |
-
"model_b": "Prompt2prompt",
|
53 |
-
"winner": "model_b",
|
54 |
-
"judge": "arena_user_::1",
|
55 |
-
"anony": true,
|
56 |
-
"tstamp": 1707713210.1306
|
57 |
-
},
|
58 |
-
{
|
59 |
-
"model_a": "Prompt2prompt",
|
60 |
-
"model_b": "SDEdit",
|
61 |
-
"winner": "model_a",
|
62 |
-
"judge": "arena_user_::1",
|
63 |
-
"anony": true,
|
64 |
-
"tstamp": 1707713747.5115
|
65 |
-
},
|
66 |
-
{
|
67 |
-
"model_a": "PNP",
|
68 |
-
"model_b": "Pix2PixZero",
|
69 |
-
"winner": "model_a",
|
70 |
-
"judge": "arena_user_::1",
|
71 |
-
"anony": true,
|
72 |
-
"tstamp": 1707715613.7226
|
73 |
-
},
|
74 |
-
{
|
75 |
-
"model_a": "CycleDiffusion",
|
76 |
-
"model_b": "MagicBrush",
|
77 |
-
"winner": "model_b",
|
78 |
-
"judge": "arena_user_::1",
|
79 |
-
"anony": true,
|
80 |
-
"tstamp": 1707765708.2644
|
81 |
-
},
|
82 |
-
{
|
83 |
-
"model_a": "PNP",
|
84 |
-
"model_b": "CycleDiffusion",
|
85 |
-
"winner": "model_a",
|
86 |
-
"judge": "arena_user_::1",
|
87 |
-
"anony": true,
|
88 |
-
"tstamp": 1707765861.2742
|
89 |
-
},
|
90 |
-
{
|
91 |
-
"model_a": "PNP",
|
92 |
-
"model_b": "CycleDiffusion",
|
93 |
-
"winner": "model_a",
|
94 |
-
"judge": "arena_user_::1",
|
95 |
-
"anony": false,
|
96 |
-
"tstamp": 1707765975.0206
|
97 |
-
},
|
98 |
-
{
|
99 |
-
"model_a": "PNP",
|
100 |
-
"model_b": "CycleDiffusion",
|
101 |
-
"winner": "model_a",
|
102 |
-
"judge": "arena_user_::1",
|
103 |
-
"anony": true,
|
104 |
-
"tstamp": 1707768866.9065
|
105 |
-
},
|
106 |
-
{
|
107 |
-
"model_a": "SDEdit",
|
108 |
-
"model_b": "MagicBrush",
|
109 |
-
"winner": "model_b",
|
110 |
-
"judge": "arena_user_::1",
|
111 |
-
"anony": true,
|
112 |
-
"tstamp": 1707771673.2989
|
113 |
-
},
|
114 |
-
{
|
115 |
-
"model_a": "SDEdit",
|
116 |
-
"model_b": "MagicBrush",
|
117 |
-
"winner": "model_b",
|
118 |
-
"judge": "arena_user_::1",
|
119 |
-
"anony": true,
|
120 |
-
"tstamp": 1707784377.6617
|
121 |
-
},
|
122 |
-
{
|
123 |
-
"model_a": "SDEdit",
|
124 |
-
"model_b": "MagicBrush",
|
125 |
-
"winner": "model_b",
|
126 |
-
"judge": "arena_user_::1",
|
127 |
-
"anony": true,
|
128 |
-
"tstamp": 1707784466.8915
|
129 |
-
},
|
130 |
-
{
|
131 |
-
"model_a": "CycleDiffusion",
|
132 |
-
"model_b": "PNP",
|
133 |
-
"winner": "model_b",
|
134 |
-
"judge": "arena_user_::1",
|
135 |
-
"anony": true,
|
136 |
-
"tstamp": 1707784983.9581
|
137 |
-
},
|
138 |
-
{
|
139 |
-
"model_a": "MagicBrush",
|
140 |
-
"model_b": "SDEdit",
|
141 |
-
"winner": "model_a",
|
142 |
-
"judge": "arena_user_::1",
|
143 |
-
"anony": true,
|
144 |
-
"tstamp": 1707785277.16
|
145 |
-
},
|
146 |
-
{
|
147 |
-
"model_a": "MagicBrush",
|
148 |
-
"model_b": "SDEdit",
|
149 |
-
"winner": "model_a",
|
150 |
-
"judge": "arena_user_::1",
|
151 |
-
"anony": true,
|
152 |
-
"tstamp": 1707795299.0619
|
153 |
-
},
|
154 |
-
{
|
155 |
-
"model_a": "MagicBrush",
|
156 |
-
"model_b": "SDEdit",
|
157 |
-
"winner": "tie (bothbad)",
|
158 |
-
"judge": "arena_user_::1",
|
159 |
-
"anony": true,
|
160 |
-
"tstamp": 1707795798.752
|
161 |
-
},
|
162 |
-
{
|
163 |
-
"model_a": "SDEdit",
|
164 |
-
"model_b": "Prompt2prompt",
|
165 |
-
"winner": "model_b",
|
166 |
-
"judge": "arena_user_::1",
|
167 |
-
"anony": false,
|
168 |
-
"tstamp": 1707796435.7996
|
169 |
-
},
|
170 |
-
{
|
171 |
-
"model_a": "SDEdit",
|
172 |
-
"model_b": "CycleDiffusion",
|
173 |
-
"winner": "model_b",
|
174 |
-
"judge": "arena_user_::1",
|
175 |
-
"anony": false,
|
176 |
-
"tstamp": 1707797278.7369
|
177 |
-
},
|
178 |
-
{
|
179 |
-
"model_a": "SDEdit",
|
180 |
-
"model_b": "CycleDiffusion",
|
181 |
-
"winner": "model_a",
|
182 |
-
"judge": "arena_user_::1",
|
183 |
-
"anony": false,
|
184 |
-
"tstamp": 1707797279.6004
|
185 |
-
},
|
186 |
-
{
|
187 |
-
"model_a": "SDEdit",
|
188 |
-
"model_b": "Prompt2prompt",
|
189 |
-
"winner": "model_b",
|
190 |
-
"judge": "arena_user_::1",
|
191 |
-
"anony": true,
|
192 |
-
"tstamp": 1707805086.9739
|
193 |
-
},
|
194 |
-
{
|
195 |
-
"model_a": "PNP",
|
196 |
-
"model_b": "SDEdit",
|
197 |
-
"winner": "model_a",
|
198 |
-
"judge": "arena_user_::1",
|
199 |
-
"anony": true,
|
200 |
-
"tstamp": 1707805220.3253
|
201 |
-
},
|
202 |
-
{
|
203 |
-
"model_a": "InstructPix2Pix",
|
204 |
-
"model_b": "CycleDiffusion",
|
205 |
-
"winner": "tie (bothbad)",
|
206 |
-
"judge": "arena_user_::1",
|
207 |
-
"anony": true,
|
208 |
-
"tstamp": 1707805332.6322
|
209 |
-
},
|
210 |
-
{
|
211 |
-
"model_a": "InstructPix2Pix",
|
212 |
-
"model_b": "Prompt2prompt",
|
213 |
-
"winner": "model_b",
|
214 |
-
"judge": "arena_user_::1",
|
215 |
-
"anony": true,
|
216 |
-
"tstamp": 1707805476.0509
|
217 |
-
},
|
218 |
-
{
|
219 |
-
"model_a": "InstructPix2Pix",
|
220 |
-
"model_b": "Prompt2prompt",
|
221 |
-
"winner": "model_b",
|
222 |
-
"judge": "arena_user_::1",
|
223 |
-
"anony": true,
|
224 |
-
"tstamp": 1707818374.3438
|
225 |
-
},
|
226 |
-
{
|
227 |
-
"model_a": "PNP",
|
228 |
-
"model_b": "Prompt2prompt",
|
229 |
-
"winner": "model_b",
|
230 |
-
"judge": "arena_user_::1",
|
231 |
-
"anony": true,
|
232 |
-
"tstamp": 1707834631.9088
|
233 |
-
},
|
234 |
-
{
|
235 |
-
"model_a": "InstructPix2Pix",
|
236 |
-
"model_b": "SDEdit",
|
237 |
-
"winner": "model_a",
|
238 |
-
"judge": "arena_user_::1",
|
239 |
-
"anony": true,
|
240 |
-
"tstamp": 1707834954.0147
|
241 |
-
},
|
242 |
-
{
|
243 |
-
"model_a": "Prompt2prompt",
|
244 |
-
"model_b": "Pix2PixZero",
|
245 |
-
"winner": "tie (bothbad)",
|
246 |
-
"judge": "arena_user_::1",
|
247 |
-
"anony": true,
|
248 |
-
"tstamp": 1707835366.544
|
249 |
-
},
|
250 |
-
{
|
251 |
-
"model_a": "PNP",
|
252 |
-
"model_b": "SDEdit",
|
253 |
-
"winner": "model_a",
|
254 |
-
"judge": "arena_user_::1",
|
255 |
-
"anony": true,
|
256 |
-
"tstamp": 1707835643.6178
|
257 |
-
},
|
258 |
-
{
|
259 |
-
"model_a": "MagicBrush",
|
260 |
-
"model_b": "InstructPix2Pix",
|
261 |
-
"winner": "tie (bothbad)",
|
262 |
-
"judge": "arena_user_::1",
|
263 |
-
"anony": true,
|
264 |
-
"tstamp": 1707835789.25
|
265 |
-
},
|
266 |
-
{
|
267 |
-
"model_a": "MagicBrush",
|
268 |
-
"model_b": "PNP",
|
269 |
-
"winner": "tie (bothbad)",
|
270 |
-
"judge": "arena_user_::1",
|
271 |
-
"anony": true,
|
272 |
-
"tstamp": 1707836852.671
|
273 |
-
},
|
274 |
-
{
|
275 |
-
"model_a": "MagicBrush",
|
276 |
-
"model_b": "InstructPix2Pix",
|
277 |
-
"winner": "model_a",
|
278 |
-
"judge": "arena_user_::1",
|
279 |
-
"anony": false,
|
280 |
-
"tstamp": 1707836952.6082
|
281 |
-
},
|
282 |
-
{
|
283 |
-
"model_a": "CycleDiffusion",
|
284 |
-
"model_b": "SDEdit",
|
285 |
-
"winner": "tie (bothbad)",
|
286 |
-
"judge": "arena_user_::1",
|
287 |
-
"anony": false,
|
288 |
-
"tstamp": 1707837020.7148
|
289 |
-
},
|
290 |
-
{
|
291 |
-
"model_a": "InstructPix2Pix",
|
292 |
-
"model_b": "PNP",
|
293 |
-
"winner": "model_a",
|
294 |
-
"judge": "arena_user_::1",
|
295 |
-
"anony": true,
|
296 |
-
"tstamp": 1707837226.2259
|
297 |
-
},
|
298 |
-
{
|
299 |
-
"model_a": "Prompt2prompt",
|
300 |
-
"model_b": "Pix2PixZero",
|
301 |
-
"winner": "model_a",
|
302 |
-
"judge": "arena_user_::1",
|
303 |
-
"anony": true,
|
304 |
-
"tstamp": 1707838166.1449
|
305 |
-
},
|
306 |
-
{
|
307 |
-
"model_a": "InstructPix2Pix",
|
308 |
-
"model_b": "MagicBrush",
|
309 |
-
"winner": "tie (bothbad)",
|
310 |
-
"judge": "arena_user_::1",
|
311 |
-
"anony": true,
|
312 |
-
"tstamp": 1707838405.0013
|
313 |
-
},
|
314 |
-
{
|
315 |
-
"model_a": "MagicBrush",
|
316 |
-
"model_b": "CycleDiffusion",
|
317 |
-
"winner": "model_a",
|
318 |
-
"judge": "arena_user_::1",
|
319 |
-
"anony": true,
|
320 |
-
"tstamp": 1707839133.3126
|
321 |
-
},
|
322 |
-
{
|
323 |
-
"model_a": "Prompt2prompt",
|
324 |
-
"model_b": "InstructPix2Pix",
|
325 |
-
"winner": "model_a",
|
326 |
-
"judge": "arena_user_::1",
|
327 |
-
"anony": true,
|
328 |
-
"tstamp": 1707839484.6824
|
329 |
-
},
|
330 |
-
{
|
331 |
-
"model_a": "PNP",
|
332 |
-
"model_b": "InstructPix2Pix",
|
333 |
-
"winner": "tie (bothbad)",
|
334 |
-
"judge": "arena_user_::1",
|
335 |
-
"anony": true,
|
336 |
-
"tstamp": 1707850104.2499
|
337 |
-
},
|
338 |
-
{
|
339 |
-
"model_a": "InstructPix2Pix",
|
340 |
-
"model_b": "Pix2PixZero",
|
341 |
-
"winner": "model_a",
|
342 |
-
"judge": "arena_user_::1",
|
343 |
-
"anony": true,
|
344 |
-
"tstamp": 1707851384.7689
|
345 |
-
},
|
346 |
-
{
|
347 |
-
"model_a": "PNP",
|
348 |
-
"model_b": "MagicBrush",
|
349 |
-
"winner": "model_b",
|
350 |
-
"judge": "arena_user_::1",
|
351 |
-
"anony": true,
|
352 |
-
"tstamp": 1707851936.9466
|
353 |
-
},
|
354 |
-
{
|
355 |
-
"model_a": "CycleDiffusion",
|
356 |
-
"model_b": "MagicBrush",
|
357 |
-
"winner": "tie (bothbad)",
|
358 |
-
"judge": "arena_user_::1",
|
359 |
-
"anony": true,
|
360 |
-
"tstamp": 1707852836.3291
|
361 |
-
},
|
362 |
-
{
|
363 |
-
"model_a": "CycleDiffusion",
|
364 |
-
"model_b": "MagicBrush",
|
365 |
-
"winner": "tie (bothbad)",
|
366 |
-
"judge": "arena_user_::1",
|
367 |
-
"anony": false,
|
368 |
-
"tstamp": 1707852878.673
|
369 |
-
},
|
370 |
-
{
|
371 |
-
"model_a": "Prompt2prompt",
|
372 |
-
"model_b": "InstructPix2Pix",
|
373 |
-
"winner": "model_a",
|
374 |
-
"judge": "arena_user_::1",
|
375 |
-
"anony": true,
|
376 |
-
"tstamp": 1707853008.1359
|
377 |
-
},
|
378 |
-
{
|
379 |
-
"model_a": "InstructPix2Pix",
|
380 |
-
"model_b": "Pix2PixZero",
|
381 |
-
"winner": "model_a",
|
382 |
-
"judge": "arena_user_::1",
|
383 |
-
"anony": false,
|
384 |
-
"tstamp": 1707856807.6229
|
385 |
-
},
|
386 |
-
{
|
387 |
-
"model_a": "MagicBrush",
|
388 |
-
"model_b": "Pix2PixZero",
|
389 |
-
"winner": "tie (bothbad)",
|
390 |
-
"judge": "arena_user_::1",
|
391 |
-
"anony": false,
|
392 |
-
"tstamp": 1707863740.3507
|
393 |
-
},
|
394 |
-
{
|
395 |
-
"model_a": "MagicBrush",
|
396 |
-
"model_b": "PNP",
|
397 |
-
"winner": "model_b",
|
398 |
-
"judge": "arena_user_::1",
|
399 |
-
"anony": true,
|
400 |
-
"tstamp": 1707866312.1118
|
401 |
-
},
|
402 |
-
{
|
403 |
-
"model_a": "Pix2PixZero",
|
404 |
-
"model_b": "Prompt2prompt",
|
405 |
-
"winner": "model_b",
|
406 |
-
"judge": "arena_user_::1",
|
407 |
-
"anony": true,
|
408 |
-
"tstamp": 1707883083.3533
|
409 |
-
},
|
410 |
-
{
|
411 |
-
"model_a": "Pix2PixZero",
|
412 |
-
"model_b": "InstructPix2Pix",
|
413 |
-
"winner": "model_b",
|
414 |
-
"judge": "arena_user_::1",
|
415 |
-
"anony": true,
|
416 |
-
"tstamp": 1707883181.1397
|
417 |
-
},
|
418 |
-
{
|
419 |
-
"model_a": "Pix2PixZero",
|
420 |
-
"model_b": "Prompt2prompt",
|
421 |
-
"winner": "model_b",
|
422 |
-
"judge": "arena_user_::1",
|
423 |
-
"anony": true,
|
424 |
-
"tstamp": 1707883187.9173
|
425 |
-
},
|
426 |
-
{
|
427 |
-
"model_a": "PNP",
|
428 |
-
"model_b": "Prompt2prompt",
|
429 |
-
"winner": "model_a",
|
430 |
-
"judge": "arena_user_::1",
|
431 |
-
"anony": true,
|
432 |
-
"tstamp": 1707883507.587
|
433 |
-
},
|
434 |
-
{
|
435 |
-
"model_a": "Prompt2prompt",
|
436 |
-
"model_b": "CycleDiffusion",
|
437 |
-
"winner": "model_a",
|
438 |
-
"judge": "arena_user_::1",
|
439 |
-
"anony": true,
|
440 |
-
"tstamp": 1707883939.6125
|
441 |
-
},
|
442 |
-
{
|
443 |
-
"model_a": "Prompt2prompt",
|
444 |
-
"model_b": "MagicBrush",
|
445 |
-
"winner": "model_b",
|
446 |
-
"judge": "arena_user_::1",
|
447 |
-
"anony": true,
|
448 |
-
"tstamp": 1707892689.4407
|
449 |
-
},
|
450 |
-
{
|
451 |
-
"model_a": "MagicBrush",
|
452 |
-
"model_b": "InstructPix2Pix",
|
453 |
-
"winner": "model_b",
|
454 |
-
"judge": "arena_user_::1",
|
455 |
-
"anony": true,
|
456 |
-
"tstamp": 1707908988.749
|
457 |
-
},
|
458 |
-
{
|
459 |
-
"model_a": "Prompt2prompt",
|
460 |
-
"model_b": "InstructPix2Pix",
|
461 |
-
"winner": "model_a",
|
462 |
-
"judge": "arena_user_::1",
|
463 |
-
"anony": true,
|
464 |
-
"tstamp": 1707912639.2701
|
465 |
-
},
|
466 |
-
{
|
467 |
-
"model_a": "MagicBrush",
|
468 |
-
"model_b": "Pix2PixZero",
|
469 |
-
"winner": "model_a",
|
470 |
-
"judge": "arena_user_::1",
|
471 |
-
"anony": false,
|
472 |
-
"tstamp": 1707917685.9574
|
473 |
-
},
|
474 |
-
{
|
475 |
-
"model_a": "MagicBrush",
|
476 |
-
"model_b": "InstructPix2Pix",
|
477 |
-
"winner": "tie (bothbad)",
|
478 |
-
"judge": "arena_user_::1",
|
479 |
-
"anony": false,
|
480 |
-
"tstamp": 1707919429.336
|
481 |
-
},
|
482 |
-
{
|
483 |
-
"model_a": "InstructPix2Pix",
|
484 |
-
"model_b": "CycleDiffusion",
|
485 |
-
"winner": "model_a",
|
486 |
-
"judge": "arena_user_::1",
|
487 |
-
"anony": true,
|
488 |
-
"tstamp": 1707932651.9192
|
489 |
-
},
|
490 |
-
{
|
491 |
-
"model_a": "MagicBrush",
|
492 |
-
"model_b": "InstructPix2Pix",
|
493 |
-
"winner": "model_a",
|
494 |
-
"judge": "arena_user_::1",
|
495 |
-
"anony": true,
|
496 |
-
"tstamp": 1707932749.3107
|
497 |
-
},
|
498 |
-
{
|
499 |
-
"model_a": "Prompt2prompt",
|
500 |
-
"model_b": "PNP",
|
501 |
-
"winner": "model_a",
|
502 |
-
"judge": "arena_user_::1",
|
503 |
-
"anony": true,
|
504 |
-
"tstamp": 1707933208.5797
|
505 |
-
},
|
506 |
-
{
|
507 |
-
"model_a": "MagicBrush",
|
508 |
-
"model_b": "Pix2PixZero",
|
509 |
-
"winner": "model_a",
|
510 |
-
"judge": "arena_user_::1",
|
511 |
-
"anony": false,
|
512 |
-
"tstamp": 1707945335.6341
|
513 |
-
},
|
514 |
-
{
|
515 |
-
"model_a": "MagicBrush",
|
516 |
-
"model_b": "PNP",
|
517 |
-
"winner": "model_a",
|
518 |
-
"judge": "arena_user_::1",
|
519 |
-
"anony": false,
|
520 |
-
"tstamp": 1708031168.6838
|
521 |
-
},
|
522 |
-
{
|
523 |
-
"model_a": "Pix2PixZero",
|
524 |
-
"model_b": "PNP",
|
525 |
-
"winner": "model_b",
|
526 |
-
"judge": "arena_user_::1",
|
527 |
-
"anony": false,
|
528 |
-
"tstamp": 1708038931.5388
|
529 |
-
},
|
530 |
-
{
|
531 |
-
"model_a": "Pix2PixZero",
|
532 |
-
"model_b": "CycleDiffusion",
|
533 |
-
"winner": "tie (bothbad)",
|
534 |
-
"judge": "arena_user_::1",
|
535 |
-
"anony": true,
|
536 |
-
"tstamp": 1708057382.78
|
537 |
-
},
|
538 |
-
{
|
539 |
-
"model_a": "PNP",
|
540 |
-
"model_b": "InstructPix2Pix",
|
541 |
-
"winner": "model_b",
|
542 |
-
"judge": "arena_user_::1",
|
543 |
-
"anony": true,
|
544 |
-
"tstamp": 1708093689.8237
|
545 |
-
},
|
546 |
-
{
|
547 |
-
"model_a": "MagicBrush",
|
548 |
-
"model_b": "PNP",
|
549 |
-
"winner": "model_b",
|
550 |
-
"judge": "arena_user_::1",
|
551 |
-
"anony": true,
|
552 |
-
"tstamp": 1708093910.4683
|
553 |
-
},
|
554 |
-
{
|
555 |
-
"model_a": "Pix2PixZero",
|
556 |
-
"model_b": "Prompt2prompt",
|
557 |
-
"winner": "model_b",
|
558 |
-
"judge": "arena_user_::1",
|
559 |
-
"anony": false,
|
560 |
-
"tstamp": 1708095090.8232
|
561 |
-
},
|
562 |
-
{
|
563 |
-
"model_a": "Pix2PixZero",
|
564 |
-
"model_b": "Prompt2prompt",
|
565 |
-
"winner": "model_a",
|
566 |
-
"judge": "arena_user_::1",
|
567 |
-
"anony": false,
|
568 |
-
"tstamp": 1708095305.4665
|
569 |
-
},
|
570 |
-
{
|
571 |
-
"model_a": "InstructPix2Pix",
|
572 |
-
"model_b": "Prompt2prompt",
|
573 |
-
"winner": "model_b",
|
574 |
-
"judge": "arena_user_::1",
|
575 |
-
"anony": true,
|
576 |
-
"tstamp": 1708140553.1694
|
577 |
-
},
|
578 |
-
{
|
579 |
-
"model_a": "MagicBrush",
|
580 |
-
"model_b": "Prompt2prompt",
|
581 |
-
"winner": "model_a",
|
582 |
-
"judge": "arena_user_::1",
|
583 |
-
"anony": true,
|
584 |
-
"tstamp": 1708145512.3656
|
585 |
-
},
|
586 |
-
{
|
587 |
-
"model_a": "Pix2PixZero",
|
588 |
-
"model_b": "Prompt2prompt",
|
589 |
-
"winner": "tie (bothbad)",
|
590 |
-
"judge": "arena_user_::1",
|
591 |
-
"anony": true,
|
592 |
-
"tstamp": 1708145724.4127
|
593 |
-
},
|
594 |
-
{
|
595 |
-
"model_a": "Pix2PixZero",
|
596 |
-
"model_b": "PNP",
|
597 |
-
"winner": "model_b",
|
598 |
-
"judge": "arena_user_::1",
|
599 |
-
"anony": true,
|
600 |
-
"tstamp": 1708146846.5098
|
601 |
-
},
|
602 |
-
{
|
603 |
-
"model_a": "PNP",
|
604 |
-
"model_b": "MagicBrush",
|
605 |
-
"winner": "model_a",
|
606 |
-
"judge": "arena_user_::1",
|
607 |
-
"anony": true,
|
608 |
-
"tstamp": 1708189738.4864
|
609 |
-
},
|
610 |
-
{
|
611 |
-
"model_a": "Prompt2prompt",
|
612 |
-
"model_b": "InstructPix2Pix",
|
613 |
-
"winner": "model_b",
|
614 |
-
"judge": "arena_user_::1",
|
615 |
-
"anony": true,
|
616 |
-
"tstamp": 1708235874.9246
|
617 |
-
},
|
618 |
-
{
|
619 |
-
"model_a": "Pix2PixZero",
|
620 |
-
"model_b": "PNP",
|
621 |
-
"winner": "model_b",
|
622 |
-
"judge": "arena_user_::1",
|
623 |
-
"anony": false,
|
624 |
-
"tstamp": 1708257619.7115
|
625 |
-
},
|
626 |
-
{
|
627 |
-
"model_a": "MagicBrush",
|
628 |
-
"model_b": "Pix2PixZero",
|
629 |
-
"winner": "tie (bothbad)",
|
630 |
-
"judge": "arena_user_::1",
|
631 |
-
"anony": true,
|
632 |
-
"tstamp": 1708341265.7655
|
633 |
-
},
|
634 |
-
{
|
635 |
-
"model_a": "MagicBrush",
|
636 |
-
"model_b": "InstructPix2Pix",
|
637 |
-
"winner": "model_b",
|
638 |
-
"judge": "arena_user_::1",
|
639 |
-
"anony": true,
|
640 |
-
"tstamp": 1708350183.3086
|
641 |
-
},
|
642 |
-
{
|
643 |
-
"model_a": "MagicBrush",
|
644 |
-
"model_b": "Pix2PixZero",
|
645 |
-
"winner": "tie (bothbad)",
|
646 |
-
"judge": "arena_user_::1",
|
647 |
-
"anony": true,
|
648 |
-
"tstamp": 1708399707.1681
|
649 |
-
},
|
650 |
-
{
|
651 |
-
"model_a": "PNP",
|
652 |
-
"model_b": "MagicBrush",
|
653 |
-
"winner": "model_a",
|
654 |
-
"judge": "arena_user_::1",
|
655 |
-
"anony": true,
|
656 |
-
"tstamp": 1708441502.4707
|
657 |
-
},
|
658 |
-
{
|
659 |
-
"model_a": "InstructPix2Pix",
|
660 |
-
"model_b": "MagicBrush",
|
661 |
-
"winner": "model_a",
|
662 |
-
"judge": "arena_user_::1",
|
663 |
-
"anony": true,
|
664 |
-
"tstamp": 1708441716.8195
|
665 |
-
},
|
666 |
-
{
|
667 |
-
"model_a": "InstructPix2Pix",
|
668 |
-
"model_b": "MagicBrush",
|
669 |
-
"winner": "model_b",
|
670 |
-
"judge": "arena_user_::1",
|
671 |
-
"anony": false,
|
672 |
-
"tstamp": 1708546759.2009
|
673 |
-
},
|
674 |
-
{
|
675 |
-
"model_a": "InstructPix2Pix",
|
676 |
-
"model_b": "MagicBrush",
|
677 |
-
"winner": "model_a",
|
678 |
-
"judge": "arena_user_::1",
|
679 |
-
"anony": false,
|
680 |
-
"tstamp": 1708546805.4892
|
681 |
-
},
|
682 |
-
{
|
683 |
-
"model_a": "Pix2PixZero",
|
684 |
-
"model_b": "CycleDiffusion",
|
685 |
-
"winner": "tie (bothbad)",
|
686 |
-
"judge": "arena_user_::1",
|
687 |
-
"anony": true,
|
688 |
-
"tstamp": 1708547082.7124
|
689 |
-
},
|
690 |
-
{
|
691 |
-
"model_a": "InstructPix2Pix",
|
692 |
-
"model_b": "MagicBrush",
|
693 |
-
"winner": "model_b",
|
694 |
-
"judge": "arena_user_::1",
|
695 |
-
"anony": false,
|
696 |
-
"tstamp": 1708547166.9685
|
697 |
-
},
|
698 |
-
{
|
699 |
-
"model_a": "InstructPix2Pix",
|
700 |
-
"model_b": "MagicBrush",
|
701 |
-
"winner": "model_b",
|
702 |
-
"judge": "arena_user_::1",
|
703 |
-
"anony": false,
|
704 |
-
"tstamp": 1708547293.7107
|
705 |
-
},
|
706 |
-
{
|
707 |
-
"model_a": "CycleDiffusion",
|
708 |
-
"model_b": "PNP",
|
709 |
-
"winner": "tie (bothbad)",
|
710 |
-
"judge": "arena_user_::1",
|
711 |
-
"anony": true,
|
712 |
-
"tstamp": 1708575046.0529
|
713 |
-
},
|
714 |
-
{
|
715 |
-
"model_a": "CycleDiffusion",
|
716 |
-
"model_b": "MagicBrush",
|
717 |
-
"winner": "tie (bothbad)",
|
718 |
-
"judge": "arena_user_::1",
|
719 |
-
"anony": true,
|
720 |
-
"tstamp": 1708615466.9264
|
721 |
-
},
|
722 |
-
{
|
723 |
-
"model_a": "CycleDiffusion",
|
724 |
-
"model_b": "MagicBrush",
|
725 |
-
"winner": "model_b",
|
726 |
-
"judge": "arena_user_::1",
|
727 |
-
"anony": false,
|
728 |
-
"tstamp": 1708615516.3341
|
729 |
-
},
|
730 |
-
{
|
731 |
-
"model_a": "InstructPix2Pix",
|
732 |
-
"model_b": "PNP",
|
733 |
-
"winner": "model_b",
|
734 |
-
"judge": "arena_user_::1",
|
735 |
-
"anony": false,
|
736 |
-
"tstamp": 1709205399.0098
|
737 |
-
},
|
738 |
-
{
|
739 |
-
"model_a": "InstructPix2Pix",
|
740 |
-
"model_b": "PNP",
|
741 |
-
"winner": "model_b",
|
742 |
-
"judge": "arena_user_::1",
|
743 |
-
"anony": false,
|
744 |
-
"tstamp": 1709205767.8923
|
745 |
-
},
|
746 |
-
{
|
747 |
-
"model_a": "PNP",
|
748 |
-
"model_b": "InstructPix2Pix",
|
749 |
-
"winner": "model_b",
|
750 |
-
"judge": "arena_user_::1",
|
751 |
-
"anony": true,
|
752 |
-
"tstamp": 1709443700.05
|
753 |
-
},
|
754 |
-
{
|
755 |
-
"model_a": "MagicBrush",
|
756 |
-
"model_b": "Pix2PixZero",
|
757 |
-
"winner": "model_a",
|
758 |
-
"judge": "arena_user_::1",
|
759 |
-
"anony": true,
|
760 |
-
"tstamp": 1709702898.9291
|
761 |
-
},
|
762 |
-
{
|
763 |
-
"model_a": "CycleDiffusion",
|
764 |
-
"model_b": "Prompt2prompt",
|
765 |
-
"winner": "tie (bothbad)",
|
766 |
-
"judge": "arena_user_::1",
|
767 |
-
"anony": true,
|
768 |
-
"tstamp": 1710091925.1861
|
769 |
-
},
|
770 |
-
{
|
771 |
-
"model_a": "MagicBrush",
|
772 |
-
"model_b": "InstructPix2Pix",
|
773 |
-
"winner": "tie (bothbad)",
|
774 |
-
"judge": "arena_user_::1",
|
775 |
-
"anony": true,
|
776 |
-
"tstamp": 1710517781.1525
|
777 |
-
},
|
778 |
-
{
|
779 |
-
"model_a": "MagicBrush",
|
780 |
-
"model_b": "InstructPix2Pix",
|
781 |
-
"winner": "tie (bothbad)",
|
782 |
-
"judge": "arena_user_::1",
|
783 |
-
"anony": false,
|
784 |
-
"tstamp": 1710517859.2942
|
785 |
-
},
|
786 |
-
{
|
787 |
-
"model_a": "Pix2PixZero",
|
788 |
-
"model_b": "CycleDiffusion",
|
789 |
-
"winner": "tie (bothbad)",
|
790 |
-
"judge": "arena_user_::1",
|
791 |
-
"anony": true,
|
792 |
-
"tstamp": 1710535672.9791
|
793 |
-
},
|
794 |
-
{
|
795 |
-
"model_a": "InfEdit",
|
796 |
-
"model_b": "MagicBrush",
|
797 |
-
"winner": "model_a",
|
798 |
-
"judge": "arena_user_10.16.25.191",
|
799 |
-
"anony": false,
|
800 |
-
"tstamp": 1714359818.6646
|
801 |
-
},
|
802 |
-
{
|
803 |
-
"model_a": "InstructPix2Pix",
|
804 |
-
"model_b": "Prompt2prompt",
|
805 |
-
"winner": "tie (bothbad)",
|
806 |
-
"judge": "arena_user_10.16.25.191",
|
807 |
-
"anony": true,
|
808 |
-
"tstamp": 1714363016.9972
|
809 |
-
},
|
810 |
-
{
|
811 |
-
"model_a": "InfEdit",
|
812 |
-
"model_b": "CosXLEdit",
|
813 |
-
"winner": "model_a",
|
814 |
-
"judge": "arena_user_10.16.25.191",
|
815 |
-
"anony": true,
|
816 |
-
"tstamp": 1714715956.3416
|
817 |
-
},
|
818 |
-
{
|
819 |
-
"model_a": "Pix2PixZero",
|
820 |
-
"model_b": "Prompt2prompt",
|
821 |
-
"winner": "tie (bothbad)",
|
822 |
-
"judge": "arena_user_10.16.2.201",
|
823 |
-
"anony": false,
|
824 |
-
"tstamp": 1714759928.3804
|
825 |
-
},
|
826 |
-
{
|
827 |
-
"model_a": "PNP",
|
828 |
-
"model_b": "InstructPix2Pix",
|
829 |
-
"winner": "model_a",
|
830 |
-
"judge": "arena_user_10.16.17.217",
|
831 |
-
"anony": true,
|
832 |
-
"tstamp": 1715246275.0118
|
833 |
-
},
|
834 |
-
{
|
835 |
-
"model_a": "SDEdit",
|
836 |
-
"model_b": "CosXLEdit",
|
837 |
-
"winner": "tie (bothbad)",
|
838 |
-
"judge": "arena_user_10.16.15.199",
|
839 |
-
"anony": true,
|
840 |
-
"tstamp": 1715247590.2235
|
841 |
-
},
|
842 |
-
{
|
843 |
-
"model_a": "CycleDiffusion",
|
844 |
-
"model_b": "CosXLEdit",
|
845 |
-
"winner": "model_b",
|
846 |
-
"judge": "arena_user_10.16.41.118",
|
847 |
-
"anony": false,
|
848 |
-
"tstamp": 1715406266.2562
|
849 |
-
},
|
850 |
-
{
|
851 |
-
"model_a": "CycleDiffusion",
|
852 |
-
"model_b": "CosXLEdit",
|
853 |
-
"winner": "model_a",
|
854 |
-
"judge": "arena_user_10.16.41.118",
|
855 |
-
"anony": false,
|
856 |
-
"tstamp": 1715406354.5284
|
857 |
-
},
|
858 |
-
{
|
859 |
-
"model_a": "CycleDiffusion",
|
860 |
-
"model_b": "CosXLEdit",
|
861 |
-
"winner": "model_b",
|
862 |
-
"judge": "arena_user_10.16.2.201",
|
863 |
-
"anony": false,
|
864 |
-
"tstamp": 1715406371.8227
|
865 |
-
},
|
866 |
-
{
|
867 |
-
"model_a": "CycleDiffusion",
|
868 |
-
"model_b": "CosXLEdit",
|
869 |
-
"winner": "model_b",
|
870 |
-
"judge": "arena_user_10.16.41.118",
|
871 |
-
"anony": false,
|
872 |
-
"tstamp": 1715406418.5066
|
873 |
-
},
|
874 |
-
{
|
875 |
-
"model_a": "CycleDiffusion",
|
876 |
-
"model_b": "CosXLEdit",
|
877 |
-
"winner": "model_b",
|
878 |
-
"judge": "arena_user_10.16.25.191",
|
879 |
-
"anony": false,
|
880 |
-
"tstamp": 1715406449.9401
|
881 |
-
},
|
882 |
-
{
|
883 |
-
"model_a": "CycleDiffusion",
|
884 |
-
"model_b": "CosXLEdit",
|
885 |
-
"winner": "model_b",
|
886 |
-
"judge": "arena_user_10.16.41.118",
|
887 |
-
"anony": false,
|
888 |
-
"tstamp": 1715406466.5778
|
889 |
-
},
|
890 |
-
{
|
891 |
-
"model_a": "InfEdit",
|
892 |
-
"model_b": "CycleDiffusion",
|
893 |
-
"winner": "model_a",
|
894 |
-
"judge": "arena_user_10.16.2.201",
|
895 |
-
"anony": true,
|
896 |
-
"tstamp": 1715620708.6361
|
897 |
-
},
|
898 |
-
{
|
899 |
-
"model_a": "Prompt2prompt",
|
900 |
-
"model_b": "CosXLEdit",
|
901 |
-
"winner": "model_a",
|
902 |
-
"judge": "arena_user_10.16.41.118",
|
903 |
-
"anony": false,
|
904 |
-
"tstamp": 1715621013.5373
|
905 |
-
},
|
906 |
-
{
|
907 |
-
"model_a": "MagicBrush",
|
908 |
-
"model_b": "CycleDiffusion",
|
909 |
-
"winner": "tie (bothbad)",
|
910 |
-
"judge": "arena_user_10.16.2.201",
|
911 |
-
"anony": true,
|
912 |
-
"tstamp": 1715661224.0507
|
913 |
-
},
|
914 |
-
{
|
915 |
-
"model_a": "SDEdit",
|
916 |
-
"model_b": "PNP",
|
917 |
-
"winner": "tie (bothbad)",
|
918 |
-
"judge": "arena_user_10.16.41.118",
|
919 |
-
"anony": true,
|
920 |
-
"tstamp": 1715661259.6143
|
921 |
-
},
|
922 |
-
{
|
923 |
-
"model_a": "Pix2PixZero",
|
924 |
-
"model_b": "Prompt2prompt",
|
925 |
-
"winner": "tie (bothbad)",
|
926 |
-
"judge": "arena_user_10.16.41.118",
|
927 |
-
"anony": true,
|
928 |
-
"tstamp": 1715661288.6018
|
929 |
-
},
|
930 |
-
{
|
931 |
-
"model_a": "InstructPix2Pix",
|
932 |
-
"model_b": "Prompt2prompt",
|
933 |
-
"winner": "model_b",
|
934 |
-
"judge": "arena_user_10.16.25.191",
|
935 |
-
"anony": true,
|
936 |
-
"tstamp": 1715661310.3621
|
937 |
-
},
|
938 |
-
{
|
939 |
-
"model_a": "CosXLEdit",
|
940 |
-
"model_b": "InstructPix2Pix",
|
941 |
-
"winner": "tie (bothbad)",
|
942 |
-
"judge": "arena_user_10.16.25.191",
|
943 |
-
"anony": true,
|
944 |
-
"tstamp": 1715718742.1258
|
945 |
-
},
|
946 |
-
{
|
947 |
-
"model_a": "MagicBrush",
|
948 |
-
"model_b": "PNP",
|
949 |
-
"winner": "model_a",
|
950 |
-
"judge": "arena_user_10.16.2.201",
|
951 |
-
"anony": true,
|
952 |
-
"tstamp": 1715718773.1054
|
953 |
-
},
|
954 |
-
{
|
955 |
-
"model_a": "SDEdit",
|
956 |
-
"model_b": "CosXLEdit",
|
957 |
-
"winner": "tie (bothbad)",
|
958 |
-
"judge": "arena_user_10.16.2.201",
|
959 |
-
"anony": true,
|
960 |
-
"tstamp": 1715718785.2832
|
961 |
-
},
|
962 |
-
{
|
963 |
-
"model_a": "InstructPix2Pix",
|
964 |
-
"model_b": "SDEdit",
|
965 |
-
"winner": "tie (bothbad)",
|
966 |
-
"judge": "arena_user_10.16.2.201",
|
967 |
-
"anony": true,
|
968 |
-
"tstamp": 1715718804.143
|
969 |
-
},
|
970 |
-
{
|
971 |
-
"model_a": "InfEdit",
|
972 |
-
"model_b": "CosXLEdit",
|
973 |
-
"winner": "model_b",
|
974 |
-
"judge": "arena_user_10.16.25.191",
|
975 |
-
"anony": true,
|
976 |
-
"tstamp": 1715718826.0248
|
977 |
-
},
|
978 |
-
{
|
979 |
-
"model_a": "InfEdit",
|
980 |
-
"model_b": "Prompt2prompt",
|
981 |
-
"winner": "model_a",
|
982 |
-
"judge": "arena_user_10.16.2.201",
|
983 |
-
"anony": true,
|
984 |
-
"tstamp": 1715718869.0041
|
985 |
-
},
|
986 |
-
{
|
987 |
-
"model_a": "InfEdit",
|
988 |
-
"model_b": "CosXLEdit",
|
989 |
-
"winner": "model_b",
|
990 |
-
"judge": "arena_user_10.16.2.201",
|
991 |
-
"anony": true,
|
992 |
-
"tstamp": 1715718904.9307
|
993 |
-
},
|
994 |
-
{
|
995 |
-
"model_a": "Prompt2prompt",
|
996 |
-
"model_b": "Pix2PixZero",
|
997 |
-
"winner": "model_a",
|
998 |
-
"judge": "arena_user_10.16.25.191",
|
999 |
-
"anony": true,
|
1000 |
-
"tstamp": 1715718933.1272
|
1001 |
-
},
|
1002 |
-
{
|
1003 |
-
"model_a": "Pix2PixZero",
|
1004 |
-
"model_b": "MagicBrush",
|
1005 |
-
"winner": "tie (bothbad)",
|
1006 |
-
"judge": "arena_user_10.16.2.201",
|
1007 |
-
"anony": true,
|
1008 |
-
"tstamp": 1715718954.8497
|
1009 |
-
},
|
1010 |
-
{
|
1011 |
-
"model_a": "MagicBrush",
|
1012 |
-
"model_b": "PNP",
|
1013 |
-
"winner": "model_b",
|
1014 |
-
"judge": "arena_user_10.16.25.191",
|
1015 |
-
"anony": true,
|
1016 |
-
"tstamp": 1715718966.8633
|
1017 |
-
},
|
1018 |
-
{
|
1019 |
-
"model_a": "CycleDiffusion",
|
1020 |
-
"model_b": "Prompt2prompt",
|
1021 |
-
"winner": "tie (bothbad)",
|
1022 |
-
"judge": "arena_user_10.16.25.191",
|
1023 |
-
"anony": true,
|
1024 |
-
"tstamp": 1715719000.6673
|
1025 |
-
},
|
1026 |
-
{
|
1027 |
-
"model_a": "MagicBrush",
|
1028 |
-
"model_b": "Pix2PixZero",
|
1029 |
-
"winner": "tie (bothbad)",
|
1030 |
-
"judge": "arena_user_10.16.25.191",
|
1031 |
-
"anony": true,
|
1032 |
-
"tstamp": 1715719019.5495
|
1033 |
-
},
|
1034 |
-
{
|
1035 |
-
"model_a": "InfEdit",
|
1036 |
-
"model_b": "Prompt2prompt",
|
1037 |
-
"winner": "model_a",
|
1038 |
-
"judge": "arena_user_10.16.25.191",
|
1039 |
-
"anony": true,
|
1040 |
-
"tstamp": 1715719035.903
|
1041 |
-
},
|
1042 |
-
{
|
1043 |
-
"model_a": "MagicBrush",
|
1044 |
-
"model_b": "Pix2PixZero",
|
1045 |
-
"winner": "model_a",
|
1046 |
-
"judge": "arena_user_10.16.25.191",
|
1047 |
-
"anony": true,
|
1048 |
-
"tstamp": 1715719046.925
|
1049 |
-
},
|
1050 |
-
{
|
1051 |
-
"model_a": "CycleDiffusion",
|
1052 |
-
"model_b": "CosXLEdit",
|
1053 |
-
"winner": "tie (bothbad)",
|
1054 |
-
"judge": "arena_user_10.16.2.201",
|
1055 |
-
"anony": true,
|
1056 |
-
"tstamp": 1715719059.6291
|
1057 |
-
},
|
1058 |
-
{
|
1059 |
-
"model_a": "Prompt2prompt",
|
1060 |
-
"model_b": "SDEdit",
|
1061 |
-
"winner": "tie (bothbad)",
|
1062 |
-
"judge": "arena_user_10.16.15.199",
|
1063 |
-
"anony": true,
|
1064 |
-
"tstamp": 1715719076.6727
|
1065 |
-
},
|
1066 |
-
{
|
1067 |
-
"model_a": "MagicBrush",
|
1068 |
-
"model_b": "PNP",
|
1069 |
-
"winner": "model_a",
|
1070 |
-
"judge": "arena_user_10.16.25.191",
|
1071 |
-
"anony": true,
|
1072 |
-
"tstamp": 1715719086.7836
|
1073 |
-
},
|
1074 |
-
{
|
1075 |
-
"model_a": "CycleDiffusion",
|
1076 |
-
"model_b": "MagicBrush",
|
1077 |
-
"winner": "model_b",
|
1078 |
-
"judge": "arena_user_10.16.25.191",
|
1079 |
-
"anony": true,
|
1080 |
-
"tstamp": 1715719109.8071
|
1081 |
-
},
|
1082 |
-
{
|
1083 |
-
"model_a": "Prompt2prompt",
|
1084 |
-
"model_b": "InstructPix2Pix",
|
1085 |
-
"winner": "model_b",
|
1086 |
-
"judge": "arena_user_10.16.25.191",
|
1087 |
-
"anony": true,
|
1088 |
-
"tstamp": 1715719122.8237
|
1089 |
-
},
|
1090 |
-
{
|
1091 |
-
"model_a": "MagicBrush",
|
1092 |
-
"model_b": "SDEdit",
|
1093 |
-
"winner": "model_a",
|
1094 |
-
"judge": "arena_user_10.16.15.199",
|
1095 |
-
"anony": true,
|
1096 |
-
"tstamp": 1715719134.1345
|
1097 |
-
},
|
1098 |
-
{
|
1099 |
-
"model_a": "SDEdit",
|
1100 |
-
"model_b": "CycleDiffusion",
|
1101 |
-
"winner": "tie (bothbad)",
|
1102 |
-
"judge": "arena_user_10.16.17.217",
|
1103 |
-
"anony": true,
|
1104 |
-
"tstamp": 1715719153.4359
|
1105 |
-
},
|
1106 |
-
{
|
1107 |
-
"model_a": "Pix2PixZero",
|
1108 |
-
"model_b": "MagicBrush",
|
1109 |
-
"winner": "tie (bothbad)",
|
1110 |
-
"judge": "arena_user_10.16.17.217",
|
1111 |
-
"anony": true,
|
1112 |
-
"tstamp": 1715719160.5285
|
1113 |
-
},
|
1114 |
-
{
|
1115 |
-
"model_a": "MagicBrush",
|
1116 |
-
"model_b": "InstructPix2Pix",
|
1117 |
-
"winner": "model_b",
|
1118 |
-
"judge": "arena_user_10.16.15.199",
|
1119 |
-
"anony": true,
|
1120 |
-
"tstamp": 1715719171.4473
|
1121 |
-
},
|
1122 |
-
{
|
1123 |
-
"model_a": "InstructPix2Pix",
|
1124 |
-
"model_b": "SDEdit",
|
1125 |
-
"winner": "tie (bothbad)",
|
1126 |
-
"judge": "arena_user_10.16.2.201",
|
1127 |
-
"anony": true,
|
1128 |
-
"tstamp": 1715719184.6227
|
1129 |
-
},
|
1130 |
-
{
|
1131 |
-
"model_a": "CosXLEdit",
|
1132 |
-
"model_b": "MagicBrush",
|
1133 |
-
"winner": "model_a",
|
1134 |
-
"judge": "arena_user_10.16.2.201",
|
1135 |
-
"anony": true,
|
1136 |
-
"tstamp": 1715719210.0429
|
1137 |
-
},
|
1138 |
-
{
|
1139 |
-
"model_a": "CycleDiffusion",
|
1140 |
-
"model_b": "MagicBrush",
|
1141 |
-
"winner": "model_b",
|
1142 |
-
"judge": "arena_user_10.16.41.118",
|
1143 |
-
"anony": true,
|
1144 |
-
"tstamp": 1715719219.6447
|
1145 |
-
},
|
1146 |
-
{
|
1147 |
-
"model_a": "PNP",
|
1148 |
-
"model_b": "Pix2PixZero",
|
1149 |
-
"winner": "tie (bothbad)",
|
1150 |
-
"judge": "arena_user_10.16.41.118",
|
1151 |
-
"anony": true,
|
1152 |
-
"tstamp": 1715719237.7036
|
1153 |
-
},
|
1154 |
-
{
|
1155 |
-
"model_a": "PNP",
|
1156 |
-
"model_b": "CycleDiffusion",
|
1157 |
-
"winner": "tie (bothbad)",
|
1158 |
-
"judge": "arena_user_10.16.25.191",
|
1159 |
-
"anony": true,
|
1160 |
-
"tstamp": 1715719249.4321
|
1161 |
-
},
|
1162 |
-
{
|
1163 |
-
"model_a": "Prompt2prompt",
|
1164 |
-
"model_b": "Pix2PixZero",
|
1165 |
-
"winner": "model_a",
|
1166 |
-
"judge": "arena_user_10.16.2.201",
|
1167 |
-
"anony": true,
|
1168 |
-
"tstamp": 1715719257.5877
|
1169 |
-
},
|
1170 |
-
{
|
1171 |
-
"model_a": "CosXLEdit",
|
1172 |
-
"model_b": "Pix2PixZero",
|
1173 |
-
"winner": "tie (bothbad)",
|
1174 |
-
"judge": "arena_user_10.16.25.191",
|
1175 |
-
"anony": true,
|
1176 |
-
"tstamp": 1715719273.7637
|
1177 |
-
},
|
1178 |
-
{
|
1179 |
-
"model_a": "PNP",
|
1180 |
-
"model_b": "CosXLEdit",
|
1181 |
-
"winner": "model_b",
|
1182 |
-
"judge": "arena_user_10.16.17.217",
|
1183 |
-
"anony": true,
|
1184 |
-
"tstamp": 1715719288.4629
|
1185 |
-
},
|
1186 |
-
{
|
1187 |
-
"model_a": "Pix2PixZero",
|
1188 |
-
"model_b": "PNP",
|
1189 |
-
"winner": "model_b",
|
1190 |
-
"judge": "arena_user_10.16.41.118",
|
1191 |
-
"anony": true,
|
1192 |
-
"tstamp": 1715719299.1712
|
1193 |
-
},
|
1194 |
-
{
|
1195 |
-
"model_a": "PNP",
|
1196 |
-
"model_b": "MagicBrush",
|
1197 |
-
"winner": "model_b",
|
1198 |
-
"judge": "arena_user_10.16.2.201",
|
1199 |
-
"anony": true,
|
1200 |
-
"tstamp": 1715719306.5928
|
1201 |
-
},
|
1202 |
-
{
|
1203 |
-
"model_a": "InstructPix2Pix",
|
1204 |
-
"model_b": "PNP",
|
1205 |
-
"winner": "tie (bothbad)",
|
1206 |
-
"judge": "arena_user_10.16.15.199",
|
1207 |
-
"anony": true,
|
1208 |
-
"tstamp": 1715719356.0694
|
1209 |
-
},
|
1210 |
-
{
|
1211 |
-
"model_a": "Prompt2prompt",
|
1212 |
-
"model_b": "CosXLEdit",
|
1213 |
-
"winner": "model_a",
|
1214 |
-
"judge": "arena_user_10.16.25.191",
|
1215 |
-
"anony": true,
|
1216 |
-
"tstamp": 1715719368.0491
|
1217 |
-
},
|
1218 |
-
{
|
1219 |
-
"model_a": "Prompt2prompt",
|
1220 |
-
"model_b": "CycleDiffusion",
|
1221 |
-
"winner": "tie (bothbad)",
|
1222 |
-
"judge": "arena_user_10.16.41.118",
|
1223 |
-
"anony": true,
|
1224 |
-
"tstamp": 1715719379.185
|
1225 |
-
},
|
1226 |
-
{
|
1227 |
-
"model_a": "CycleDiffusion",
|
1228 |
-
"model_b": "Prompt2prompt",
|
1229 |
-
"winner": "tie (bothbad)",
|
1230 |
-
"judge": "arena_user_10.16.2.201",
|
1231 |
-
"anony": true,
|
1232 |
-
"tstamp": 1715719389.0771
|
1233 |
-
},
|
1234 |
-
{
|
1235 |
-
"model_a": "Pix2PixZero",
|
1236 |
-
"model_b": "MagicBrush",
|
1237 |
-
"winner": "model_b",
|
1238 |
-
"judge": "arena_user_10.16.17.217",
|
1239 |
-
"anony": true,
|
1240 |
-
"tstamp": 1715719397.7162
|
1241 |
-
},
|
1242 |
-
{
|
1243 |
-
"model_a": "PNP",
|
1244 |
-
"model_b": "InstructPix2Pix",
|
1245 |
-
"winner": "tie (bothbad)",
|
1246 |
-
"judge": "arena_user_10.16.2.201",
|
1247 |
-
"anony": true,
|
1248 |
-
"tstamp": 1715719406.4165
|
1249 |
-
},
|
1250 |
-
{
|
1251 |
-
"model_a": "Pix2PixZero",
|
1252 |
-
"model_b": "PNP",
|
1253 |
-
"winner": "model_b",
|
1254 |
-
"judge": "arena_user_10.16.25.191",
|
1255 |
-
"anony": true,
|
1256 |
-
"tstamp": 1715719429.1002
|
1257 |
-
},
|
1258 |
-
{
|
1259 |
-
"model_a": "CosXLEdit",
|
1260 |
-
"model_b": "MagicBrush",
|
1261 |
-
"winner": "model_a",
|
1262 |
-
"judge": "arena_user_10.16.2.201",
|
1263 |
-
"anony": true,
|
1264 |
-
"tstamp": 1715719435.4694
|
1265 |
-
},
|
1266 |
-
{
|
1267 |
-
"model_a": "PNP",
|
1268 |
-
"model_b": "SDEdit",
|
1269 |
-
"winner": "tie (bothbad)",
|
1270 |
-
"judge": "arena_user_10.16.2.201",
|
1271 |
-
"anony": true,
|
1272 |
-
"tstamp": 1715719454.4526
|
1273 |
-
},
|
1274 |
-
{
|
1275 |
-
"model_a": "InfEdit",
|
1276 |
-
"model_b": "PNP",
|
1277 |
-
"winner": "tie (bothbad)",
|
1278 |
-
"judge": "arena_user_10.16.17.217",
|
1279 |
-
"anony": true,
|
1280 |
-
"tstamp": 1715719470.154
|
1281 |
-
},
|
1282 |
-
{
|
1283 |
-
"model_a": "MagicBrush",
|
1284 |
-
"model_b": "PNP",
|
1285 |
-
"winner": "model_a",
|
1286 |
-
"judge": "arena_user_10.16.41.118",
|
1287 |
-
"anony": true,
|
1288 |
-
"tstamp": 1715719482.3114
|
1289 |
-
},
|
1290 |
-
{
|
1291 |
-
"model_a": "SDEdit",
|
1292 |
-
"model_b": "PNP",
|
1293 |
-
"winner": "tie",
|
1294 |
-
"judge": "arena_user_10.16.2.201",
|
1295 |
-
"anony": true,
|
1296 |
-
"tstamp": 1715719499.9643
|
1297 |
-
},
|
1298 |
-
{
|
1299 |
-
"model_a": "InstructPix2Pix",
|
1300 |
-
"model_b": "MagicBrush",
|
1301 |
-
"winner": "model_b",
|
1302 |
-
"judge": "arena_user_10.16.2.201",
|
1303 |
-
"anony": true,
|
1304 |
-
"tstamp": 1715719513.7317
|
1305 |
-
},
|
1306 |
-
{
|
1307 |
-
"model_a": "InfEdit",
|
1308 |
-
"model_b": "PNP",
|
1309 |
-
"winner": "model_a",
|
1310 |
-
"judge": "arena_user_10.16.15.199",
|
1311 |
-
"anony": true,
|
1312 |
-
"tstamp": 1715719527.69
|
1313 |
-
},
|
1314 |
-
{
|
1315 |
-
"model_a": "Prompt2prompt",
|
1316 |
-
"model_b": "MagicBrush",
|
1317 |
-
"winner": "tie (bothbad)",
|
1318 |
-
"judge": "arena_user_10.16.41.118",
|
1319 |
-
"anony": true,
|
1320 |
-
"tstamp": 1715719542.751
|
1321 |
-
},
|
1322 |
-
{
|
1323 |
-
"model_a": "Pix2PixZero",
|
1324 |
-
"model_b": "InfEdit",
|
1325 |
-
"winner": "tie (bothbad)",
|
1326 |
-
"judge": "arena_user_10.16.15.199",
|
1327 |
-
"anony": true,
|
1328 |
-
"tstamp": 1715719560.9912
|
1329 |
-
},
|
1330 |
-
{
|
1331 |
-
"model_a": "PNP",
|
1332 |
-
"model_b": "Pix2PixZero",
|
1333 |
-
"winner": "tie (bothbad)",
|
1334 |
-
"judge": "arena_user_10.16.2.201",
|
1335 |
-
"anony": true,
|
1336 |
-
"tstamp": 1715719575.3291
|
1337 |
-
},
|
1338 |
-
{
|
1339 |
-
"model_a": "PNP",
|
1340 |
-
"model_b": "CosXLEdit",
|
1341 |
-
"winner": "model_b",
|
1342 |
-
"judge": "arena_user_10.16.17.217",
|
1343 |
-
"anony": true,
|
1344 |
-
"tstamp": 1715719581.9552
|
1345 |
-
},
|
1346 |
-
{
|
1347 |
-
"model_a": "Pix2PixZero",
|
1348 |
-
"model_b": "Prompt2prompt",
|
1349 |
-
"winner": "tie (bothbad)",
|
1350 |
-
"judge": "arena_user_10.16.25.191",
|
1351 |
-
"anony": true,
|
1352 |
-
"tstamp": 1715719591.9907
|
1353 |
-
},
|
1354 |
-
{
|
1355 |
-
"model_a": "CosXLEdit",
|
1356 |
-
"model_b": "SDEdit",
|
1357 |
-
"winner": "model_a",
|
1358 |
-
"judge": "arena_user_10.16.2.201",
|
1359 |
-
"anony": true,
|
1360 |
-
"tstamp": 1715719601.8819
|
1361 |
-
},
|
1362 |
-
{
|
1363 |
-
"model_a": "InfEdit",
|
1364 |
-
"model_b": "MagicBrush",
|
1365 |
-
"winner": "model_b",
|
1366 |
-
"judge": "arena_user_10.16.41.118",
|
1367 |
-
"anony": true,
|
1368 |
-
"tstamp": 1715719612.1837
|
1369 |
-
},
|
1370 |
-
{
|
1371 |
-
"model_a": "SDEdit",
|
1372 |
-
"model_b": "InstructPix2Pix",
|
1373 |
-
"winner": "tie (bothbad)",
|
1374 |
-
"judge": "arena_user_10.16.2.201",
|
1375 |
-
"anony": true,
|
1376 |
-
"tstamp": 1715719620.469
|
1377 |
-
},
|
1378 |
-
{
|
1379 |
-
"model_a": "InstructPix2Pix",
|
1380 |
-
"model_b": "MagicBrush",
|
1381 |
-
"winner": "tie (bothbad)",
|
1382 |
-
"judge": "arena_user_10.16.41.118",
|
1383 |
-
"anony": true,
|
1384 |
-
"tstamp": 1715719627.34
|
1385 |
-
},
|
1386 |
-
{
|
1387 |
-
"model_a": "MagicBrush",
|
1388 |
-
"model_b": "Prompt2prompt",
|
1389 |
-
"winner": "model_a",
|
1390 |
-
"judge": "arena_user_10.16.2.201",
|
1391 |
-
"anony": true,
|
1392 |
-
"tstamp": 1715719632.694
|
1393 |
-
},
|
1394 |
-
{
|
1395 |
-
"model_a": "Prompt2prompt",
|
1396 |
-
"model_b": "SDEdit",
|
1397 |
-
"winner": "tie (bothbad)",
|
1398 |
-
"judge": "arena_user_10.16.41.118",
|
1399 |
-
"anony": true,
|
1400 |
-
"tstamp": 1715719652.2038
|
1401 |
-
},
|
1402 |
-
{
|
1403 |
-
"model_a": "SDEdit",
|
1404 |
-
"model_b": "Prompt2prompt",
|
1405 |
-
"winner": "tie (bothbad)",
|
1406 |
-
"judge": "arena_user_10.16.25.191",
|
1407 |
-
"anony": true,
|
1408 |
-
"tstamp": 1715719661.8855
|
1409 |
-
},
|
1410 |
-
{
|
1411 |
-
"model_a": "CosXLEdit",
|
1412 |
-
"model_b": "Prompt2prompt",
|
1413 |
-
"winner": "tie (bothbad)",
|
1414 |
-
"judge": "arena_user_10.16.2.201",
|
1415 |
-
"anony": true,
|
1416 |
-
"tstamp": 1715719677.2949
|
1417 |
-
},
|
1418 |
-
{
|
1419 |
-
"model_a": "MagicBrush",
|
1420 |
-
"model_b": "Prompt2prompt",
|
1421 |
-
"winner": "model_a",
|
1422 |
-
"judge": "arena_user_10.16.2.201",
|
1423 |
-
"anony": true,
|
1424 |
-
"tstamp": 1715719687.3022
|
1425 |
-
},
|
1426 |
-
{
|
1427 |
-
"model_a": "SDEdit",
|
1428 |
-
"model_b": "Prompt2prompt",
|
1429 |
-
"winner": "model_b",
|
1430 |
-
"judge": "arena_user_10.16.2.201",
|
1431 |
-
"anony": true,
|
1432 |
-
"tstamp": 1715719699.47
|
1433 |
-
},
|
1434 |
-
{
|
1435 |
-
"model_a": "Pix2PixZero",
|
1436 |
-
"model_b": "InfEdit",
|
1437 |
-
"winner": "model_b",
|
1438 |
-
"judge": "arena_user_10.16.2.201",
|
1439 |
-
"anony": true,
|
1440 |
-
"tstamp": 1715719706.2375
|
1441 |
-
},
|
1442 |
-
{
|
1443 |
-
"model_a": "CosXLEdit",
|
1444 |
-
"model_b": "Prompt2prompt",
|
1445 |
-
"winner": "model_a",
|
1446 |
-
"judge": "arena_user_10.16.17.217",
|
1447 |
-
"anony": true,
|
1448 |
-
"tstamp": 1715719717.3564
|
1449 |
-
},
|
1450 |
-
{
|
1451 |
-
"model_a": "InstructPix2Pix",
|
1452 |
-
"model_b": "CosXLEdit",
|
1453 |
-
"winner": "tie (bothbad)",
|
1454 |
-
"judge": "arena_user_10.16.25.191",
|
1455 |
-
"anony": true,
|
1456 |
-
"tstamp": 1715719722.5542
|
1457 |
-
},
|
1458 |
-
{
|
1459 |
-
"model_a": "InfEdit",
|
1460 |
-
"model_b": "InstructPix2Pix",
|
1461 |
-
"winner": "tie (bothbad)",
|
1462 |
-
"judge": "arena_user_10.16.41.118",
|
1463 |
-
"anony": true,
|
1464 |
-
"tstamp": 1715719728.5417
|
1465 |
-
},
|
1466 |
-
{
|
1467 |
-
"model_a": "MagicBrush",
|
1468 |
-
"model_b": "SDEdit",
|
1469 |
-
"winner": "model_a",
|
1470 |
-
"judge": "arena_user_10.16.2.201",
|
1471 |
-
"anony": true,
|
1472 |
-
"tstamp": 1715719737.2385
|
1473 |
-
},
|
1474 |
-
{
|
1475 |
-
"model_a": "MagicBrush",
|
1476 |
-
"model_b": "Pix2PixZero",
|
1477 |
-
"winner": "tie (bothbad)",
|
1478 |
-
"judge": "arena_user_10.16.15.199",
|
1479 |
-
"anony": true,
|
1480 |
-
"tstamp": 1715815138.5243
|
1481 |
-
},
|
1482 |
-
{
|
1483 |
-
"model_a": "CosXLEdit",
|
1484 |
-
"model_b": "Prompt2prompt",
|
1485 |
-
"winner": "model_b",
|
1486 |
-
"judge": "arena_user_10.16.17.217",
|
1487 |
-
"anony": true,
|
1488 |
-
"tstamp": 1715815152.0033
|
1489 |
-
},
|
1490 |
-
{
|
1491 |
-
"model_a": "Pix2PixZero",
|
1492 |
-
"model_b": "Prompt2prompt",
|
1493 |
-
"winner": "tie (bothbad)",
|
1494 |
-
"judge": "arena_user_10.16.41.118",
|
1495 |
-
"anony": true,
|
1496 |
-
"tstamp": 1715815169.0475
|
1497 |
-
},
|
1498 |
-
{
|
1499 |
-
"model_a": "InstructPix2Pix",
|
1500 |
-
"model_b": "SDEdit",
|
1501 |
-
"winner": "model_b",
|
1502 |
-
"judge": "arena_user_10.16.41.118",
|
1503 |
-
"anony": true,
|
1504 |
-
"tstamp": 1715815187.1917
|
1505 |
-
},
|
1506 |
-
{
|
1507 |
-
"model_a": "InstructPix2Pix",
|
1508 |
-
"model_b": "Pix2PixZero",
|
1509 |
-
"winner": "tie (bothbad)",
|
1510 |
-
"judge": "arena_user_10.16.2.201",
|
1511 |
-
"anony": true,
|
1512 |
-
"tstamp": 1715815197.5233
|
1513 |
-
},
|
1514 |
-
{
|
1515 |
-
"model_a": "Pix2PixZero",
|
1516 |
-
"model_b": "SDEdit",
|
1517 |
-
"winner": "tie (bothbad)",
|
1518 |
-
"judge": "arena_user_10.16.2.201",
|
1519 |
-
"anony": true,
|
1520 |
-
"tstamp": 1715815209.8285
|
1521 |
-
},
|
1522 |
-
{
|
1523 |
-
"model_a": "CycleDiffusion",
|
1524 |
-
"model_b": "MagicBrush",
|
1525 |
-
"winner": "model_b",
|
1526 |
-
"judge": "arena_user_10.16.2.201",
|
1527 |
-
"anony": true,
|
1528 |
-
"tstamp": 1715815228.6736
|
1529 |
-
},
|
1530 |
-
{
|
1531 |
-
"model_a": "InfEdit",
|
1532 |
-
"model_b": "Pix2PixZero",
|
1533 |
-
"winner": "tie (bothbad)",
|
1534 |
-
"judge": "arena_user_10.16.2.201",
|
1535 |
-
"anony": true,
|
1536 |
-
"tstamp": 1715815236.3935
|
1537 |
-
},
|
1538 |
-
{
|
1539 |
-
"model_a": "SDEdit",
|
1540 |
-
"model_b": "PNP",
|
1541 |
-
"winner": "tie (bothbad)",
|
1542 |
-
"judge": "arena_user_10.16.25.191",
|
1543 |
-
"anony": true,
|
1544 |
-
"tstamp": 1715815265.9705
|
1545 |
-
},
|
1546 |
-
{
|
1547 |
-
"model_a": "MagicBrush",
|
1548 |
-
"model_b": "SDEdit",
|
1549 |
-
"winner": "tie (bothbad)",
|
1550 |
-
"judge": "arena_user_10.16.15.199",
|
1551 |
-
"anony": true,
|
1552 |
-
"tstamp": 1715815278.5019
|
1553 |
-
},
|
1554 |
-
{
|
1555 |
-
"model_a": "CycleDiffusion",
|
1556 |
-
"model_b": "CosXLEdit",
|
1557 |
-
"winner": "tie (bothbad)",
|
1558 |
-
"judge": "arena_user_10.16.15.199",
|
1559 |
-
"anony": true,
|
1560 |
-
"tstamp": 1715815294.5978
|
1561 |
-
},
|
1562 |
-
{
|
1563 |
-
"model_a": "MagicBrush",
|
1564 |
-
"model_b": "InfEdit",
|
1565 |
-
"winner": "model_a",
|
1566 |
-
"judge": "arena_user_10.16.17.217",
|
1567 |
-
"anony": true,
|
1568 |
-
"tstamp": 1715815325.4468
|
1569 |
-
},
|
1570 |
-
{
|
1571 |
-
"model_a": "MagicBrush",
|
1572 |
-
"model_b": "Pix2PixZero",
|
1573 |
-
"winner": "model_a",
|
1574 |
-
"judge": "arena_user_10.16.41.118",
|
1575 |
-
"anony": true,
|
1576 |
-
"tstamp": 1715913098.6617
|
1577 |
-
}
|
1578 |
-
]
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
arena_elo/results/20240516/elo_results_image_editing.pkl
DELETED
@@ -1,3 +0,0 @@
|
|
1 |
-
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:837f11fd6cda1fe2d6a5cc1c239a207725ad0157b16282303cb684427ddc7e9d
|
3 |
-
size 62484
|
|
|
|
|
|
|
|
arena_elo/results/20240516/image_editing_leaderboard.csv
DELETED
@@ -1,10 +0,0 @@
|
|
1 |
-
key,Model,Arena Elo rating (anony),Arena Elo rating (full),License,Organization,Link
|
2 |
-
CosXLEdit,CosXLEdit,1097.63559213644,1085.7285800995926,cosxl-nc-community,Stability AI,https://huggingface.co/spaces/multimodalart/cosxl
|
3 |
-
MagicBrush,MagicBrush,1075.1489922450316,1086.8819832924794,CC-BY-4.0,"The Ohio State University, University of Waterloo",https://osu-nlp-group.github.io/MagicBrush
|
4 |
-
InfEdit,InfEdit,1065.4719519196174,1090.684638162955,Apache-2.0,"University of Michigan, University of California, Berkeley",https://huggingface.co/spaces/sled-umich/InfEdit
|
5 |
-
Prompt2prompt,Prompt2prompt,1063.1432047252297,1060.8146250689238,Apache-2.0,"Google, Tel Aviv University",https://prompt-to-prompt.github.io
|
6 |
-
InstructPix2Pix,InstructPix2Pix,1043.9312648233226,1028.7932718869638,"Copyright 2023 Timothy Brooks, Aleksander Holynski, Alexei A. Efros","University of California, Berkeley",https://www.timothybrooks.com/instruct-pix2pix
|
7 |
-
PNP,PNP,1022.4342554377677,1043.322342347598,-,Weizmann Institute of Science,https://github.com/MichalGeyer/plug-and-play
|
8 |
-
Pix2PixZero,Pix2PixZero,891.2979039265506,886.7359371585381,MIT License,"Carnegie Mellon University, Adobe Research",https://pix2pixzero.github.io
|
9 |
-
SDEdit,SDEdit,890.443823405714,880.5508125882768,MIT License,Stanford University,https://sde-image-editing.github.io
|
10 |
-
CycleDiffusion,CycleDiffusion,850.4930113803264,836.4878093946726,X11,Carnegie Mellon University,https://github.com/ChenWu98/cycle-diffusion
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
arena_elo/results/20240517/clean_battle_t2i_generation.json
DELETED
The diff for this file is too large to render.
See raw diff
|
|
arena_elo/results/20240517/elo_results_t2i_generation.pkl
DELETED
@@ -1,3 +0,0 @@
|
|
1 |
-
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:93808a9ce2f497109d0fc708e4055b6463a692502ef541ff28352f52b612916d
|
3 |
-
size 68172
|
|
|
|
|
|
|
|
arena_elo/results/20240517/t2i_generation_leaderboard.csv
DELETED
@@ -1,12 +0,0 @@
|
|
1 |
-
key,Model,Arena Elo rating (anony),Arena Elo rating (full),License,Organization,Link
|
2 |
-
PlayGround V2.5,PlayGround V2.5,1136.9514432133128,1081.5838551712898,Playground v2.5 Community License,Playground,https://huggingface.co/playgroundai/playground-v2.5-1024px-aesthetic
|
3 |
-
PlayGround V2,PlayGround V2,1099.4286233187172,1042.590911846903,Playground v2 Community License,Playground,https://huggingface.co/playgroundai/playground-v2-1024px-aesthetic
|
4 |
-
SDXLLightning,SDXLLightning,1062.4565867132737,1004.4096880141087,openrail++,ByteDance,https://huggingface.co/ByteDance/SDXL-Lightning
|
5 |
-
StableCascade,StableCascade,1061.93020315328,1006.1117357811837,stable-cascade-nc-community (other),Stability AI,https://huggingface.co/stabilityai/stable-cascade
|
6 |
-
PixArtAlpha,PixArtAlpha,1051.847602698194,981.1247821885942,openrail++,PixArt-alpha,https://huggingface.co/PixArt-alpha/PixArt-XL-2-1024-MS
|
7 |
-
PixArtSigma,PixArtSigma,1049.8339911951734,989.7640320919886,openrail++,PixArt-alpha,https://fal.ai/models/fal-ai/pixart-sigma
|
8 |
-
SDXL,SDXL,999.6167439144875,941.9623909945509,openrail++,Stability AI,https://huggingface.co/stabilityai/stable-diffusion-xl-base-1.0
|
9 |
-
SDXLTurbo,SDXLTurbo,933.468824554199,875.8124778188443,sai-nc-community (other),Stability AI,https://huggingface.co/stabilityai/sdxl-turbo
|
10 |
-
LCM(v1.5/XL),LCM(v1.5/XL),929.425577747465,865.7356218313212,openrail++,Latent Consistency,https://fal.ai/models/fal-ai/fast-lcm-diffusion/api
|
11 |
-
OpenJourney,OpenJourney,857.2709081764949,793.4952273226107,creativeml-openrail-m,PromptHero,https://huggingface.co/prompthero/openjourney
|
12 |
-
LCM,LCM,817.7694953154022,773.4948395309905,MIT License,Tsinghua University,https://huggingface.co/SimianLuo/LCM_Dreamshaper_v7
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
arena_elo/results/20240525/clean_battle_image_editing.json
DELETED
The diff for this file is too large to render.
See raw diff
|
|
arena_elo/results/20240525/clean_battle_t2i_generation.json
DELETED
The diff for this file is too large to render.
See raw diff
|
|
arena_elo/results/20240525/elo_results_image_editing.pkl
DELETED
@@ -1,3 +0,0 @@
|
|
1 |
-
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:a90694074e1b68a62bd75cdf0c81eb545dfcc115da34e9efdb215d668bd13196
|
3 |
-
size 62502
|
|
|
|
|
|
|
|
arena_elo/results/20240525/elo_results_t2i_generation.pkl
DELETED
@@ -1,3 +0,0 @@
|
|
1 |
-
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:7172486b8454e25f9b3a9df84e55d2dcce923a3b63e091fd8d165b63bbde7bc4
|
3 |
-
size 68170
|
|
|
|
|
|
|
|