DongfuJiang commited on
Commit
8750953
1 Parent(s): f468e90
arena_elo/elo_rating/clean_battle_data.py CHANGED
@@ -79,6 +79,7 @@ def to_openai_format(messages):
79
 
80
 
81
  def replace_model_name(old_name, tstamp):
 
82
  replace_dict = {
83
  "bard": "palm-2",
84
  "claude-v1": "claude-1",
@@ -87,14 +88,19 @@ def replace_model_name(old_name, tstamp):
87
  "claude-2": "claude-2.0",
88
  "PlayGroundV2": "PlayGround V2",
89
  "PlayGroundV2.5": "PlayGround V2.5",
 
 
90
  }
91
  if old_name in ["gpt-4", "gpt-3.5-turbo"]:
92
  if tstamp > 1687849200:
93
- return old_name + "-0613"
94
  else:
95
- return old_name + "-0314"
96
  if old_name in replace_dict:
97
- return replace_dict[old_name]
 
 
 
98
  return old_name
99
 
100
 
@@ -305,6 +311,10 @@ def clean_battle_data(
305
 
306
  else:
307
  raise ValueError(f"Invalid task_name: {task_name}")
 
 
 
 
308
  models = [replace_model_name(m, row["tstamp"]) for m in models]
309
 
310
  # Exclude certain models
 
79
 
80
 
81
  def replace_model_name(old_name, tstamp):
82
+
83
  replace_dict = {
84
  "bard": "palm-2",
85
  "claude-v1": "claude-1",
 
88
  "claude-2": "claude-2.0",
89
  "PlayGroundV2": "PlayGround V2",
90
  "PlayGroundV2.5": "PlayGround V2.5",
91
+ "FluxTimestep": "FLUX1schnell",
92
+ "FluxGuidance": "FLUX1dev"
93
  }
94
  if old_name in ["gpt-4", "gpt-3.5-turbo"]:
95
  if tstamp > 1687849200:
96
+ old_name += "-0613"
97
  else:
98
+ old_name += "-0314"
99
  if old_name in replace_dict:
100
+ old_name = replace_dict[old_name]
101
+ if "Flux" in old_name:
102
+ print(f"Invalid model names: {old_name}")
103
+ exit(1)
104
  return old_name
105
 
106
 
 
311
 
312
  else:
313
  raise ValueError(f"Invalid task_name: {task_name}")
314
+
315
+ # if "Flux" in models[0] or "Flux" in models[1]:
316
+ # print(f"Invalid model names: {models}")
317
+ # exit(1)
318
  models = [replace_model_name(m, row["tstamp"]) for m in models]
319
 
320
  # Exclude certain models
arena_elo/elo_rating/elo_analysis.py CHANGED
@@ -452,3 +452,6 @@ if __name__ == "__main__":
452
  }
453
  with open(f"elo_results_{cutoff_date}.pkl", "wb") as fout:
454
  pickle.dump(results, fout)
 
 
 
 
452
  }
453
  with open(f"elo_results_{cutoff_date}.pkl", "wb") as fout:
454
  pickle.dump(results, fout)
455
+
456
+ with open("cut_off_date.txt", "w") as fout:
457
+ fout.write(cutoff_date)
arena_elo/results/20240809/elo_results_image_editing.pkl CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1da1e19486e987e18cf9bec79c36f1b71291a4f92490cf7d3af4edbc98628510
3
- size 62482
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b54d460d93f22ee6e2519ccc82e4ebd64ec81987505760c428b593ff91a13368
3
+ size 62455
arena_elo/results/20240809/image_editing_leaderboard.csv CHANGED
@@ -2,7 +2,7 @@ key,Model,Arena Elo rating (anony),Arena Elo rating (full),License,Organization,
2
  MagicBrush,MagicBrush,1112.4518849527376,1116.3228088792275,CC-BY-4.0,"The Ohio State University, University of Waterloo",https://osu-nlp-group.github.io/MagicBrush
3
  InfEdit,InfEdit,1077.2249767545911,1077.0861206067664,CC BY-NC-ND 4.0,"University of Michigan, University of California, Berkeley",https://huggingface.co/spaces/sled-umich/InfEdit
4
  CosXLEdit,CosXLEdit,1064.682441262532,1065.599445502775,cosxl-nc-community,Stability AI,https://huggingface.co/spaces/multimodalart/cosxl
5
- InstructPix2Pix,InstructPix2Pix,1035.4054226880567,1033.208668133612,"Copyright 2023 Timothy Brooks, Aleksander Holynski, Alexei A. Efros","University of California, Berkeley",https://www.timothybrooks.com/instruct-pix2pix
6
  PNP,PNP,1001.4916130267786,1006.0747389504991,-,Weizmann Institute of Science,https://github.com/MichalGeyer/plug-and-play
7
  Prompt2prompt,Prompt2prompt,990.9755779591587,992.0796321838297,Apache-2.0,"Google, Tel Aviv University",https://prompt-to-prompt.github.io
8
  CycleDiffusion,CycleDiffusion,938.5637450408492,931.6722574678079,X11,Carnegie Mellon University,https://github.com/ChenWu98/cycle-diffusion
 
2
  MagicBrush,MagicBrush,1112.4518849527376,1116.3228088792275,CC-BY-4.0,"The Ohio State University, University of Waterloo",https://osu-nlp-group.github.io/MagicBrush
3
  InfEdit,InfEdit,1077.2249767545911,1077.0861206067664,CC BY-NC-ND 4.0,"University of Michigan, University of California, Berkeley",https://huggingface.co/spaces/sled-umich/InfEdit
4
  CosXLEdit,CosXLEdit,1064.682441262532,1065.599445502775,cosxl-nc-community,Stability AI,https://huggingface.co/spaces/multimodalart/cosxl
5
+ InstructPix2Pix,InstructPix2Pix,1035.4054226880567,1033.2086681336118,"Copyright 2023 Timothy Brooks, Aleksander Holynski, Alexei A. Efros","University of California, Berkeley",https://www.timothybrooks.com/instruct-pix2pix
6
  PNP,PNP,1001.4916130267786,1006.0747389504991,-,Weizmann Institute of Science,https://github.com/MichalGeyer/plug-and-play
7
  Prompt2prompt,Prompt2prompt,990.9755779591587,992.0796321838297,Apache-2.0,"Google, Tel Aviv University",https://prompt-to-prompt.github.io
8
  CycleDiffusion,CycleDiffusion,938.5637450408492,931.6722574678079,X11,Carnegie Mellon University,https://github.com/ChenWu98/cycle-diffusion
arena_elo/results/20240818/clean_battle_t2i_generation.json ADDED
The diff for this file is too large to render. See raw diff
 
arena_elo/results/20240818/clean_battle_video_generation.json ADDED
The diff for this file is too large to render. See raw diff
 
arena_elo/{elo_results_20240809.pkl → results/20240818/elo_results_t2i_generation.pkl} RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b54d460d93f22ee6e2519ccc82e4ebd64ec81987505760c428b593ff91a13368
3
- size 62455
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fa69fb8e450bd988c80b346d4f102c5be8bd74605030f0d5a295a71b66230ccd
3
+ size 76790
arena_elo/results/20240818/elo_results_video_generation.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6c76c0dad67cabfdbda5beb2056bfaf9f669f7a5a3857716212f6f831516d5f9
3
+ size 59905
arena_elo/results/20240818/t2i_generation_leaderboard.csv ADDED
@@ -0,0 +1,15 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ key,Model,Arena Elo rating (anony),Arena Elo rating (full),License,Organization,Link
2
+ PlayGround V2.5,PlayGround V2.5,1141.5188909673816,1141.7574769353046,Playground v2.5 Community License,Playground,https://huggingface.co/playgroundai/playground-v2.5-1024px-aesthetic
3
+ FLUX1schnell,FLUX1schnell,1107.0181424085022,1112.4579783184781,N/A,N/A,N/A
4
+ PlayGround V2,PlayGround V2,1083.848194525069,1081.1558760457797,Playground v2 Community License,Playground,https://huggingface.co/playgroundai/playground-v2-1024px-aesthetic
5
+ HunyuanDiT,HunyuanDiT,1061.8376119998818,1045.8437711625322,tencent-hunyuan-community,Tencent,https://huggingface.co/Tencent-Hunyuan/HunyuanDiT
6
+ StableCascade,StableCascade,1048.1457195754278,1050.1691240248065,stable-cascade-nc-community (other),Stability AI,https://huggingface.co/stabilityai/stable-cascade
7
+ SDXLLightning,SDXLLightning,1034.30472320188,1037.2932871766393,openrail++,ByteDance,https://huggingface.co/ByteDance/SDXL-Lightning
8
+ PixArtAlpha,PixArtAlpha,1033.912116989071,1022.557442237083,openrail++,PixArt-alpha,https://huggingface.co/PixArt-alpha/PixArt-XL-2-1024-MS
9
+ PixArtSigma,PixArtSigma,1029.1408183981687,1027.4953277391191,openrail++,PixArt-alpha,https://fal.ai/models/fal-ai/pixart-sigma
10
+ SD3,SD3,1006.8458978216129,1000.2491511468914,stabilityai-nc-research-community,Stability AI,https://huggingface.co/stabilityai/stable-diffusion-3-medium
11
+ SDXL,SDXL,975.3595050901268,974.4701361426086,openrail++,Stability AI,https://huggingface.co/stabilityai/stable-diffusion-xl-base-1.0
12
+ SDXLTurbo,SDXLTurbo,922.5038319935961,918.6139210049913,sai-nc-community (other),Stability AI,https://huggingface.co/stabilityai/sdxl-turbo
13
+ LCM(v1.5/XL),LCM(v1.5/XL),916.2179215619182,908.6161501509581,openrail++,Latent Consistency,https://fal.ai/models/fal-ai/fast-lcm-diffusion/api
14
+ OpenJourney,OpenJourney,838.9432903688682,832.1138397704597,creativeml-openrail-m,PromptHero,https://huggingface.co/prompthero/openjourney
15
+ LCM,LCM,800.403335098498,812.6668778296877,MIT License,Tsinghua University,https://huggingface.co/SimianLuo/LCM_Dreamshaper_v7
arena_elo/results/20240818/video_generation_leaderboard.csv ADDED
@@ -0,0 +1,9 @@
 
 
 
 
 
 
 
 
 
 
1
+ key,Model,Arena Elo rating (anony),Arena Elo rating (full),License,Organization,Link
2
+ StableVideoDiffusion,StableVideoDiffusion,1133.1838006160342,1135.648326348363,stable-video-diffusion-nc-community,Stability AI,https://fal.ai/models/fal-ai/fast-svd/text-to-video/api
3
+ T2VTurbo,T2VTurbo,1097.0055576746822,1095.4539969650828,cc-by-nc-4.0,"University of California, Santa Barbara",https://huggingface.co/jiachenli-ucsb/T2V-Turbo-VC2
4
+ VideoCrafter2,VideoCrafter2,1074.299413538351,1074.604913704468,Apache 2.0,Tencent AI Lab,https://ailab-cvc.github.io/videocrafter2/
5
+ AnimateDiff,AnimateDiff,1068.2089967499214,1066.8805974519646,creativeml-openrail-m,"The Chinese University of Hong Kong, Shanghai AI Lab, Stanford University",https://fal.ai/models/fast-animatediff-t2v
6
+ LaVie,LaVie,995.82479731396,994.8703618669116,Apache 2.0,Shanghai AI Lab,https://github.com/Vchitect/LaVie
7
+ OpenSora,OpenSora,913.3181800582577,913.0542295067128,Apache 2.0,HPC-AI Tech,https://github.com/hpcaitech/Open-Sora
8
+ ModelScope,ModelScope,861.1074201988872,862.3583669429345,cc-by-nc-4.0,Alibaba Group,https://arxiv.org/abs/2308.06571
9
+ AnimateDiffTurbo,AnimateDiffTurbo,857.0518338499064,857.1292072135634,creativeml-openrail-m,"The Chinese University of Hong Kong, Shanghai AI Lab, Stanford University",https://fal.ai/models/fast-animatediff-t2v-turbo
arena_elo/results/latest/clean_battle_t2i_generation.json CHANGED
@@ -49848,8 +49848,8 @@
49848
  "tstamp": 1723054634.5468
49849
  },
49850
  {
49851
- "model_a": "FluxGuidance",
49852
- "model_b": "FluxTimestep",
49853
  "winner": "model_b",
49854
  "judge": "arena_user_10.16.12.147",
49855
  "anony": true,
@@ -49880,8 +49880,8 @@
49880
  "tstamp": 1723063074.7642
49881
  },
49882
  {
49883
- "model_a": "FluxTimestep",
49884
- "model_b": "FluxGuidance",
49885
  "winner": "model_b",
49886
  "judge": "arena_user_10.16.14.231",
49887
  "anony": true,
@@ -49897,14 +49897,14 @@
49897
  },
49898
  {
49899
  "model_a": "AuraFlow",
49900
- "model_b": "FluxGuidance",
49901
  "winner": "model_b",
49902
  "judge": "arena_user_10.16.31.28",
49903
  "anony": false,
49904
  "tstamp": 1723067240.2924
49905
  },
49906
  {
49907
- "model_a": "FluxTimestep",
49908
  "model_b": "SDXLLightning",
49909
  "winner": "model_a",
49910
  "judge": "arena_user_10.16.43.145",
@@ -49920,16 +49920,16 @@
49920
  "tstamp": 1723078808.7741
49921
  },
49922
  {
49923
- "model_a": "FluxTimestep",
49924
- "model_b": "FluxGuidance",
49925
  "winner": "tie (bothbad)",
49926
  "judge": "arena_user_10.16.31.28",
49927
  "anony": false,
49928
  "tstamp": 1723080943.3647
49929
  },
49930
  {
49931
- "model_a": "FluxTimestep",
49932
- "model_b": "FluxGuidance",
49933
  "winner": "tie (bothbad)",
49934
  "judge": "arena_user_10.16.12.147",
49935
  "anony": false,
@@ -50016,7 +50016,7 @@
50016
  "tstamp": 1723160130.8681
50017
  },
50018
  {
50019
- "model_a": "FluxTimestep",
50020
  "model_b": "SDXLLightning",
50021
  "winner": "model_a",
50022
  "judge": "arena_user_10.16.17.24",
@@ -50057,7 +50057,7 @@
50057
  },
50058
  {
50059
  "model_a": "PixArtAlpha",
50060
- "model_b": "FluxGuidance",
50061
  "winner": "tie",
50062
  "judge": "arena_user_10.16.43.145",
50063
  "anony": true,
@@ -50080,7 +50080,7 @@
50080
  "tstamp": 1723160326.9647
50081
  },
50082
  {
50083
- "model_a": "FluxTimestep",
50084
  "model_b": "PlayGround V2.5",
50085
  "winner": "model_a",
50086
  "judge": "arena_user_10.16.22.62",
@@ -50088,8 +50088,8 @@
50088
  "tstamp": 1723165134.1363
50089
  },
50090
  {
50091
- "model_a": "FluxGuidance",
50092
- "model_b": "FluxTimestep",
50093
  "winner": "model_a",
50094
  "judge": "arena_user_10.16.22.62",
50095
  "anony": true,
@@ -50105,7 +50105,7 @@
50105
  },
50106
  {
50107
  "model_a": "OpenJourney",
50108
- "model_b": "FluxGuidance",
50109
  "winner": "model_b",
50110
  "judge": "arena_user_10.16.43.145",
50111
  "anony": true,
@@ -50128,7 +50128,7 @@
50128
  "tstamp": 1723186558.1923
50129
  },
50130
  {
50131
- "model_a": "FluxGuidance",
50132
  "model_b": "StableCascade",
50133
  "winner": "tie",
50134
  "judge": "arena_user_10.16.43.145",
@@ -50144,7 +50144,7 @@
50144
  "tstamp": 1723186599.4345
50145
  },
50146
  {
50147
- "model_a": "FluxTimestep",
50148
  "model_b": "SD3",
50149
  "winner": "model_a",
50150
  "judge": "arena_user_10.16.22.62",
@@ -50169,14 +50169,14 @@
50169
  },
50170
  {
50171
  "model_a": "AuraFlow",
50172
- "model_b": "FluxTimestep",
50173
  "winner": "model_b",
50174
  "judge": "arena_user_10.16.43.145",
50175
  "anony": true,
50176
  "tstamp": 1723203750.3175
50177
  },
50178
  {
50179
- "model_a": "FluxTimestep",
50180
  "model_b": "Kolors",
50181
  "winner": "tie (bothbad)",
50182
  "judge": "arena_user_10.16.22.62",
@@ -50208,7 +50208,7 @@
50208
  "tstamp": 1723206395.3717
50209
  },
50210
  {
50211
- "model_a": "FluxTimestep",
50212
  "model_b": "StableCascade",
50213
  "winner": "model_a",
50214
  "judge": "arena_user_10.16.12.147",
@@ -50225,14 +50225,14 @@
50225
  },
50226
  {
50227
  "model_a": "PixArtSigma",
50228
- "model_b": "FluxGuidance",
50229
  "winner": "model_b",
50230
  "judge": "arena_user_10.16.43.250",
50231
  "anony": true,
50232
  "tstamp": 1723206430.7406
50233
  },
50234
  {
50235
- "model_a": "FluxTimestep",
50236
  "model_b": "SDXLTurbo",
50237
  "winner": "model_a",
50238
  "judge": "arena_user_10.16.43.145",
@@ -50248,16 +50248,16 @@
50248
  "tstamp": 1723224658.8908
50249
  },
50250
  {
50251
- "model_a": "FluxGuidance",
50252
- "model_b": "FluxTimestep",
50253
  "winner": "model_a",
50254
  "judge": "arena_user_10.16.36.191",
50255
  "anony": false,
50256
  "tstamp": 1723232348.385
50257
  },
50258
  {
50259
- "model_a": "FluxTimestep",
50260
- "model_b": "FluxGuidance",
50261
  "winner": "model_b",
50262
  "judge": "arena_user_10.16.36.191",
50263
  "anony": false,
@@ -50289,7 +50289,7 @@
50289
  },
50290
  {
50291
  "model_a": "OpenJourney",
50292
- "model_b": "FluxTimestep",
50293
  "winner": "tie",
50294
  "judge": "arena_user_10.16.22.62",
50295
  "anony": true,
@@ -50392,7 +50392,7 @@
50392
  "tstamp": 1723338245.5496
50393
  },
50394
  {
50395
- "model_a": "FluxTimestep",
50396
  "model_b": "SDXLTurbo",
50397
  "winner": "model_a",
50398
  "judge": "arena_user_10.16.43.145",
@@ -50416,7 +50416,7 @@
50416
  "tstamp": 1723338272.1677
50417
  },
50418
  {
50419
- "model_a": "FluxGuidance",
50420
  "model_b": "SD3",
50421
  "winner": "model_a",
50422
  "judge": "arena_user_10.16.17.24",
@@ -50513,7 +50513,7 @@
50513
  },
50514
  {
50515
  "model_a": "SDXL",
50516
- "model_b": "FluxTimestep",
50517
  "winner": "model_b",
50518
  "judge": "arena_user_10.16.12.147",
50519
  "anony": false,
@@ -50576,7 +50576,7 @@
50576
  "tstamp": 1723416140.7059
50577
  },
50578
  {
50579
- "model_a": "FluxTimestep",
50580
  "model_b": "HunyuanDiT",
50581
  "winner": "model_a",
50582
  "judge": "arena_user_10.16.22.62",
@@ -50601,7 +50601,7 @@
50601
  },
50602
  {
50603
  "model_a": "HunyuanDiT",
50604
- "model_b": "FluxGuidance",
50605
  "winner": "model_b",
50606
  "judge": "arena_user_10.16.36.191",
50607
  "anony": true,
@@ -50617,14 +50617,14 @@
50617
  },
50618
  {
50619
  "model_a": "AuraFlow",
50620
- "model_b": "FluxGuidance",
50621
  "winner": "model_b",
50622
  "judge": "arena_user_10.16.12.147",
50623
  "anony": true,
50624
  "tstamp": 1723466162.8794
50625
  },
50626
  {
50627
- "model_a": "FluxGuidance",
50628
  "model_b": "OpenJourney",
50629
  "winner": "model_a",
50630
  "judge": "arena_user_10.16.45.228",
@@ -50640,8 +50640,8 @@
50640
  "tstamp": 1723481690.3525
50641
  },
50642
  {
50643
- "model_a": "FluxGuidance",
50644
- "model_b": "FluxTimestep",
50645
  "winner": "model_a",
50646
  "judge": "arena_user_10.16.45.228",
50647
  "anony": true,
@@ -50656,7 +50656,7 @@
50656
  "tstamp": 1723510064.126
50657
  },
50658
  {
50659
- "model_a": "FluxGuidance",
50660
  "model_b": "SDXLTurbo",
50661
  "winner": "model_b",
50662
  "judge": "arena_user_10.16.17.24",
@@ -50665,7 +50665,7 @@
50665
  },
50666
  {
50667
  "model_a": "PixArtAlpha",
50668
- "model_b": "FluxTimestep",
50669
  "winner": "tie (bothbad)",
50670
  "judge": "arena_user_10.16.22.62",
50671
  "anony": true,
@@ -50697,7 +50697,7 @@
50697
  },
50698
  {
50699
  "model_a": "HunyuanDiT",
50700
- "model_b": "FluxGuidance",
50701
  "winner": "model_b",
50702
  "judge": "arena_user_10.16.22.62",
50703
  "anony": true,
@@ -50768,7 +50768,7 @@
50768
  "tstamp": 1723521805.5654
50769
  },
50770
  {
50771
- "model_a": "FluxTimestep",
50772
  "model_b": "StableCascade",
50773
  "winner": "model_a",
50774
  "judge": "arena_user_10.16.12.147",
@@ -50777,7 +50777,7 @@
50777
  },
50778
  {
50779
  "model_a": "SDXL",
50780
- "model_b": "FluxGuidance",
50781
  "winner": "model_b",
50782
  "judge": "arena_user_10.16.36.191",
50783
  "anony": true,
@@ -50785,7 +50785,7 @@
50785
  },
50786
  {
50787
  "model_a": "AuraFlow",
50788
- "model_b": "FluxGuidance",
50789
  "winner": "model_b",
50790
  "judge": "arena_user_10.16.45.228",
50791
  "anony": true,
@@ -50848,7 +50848,7 @@
50848
  "tstamp": 1723526723.0377
50849
  },
50850
  {
50851
- "model_a": "FluxTimestep",
50852
  "model_b": "PlayGround V2.5",
50853
  "winner": "model_a",
50854
  "judge": "arena_user_10.16.17.24",
@@ -50872,7 +50872,7 @@
50872
  "tstamp": 1723568683.2572
50873
  },
50874
  {
50875
- "model_a": "FluxGuidance",
50876
  "model_b": "PlayGround V2.5",
50877
  "winner": "model_b",
50878
  "judge": "arena_user_10.16.18.162",
@@ -50897,7 +50897,7 @@
50897
  },
50898
  {
50899
  "model_a": "Kolors",
50900
- "model_b": "FluxGuidance",
50901
  "winner": "tie",
50902
  "judge": "arena_user_10.16.2.60",
50903
  "anony": true,
@@ -50928,7 +50928,7 @@
50928
  "tstamp": 1723644206.2483
50929
  },
50930
  {
50931
- "model_a": "FluxTimestep",
50932
  "model_b": "SDXL",
50933
  "winner": "model_a",
50934
  "judge": "arena_user_10.16.3.140",
@@ -51009,7 +51009,7 @@
51009
  },
51010
  {
51011
  "model_a": "SD3",
51012
- "model_b": "FluxTimestep",
51013
  "winner": "tie",
51014
  "judge": "arena_user_10.16.18.162",
51015
  "anony": true,
@@ -51041,14 +51041,14 @@
51041
  },
51042
  {
51043
  "model_a": "SDXLLightning",
51044
- "model_b": "FluxTimestep",
51045
  "winner": "model_a",
51046
  "judge": "arena_user_10.16.18.75",
51047
  "anony": true,
51048
  "tstamp": 1723694936.0013
51049
  },
51050
  {
51051
- "model_a": "FluxTimestep",
51052
  "model_b": "SDXLLightning",
51053
  "winner": "model_b",
51054
  "judge": "arena_user_10.16.18.75",
@@ -51080,7 +51080,7 @@
51080
  "tstamp": 1723764843.3515
51081
  },
51082
  {
51083
- "model_a": "FluxTimestep",
51084
  "model_b": "SDXLTurbo",
51085
  "winner": "model_b",
51086
  "judge": "arena_user_10.16.18.75",
@@ -51088,7 +51088,7 @@
51088
  "tstamp": 1723764855.5548
51089
  },
51090
  {
51091
- "model_a": "FluxTimestep",
51092
  "model_b": "PixArtSigma",
51093
  "winner": "model_b",
51094
  "judge": "arena_user_10.16.1.165",
@@ -51104,7 +51104,7 @@
51104
  "tstamp": 1723764889.9278
51105
  },
51106
  {
51107
- "model_a": "FluxTimestep",
51108
  "model_b": "SD3",
51109
  "winner": "tie (bothbad)",
51110
  "judge": "arena_user_10.16.18.75",
@@ -51129,7 +51129,7 @@
51129
  },
51130
  {
51131
  "model_a": "Kolors",
51132
- "model_b": "FluxTimestep",
51133
  "winner": "tie",
51134
  "judge": "arena_user_10.16.18.75",
51135
  "anony": true,
@@ -51161,7 +51161,7 @@
51161
  },
51162
  {
51163
  "model_a": "PixArtAlpha",
51164
- "model_b": "FluxTimestep",
51165
  "winner": "model_a",
51166
  "judge": "arena_user_10.16.18.162",
51167
  "anony": true,
@@ -51192,7 +51192,7 @@
51192
  "tstamp": 1723787634.5486
51193
  },
51194
  {
51195
- "model_a": "FluxTimestep",
51196
  "model_b": "SDXL",
51197
  "winner": "model_a",
51198
  "judge": "arena_user_10.16.1.165",
@@ -51209,7 +51209,7 @@
51209
  },
51210
  {
51211
  "model_a": "SDXL",
51212
- "model_b": "FluxTimestep",
51213
  "winner": "model_b",
51214
  "judge": "arena_user_10.16.34.60",
51215
  "anony": true,
@@ -51224,7 +51224,7 @@
51224
  "tstamp": 1723814629.9803
51225
  },
51226
  {
51227
- "model_a": "FluxTimestep",
51228
  "model_b": "SDXLLightning",
51229
  "winner": "model_a",
51230
  "judge": "arena_user_10.16.34.60",
@@ -51240,7 +51240,7 @@
51240
  "tstamp": 1723824350.2469
51241
  },
51242
  {
51243
- "model_a": "FluxGuidance",
51244
  "model_b": "AuraFlow",
51245
  "winner": "model_a",
51246
  "judge": "arena_user_10.16.18.75",
@@ -51248,7 +51248,7 @@
51248
  "tstamp": 1723824360.0778
51249
  },
51250
  {
51251
- "model_a": "FluxGuidance",
51252
  "model_b": "PixArtSigma",
51253
  "winner": "model_a",
51254
  "judge": "arena_user_10.16.34.60",
@@ -51288,7 +51288,7 @@
51288
  "tstamp": 1723838955.3114
51289
  },
51290
  {
51291
- "model_a": "FluxTimestep",
51292
  "model_b": "OpenJourney",
51293
  "winner": "model_a",
51294
  "judge": "arena_user_10.16.18.75",
@@ -51368,7 +51368,7 @@
51368
  "tstamp": 1723839891.4319
51369
  },
51370
  {
51371
- "model_a": "FluxTimestep",
51372
  "model_b": "SDXLLightning",
51373
  "winner": "model_b",
51374
  "judge": "arena_user_10.16.34.60",
@@ -51376,7 +51376,7 @@
51376
  "tstamp": 1723839938.2449
51377
  },
51378
  {
51379
- "model_a": "FluxTimestep",
51380
  "model_b": "SDXL",
51381
  "winner": "model_a",
51382
  "judge": "arena_user_10.16.18.162",
@@ -51401,15 +51401,15 @@
51401
  },
51402
  {
51403
  "model_a": "AuraFlow",
51404
- "model_b": "FluxTimestep",
51405
  "winner": "model_a",
51406
  "judge": "arena_user_10.16.34.60",
51407
  "anony": true,
51408
  "tstamp": 1723840344.8034
51409
  },
51410
  {
51411
- "model_a": "FluxTimestep",
51412
- "model_b": "FluxGuidance",
51413
  "winner": "tie",
51414
  "judge": "arena_user_10.16.18.75",
51415
  "anony": true,
@@ -51417,7 +51417,7 @@
51417
  },
51418
  {
51419
  "model_a": "AuraFlow",
51420
- "model_b": "FluxGuidance",
51421
  "winner": "model_a",
51422
  "judge": "arena_user_10.16.34.60",
51423
  "anony": true,
@@ -51441,7 +51441,7 @@
51441
  },
51442
  {
51443
  "model_a": "Kolors",
51444
- "model_b": "FluxTimestep",
51445
  "winner": "tie (bothbad)",
51446
  "judge": "arena_user_10.16.18.75",
51447
  "anony": true,
@@ -51480,7 +51480,7 @@
51480
  "tstamp": 1723855363.9435
51481
  },
51482
  {
51483
- "model_a": "FluxGuidance",
51484
  "model_b": "SDXLTurbo",
51485
  "winner": "tie",
51486
  "judge": "arena_user_10.16.34.60",
@@ -51536,8 +51536,8 @@
51536
  "tstamp": 1723855411.5431
51537
  },
51538
  {
51539
- "model_a": "FluxGuidance",
51540
- "model_b": "FluxTimestep",
51541
  "winner": "model_a",
51542
  "judge": "arena_user_10.16.18.162",
51543
  "anony": true,
@@ -51577,7 +51577,7 @@
51577
  },
51578
  {
51579
  "model_a": "AuraFlow",
51580
- "model_b": "FluxTimestep",
51581
  "winner": "model_b",
51582
  "judge": "arena_user_10.16.34.60",
51583
  "anony": true,
@@ -51585,7 +51585,7 @@
51585
  },
51586
  {
51587
  "model_a": "Kolors",
51588
- "model_b": "FluxGuidance",
51589
  "winner": "tie",
51590
  "judge": "arena_user_10.16.34.60",
51591
  "anony": true,
@@ -51641,7 +51641,7 @@
51641
  },
51642
  {
51643
  "model_a": "SDXLTurbo",
51644
- "model_b": "FluxTimestep",
51645
  "winner": "model_a",
51646
  "judge": "arena_user_10.16.34.60",
51647
  "anony": true,
@@ -51656,7 +51656,7 @@
51656
  "tstamp": 1723855483.6681
51657
  },
51658
  {
51659
- "model_a": "FluxTimestep",
51660
  "model_b": "OpenJourney",
51661
  "winner": "model_a",
51662
  "judge": "arena_user_10.16.18.162",
@@ -51665,7 +51665,7 @@
51665
  },
51666
  {
51667
  "model_a": "SDXL",
51668
- "model_b": "FluxGuidance",
51669
  "winner": "model_b",
51670
  "judge": "arena_user_10.16.18.162",
51671
  "anony": true,
@@ -51712,7 +51712,7 @@
51712
  "tstamp": 1723855518.1443
51713
  },
51714
  {
51715
- "model_a": "FluxTimestep",
51716
  "model_b": "AuraFlow",
51717
  "winner": "tie",
51718
  "judge": "arena_user_10.16.18.162",
@@ -51728,7 +51728,7 @@
51728
  "tstamp": 1723855533.5625
51729
  },
51730
  {
51731
- "model_a": "FluxGuidance",
51732
  "model_b": "SD3",
51733
  "winner": "model_a",
51734
  "judge": "arena_user_10.16.34.60",
@@ -51745,7 +51745,7 @@
51745
  },
51746
  {
51747
  "model_a": "Kolors",
51748
- "model_b": "FluxGuidance",
51749
  "winner": "model_b",
51750
  "judge": "arena_user_10.16.18.162",
51751
  "anony": true,
@@ -51769,7 +51769,7 @@
51769
  },
51770
  {
51771
  "model_a": "SDXLLightning",
51772
- "model_b": "FluxTimestep",
51773
  "winner": "tie",
51774
  "judge": "arena_user_10.16.18.162",
51775
  "anony": true,
@@ -51792,7 +51792,7 @@
51792
  "tstamp": 1723855564.8518
51793
  },
51794
  {
51795
- "model_a": "FluxTimestep",
51796
  "model_b": "PixArtSigma",
51797
  "winner": "model_a",
51798
  "judge": "arena_user_10.16.18.75",
@@ -51833,7 +51833,7 @@
51833
  },
51834
  {
51835
  "model_a": "PlayGround V2.5",
51836
- "model_b": "FluxTimestep",
51837
  "winner": "model_a",
51838
  "judge": "arena_user_10.16.18.162",
51839
  "anony": true,
@@ -51841,7 +51841,7 @@
51841
  },
51842
  {
51843
  "model_a": "PixArtAlpha",
51844
- "model_b": "FluxTimestep",
51845
  "winner": "model_b",
51846
  "judge": "arena_user_10.16.18.75",
51847
  "anony": true,
@@ -51849,7 +51849,7 @@
51849
  },
51850
  {
51851
  "model_a": "PlayGround V2.5",
51852
- "model_b": "FluxGuidance",
51853
  "winner": "model_a",
51854
  "judge": "arena_user_10.16.34.60",
51855
  "anony": true,
@@ -51865,7 +51865,7 @@
51865
  },
51866
  {
51867
  "model_a": "PlayGround V2.5",
51868
- "model_b": "FluxGuidance",
51869
  "winner": "tie",
51870
  "judge": "arena_user_10.16.18.75",
51871
  "anony": true,
@@ -51881,14 +51881,14 @@
51881
  },
51882
  {
51883
  "model_a": "HunyuanDiT",
51884
- "model_b": "FluxGuidance",
51885
  "winner": "model_a",
51886
  "judge": "arena_user_10.16.18.75",
51887
  "anony": true,
51888
  "tstamp": 1723855622.7164
51889
  },
51890
  {
51891
- "model_a": "FluxTimestep",
51892
  "model_b": "SD3",
51893
  "winner": "tie (bothbad)",
51894
  "judge": "arena_user_10.16.18.75",
@@ -51913,7 +51913,7 @@
51913
  },
51914
  {
51915
  "model_a": "Kolors",
51916
- "model_b": "FluxTimestep",
51917
  "winner": "tie (bothbad)",
51918
  "judge": "arena_user_10.16.18.75",
51919
  "anony": true,
@@ -52057,7 +52057,7 @@
52057
  },
52058
  {
52059
  "model_a": "PlayGround V2.5",
52060
- "model_b": "FluxGuidance",
52061
  "winner": "model_a",
52062
  "judge": "arena_user_10.16.18.162",
52063
  "anony": true,
@@ -52072,7 +52072,7 @@
52072
  "tstamp": 1723876446.6019
52073
  },
52074
  {
52075
- "model_a": "FluxTimestep",
52076
  "model_b": "PlayGround V2.5",
52077
  "winner": "model_b",
52078
  "judge": "arena_user_10.16.18.162",
@@ -52168,11 +52168,243 @@
52168
  "tstamp": 1723908029.3549
52169
  },
52170
  {
52171
- "model_a": "FluxGuidance",
52172
- "model_b": "FluxTimestep",
52173
  "winner": "tie",
52174
  "judge": "arena_user_10.16.18.75",
52175
  "anony": true,
52176
  "tstamp": 1723908074.195
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
52177
  }
52178
  ]
 
49848
  "tstamp": 1723054634.5468
49849
  },
49850
  {
49851
+ "model_a": "FLUX1dev",
49852
+ "model_b": "FLUX1schnell",
49853
  "winner": "model_b",
49854
  "judge": "arena_user_10.16.12.147",
49855
  "anony": true,
 
49880
  "tstamp": 1723063074.7642
49881
  },
49882
  {
49883
+ "model_a": "FLUX1schnell",
49884
+ "model_b": "FLUX1dev",
49885
  "winner": "model_b",
49886
  "judge": "arena_user_10.16.14.231",
49887
  "anony": true,
 
49897
  },
49898
  {
49899
  "model_a": "AuraFlow",
49900
+ "model_b": "FLUX1dev",
49901
  "winner": "model_b",
49902
  "judge": "arena_user_10.16.31.28",
49903
  "anony": false,
49904
  "tstamp": 1723067240.2924
49905
  },
49906
  {
49907
+ "model_a": "FLUX1schnell",
49908
  "model_b": "SDXLLightning",
49909
  "winner": "model_a",
49910
  "judge": "arena_user_10.16.43.145",
 
49920
  "tstamp": 1723078808.7741
49921
  },
49922
  {
49923
+ "model_a": "FLUX1schnell",
49924
+ "model_b": "FLUX1dev",
49925
  "winner": "tie (bothbad)",
49926
  "judge": "arena_user_10.16.31.28",
49927
  "anony": false,
49928
  "tstamp": 1723080943.3647
49929
  },
49930
  {
49931
+ "model_a": "FLUX1schnell",
49932
+ "model_b": "FLUX1dev",
49933
  "winner": "tie (bothbad)",
49934
  "judge": "arena_user_10.16.12.147",
49935
  "anony": false,
 
50016
  "tstamp": 1723160130.8681
50017
  },
50018
  {
50019
+ "model_a": "FLUX1schnell",
50020
  "model_b": "SDXLLightning",
50021
  "winner": "model_a",
50022
  "judge": "arena_user_10.16.17.24",
 
50057
  },
50058
  {
50059
  "model_a": "PixArtAlpha",
50060
+ "model_b": "FLUX1dev",
50061
  "winner": "tie",
50062
  "judge": "arena_user_10.16.43.145",
50063
  "anony": true,
 
50080
  "tstamp": 1723160326.9647
50081
  },
50082
  {
50083
+ "model_a": "FLUX1schnell",
50084
  "model_b": "PlayGround V2.5",
50085
  "winner": "model_a",
50086
  "judge": "arena_user_10.16.22.62",
 
50088
  "tstamp": 1723165134.1363
50089
  },
50090
  {
50091
+ "model_a": "FLUX1dev",
50092
+ "model_b": "FLUX1schnell",
50093
  "winner": "model_a",
50094
  "judge": "arena_user_10.16.22.62",
50095
  "anony": true,
 
50105
  },
50106
  {
50107
  "model_a": "OpenJourney",
50108
+ "model_b": "FLUX1dev",
50109
  "winner": "model_b",
50110
  "judge": "arena_user_10.16.43.145",
50111
  "anony": true,
 
50128
  "tstamp": 1723186558.1923
50129
  },
50130
  {
50131
+ "model_a": "FLUX1dev",
50132
  "model_b": "StableCascade",
50133
  "winner": "tie",
50134
  "judge": "arena_user_10.16.43.145",
 
50144
  "tstamp": 1723186599.4345
50145
  },
50146
  {
50147
+ "model_a": "FLUX1schnell",
50148
  "model_b": "SD3",
50149
  "winner": "model_a",
50150
  "judge": "arena_user_10.16.22.62",
 
50169
  },
50170
  {
50171
  "model_a": "AuraFlow",
50172
+ "model_b": "FLUX1schnell",
50173
  "winner": "model_b",
50174
  "judge": "arena_user_10.16.43.145",
50175
  "anony": true,
50176
  "tstamp": 1723203750.3175
50177
  },
50178
  {
50179
+ "model_a": "FLUX1schnell",
50180
  "model_b": "Kolors",
50181
  "winner": "tie (bothbad)",
50182
  "judge": "arena_user_10.16.22.62",
 
50208
  "tstamp": 1723206395.3717
50209
  },
50210
  {
50211
+ "model_a": "FLUX1schnell",
50212
  "model_b": "StableCascade",
50213
  "winner": "model_a",
50214
  "judge": "arena_user_10.16.12.147",
 
50225
  },
50226
  {
50227
  "model_a": "PixArtSigma",
50228
+ "model_b": "FLUX1dev",
50229
  "winner": "model_b",
50230
  "judge": "arena_user_10.16.43.250",
50231
  "anony": true,
50232
  "tstamp": 1723206430.7406
50233
  },
50234
  {
50235
+ "model_a": "FLUX1schnell",
50236
  "model_b": "SDXLTurbo",
50237
  "winner": "model_a",
50238
  "judge": "arena_user_10.16.43.145",
 
50248
  "tstamp": 1723224658.8908
50249
  },
50250
  {
50251
+ "model_a": "FLUX1dev",
50252
+ "model_b": "FLUX1schnell",
50253
  "winner": "model_a",
50254
  "judge": "arena_user_10.16.36.191",
50255
  "anony": false,
50256
  "tstamp": 1723232348.385
50257
  },
50258
  {
50259
+ "model_a": "FLUX1schnell",
50260
+ "model_b": "FLUX1dev",
50261
  "winner": "model_b",
50262
  "judge": "arena_user_10.16.36.191",
50263
  "anony": false,
 
50289
  },
50290
  {
50291
  "model_a": "OpenJourney",
50292
+ "model_b": "FLUX1schnell",
50293
  "winner": "tie",
50294
  "judge": "arena_user_10.16.22.62",
50295
  "anony": true,
 
50392
  "tstamp": 1723338245.5496
50393
  },
50394
  {
50395
+ "model_a": "FLUX1schnell",
50396
  "model_b": "SDXLTurbo",
50397
  "winner": "model_a",
50398
  "judge": "arena_user_10.16.43.145",
 
50416
  "tstamp": 1723338272.1677
50417
  },
50418
  {
50419
+ "model_a": "FLUX1dev",
50420
  "model_b": "SD3",
50421
  "winner": "model_a",
50422
  "judge": "arena_user_10.16.17.24",
 
50513
  },
50514
  {
50515
  "model_a": "SDXL",
50516
+ "model_b": "FLUX1schnell",
50517
  "winner": "model_b",
50518
  "judge": "arena_user_10.16.12.147",
50519
  "anony": false,
 
50576
  "tstamp": 1723416140.7059
50577
  },
50578
  {
50579
+ "model_a": "FLUX1schnell",
50580
  "model_b": "HunyuanDiT",
50581
  "winner": "model_a",
50582
  "judge": "arena_user_10.16.22.62",
 
50601
  },
50602
  {
50603
  "model_a": "HunyuanDiT",
50604
+ "model_b": "FLUX1dev",
50605
  "winner": "model_b",
50606
  "judge": "arena_user_10.16.36.191",
50607
  "anony": true,
 
50617
  },
50618
  {
50619
  "model_a": "AuraFlow",
50620
+ "model_b": "FLUX1dev",
50621
  "winner": "model_b",
50622
  "judge": "arena_user_10.16.12.147",
50623
  "anony": true,
50624
  "tstamp": 1723466162.8794
50625
  },
50626
  {
50627
+ "model_a": "FLUX1dev",
50628
  "model_b": "OpenJourney",
50629
  "winner": "model_a",
50630
  "judge": "arena_user_10.16.45.228",
 
50640
  "tstamp": 1723481690.3525
50641
  },
50642
  {
50643
+ "model_a": "FLUX1dev",
50644
+ "model_b": "FLUX1schnell",
50645
  "winner": "model_a",
50646
  "judge": "arena_user_10.16.45.228",
50647
  "anony": true,
 
50656
  "tstamp": 1723510064.126
50657
  },
50658
  {
50659
+ "model_a": "FLUX1dev",
50660
  "model_b": "SDXLTurbo",
50661
  "winner": "model_b",
50662
  "judge": "arena_user_10.16.17.24",
 
50665
  },
50666
  {
50667
  "model_a": "PixArtAlpha",
50668
+ "model_b": "FLUX1schnell",
50669
  "winner": "tie (bothbad)",
50670
  "judge": "arena_user_10.16.22.62",
50671
  "anony": true,
 
50697
  },
50698
  {
50699
  "model_a": "HunyuanDiT",
50700
+ "model_b": "FLUX1dev",
50701
  "winner": "model_b",
50702
  "judge": "arena_user_10.16.22.62",
50703
  "anony": true,
 
50768
  "tstamp": 1723521805.5654
50769
  },
50770
  {
50771
+ "model_a": "FLUX1schnell",
50772
  "model_b": "StableCascade",
50773
  "winner": "model_a",
50774
  "judge": "arena_user_10.16.12.147",
 
50777
  },
50778
  {
50779
  "model_a": "SDXL",
50780
+ "model_b": "FLUX1dev",
50781
  "winner": "model_b",
50782
  "judge": "arena_user_10.16.36.191",
50783
  "anony": true,
 
50785
  },
50786
  {
50787
  "model_a": "AuraFlow",
50788
+ "model_b": "FLUX1dev",
50789
  "winner": "model_b",
50790
  "judge": "arena_user_10.16.45.228",
50791
  "anony": true,
 
50848
  "tstamp": 1723526723.0377
50849
  },
50850
  {
50851
+ "model_a": "FLUX1schnell",
50852
  "model_b": "PlayGround V2.5",
50853
  "winner": "model_a",
50854
  "judge": "arena_user_10.16.17.24",
 
50872
  "tstamp": 1723568683.2572
50873
  },
50874
  {
50875
+ "model_a": "FLUX1dev",
50876
  "model_b": "PlayGround V2.5",
50877
  "winner": "model_b",
50878
  "judge": "arena_user_10.16.18.162",
 
50897
  },
50898
  {
50899
  "model_a": "Kolors",
50900
+ "model_b": "FLUX1dev",
50901
  "winner": "tie",
50902
  "judge": "arena_user_10.16.2.60",
50903
  "anony": true,
 
50928
  "tstamp": 1723644206.2483
50929
  },
50930
  {
50931
+ "model_a": "FLUX1schnell",
50932
  "model_b": "SDXL",
50933
  "winner": "model_a",
50934
  "judge": "arena_user_10.16.3.140",
 
51009
  },
51010
  {
51011
  "model_a": "SD3",
51012
+ "model_b": "FLUX1schnell",
51013
  "winner": "tie",
51014
  "judge": "arena_user_10.16.18.162",
51015
  "anony": true,
 
51041
  },
51042
  {
51043
  "model_a": "SDXLLightning",
51044
+ "model_b": "FLUX1schnell",
51045
  "winner": "model_a",
51046
  "judge": "arena_user_10.16.18.75",
51047
  "anony": true,
51048
  "tstamp": 1723694936.0013
51049
  },
51050
  {
51051
+ "model_a": "FLUX1schnell",
51052
  "model_b": "SDXLLightning",
51053
  "winner": "model_b",
51054
  "judge": "arena_user_10.16.18.75",
 
51080
  "tstamp": 1723764843.3515
51081
  },
51082
  {
51083
+ "model_a": "FLUX1schnell",
51084
  "model_b": "SDXLTurbo",
51085
  "winner": "model_b",
51086
  "judge": "arena_user_10.16.18.75",
 
51088
  "tstamp": 1723764855.5548
51089
  },
51090
  {
51091
+ "model_a": "FLUX1schnell",
51092
  "model_b": "PixArtSigma",
51093
  "winner": "model_b",
51094
  "judge": "arena_user_10.16.1.165",
 
51104
  "tstamp": 1723764889.9278
51105
  },
51106
  {
51107
+ "model_a": "FLUX1schnell",
51108
  "model_b": "SD3",
51109
  "winner": "tie (bothbad)",
51110
  "judge": "arena_user_10.16.18.75",
 
51129
  },
51130
  {
51131
  "model_a": "Kolors",
51132
+ "model_b": "FLUX1schnell",
51133
  "winner": "tie",
51134
  "judge": "arena_user_10.16.18.75",
51135
  "anony": true,
 
51161
  },
51162
  {
51163
  "model_a": "PixArtAlpha",
51164
+ "model_b": "FLUX1schnell",
51165
  "winner": "model_a",
51166
  "judge": "arena_user_10.16.18.162",
51167
  "anony": true,
 
51192
  "tstamp": 1723787634.5486
51193
  },
51194
  {
51195
+ "model_a": "FLUX1schnell",
51196
  "model_b": "SDXL",
51197
  "winner": "model_a",
51198
  "judge": "arena_user_10.16.1.165",
 
51209
  },
51210
  {
51211
  "model_a": "SDXL",
51212
+ "model_b": "FLUX1schnell",
51213
  "winner": "model_b",
51214
  "judge": "arena_user_10.16.34.60",
51215
  "anony": true,
 
51224
  "tstamp": 1723814629.9803
51225
  },
51226
  {
51227
+ "model_a": "FLUX1schnell",
51228
  "model_b": "SDXLLightning",
51229
  "winner": "model_a",
51230
  "judge": "arena_user_10.16.34.60",
 
51240
  "tstamp": 1723824350.2469
51241
  },
51242
  {
51243
+ "model_a": "FLUX1dev",
51244
  "model_b": "AuraFlow",
51245
  "winner": "model_a",
51246
  "judge": "arena_user_10.16.18.75",
 
51248
  "tstamp": 1723824360.0778
51249
  },
51250
  {
51251
+ "model_a": "FLUX1dev",
51252
  "model_b": "PixArtSigma",
51253
  "winner": "model_a",
51254
  "judge": "arena_user_10.16.34.60",
 
51288
  "tstamp": 1723838955.3114
51289
  },
51290
  {
51291
+ "model_a": "FLUX1schnell",
51292
  "model_b": "OpenJourney",
51293
  "winner": "model_a",
51294
  "judge": "arena_user_10.16.18.75",
 
51368
  "tstamp": 1723839891.4319
51369
  },
51370
  {
51371
+ "model_a": "FLUX1schnell",
51372
  "model_b": "SDXLLightning",
51373
  "winner": "model_b",
51374
  "judge": "arena_user_10.16.34.60",
 
51376
  "tstamp": 1723839938.2449
51377
  },
51378
  {
51379
+ "model_a": "FLUX1schnell",
51380
  "model_b": "SDXL",
51381
  "winner": "model_a",
51382
  "judge": "arena_user_10.16.18.162",
 
51401
  },
51402
  {
51403
  "model_a": "AuraFlow",
51404
+ "model_b": "FLUX1schnell",
51405
  "winner": "model_a",
51406
  "judge": "arena_user_10.16.34.60",
51407
  "anony": true,
51408
  "tstamp": 1723840344.8034
51409
  },
51410
  {
51411
+ "model_a": "FLUX1schnell",
51412
+ "model_b": "FLUX1dev",
51413
  "winner": "tie",
51414
  "judge": "arena_user_10.16.18.75",
51415
  "anony": true,
 
51417
  },
51418
  {
51419
  "model_a": "AuraFlow",
51420
+ "model_b": "FLUX1dev",
51421
  "winner": "model_a",
51422
  "judge": "arena_user_10.16.34.60",
51423
  "anony": true,
 
51441
  },
51442
  {
51443
  "model_a": "Kolors",
51444
+ "model_b": "FLUX1schnell",
51445
  "winner": "tie (bothbad)",
51446
  "judge": "arena_user_10.16.18.75",
51447
  "anony": true,
 
51480
  "tstamp": 1723855363.9435
51481
  },
51482
  {
51483
+ "model_a": "FLUX1dev",
51484
  "model_b": "SDXLTurbo",
51485
  "winner": "tie",
51486
  "judge": "arena_user_10.16.34.60",
 
51536
  "tstamp": 1723855411.5431
51537
  },
51538
  {
51539
+ "model_a": "FLUX1dev",
51540
+ "model_b": "FLUX1schnell",
51541
  "winner": "model_a",
51542
  "judge": "arena_user_10.16.18.162",
51543
  "anony": true,
 
51577
  },
51578
  {
51579
  "model_a": "AuraFlow",
51580
+ "model_b": "FLUX1schnell",
51581
  "winner": "model_b",
51582
  "judge": "arena_user_10.16.34.60",
51583
  "anony": true,
 
51585
  },
51586
  {
51587
  "model_a": "Kolors",
51588
+ "model_b": "FLUX1dev",
51589
  "winner": "tie",
51590
  "judge": "arena_user_10.16.34.60",
51591
  "anony": true,
 
51641
  },
51642
  {
51643
  "model_a": "SDXLTurbo",
51644
+ "model_b": "FLUX1schnell",
51645
  "winner": "model_a",
51646
  "judge": "arena_user_10.16.34.60",
51647
  "anony": true,
 
51656
  "tstamp": 1723855483.6681
51657
  },
51658
  {
51659
+ "model_a": "FLUX1schnell",
51660
  "model_b": "OpenJourney",
51661
  "winner": "model_a",
51662
  "judge": "arena_user_10.16.18.162",
 
51665
  },
51666
  {
51667
  "model_a": "SDXL",
51668
+ "model_b": "FLUX1dev",
51669
  "winner": "model_b",
51670
  "judge": "arena_user_10.16.18.162",
51671
  "anony": true,
 
51712
  "tstamp": 1723855518.1443
51713
  },
51714
  {
51715
+ "model_a": "FLUX1schnell",
51716
  "model_b": "AuraFlow",
51717
  "winner": "tie",
51718
  "judge": "arena_user_10.16.18.162",
 
51728
  "tstamp": 1723855533.5625
51729
  },
51730
  {
51731
+ "model_a": "FLUX1dev",
51732
  "model_b": "SD3",
51733
  "winner": "model_a",
51734
  "judge": "arena_user_10.16.34.60",
 
51745
  },
51746
  {
51747
  "model_a": "Kolors",
51748
+ "model_b": "FLUX1dev",
51749
  "winner": "model_b",
51750
  "judge": "arena_user_10.16.18.162",
51751
  "anony": true,
 
51769
  },
51770
  {
51771
  "model_a": "SDXLLightning",
51772
+ "model_b": "FLUX1schnell",
51773
  "winner": "tie",
51774
  "judge": "arena_user_10.16.18.162",
51775
  "anony": true,
 
51792
  "tstamp": 1723855564.8518
51793
  },
51794
  {
51795
+ "model_a": "FLUX1schnell",
51796
  "model_b": "PixArtSigma",
51797
  "winner": "model_a",
51798
  "judge": "arena_user_10.16.18.75",
 
51833
  },
51834
  {
51835
  "model_a": "PlayGround V2.5",
51836
+ "model_b": "FLUX1schnell",
51837
  "winner": "model_a",
51838
  "judge": "arena_user_10.16.18.162",
51839
  "anony": true,
 
51841
  },
51842
  {
51843
  "model_a": "PixArtAlpha",
51844
+ "model_b": "FLUX1schnell",
51845
  "winner": "model_b",
51846
  "judge": "arena_user_10.16.18.75",
51847
  "anony": true,
 
51849
  },
51850
  {
51851
  "model_a": "PlayGround V2.5",
51852
+ "model_b": "FLUX1dev",
51853
  "winner": "model_a",
51854
  "judge": "arena_user_10.16.34.60",
51855
  "anony": true,
 
51865
  },
51866
  {
51867
  "model_a": "PlayGround V2.5",
51868
+ "model_b": "FLUX1dev",
51869
  "winner": "tie",
51870
  "judge": "arena_user_10.16.18.75",
51871
  "anony": true,
 
51881
  },
51882
  {
51883
  "model_a": "HunyuanDiT",
51884
+ "model_b": "FLUX1dev",
51885
  "winner": "model_a",
51886
  "judge": "arena_user_10.16.18.75",
51887
  "anony": true,
51888
  "tstamp": 1723855622.7164
51889
  },
51890
  {
51891
+ "model_a": "FLUX1schnell",
51892
  "model_b": "SD3",
51893
  "winner": "tie (bothbad)",
51894
  "judge": "arena_user_10.16.18.75",
 
51913
  },
51914
  {
51915
  "model_a": "Kolors",
51916
+ "model_b": "FLUX1schnell",
51917
  "winner": "tie (bothbad)",
51918
  "judge": "arena_user_10.16.18.75",
51919
  "anony": true,
 
52057
  },
52058
  {
52059
  "model_a": "PlayGround V2.5",
52060
+ "model_b": "FLUX1dev",
52061
  "winner": "model_a",
52062
  "judge": "arena_user_10.16.18.162",
52063
  "anony": true,
 
52072
  "tstamp": 1723876446.6019
52073
  },
52074
  {
52075
+ "model_a": "FLUX1schnell",
52076
  "model_b": "PlayGround V2.5",
52077
  "winner": "model_b",
52078
  "judge": "arena_user_10.16.18.162",
 
52168
  "tstamp": 1723908029.3549
52169
  },
52170
  {
52171
+ "model_a": "FLUX1dev",
52172
+ "model_b": "FLUX1schnell",
52173
  "winner": "tie",
52174
  "judge": "arena_user_10.16.18.75",
52175
  "anony": true,
52176
  "tstamp": 1723908074.195
52177
+ },
52178
+ {
52179
+ "model_a": "OpenJourney",
52180
+ "model_b": "FLUX1dev",
52181
+ "winner": "model_a",
52182
+ "judge": "arena_user_10.16.18.162",
52183
+ "anony": true,
52184
+ "tstamp": 1723910785.0692
52185
+ },
52186
+ {
52187
+ "model_a": "SDXLTurbo",
52188
+ "model_b": "AuraFlow",
52189
+ "winner": "model_a",
52190
+ "judge": "arena_user_10.16.18.162",
52191
+ "anony": true,
52192
+ "tstamp": 1723922566.9706
52193
+ },
52194
+ {
52195
+ "model_a": "StableCascade",
52196
+ "model_b": "SDXLTurbo",
52197
+ "winner": "tie (bothbad)",
52198
+ "judge": "arena_user_10.16.1.165",
52199
+ "anony": true,
52200
+ "tstamp": 1723922575.0171
52201
+ },
52202
+ {
52203
+ "model_a": "PixArtSigma",
52204
+ "model_b": "Kolors",
52205
+ "winner": "tie (bothbad)",
52206
+ "judge": "arena_user_10.16.18.162",
52207
+ "anony": true,
52208
+ "tstamp": 1723922584.553
52209
+ },
52210
+ {
52211
+ "model_a": "SDXLTurbo",
52212
+ "model_b": "StableCascade",
52213
+ "winner": "model_b",
52214
+ "judge": "arena_user_10.16.18.162",
52215
+ "anony": true,
52216
+ "tstamp": 1723922593.6921
52217
+ },
52218
+ {
52219
+ "model_a": "FLUX1schnell",
52220
+ "model_b": "PixArtAlpha",
52221
+ "winner": "model_b",
52222
+ "judge": "arena_user_10.16.18.162",
52223
+ "anony": true,
52224
+ "tstamp": 1723922618.7522
52225
+ },
52226
+ {
52227
+ "model_a": "StableCascade",
52228
+ "model_b": "PixArtSigma",
52229
+ "winner": "model_a",
52230
+ "judge": "arena_user_10.16.18.162",
52231
+ "anony": true,
52232
+ "tstamp": 1723922626.6249
52233
+ },
52234
+ {
52235
+ "model_a": "SD3",
52236
+ "model_b": "SDXLTurbo",
52237
+ "winner": "model_b",
52238
+ "judge": "arena_user_10.16.18.162",
52239
+ "anony": true,
52240
+ "tstamp": 1723922643.7963
52241
+ },
52242
+ {
52243
+ "model_a": "Kolors",
52244
+ "model_b": "SDXLLightning",
52245
+ "winner": "model_b",
52246
+ "judge": "arena_user_10.16.18.75",
52247
+ "anony": true,
52248
+ "tstamp": 1723922667.2898
52249
+ },
52250
+ {
52251
+ "model_a": "FLUX1dev",
52252
+ "model_b": "SDXLTurbo",
52253
+ "winner": "model_a",
52254
+ "judge": "arena_user_10.16.18.162",
52255
+ "anony": true,
52256
+ "tstamp": 1723922745.1648
52257
+ },
52258
+ {
52259
+ "model_a": "Kolors",
52260
+ "model_b": "FLUX1schnell",
52261
+ "winner": "model_a",
52262
+ "judge": "arena_user_10.16.18.75",
52263
+ "anony": true,
52264
+ "tstamp": 1723922759.0787
52265
+ },
52266
+ {
52267
+ "model_a": "PlayGround V2.5",
52268
+ "model_b": "Kolors",
52269
+ "winner": "tie (bothbad)",
52270
+ "judge": "arena_user_10.16.18.162",
52271
+ "anony": true,
52272
+ "tstamp": 1723922767.444
52273
+ },
52274
+ {
52275
+ "model_a": "OpenJourney",
52276
+ "model_b": "PixArtSigma",
52277
+ "winner": "model_b",
52278
+ "judge": "arena_user_10.16.18.162",
52279
+ "anony": true,
52280
+ "tstamp": 1723922776.0625
52281
+ },
52282
+ {
52283
+ "model_a": "StableCascade",
52284
+ "model_b": "SDXLTurbo",
52285
+ "winner": "model_a",
52286
+ "judge": "arena_user_10.16.18.162",
52287
+ "anony": true,
52288
+ "tstamp": 1723922788.5956
52289
+ },
52290
+ {
52291
+ "model_a": "SDXLTurbo",
52292
+ "model_b": "SDXLLightning",
52293
+ "winner": "tie (bothbad)",
52294
+ "judge": "arena_user_10.16.18.162",
52295
+ "anony": true,
52296
+ "tstamp": 1723922800.3378
52297
+ },
52298
+ {
52299
+ "model_a": "SDXLTurbo",
52300
+ "model_b": "PixArtAlpha",
52301
+ "winner": "model_b",
52302
+ "judge": "arena_user_10.16.1.165",
52303
+ "anony": true,
52304
+ "tstamp": 1723922808.3497
52305
+ },
52306
+ {
52307
+ "model_a": "SD3",
52308
+ "model_b": "PixArtSigma",
52309
+ "winner": "model_a",
52310
+ "judge": "arena_user_10.16.18.162",
52311
+ "anony": true,
52312
+ "tstamp": 1723922819.7194
52313
+ },
52314
+ {
52315
+ "model_a": "SD3",
52316
+ "model_b": "StableCascade",
52317
+ "winner": "tie (bothbad)",
52318
+ "judge": "arena_user_10.16.18.75",
52319
+ "anony": true,
52320
+ "tstamp": 1723922828.2665
52321
+ },
52322
+ {
52323
+ "model_a": "PixArtAlpha",
52324
+ "model_b": "AuraFlow",
52325
+ "winner": "model_b",
52326
+ "judge": "arena_user_10.16.1.165",
52327
+ "anony": true,
52328
+ "tstamp": 1723963692.1376
52329
+ },
52330
+ {
52331
+ "model_a": "SDXLLightning",
52332
+ "model_b": "OpenJourney",
52333
+ "winner": "tie (bothbad)",
52334
+ "judge": "arena_user_10.16.18.162",
52335
+ "anony": true,
52336
+ "tstamp": 1723963701.4014
52337
+ },
52338
+ {
52339
+ "model_a": "SDXLLightning",
52340
+ "model_b": "FLUX1dev",
52341
+ "winner": "model_b",
52342
+ "judge": "arena_user_10.16.1.165",
52343
+ "anony": true,
52344
+ "tstamp": 1723963715.181
52345
+ },
52346
+ {
52347
+ "model_a": "SDXL",
52348
+ "model_b": "SD3",
52349
+ "winner": "model_b",
52350
+ "judge": "arena_user_10.16.18.162",
52351
+ "anony": true,
52352
+ "tstamp": 1723963739.8545
52353
+ },
52354
+ {
52355
+ "model_a": "AuraFlow",
52356
+ "model_b": "SDXL",
52357
+ "winner": "model_b",
52358
+ "judge": "arena_user_10.16.1.165",
52359
+ "anony": true,
52360
+ "tstamp": 1723963746.2871
52361
+ },
52362
+ {
52363
+ "model_a": "HunyuanDiT",
52364
+ "model_b": "SDXL",
52365
+ "winner": "model_a",
52366
+ "judge": "arena_user_10.16.1.165",
52367
+ "anony": true,
52368
+ "tstamp": 1723970594.9832
52369
+ },
52370
+ {
52371
+ "model_a": "StableCascade",
52372
+ "model_b": "PlayGround V2.5",
52373
+ "winner": "model_a",
52374
+ "judge": "arena_user_10.16.18.75",
52375
+ "anony": true,
52376
+ "tstamp": 1723970603.8367
52377
+ },
52378
+ {
52379
+ "model_a": "PixArtAlpha",
52380
+ "model_b": "SDXL",
52381
+ "winner": "model_a",
52382
+ "judge": "arena_user_10.16.18.75",
52383
+ "anony": true,
52384
+ "tstamp": 1723970610.2448
52385
+ },
52386
+ {
52387
+ "model_a": "PixArtSigma",
52388
+ "model_b": "AuraFlow",
52389
+ "winner": "model_a",
52390
+ "judge": "arena_user_10.16.18.75",
52391
+ "anony": true,
52392
+ "tstamp": 1723970619.6508
52393
+ },
52394
+ {
52395
+ "model_a": "SD3",
52396
+ "model_b": "SDXLLightning",
52397
+ "winner": "model_a",
52398
+ "judge": "arena_user_10.16.18.75",
52399
+ "anony": true,
52400
+ "tstamp": 1723970626.3099
52401
+ },
52402
+ {
52403
+ "model_a": "FLUX1schnell",
52404
+ "model_b": "OpenJourney",
52405
+ "winner": "model_a",
52406
+ "judge": "arena_user_10.16.18.75",
52407
+ "anony": true,
52408
+ "tstamp": 1723970632.9565
52409
  }
52410
  ]
arena_elo/results/latest/clean_battle_video_generation.json CHANGED
@@ -14862,5 +14862,21 @@
14862
  "judge": "arena_user_10.16.18.75",
14863
  "anony": true,
14864
  "tstamp": 1723909957.9225
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
14865
  }
14866
  ]
 
14862
  "judge": "arena_user_10.16.18.75",
14863
  "anony": true,
14864
  "tstamp": 1723909957.9225
14865
+ },
14866
+ {
14867
+ "model_a": "AnimateDiff",
14868
+ "model_b": "AnimateDiffTurbo",
14869
+ "winner": "tie (bothbad)",
14870
+ "judge": "arena_user_10.16.1.165",
14871
+ "anony": true,
14872
+ "tstamp": 1723963592.0484
14873
+ },
14874
+ {
14875
+ "model_a": "AnimateDiff",
14876
+ "model_b": "AnimateDiffTurbo",
14877
+ "winner": "tie",
14878
+ "judge": "arena_user_10.16.18.75",
14879
+ "anony": true,
14880
+ "tstamp": 1724006529.2433
14881
  }
14882
  ]
arena_elo/results/latest/elo_results_image_editing.pkl CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1da1e19486e987e18cf9bec79c36f1b71291a4f92490cf7d3af4edbc98628510
3
- size 62482
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b54d460d93f22ee6e2519ccc82e4ebd64ec81987505760c428b593ff91a13368
3
+ size 62455
arena_elo/results/latest/elo_results_t2i_generation.pkl CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:503ad9814b462e2bd1e60a3bdfb27549a374706e5f622cf5848a776509b2bc0e
3
- size 76789
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fa69fb8e450bd988c80b346d4f102c5be8bd74605030f0d5a295a71b66230ccd
3
+ size 76790
arena_elo/results/latest/elo_results_video_generation.pkl CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c3bfa72b72fe286920122d9d36e161dcab2a2ee06ecf5ceb6ad822fd50063548
3
  size 59905
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6c76c0dad67cabfdbda5beb2056bfaf9f669f7a5a3857716212f6f831516d5f9
3
  size 59905
arena_elo/results/latest/image_editing_leaderboard.csv CHANGED
@@ -2,7 +2,7 @@ key,Model,Arena Elo rating (anony),Arena Elo rating (full),License,Organization,
2
  MagicBrush,MagicBrush,1112.4518849527376,1116.3228088792275,CC-BY-4.0,"The Ohio State University, University of Waterloo",https://osu-nlp-group.github.io/MagicBrush
3
  InfEdit,InfEdit,1077.2249767545911,1077.0861206067664,CC BY-NC-ND 4.0,"University of Michigan, University of California, Berkeley",https://huggingface.co/spaces/sled-umich/InfEdit
4
  CosXLEdit,CosXLEdit,1064.682441262532,1065.599445502775,cosxl-nc-community,Stability AI,https://huggingface.co/spaces/multimodalart/cosxl
5
- InstructPix2Pix,InstructPix2Pix,1035.4054226880567,1033.208668133612,"Copyright 2023 Timothy Brooks, Aleksander Holynski, Alexei A. Efros","University of California, Berkeley",https://www.timothybrooks.com/instruct-pix2pix
6
  PNP,PNP,1001.4916130267786,1006.0747389504991,-,Weizmann Institute of Science,https://github.com/MichalGeyer/plug-and-play
7
  Prompt2prompt,Prompt2prompt,990.9755779591587,992.0796321838297,Apache-2.0,"Google, Tel Aviv University",https://prompt-to-prompt.github.io
8
  CycleDiffusion,CycleDiffusion,938.5637450408492,931.6722574678079,X11,Carnegie Mellon University,https://github.com/ChenWu98/cycle-diffusion
 
2
  MagicBrush,MagicBrush,1112.4518849527376,1116.3228088792275,CC-BY-4.0,"The Ohio State University, University of Waterloo",https://osu-nlp-group.github.io/MagicBrush
3
  InfEdit,InfEdit,1077.2249767545911,1077.0861206067664,CC BY-NC-ND 4.0,"University of Michigan, University of California, Berkeley",https://huggingface.co/spaces/sled-umich/InfEdit
4
  CosXLEdit,CosXLEdit,1064.682441262532,1065.599445502775,cosxl-nc-community,Stability AI,https://huggingface.co/spaces/multimodalart/cosxl
5
+ InstructPix2Pix,InstructPix2Pix,1035.4054226880567,1033.2086681336118,"Copyright 2023 Timothy Brooks, Aleksander Holynski, Alexei A. Efros","University of California, Berkeley",https://www.timothybrooks.com/instruct-pix2pix
6
  PNP,PNP,1001.4916130267786,1006.0747389504991,-,Weizmann Institute of Science,https://github.com/MichalGeyer/plug-and-play
7
  Prompt2prompt,Prompt2prompt,990.9755779591587,992.0796321838297,Apache-2.0,"Google, Tel Aviv University",https://prompt-to-prompt.github.io
8
  CycleDiffusion,CycleDiffusion,938.5637450408492,931.6722574678079,X11,Carnegie Mellon University,https://github.com/ChenWu98/cycle-diffusion
arena_elo/results/latest/t2i_generation_leaderboard.csv CHANGED
@@ -1,15 +1,15 @@
1
  key,Model,Arena Elo rating (anony),Arena Elo rating (full),License,Organization,Link
2
- PlayGround V2.5,PlayGround V2.5,1141.866659999037,1141.8338384616795,Playground v2.5 Community License,Playground,https://huggingface.co/playgroundai/playground-v2.5-1024px-aesthetic
3
- FluxTimestep,FluxTimestep,1115.928646165151,1121.9304446567799,N/A,N/A,N/A
4
- PlayGround V2,PlayGround V2,1083.663321447569,1080.8791567769488,Playground v2 Community License,Playground,https://huggingface.co/playgroundai/playground-v2-1024px-aesthetic
5
- HunyuanDiT,HunyuanDiT,1059.7533365825295,1043.5339717960453,tencent-hunyuan-community,Tencent,https://huggingface.co/Tencent-Hunyuan/HunyuanDiT
6
- StableCascade,StableCascade,1046.7571473591233,1048.8389078449923,stable-cascade-nc-community (other),Stability AI,https://huggingface.co/stabilityai/stable-cascade
7
- SDXLLightning,SDXLLightning,1034.8611228210834,1037.6419954765402,openrail++,ByteDance,https://huggingface.co/ByteDance/SDXL-Lightning
8
- PixArtAlpha,PixArtAlpha,1033.0085889123181,1021.5860196967267,openrail++,PixArt-alpha,https://huggingface.co/PixArt-alpha/PixArt-XL-2-1024-MS
9
- PixArtSigma,PixArtSigma,1029.7824987127658,1027.9500586698966,openrail++,PixArt-alpha,https://fal.ai/models/fal-ai/pixart-sigma
10
- SD3,SD3,1001.3310047788816,994.5930116229433,stabilityai-nc-research-community,Stability AI,https://huggingface.co/stabilityai/stable-diffusion-3-medium
11
- SDXL,SDXL,975.7678875209955,974.6391412818967,openrail++,Stability AI,https://huggingface.co/stabilityai/stable-diffusion-xl-base-1.0
12
- SDXLTurbo,SDXLTurbo,922.2975316059412,918.3190757057619,sai-nc-community (other),Stability AI,https://huggingface.co/stabilityai/sdxl-turbo
13
- LCM(v1.5/XL),LCM(v1.5/XL),915.9954758760788,908.3365622923737,openrail++,Latent Consistency,https://fal.ai/models/fal-ai/fast-lcm-diffusion/api
14
- OpenJourney,OpenJourney,838.7888235391866,831.8551299360711,creativeml-openrail-m,PromptHero,https://huggingface.co/prompthero/openjourney
15
- LCM,LCM,800.197954679335,812.3288511265314,MIT License,Tsinghua University,https://huggingface.co/SimianLuo/LCM_Dreamshaper_v7
 
1
  key,Model,Arena Elo rating (anony),Arena Elo rating (full),License,Organization,Link
2
+ PlayGround V2.5,PlayGround V2.5,1141.5188909673816,1141.7574769353046,Playground v2.5 Community License,Playground,https://huggingface.co/playgroundai/playground-v2.5-1024px-aesthetic
3
+ FLUX1schnell,FLUX1schnell,1107.0181424085022,1112.4579783184781,N/A,N/A,N/A
4
+ PlayGround V2,PlayGround V2,1083.848194525069,1081.1558760457797,Playground v2 Community License,Playground,https://huggingface.co/playgroundai/playground-v2-1024px-aesthetic
5
+ HunyuanDiT,HunyuanDiT,1061.8376119998818,1045.8437711625322,tencent-hunyuan-community,Tencent,https://huggingface.co/Tencent-Hunyuan/HunyuanDiT
6
+ StableCascade,StableCascade,1048.1457195754278,1050.1691240248065,stable-cascade-nc-community (other),Stability AI,https://huggingface.co/stabilityai/stable-cascade
7
+ SDXLLightning,SDXLLightning,1034.30472320188,1037.2932871766393,openrail++,ByteDance,https://huggingface.co/ByteDance/SDXL-Lightning
8
+ PixArtAlpha,PixArtAlpha,1033.912116989071,1022.557442237083,openrail++,PixArt-alpha,https://huggingface.co/PixArt-alpha/PixArt-XL-2-1024-MS
9
+ PixArtSigma,PixArtSigma,1029.1408183981687,1027.4953277391191,openrail++,PixArt-alpha,https://fal.ai/models/fal-ai/pixart-sigma
10
+ SD3,SD3,1006.8458978216129,1000.2491511468914,stabilityai-nc-research-community,Stability AI,https://huggingface.co/stabilityai/stable-diffusion-3-medium
11
+ SDXL,SDXL,975.3595050901268,974.4701361426086,openrail++,Stability AI,https://huggingface.co/stabilityai/stable-diffusion-xl-base-1.0
12
+ SDXLTurbo,SDXLTurbo,922.5038319935961,918.6139210049913,sai-nc-community (other),Stability AI,https://huggingface.co/stabilityai/sdxl-turbo
13
+ LCM(v1.5/XL),LCM(v1.5/XL),916.2179215619182,908.6161501509581,openrail++,Latent Consistency,https://fal.ai/models/fal-ai/fast-lcm-diffusion/api
14
+ OpenJourney,OpenJourney,838.9432903688682,832.1138397704597,creativeml-openrail-m,PromptHero,https://huggingface.co/prompthero/openjourney
15
+ LCM,LCM,800.403335098498,812.6668778296877,MIT License,Tsinghua University,https://huggingface.co/SimianLuo/LCM_Dreamshaper_v7
arena_elo/results/latest/video_generation_leaderboard.csv CHANGED
@@ -1,9 +1,9 @@
1
  key,Model,Arena Elo rating (anony),Arena Elo rating (full),License,Organization,Link
2
- StableVideoDiffusion,StableVideoDiffusion,1133.2057266842914,1135.6740718576937,stable-video-diffusion-nc-community,Stability AI,https://fal.ai/models/fal-ai/fast-svd/text-to-video/api
3
- T2VTurbo,T2VTurbo,1097.0362394075614,1095.481109681995,cc-by-nc-4.0,"University of California, Santa Barbara",https://huggingface.co/jiachenli-ucsb/T2V-Turbo-VC2
4
- VideoCrafter2,VideoCrafter2,1074.3273548011723,1074.6323977593943,Apache 2.0,Tencent AI Lab,https://ailab-cvc.github.io/videocrafter2/
5
- AnimateDiff,AnimateDiff,1068.93900863825,1067.5731621857178,creativeml-openrail-m,"The Chinese University of Hong Kong, Shanghai AI Lab, Stanford University",https://fal.ai/models/fast-animatediff-t2v
6
- LaVie,LaVie,995.8323112101649,994.8789456408321,Apache 2.0,Shanghai AI Lab,https://github.com/Vchitect/LaVie
7
- OpenSora,OpenSora,913.264882541298,913.001492764224,Apache 2.0,HPC-AI Tech,https://github.com/hpcaitech/Open-Sora
8
- ModelScope,ModelScope,861.0476363835537,862.3030529191846,cc-by-nc-4.0,Alibaba Group,https://arxiv.org/abs/2308.06571
9
- AnimateDiffTurbo,AnimateDiffTurbo,856.3468403337079,856.4557671909597,creativeml-openrail-m,"The Chinese University of Hong Kong, Shanghai AI Lab, Stanford University",https://fal.ai/models/fast-animatediff-t2v-turbo
 
1
  key,Model,Arena Elo rating (anony),Arena Elo rating (full),License,Organization,Link
2
+ StableVideoDiffusion,StableVideoDiffusion,1133.1838006160342,1135.648326348363,stable-video-diffusion-nc-community,Stability AI,https://fal.ai/models/fal-ai/fast-svd/text-to-video/api
3
+ T2VTurbo,T2VTurbo,1097.0055576746822,1095.4539969650828,cc-by-nc-4.0,"University of California, Santa Barbara",https://huggingface.co/jiachenli-ucsb/T2V-Turbo-VC2
4
+ VideoCrafter2,VideoCrafter2,1074.299413538351,1074.604913704468,Apache 2.0,Tencent AI Lab,https://ailab-cvc.github.io/videocrafter2/
5
+ AnimateDiff,AnimateDiff,1068.2089967499214,1066.8805974519646,creativeml-openrail-m,"The Chinese University of Hong Kong, Shanghai AI Lab, Stanford University",https://fal.ai/models/fast-animatediff-t2v
6
+ LaVie,LaVie,995.82479731396,994.8703618669116,Apache 2.0,Shanghai AI Lab,https://github.com/Vchitect/LaVie
7
+ OpenSora,OpenSora,913.3181800582577,913.0542295067128,Apache 2.0,HPC-AI Tech,https://github.com/hpcaitech/Open-Sora
8
+ ModelScope,ModelScope,861.1074201988872,862.3583669429345,cc-by-nc-4.0,Alibaba Group,https://arxiv.org/abs/2308.06571
9
+ AnimateDiffTurbo,AnimateDiffTurbo,857.0518338499064,857.1292072135634,creativeml-openrail-m,"The Chinese University of Hong Kong, Shanghai AI Lab, Stanford University",https://fal.ai/models/fast-animatediff-t2v-turbo
arena_elo/update_elo_rating.sh CHANGED
@@ -3,6 +3,7 @@ if [ -z "$LOGDIR" ]; then
3
  echo "LOGDIR is not set. Using default '../GenAI-Arena-hf-logs/vote_log'"
4
  export LOGDIR="../GenAI-Arena-hf-logs/vote_log"
5
  fi
 
6
 
7
  mkdir -p results
8
 
@@ -29,13 +30,19 @@ mv clean_battle_t2i_generation_$generation_battle_cutoff_date.json ./results/$ge
29
  mv clean_battle_video_generation_$video_generation_battle_cutoff_date.json ./results/$video_generation_battle_cutoff_date/clean_battle_video_generation.json
30
 
31
 
 
32
  python3 -m elo_rating.elo_analysis --clean-battle-file ./results/$edition_battle_cutoff_date/clean_battle_image_editing.json
 
33
  mv ./elo_results_$edition_battle_cutoff_date.pkl ./results/$edition_battle_cutoff_date/elo_results_image_editing.pkl
34
 
 
35
  python3 -m elo_rating.elo_analysis --clean-battle-file ./results/$generation_battle_cutoff_date/clean_battle_t2i_generation.json
 
36
  mv ./elo_results_$generation_battle_cutoff_date.pkl ./results/$generation_battle_cutoff_date/elo_results_t2i_generation.pkl
37
 
 
38
  python3 -m elo_rating.elo_analysis --clean-battle-file ./results/$video_generation_battle_cutoff_date/clean_battle_video_generation.json
 
39
  mv ./elo_results_$video_generation_battle_cutoff_date.pkl ./results/$video_generation_battle_cutoff_date/elo_results_video_generation.pkl
40
 
41
  # generat the leaderboard
 
3
  echo "LOGDIR is not set. Using default '../GenAI-Arena-hf-logs/vote_log'"
4
  export LOGDIR="../GenAI-Arena-hf-logs/vote_log"
5
  fi
6
+ set -e
7
 
8
  mkdir -p results
9
 
 
30
  mv clean_battle_video_generation_$video_generation_battle_cutoff_date.json ./results/$video_generation_battle_cutoff_date/clean_battle_video_generation.json
31
 
32
 
33
+ echo "Calculating Elo rating for image editing task"
34
  python3 -m elo_rating.elo_analysis --clean-battle-file ./results/$edition_battle_cutoff_date/clean_battle_image_editing.json
35
+ edition_battle_cutoff_date=`cat cut_off_date.txt` && rm cut_off_date.txt && echo "Image editing battle data (after filtering models with < 50 battles) last updated on $edition_battle_cutoff_date"
36
  mv ./elo_results_$edition_battle_cutoff_date.pkl ./results/$edition_battle_cutoff_date/elo_results_image_editing.pkl
37
 
38
+ echo "Calculating Elo rating for t2i generation task"
39
  python3 -m elo_rating.elo_analysis --clean-battle-file ./results/$generation_battle_cutoff_date/clean_battle_t2i_generation.json
40
+ generation_battle_cutoff_date=`cat cut_off_date.txt` && rm cut_off_date.txt && echo "T2I image generation battle data (after filtering models with < 50 battles) last updated on $generation_battle_cutoff_date"
41
  mv ./elo_results_$generation_battle_cutoff_date.pkl ./results/$generation_battle_cutoff_date/elo_results_t2i_generation.pkl
42
 
43
+ echo "Calculating Elo rating for video generation task"
44
  python3 -m elo_rating.elo_analysis --clean-battle-file ./results/$video_generation_battle_cutoff_date/clean_battle_video_generation.json
45
+ video_generation_battle_cutoff_date=`cat cut_off_date.txt` && rm cut_off_date.txt && echo "Video generation battle data (after filtering models with < 50 battles) last updated on $video_generation_battle_cutoff_date"
46
  mv ./elo_results_$video_generation_battle_cutoff_date.pkl ./results/$video_generation_battle_cutoff_date/elo_results_video_generation.pkl
47
 
48
  # generat the leaderboard
model/model_manager.py CHANGED
@@ -34,9 +34,10 @@ class ModelManager:
34
  model_id = "meta-llama/Llama-Guard-3-8B"
35
  device = "cuda" if torch.cuda.is_available() else "cpu"
36
  dtype = torch.bfloat16
 
37
  if enable_nsfw:
38
- self.guard_tokenizer = AutoTokenizer.from_pretrained(model_id, token=os.environ['HF_GUARD'])
39
- self.guard = AutoModelForCausalLM.from_pretrained(model_id, torch_dtype=dtype, device_map=device, token=os.environ['HF_GUARD'])
40
  else:
41
  self.guard_tokenizer = None
42
  self.guard = None
 
34
  model_id = "meta-llama/Llama-Guard-3-8B"
35
  device = "cuda" if torch.cuda.is_available() else "cpu"
36
  dtype = torch.bfloat16
37
+ token = os.getenv("HF_TOKEN") or os.getenv("HF_GUARD")
38
  if enable_nsfw:
39
+ self.guard_tokenizer = AutoTokenizer.from_pretrained(model_id)
40
+ self.guard = AutoModelForCausalLM.from_pretrained(model_id, torch_dtype=dtype, device_map=device)
41
  else:
42
  self.guard_tokenizer = None
43
  self.guard = None