DongfuJiang commited on
Commit
8d8dec7
·
1 Parent(s): 5cad49d

Auto Daily Leaderboard udpate Wed Mar 5 12:00:31 PM EST 2025

Browse files
arena_elo/results/20250304/clean_battle_image_editing.json ADDED
The diff for this file is too large to render. See raw diff
 
arena_elo/results/20250304/clean_battle_t2i_generation.json CHANGED
@@ -119526,5 +119526,89 @@
119526
  "judge": "arena_user_10.16.26.206",
119527
  "anony": true,
119528
  "tstamp": 1741095831.392
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
119529
  }
119530
  ]
 
119526
  "judge": "arena_user_10.16.26.206",
119527
  "anony": true,
119528
  "tstamp": 1741095831.392
119529
+ },
119530
+ {
119531
+ "model_a_conv_id": "0185393f1c2d4230a6c77b47915b032a",
119532
+ "model_b_conv_id": "474a192e20a945f488526fdc41a51c78",
119533
+ "inputs": {
119534
+ "prompt": "Lonely evil bananas on a table, hard light chiaroscuro, realistic"
119535
+ },
119536
+ "model_a": "SD3",
119537
+ "model_b": "FLUX.1-schnell",
119538
+ "vote_type": "leftvote",
119539
+ "winner": "model_a",
119540
+ "judge": "arena_user_10.20.34.20",
119541
+ "anony": true,
119542
+ "tstamp": 1741121271.8992
119543
+ },
119544
+ {
119545
+ "model_a_conv_id": "c8c18c427d94419997d8763049f93083",
119546
+ "model_b_conv_id": "232e907652ba43a6bdc50c0c00e25c21",
119547
+ "inputs": {
119548
+ "prompt": "A silver , orange , and grey train 's closed doors ."
119549
+ },
119550
+ "model_a": "OpenJourney",
119551
+ "model_b": "HunyuanDiT",
119552
+ "vote_type": "leftvote",
119553
+ "winner": "model_a",
119554
+ "judge": "arena_user_10.20.6.93",
119555
+ "anony": true,
119556
+ "tstamp": 1741125864.5212
119557
+ },
119558
+ {
119559
+ "model_a_conv_id": "0a06ae6cc7ee43fd91e76b6edbc4ed99",
119560
+ "model_b_conv_id": "8bde484544ca402ba1a43ebb8b47ee94",
119561
+ "inputs": {
119562
+ "prompt": "An oil painting of a couple in formal evening wear going home get caught in a heavy downpour with no umbrellas."
119563
+ },
119564
+ "model_a": "OpenJourney",
119565
+ "model_b": "FLUX.1-schnell",
119566
+ "vote_type": "leftvote",
119567
+ "winner": "model_a",
119568
+ "judge": "arena_user_10.20.6.93",
119569
+ "anony": true,
119570
+ "tstamp": 1741125912.2516
119571
+ },
119572
+ {
119573
+ "model_a_conv_id": "5de18ded57f84df49f68d1dbd40c79ee",
119574
+ "model_b_conv_id": "00efe410f6d04d60ad54584b67937675",
119575
+ "inputs": {
119576
+ "prompt": "photorealistic, detailed picture of a single flower crown"
119577
+ },
119578
+ "model_a": "StableCascade",
119579
+ "model_b": "SD3",
119580
+ "vote_type": "leftvote",
119581
+ "winner": "model_a",
119582
+ "judge": "arena_user_10.20.6.93",
119583
+ "anony": true,
119584
+ "tstamp": 1741125923.6082
119585
+ },
119586
+ {
119587
+ "model_a_conv_id": "2e9ecc159b70456a8ce5b945f8bcff45",
119588
+ "model_b_conv_id": "8fea2bec8b644afaa9d702a65d15fbf9",
119589
+ "inputs": {
119590
+ "prompt": "A sign that says 'Diffusion'."
119591
+ },
119592
+ "model_a": "Kolors",
119593
+ "model_b": "FLUX.1-schnell",
119594
+ "vote_type": "rightvote",
119595
+ "winner": "model_b",
119596
+ "judge": "arena_user_10.16.39.39",
119597
+ "anony": true,
119598
+ "tstamp": 1741150405.5497
119599
+ },
119600
+ {
119601
+ "model_a_conv_id": "52cb0b6a7c8442fe9cd1fb9a25d7a1ea",
119602
+ "model_b_conv_id": "d21cc3e622e24c179a9355fc0efefec6",
119603
+ "inputs": {
119604
+ "prompt": "A futuristic hopeful busy city, purple and green color scheme"
119605
+ },
119606
+ "model_a": "FLUX.1-dev",
119607
+ "model_b": "PlayGround V2.5",
119608
+ "vote_type": "rightvote",
119609
+ "winner": "model_b",
119610
+ "judge": "arena_user_10.16.10.234",
119611
+ "anony": true,
119612
+ "tstamp": 1741159133.6543
119613
  }
119614
  ]
arena_elo/results/20250304/clean_battle_video_generation.json ADDED
The diff for this file is too large to render. See raw diff
 
arena_elo/results/20250304/elo_results_image_editing.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4870af4799cfffb6028d9400393f506195a33506e3e7a623ba3b47eb1a74e80d
3
+ size 66042
arena_elo/results/20250304/elo_results_t2i_generation.pkl CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:136315573bd9db9ec2d8323323fe110a66ecc8ccb196cc589b1981cfd3abd922
3
  size 88249
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8a10ce90aa6854aa0f5e36960924d7b6f279ba0a0bdd8b277e30aafa53e3c5c6
3
  size 88249
arena_elo/results/20250304/elo_results_video_generation.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:16bad273fddfb469d5c43633cd7a0004bac850745af70690399441fce4101a53
3
+ size 81357
arena_elo/results/20250304/image_editing_leaderboard.csv ADDED
@@ -0,0 +1,11 @@
 
 
 
 
 
 
 
 
 
 
 
 
1
+ key,Model,Arena Elo rating (anony),Arena Elo rating (full),License,Organization,Link
2
+ MagicBrush,MagicBrush,1097.6043637492648,1101.586566284983,CC-BY-4.0,"The Ohio State University, University of Waterloo",https://osu-nlp-group.github.io/MagicBrush/
3
+ UltraEdit,UltraEdit,1067.6689393370273,1067.5307252360478,other,Peking University; BIGAI,https://ultra-editing.github.io/
4
+ InfEdit,InfEdit,1064.0397321107114,1063.825933465487,CC BY-NC-ND 4.0,"University of Michigan, University of California, Berkeley",https://sled-group.github.io/InfEdit/
5
+ CosXLEdit,CosXLEdit,1055.6654687506614,1056.6602196716653,cosxl-nc-community,Stability AI,https://huggingface.co/stabilityai/cosxl
6
+ InstructPix2Pix,InstructPix2Pix,1029.4247873690776,1027.3282587563656,"Copyright 2023 Timothy Brooks, Aleksander Holynski, Alexei A. Efros","University of California, Berkeley",https://www.timothybrooks.com/instruct-pix2pix
7
+ PNP,PNP,992.6639287658154,997.0795878330872,-,Weizmann Institute of Science,https://github.com/MichalGeyer/plug-and-play
8
+ Prompt2prompt,Prompt2prompt,983.865737169967,984.9659516741241,Apache-2.0,"Google, Tel Aviv University",https://prompt-to-prompt.github.io/
9
+ CycleDiffusion,CycleDiffusion,935.3470162601191,929.2166701957979,X11,Carnegie Mellon University,https://github.com/ChenWu98/cycle-diffusion?tab=readme-ov-file
10
+ SDEdit,SDEdit,918.7855764202982,917.2961474609109,MIT License,Stanford University,https://sde-image-editing.github.io
11
+ Pix2PixZero,Pix2PixZero,854.9344500670585,854.5099394215308,MIT License,"Carnegie Mellon University, Adobe Research",https://pix2pixzero.github.io/
arena_elo/results/20250304/t2i_generation_leaderboard.csv CHANGED
@@ -1,18 +1,18 @@
1
  key,Model,Arena Elo rating (anony),Arena Elo rating (full),License,Organization,Link
2
- FLUX.1-dev,FLUX.1-dev,1142.0581529119786,1143.4965181495513,flux-1-dev-non-commercial-license (other),Black Forest Labs,https://huggingface.co/docs/diffusers/main/en/api/pipelines/flux
3
- PlayGround V2.5,PlayGround V2.5,1114.4733917878725,1115.44974183415,Playground v2.5 Community License,Playground,https://huggingface.co/playgroundai/playground-v2.5-1024px-aesthetic
4
- FLUX.1-schnell,FLUX.1-schnell,1095.1919208539869,1099.8402949195838,Apache-2.0,Black Forest Labs,https://huggingface.co/docs/diffusers/main/en/api/pipelines/flux
5
- PlayGround V2,PlayGround V2,1071.1953260421708,1070.9781943889616,Playground v2 Community License,Playground,https://huggingface.co/playgroundai/playground-v2-1024px-aesthetic
6
- Kolors,Kolors,1059.9768091690526,1058.9278023578413,Apache-2.0,Kwai Kolors,https://huggingface.co/Kwai-Kolors/Kolors
7
- StableCascade,StableCascade,1042.2740292337398,1044.698012486259,stable-cascade-nc-community (other),Stability AI,https://fal.ai/models/stable-cascade/api
8
- HunyuanDiT,HunyuanDiT,1019.1725460542228,1014.14790770645,tencent-hunyuan-community,Tencent,https://github.com/Tencent/HunyuanDiT
9
- PixArtAlpha,PixArtAlpha,1018.7688590382843,1011.3673764231929,openrail++,PixArt-alpha,https://huggingface.co/PixArt-alpha/PixArt-XL-2-1024-MS
10
- PixArtSigma,PixArtSigma,1017.5024468944063,1017.9587278893003,openrail++,PixArt-alpha,https://github.com/PixArt-alpha/PixArt-sigma
11
- SDXL-Lightning,SDXL-Lightning,1015.5898224267512,1020.0063006856607,openrail++,ByteDance,https://huggingface.co/ByteDance/SDXL-Lightning
12
- SD3,SD3,1006.1000828160398,1007.6715687753389,stabilityai-nc-research-community,Stability AI,https://huggingface.co/blog/sd3
13
- AuraFlow,AuraFlow,994.6438416026293,992.5777776758314,Apache-2.0,Fal.AI,https://huggingface.co/fal/AuraFlow
14
- SDXL,SDXL,964.4887318172774,965.830368614938,openrail++,Stability AI,https://huggingface.co/stabilityai/stable-diffusion-xl-base-1.0
15
- SDXLTurbo,SDXLTurbo,913.5993709023219,912.0290237708969,sai-nc-community (other),Stability AI,https://huggingface.co/stabilityai/sdxl-turbo
16
- LCM(v1.5/XL),LCM(v1.5/XL),904.1511961853133,898.4691494073832,openrail++,Latent Consistency,https://fal.ai/models/fast-lcm-diffusion-turbo
17
- OpenJourney,OpenJourney,831.3542903772337,826.9276283450821,creativeml-openrail-m,PromptHero,https://huggingface.co/prompthero/openjourney
18
- LCM,LCM,789.4591818867234,804.3230828495077,MIT License,Tsinghua University,https://huggingface.co/SimianLuo/LCM_Dreamshaper_v7
 
1
  key,Model,Arena Elo rating (anony),Arena Elo rating (full),License,Organization,Link
2
+ FLUX.1-dev,FLUX.1-dev,1140.54064444776,1142.478433248384,flux-1-dev-non-commercial-license (other),Black Forest Labs,https://huggingface.co/docs/diffusers/main/en/api/pipelines/flux
3
+ PlayGround V2.5,PlayGround V2.5,1115.0413282850327,1115.8660729402743,Playground v2.5 Community License,Playground,https://huggingface.co/playgroundai/playground-v2.5-1024px-aesthetic
4
+ FLUX.1-schnell,FLUX.1-schnell,1092.9274950720344,1097.9940464682022,Apache-2.0,Black Forest Labs,https://huggingface.co/docs/diffusers/main/en/api/pipelines/flux
5
+ PlayGround V2,PlayGround V2,1071.7726265799272,1071.5040505618556,Playground v2 Community License,Playground,https://huggingface.co/playgroundai/playground-v2-1024px-aesthetic
6
+ Kolors,Kolors,1058.6589291047005,1057.6750924733155,Apache-2.0,Kwai Kolors,https://huggingface.co/Kwai-Kolors/Kolors
7
+ StableCascade,StableCascade,1042.913333399551,1045.2807916556396,stable-cascade-nc-community (other),Stability AI,https://fal.ai/models/stable-cascade/api
8
+ PixArtAlpha,PixArtAlpha,1019.1762583059761,1011.770053541195,openrail++,PixArt-alpha,https://huggingface.co/PixArt-alpha/PixArt-XL-2-1024-MS
9
+ HunyuanDiT,HunyuanDiT,1018.0203471450936,1013.0401202408287,tencent-hunyuan-community,Tencent,https://github.com/Tencent/HunyuanDiT
10
+ PixArtSigma,PixArtSigma,1017.8332359128535,1018.2583849827981,openrail++,PixArt-alpha,https://github.com/PixArt-alpha/PixArt-sigma
11
+ SDXL-Lightning,SDXL-Lightning,1015.929417091197,1020.2883464821336,openrail++,ByteDance,https://huggingface.co/ByteDance/SDXL-Lightning
12
+ SD3,SD3,1006.3839266840495,1007.9240613567083,stabilityai-nc-research-community,Stability AI,https://huggingface.co/blog/sd3
13
+ AuraFlow,AuraFlow,994.3106981605351,992.242324025994,Apache-2.0,Fal.AI,https://huggingface.co/fal/AuraFlow
14
+ SDXL,SDXL,964.9414706928835,966.2631624320217,openrail++,Stability AI,https://huggingface.co/stabilityai/stable-diffusion-xl-base-1.0
15
+ SDXLTurbo,SDXLTurbo,914.0691290472807,912.4816793045377,sai-nc-community (other),Stability AI,https://huggingface.co/stabilityai/sdxl-turbo
16
+ LCM(v1.5/XL),LCM(v1.5/XL),904.7423661198958,898.9893685687374,openrail++,Latent Consistency,https://fal.ai/models/fast-lcm-diffusion-turbo
17
+ OpenJourney,OpenJourney,832.6104126653283,828.0593272803596,creativeml-openrail-m,PromptHero,https://huggingface.co/prompthero/openjourney
18
+ LCM,LCM,790.1283812858934,804.9328295962027,MIT License,Tsinghua University,https://huggingface.co/SimianLuo/LCM_Dreamshaper_v7
arena_elo/results/20250304/video_generation_leaderboard.csv ADDED
@@ -0,0 +1,16 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ key,Model,Arena Elo rating (anony),Arena Elo rating (full),License,Organization,Link
2
+ CogVideoX-5B,CogVideoX-5B,1135.3687032647802,1137.4502071323247,CogVideoX LICENSE,THUDM,https://github.com/THUDM/CogVideo
3
+ Mochi1,Mochi1,1125.7384643081691,1125.3719082547418,Apache 2.0,Genmo AI,https://github.com/genmoai/mochi
4
+ StableVideoDiffusion,StableVideoDiffusion,1117.729420623102,1117.7784800711422,SVD-nc-community,Stability AI,https://fal.ai/models/fal-ai/fast-svd/text-to-video/api
5
+ Pyramid Flow,Pyramid Flow,1109.6318946208864,1111.5514173990646,MIT LICENSE,Peking University,https://pyramid-flow.github.io/
6
+ T2V-Turbo,T2V-Turbo,1053.7466599517436,1054.1656932519484,cc-by-nc-4.0,"University of California, Santa Barbara",https://github.com/Ji4chenLi/t2v-turbo
7
+ CogVideoX-2B,CogVideoX-2B,1049.0498525063604,1047.4175015816522,CogVideoX LICENSE,THUDM,https://github.com/THUDM/CogVideo
8
+ AnimateDiff,AnimateDiff,1039.3527292117005,1038.8077990227764,creativeml-openrail-m,"The Chinese University of Hong Kong, Shanghai AI Lab, Stanford University",https://fal.ai/models/fast-animatediff-t2v
9
+ VideoCrafter2,VideoCrafter2,1030.3385942855953,1029.772281835828,Apache 2.0,Tencent AI Lab,https://ailab-cvc.github.io/videocrafter2/
10
+ Allegro,Allegro,1000.4880460748201,1002.9456853576637,Apache 2.0,rhymes-ai,https://github.com/rhymes-ai/Allegro
11
+ LaVie,LaVie,964.3781718312032,963.8704115935535,Apache 2.0,Shanghai AI Lab,https://github.com/Vchitect/LaVie
12
+ LTXVideo,LTXVideo,955.7125101266762,956.8216700870381,Apache 2.0,Lightricks,https://github.com/Lightricks/LTX-Video
13
+ OpenSora,OpenSora,880.7730380536314,879.9846635860854,Apache 2.0,HPC-AI Tech,https://github.com/hpcaitech/Open-Sora
14
+ OpenSora v1.2,OpenSora v1.2,872.9373563958695,870.3676769922687,Apache 2.0,HPC-AI Tech,https://github.com/hpcaitech/Open-Sora
15
+ AnimateDiff Turbo,AnimateDiff Turbo,834.1089618094404,832.3433342390309,creativeml-openrail-m,"The Chinese University of Hong Kong, Shanghai AI Lab, Stanford University",https://fal.ai/models/fast-animatediff-t2v-turbo
16
+ ModelScope,ModelScope,830.6455969360253,831.3512695948783,cc-by-nc-4.0,Alibaba Group,https://arxiv.org/abs/2308.06571
arena_elo/results/latest/clean_battle_image_editing.json CHANGED
@@ -20296,5 +20296,37 @@
20296
  "judge": "arena_user_10.16.29.175",
20297
  "anony": true,
20298
  "tstamp": 1740990144.7425
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
20299
  }
20300
  ]
 
20296
  "judge": "arena_user_10.16.29.175",
20297
  "anony": true,
20298
  "tstamp": 1740990144.7425
20299
+ },
20300
+ {
20301
+ "model_a_conv_id": "6cccd366988149ecaa236f96c411511d",
20302
+ "model_b_conv_id": "2b8e05390dda4995b1737c66e17547bf",
20303
+ "inputs": {
20304
+ "source_prompt": "A bull is on a farm walking around a pen.",
20305
+ "target_prompt": "A stylish cow wearing a hat walks around a pen on a farm.",
20306
+ "instruct_prompt": "Have the cow wear a hat."
20307
+ },
20308
+ "model_a": "AURORA",
20309
+ "model_b": "MagicBrush",
20310
+ "vote_type": "bothbad_vote",
20311
+ "winner": "tie (bothbad)",
20312
+ "judge": "arena_user_10.20.6.93",
20313
+ "anony": true,
20314
+ "tstamp": 1741126011.2284
20315
+ },
20316
+ {
20317
+ "model_a_conv_id": "60879e27cc534b818220b3a19be1644f",
20318
+ "model_b_conv_id": "95b9fad459b54580a3d67c8813cc6e53",
20319
+ "inputs": {
20320
+ "source_prompt": "a tennis player with a racket on a court",
20321
+ "target_prompt": "A tennis player with a baseball cap and racket on a court",
20322
+ "instruct_prompt": "give her a baseball cap"
20323
+ },
20324
+ "model_a": "CycleDiffusion",
20325
+ "model_b": "MagicBrush",
20326
+ "vote_type": "bothbad_vote",
20327
+ "winner": "tie (bothbad)",
20328
+ "judge": "arena_user_10.20.6.93",
20329
+ "anony": true,
20330
+ "tstamp": 1741126037.3003
20331
  }
20332
  ]
arena_elo/results/latest/clean_battle_t2i_generation.json CHANGED
@@ -119526,5 +119526,89 @@
119526
  "judge": "arena_user_10.16.26.206",
119527
  "anony": true,
119528
  "tstamp": 1741095831.392
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
119529
  }
119530
  ]
 
119526
  "judge": "arena_user_10.16.26.206",
119527
  "anony": true,
119528
  "tstamp": 1741095831.392
119529
+ },
119530
+ {
119531
+ "model_a_conv_id": "0185393f1c2d4230a6c77b47915b032a",
119532
+ "model_b_conv_id": "474a192e20a945f488526fdc41a51c78",
119533
+ "inputs": {
119534
+ "prompt": "Lonely evil bananas on a table, hard light chiaroscuro, realistic"
119535
+ },
119536
+ "model_a": "SD3",
119537
+ "model_b": "FLUX.1-schnell",
119538
+ "vote_type": "leftvote",
119539
+ "winner": "model_a",
119540
+ "judge": "arena_user_10.20.34.20",
119541
+ "anony": true,
119542
+ "tstamp": 1741121271.8992
119543
+ },
119544
+ {
119545
+ "model_a_conv_id": "c8c18c427d94419997d8763049f93083",
119546
+ "model_b_conv_id": "232e907652ba43a6bdc50c0c00e25c21",
119547
+ "inputs": {
119548
+ "prompt": "A silver , orange , and grey train 's closed doors ."
119549
+ },
119550
+ "model_a": "OpenJourney",
119551
+ "model_b": "HunyuanDiT",
119552
+ "vote_type": "leftvote",
119553
+ "winner": "model_a",
119554
+ "judge": "arena_user_10.20.6.93",
119555
+ "anony": true,
119556
+ "tstamp": 1741125864.5212
119557
+ },
119558
+ {
119559
+ "model_a_conv_id": "0a06ae6cc7ee43fd91e76b6edbc4ed99",
119560
+ "model_b_conv_id": "8bde484544ca402ba1a43ebb8b47ee94",
119561
+ "inputs": {
119562
+ "prompt": "An oil painting of a couple in formal evening wear going home get caught in a heavy downpour with no umbrellas."
119563
+ },
119564
+ "model_a": "OpenJourney",
119565
+ "model_b": "FLUX.1-schnell",
119566
+ "vote_type": "leftvote",
119567
+ "winner": "model_a",
119568
+ "judge": "arena_user_10.20.6.93",
119569
+ "anony": true,
119570
+ "tstamp": 1741125912.2516
119571
+ },
119572
+ {
119573
+ "model_a_conv_id": "5de18ded57f84df49f68d1dbd40c79ee",
119574
+ "model_b_conv_id": "00efe410f6d04d60ad54584b67937675",
119575
+ "inputs": {
119576
+ "prompt": "photorealistic, detailed picture of a single flower crown"
119577
+ },
119578
+ "model_a": "StableCascade",
119579
+ "model_b": "SD3",
119580
+ "vote_type": "leftvote",
119581
+ "winner": "model_a",
119582
+ "judge": "arena_user_10.20.6.93",
119583
+ "anony": true,
119584
+ "tstamp": 1741125923.6082
119585
+ },
119586
+ {
119587
+ "model_a_conv_id": "2e9ecc159b70456a8ce5b945f8bcff45",
119588
+ "model_b_conv_id": "8fea2bec8b644afaa9d702a65d15fbf9",
119589
+ "inputs": {
119590
+ "prompt": "A sign that says 'Diffusion'."
119591
+ },
119592
+ "model_a": "Kolors",
119593
+ "model_b": "FLUX.1-schnell",
119594
+ "vote_type": "rightvote",
119595
+ "winner": "model_b",
119596
+ "judge": "arena_user_10.16.39.39",
119597
+ "anony": true,
119598
+ "tstamp": 1741150405.5497
119599
+ },
119600
+ {
119601
+ "model_a_conv_id": "52cb0b6a7c8442fe9cd1fb9a25d7a1ea",
119602
+ "model_b_conv_id": "d21cc3e622e24c179a9355fc0efefec6",
119603
+ "inputs": {
119604
+ "prompt": "A futuristic hopeful busy city, purple and green color scheme"
119605
+ },
119606
+ "model_a": "FLUX.1-dev",
119607
+ "model_b": "PlayGround V2.5",
119608
+ "vote_type": "rightvote",
119609
+ "winner": "model_b",
119610
+ "judge": "arena_user_10.16.10.234",
119611
+ "anony": true,
119612
+ "tstamp": 1741159133.6543
119613
  }
119614
  ]
arena_elo/results/latest/clean_battle_video_generation.json CHANGED
@@ -40598,5 +40598,75 @@
40598
  "judge": "arena_user_10.16.39.39",
40599
  "anony": true,
40600
  "tstamp": 1741054957.9658
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
40601
  }
40602
  ]
 
40598
  "judge": "arena_user_10.16.39.39",
40599
  "anony": true,
40600
  "tstamp": 1741054957.9658
40601
+ },
40602
+ {
40603
+ "model_a_conv_id": "98b94002e0564021b785c55a1d905b66",
40604
+ "model_b_conv_id": "75bceb6ea6c5419da0755e47646daeca",
40605
+ "inputs": {
40606
+ "prompt": "train station platform"
40607
+ },
40608
+ "model_a": "StableVideoDiffusion",
40609
+ "model_b": "Allegro",
40610
+ "vote_type": "rightvote",
40611
+ "winner": "model_b",
40612
+ "judge": "arena_user_10.16.28.13",
40613
+ "anony": true,
40614
+ "tstamp": 1741116370.5924
40615
+ },
40616
+ {
40617
+ "model_a_conv_id": "152e8ec10b4d478c9eec87b7f7289203",
40618
+ "model_b_conv_id": "daa951289f4f4da2ab9e5e5eb7b215d3",
40619
+ "inputs": {
40620
+ "prompt": "A person is getting a haircut"
40621
+ },
40622
+ "model_a": "CogVideoX-5B",
40623
+ "model_b": "StableVideoDiffusion",
40624
+ "vote_type": "leftvote",
40625
+ "winner": "model_a",
40626
+ "judge": "arena_user_10.20.6.93",
40627
+ "anony": true,
40628
+ "tstamp": 1741126084.0572
40629
+ },
40630
+ {
40631
+ "model_a_conv_id": "a3c2136e05f8489b98cdfdbaf5fed4d6",
40632
+ "model_b_conv_id": "ea3b901ce24242dfb81b2593ea18e013",
40633
+ "inputs": {
40634
+ "prompt": "a yellow bicycle"
40635
+ },
40636
+ "model_a": "VideoCrafter2",
40637
+ "model_b": "StableVideoDiffusion",
40638
+ "vote_type": "rightvote",
40639
+ "winner": "model_b",
40640
+ "judge": "arena_user_10.20.6.93",
40641
+ "anony": true,
40642
+ "tstamp": 1741126105.3267
40643
+ },
40644
+ {
40645
+ "model_a_conv_id": "5f81e2c76e8d4892b141f424fa7c858f",
40646
+ "model_b_conv_id": "9aff9086c0914f4ca58d0908131a6973",
40647
+ "inputs": {
40648
+ "prompt": "a person and a hair drier"
40649
+ },
40650
+ "model_a": "StableVideoDiffusion",
40651
+ "model_b": "CogVideoX-2B",
40652
+ "vote_type": "bothbad_vote",
40653
+ "winner": "tie (bothbad)",
40654
+ "judge": "arena_user_10.20.6.93",
40655
+ "anony": true,
40656
+ "tstamp": 1741126132.6116
40657
+ },
40658
+ {
40659
+ "model_a_conv_id": "855906fd7541484e81f1e2ae1816d63b",
40660
+ "model_b_conv_id": "73f27968c02e414b99aa06e828a87705",
40661
+ "inputs": {
40662
+ "prompt": "Gwen Stacy reading a book, Van Gogh style"
40663
+ },
40664
+ "model_a": "AnimateDiff Turbo",
40665
+ "model_b": "AnimateDiff",
40666
+ "vote_type": "rightvote",
40667
+ "winner": "model_b",
40668
+ "judge": "arena_user_10.20.6.93",
40669
+ "anony": true,
40670
+ "tstamp": 1741126151.2247
40671
  }
40672
  ]
arena_elo/results/latest/elo_results_image_editing.pkl CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f32da2091c8f5cd03778d90e04d8ba7ff32e8de5d4f2019e7c6364f734423101
3
  size 66042
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4870af4799cfffb6028d9400393f506195a33506e3e7a623ba3b47eb1a74e80d
3
  size 66042
arena_elo/results/latest/elo_results_t2i_generation.pkl CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:136315573bd9db9ec2d8323323fe110a66ecc8ccb196cc589b1981cfd3abd922
3
  size 88249
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8a10ce90aa6854aa0f5e36960924d7b6f279ba0a0bdd8b277e30aafa53e3c5c6
3
  size 88249
arena_elo/results/latest/elo_results_video_generation.pkl CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7907b707a3ea241eb9164388e17ad7e235d058b3796084b2333702d2ba660b54
3
- size 81355
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:16bad273fddfb469d5c43633cd7a0004bac850745af70690399441fce4101a53
3
+ size 81357
arena_elo/results/latest/image_editing_leaderboard.csv CHANGED
@@ -1,11 +1,11 @@
1
  key,Model,Arena Elo rating (anony),Arena Elo rating (full),License,Organization,Link
2
- MagicBrush,MagicBrush,1098.11909638452,1102.0924438876038,CC-BY-4.0,"The Ohio State University, University of Waterloo",https://osu-nlp-group.github.io/MagicBrush/
3
- UltraEdit,UltraEdit,1067.6922568512323,1067.5514176443478,other,Peking University; BIGAI,https://ultra-editing.github.io/
4
- InfEdit,InfEdit,1064.0583455960025,1063.8632624383984,CC BY-NC-ND 4.0,"University of Michigan, University of California, Berkeley",https://sled-group.github.io/InfEdit/
5
- CosXLEdit,CosXLEdit,1055.6699311266136,1056.6547463387872,cosxl-nc-community,Stability AI,https://huggingface.co/stabilityai/cosxl
6
- InstructPix2Pix,InstructPix2Pix,1029.426353576916,1027.3387401625496,"Copyright 2023 Timothy Brooks, Aleksander Holynski, Alexei A. Efros","University of California, Berkeley",https://www.timothybrooks.com/instruct-pix2pix
7
- PNP,PNP,992.668005312241,997.0839601892403,-,Weizmann Institute of Science,https://github.com/MichalGeyer/plug-and-play
8
- Prompt2prompt,Prompt2prompt,983.8617890677732,984.9626360844215,Apache-2.0,"Google, Tel Aviv University",https://prompt-to-prompt.github.io/
9
- CycleDiffusion,CycleDiffusion,934.7740837892117,928.6484309741794,X11,Carnegie Mellon University,https://github.com/ChenWu98/cycle-diffusion?tab=readme-ov-file
10
- SDEdit,SDEdit,918.7969153614958,917.3007920540573,MIT License,Stanford University,https://sde-image-editing.github.io
11
- Pix2PixZero,Pix2PixZero,854.933222933994,854.5035702264144,MIT License,"Carnegie Mellon University, Adobe Research",https://pix2pixzero.github.io/
 
1
  key,Model,Arena Elo rating (anony),Arena Elo rating (full),License,Organization,Link
2
+ MagicBrush,MagicBrush,1097.6043637492648,1101.586566284983,CC-BY-4.0,"The Ohio State University, University of Waterloo",https://osu-nlp-group.github.io/MagicBrush/
3
+ UltraEdit,UltraEdit,1067.6689393370273,1067.5307252360478,other,Peking University; BIGAI,https://ultra-editing.github.io/
4
+ InfEdit,InfEdit,1064.0397321107114,1063.825933465487,CC BY-NC-ND 4.0,"University of Michigan, University of California, Berkeley",https://sled-group.github.io/InfEdit/
5
+ CosXLEdit,CosXLEdit,1055.6654687506614,1056.6602196716653,cosxl-nc-community,Stability AI,https://huggingface.co/stabilityai/cosxl
6
+ InstructPix2Pix,InstructPix2Pix,1029.4247873690776,1027.3282587563656,"Copyright 2023 Timothy Brooks, Aleksander Holynski, Alexei A. Efros","University of California, Berkeley",https://www.timothybrooks.com/instruct-pix2pix
7
+ PNP,PNP,992.6639287658154,997.0795878330872,-,Weizmann Institute of Science,https://github.com/MichalGeyer/plug-and-play
8
+ Prompt2prompt,Prompt2prompt,983.865737169967,984.9659516741241,Apache-2.0,"Google, Tel Aviv University",https://prompt-to-prompt.github.io/
9
+ CycleDiffusion,CycleDiffusion,935.3470162601191,929.2166701957979,X11,Carnegie Mellon University,https://github.com/ChenWu98/cycle-diffusion?tab=readme-ov-file
10
+ SDEdit,SDEdit,918.7855764202982,917.2961474609109,MIT License,Stanford University,https://sde-image-editing.github.io
11
+ Pix2PixZero,Pix2PixZero,854.9344500670585,854.5099394215308,MIT License,"Carnegie Mellon University, Adobe Research",https://pix2pixzero.github.io/
arena_elo/results/latest/t2i_generation_leaderboard.csv CHANGED
@@ -1,18 +1,18 @@
1
  key,Model,Arena Elo rating (anony),Arena Elo rating (full),License,Organization,Link
2
- FLUX.1-dev,FLUX.1-dev,1142.0581529119786,1143.4965181495513,flux-1-dev-non-commercial-license (other),Black Forest Labs,https://huggingface.co/docs/diffusers/main/en/api/pipelines/flux
3
- PlayGround V2.5,PlayGround V2.5,1114.4733917878725,1115.44974183415,Playground v2.5 Community License,Playground,https://huggingface.co/playgroundai/playground-v2.5-1024px-aesthetic
4
- FLUX.1-schnell,FLUX.1-schnell,1095.1919208539869,1099.8402949195838,Apache-2.0,Black Forest Labs,https://huggingface.co/docs/diffusers/main/en/api/pipelines/flux
5
- PlayGround V2,PlayGround V2,1071.1953260421708,1070.9781943889616,Playground v2 Community License,Playground,https://huggingface.co/playgroundai/playground-v2-1024px-aesthetic
6
- Kolors,Kolors,1059.9768091690526,1058.9278023578413,Apache-2.0,Kwai Kolors,https://huggingface.co/Kwai-Kolors/Kolors
7
- StableCascade,StableCascade,1042.2740292337398,1044.698012486259,stable-cascade-nc-community (other),Stability AI,https://fal.ai/models/stable-cascade/api
8
- HunyuanDiT,HunyuanDiT,1019.1725460542228,1014.14790770645,tencent-hunyuan-community,Tencent,https://github.com/Tencent/HunyuanDiT
9
- PixArtAlpha,PixArtAlpha,1018.7688590382843,1011.3673764231929,openrail++,PixArt-alpha,https://huggingface.co/PixArt-alpha/PixArt-XL-2-1024-MS
10
- PixArtSigma,PixArtSigma,1017.5024468944063,1017.9587278893003,openrail++,PixArt-alpha,https://github.com/PixArt-alpha/PixArt-sigma
11
- SDXL-Lightning,SDXL-Lightning,1015.5898224267512,1020.0063006856607,openrail++,ByteDance,https://huggingface.co/ByteDance/SDXL-Lightning
12
- SD3,SD3,1006.1000828160398,1007.6715687753389,stabilityai-nc-research-community,Stability AI,https://huggingface.co/blog/sd3
13
- AuraFlow,AuraFlow,994.6438416026293,992.5777776758314,Apache-2.0,Fal.AI,https://huggingface.co/fal/AuraFlow
14
- SDXL,SDXL,964.4887318172774,965.830368614938,openrail++,Stability AI,https://huggingface.co/stabilityai/stable-diffusion-xl-base-1.0
15
- SDXLTurbo,SDXLTurbo,913.5993709023219,912.0290237708969,sai-nc-community (other),Stability AI,https://huggingface.co/stabilityai/sdxl-turbo
16
- LCM(v1.5/XL),LCM(v1.5/XL),904.1511961853133,898.4691494073832,openrail++,Latent Consistency,https://fal.ai/models/fast-lcm-diffusion-turbo
17
- OpenJourney,OpenJourney,831.3542903772337,826.9276283450821,creativeml-openrail-m,PromptHero,https://huggingface.co/prompthero/openjourney
18
- LCM,LCM,789.4591818867234,804.3230828495077,MIT License,Tsinghua University,https://huggingface.co/SimianLuo/LCM_Dreamshaper_v7
 
1
  key,Model,Arena Elo rating (anony),Arena Elo rating (full),License,Organization,Link
2
+ FLUX.1-dev,FLUX.1-dev,1140.54064444776,1142.478433248384,flux-1-dev-non-commercial-license (other),Black Forest Labs,https://huggingface.co/docs/diffusers/main/en/api/pipelines/flux
3
+ PlayGround V2.5,PlayGround V2.5,1115.0413282850327,1115.8660729402743,Playground v2.5 Community License,Playground,https://huggingface.co/playgroundai/playground-v2.5-1024px-aesthetic
4
+ FLUX.1-schnell,FLUX.1-schnell,1092.9274950720344,1097.9940464682022,Apache-2.0,Black Forest Labs,https://huggingface.co/docs/diffusers/main/en/api/pipelines/flux
5
+ PlayGround V2,PlayGround V2,1071.7726265799272,1071.5040505618556,Playground v2 Community License,Playground,https://huggingface.co/playgroundai/playground-v2-1024px-aesthetic
6
+ Kolors,Kolors,1058.6589291047005,1057.6750924733155,Apache-2.0,Kwai Kolors,https://huggingface.co/Kwai-Kolors/Kolors
7
+ StableCascade,StableCascade,1042.913333399551,1045.2807916556396,stable-cascade-nc-community (other),Stability AI,https://fal.ai/models/stable-cascade/api
8
+ PixArtAlpha,PixArtAlpha,1019.1762583059761,1011.770053541195,openrail++,PixArt-alpha,https://huggingface.co/PixArt-alpha/PixArt-XL-2-1024-MS
9
+ HunyuanDiT,HunyuanDiT,1018.0203471450936,1013.0401202408287,tencent-hunyuan-community,Tencent,https://github.com/Tencent/HunyuanDiT
10
+ PixArtSigma,PixArtSigma,1017.8332359128535,1018.2583849827981,openrail++,PixArt-alpha,https://github.com/PixArt-alpha/PixArt-sigma
11
+ SDXL-Lightning,SDXL-Lightning,1015.929417091197,1020.2883464821336,openrail++,ByteDance,https://huggingface.co/ByteDance/SDXL-Lightning
12
+ SD3,SD3,1006.3839266840495,1007.9240613567083,stabilityai-nc-research-community,Stability AI,https://huggingface.co/blog/sd3
13
+ AuraFlow,AuraFlow,994.3106981605351,992.242324025994,Apache-2.0,Fal.AI,https://huggingface.co/fal/AuraFlow
14
+ SDXL,SDXL,964.9414706928835,966.2631624320217,openrail++,Stability AI,https://huggingface.co/stabilityai/stable-diffusion-xl-base-1.0
15
+ SDXLTurbo,SDXLTurbo,914.0691290472807,912.4816793045377,sai-nc-community (other),Stability AI,https://huggingface.co/stabilityai/sdxl-turbo
16
+ LCM(v1.5/XL),LCM(v1.5/XL),904.7423661198958,898.9893685687374,openrail++,Latent Consistency,https://fal.ai/models/fast-lcm-diffusion-turbo
17
+ OpenJourney,OpenJourney,832.6104126653283,828.0593272803596,creativeml-openrail-m,PromptHero,https://huggingface.co/prompthero/openjourney
18
+ LCM,LCM,790.1283812858934,804.9328295962027,MIT License,Tsinghua University,https://huggingface.co/SimianLuo/LCM_Dreamshaper_v7
arena_elo/results/latest/video_generation_leaderboard.csv CHANGED
@@ -1,16 +1,16 @@
1
  key,Model,Arena Elo rating (anony),Arena Elo rating (full),License,Organization,Link
2
- CogVideoX-5B,CogVideoX-5B,1132.8058625703793,1134.9792418769139,CogVideoX LICENSE,THUDM,https://github.com/THUDM/CogVideo
3
- Mochi1,Mochi1,1125.450546864127,1125.0881795936793,Apache 2.0,Genmo AI,https://github.com/genmoai/mochi
4
- StableVideoDiffusion,StableVideoDiffusion,1119.6541987548815,1119.6606846142206,SVD-nc-community,Stability AI,https://fal.ai/models/fal-ai/fast-svd/text-to-video/api
5
- Pyramid Flow,Pyramid Flow,1109.3076186633843,1111.2037241143935,MIT LICENSE,Peking University,https://pyramid-flow.github.io/
6
- T2V-Turbo,T2V-Turbo,1054.1637414990266,1054.5851746339542,cc-by-nc-4.0,"University of California, Santa Barbara",https://github.com/Ji4chenLi/t2v-turbo
7
- CogVideoX-2B,CogVideoX-2B,1048.8492617607403,1047.2260718567795,CogVideoX LICENSE,THUDM,https://github.com/THUDM/CogVideo
8
- AnimateDiff,AnimateDiff,1039.8088570323023,1039.282837198361,creativeml-openrail-m,"The Chinese University of Hong Kong, Shanghai AI Lab, Stanford University",https://fal.ai/models/fast-animatediff-t2v
9
- VideoCrafter2,VideoCrafter2,1031.4364366567702,1030.8535421487534,Apache 2.0,Tencent AI Lab,https://ailab-cvc.github.io/videocrafter2/
10
- Allegro,Allegro,996.4877909612346,998.9896994797994,Apache 2.0,rhymes-ai,https://github.com/rhymes-ai/Allegro
11
- LaVie,LaVie,965.2987009413192,964.778020952365,Apache 2.0,Shanghai AI Lab,https://github.com/Vchitect/LaVie
12
- LTXVideo,LTXVideo,955.5655897899491,956.6621939138146,Apache 2.0,Lightricks,https://github.com/Lightricks/LTX-Video
13
- OpenSora,OpenSora,881.6768153618258,880.8791993411879,Apache 2.0,HPC-AI Tech,https://github.com/hpcaitech/Open-Sora
14
- OpenSora v1.2,OpenSora v1.2,872.8694554892492,870.2903351385157,Apache 2.0,HPC-AI Tech,https://github.com/hpcaitech/Open-Sora
15
- AnimateDiff Turbo,AnimateDiff Turbo,835.0510392691535,833.2532008948735,creativeml-openrail-m,"The Chinese University of Hong Kong, Shanghai AI Lab, Stanford University",https://fal.ai/models/fast-animatediff-t2v-turbo
16
- ModelScope,ModelScope,831.5740843856572,832.2678942423846,cc-by-nc-4.0,Alibaba Group,https://arxiv.org/abs/2308.06571
 
1
  key,Model,Arena Elo rating (anony),Arena Elo rating (full),License,Organization,Link
2
+ CogVideoX-5B,CogVideoX-5B,1135.3687032647802,1137.4502071323247,CogVideoX LICENSE,THUDM,https://github.com/THUDM/CogVideo
3
+ Mochi1,Mochi1,1125.7384643081691,1125.3719082547418,Apache 2.0,Genmo AI,https://github.com/genmoai/mochi
4
+ StableVideoDiffusion,StableVideoDiffusion,1117.729420623102,1117.7784800711422,SVD-nc-community,Stability AI,https://fal.ai/models/fal-ai/fast-svd/text-to-video/api
5
+ Pyramid Flow,Pyramid Flow,1109.6318946208864,1111.5514173990646,MIT LICENSE,Peking University,https://pyramid-flow.github.io/
6
+ T2V-Turbo,T2V-Turbo,1053.7466599517436,1054.1656932519484,cc-by-nc-4.0,"University of California, Santa Barbara",https://github.com/Ji4chenLi/t2v-turbo
7
+ CogVideoX-2B,CogVideoX-2B,1049.0498525063604,1047.4175015816522,CogVideoX LICENSE,THUDM,https://github.com/THUDM/CogVideo
8
+ AnimateDiff,AnimateDiff,1039.3527292117005,1038.8077990227764,creativeml-openrail-m,"The Chinese University of Hong Kong, Shanghai AI Lab, Stanford University",https://fal.ai/models/fast-animatediff-t2v
9
+ VideoCrafter2,VideoCrafter2,1030.3385942855953,1029.772281835828,Apache 2.0,Tencent AI Lab,https://ailab-cvc.github.io/videocrafter2/
10
+ Allegro,Allegro,1000.4880460748201,1002.9456853576637,Apache 2.0,rhymes-ai,https://github.com/rhymes-ai/Allegro
11
+ LaVie,LaVie,964.3781718312032,963.8704115935535,Apache 2.0,Shanghai AI Lab,https://github.com/Vchitect/LaVie
12
+ LTXVideo,LTXVideo,955.7125101266762,956.8216700870381,Apache 2.0,Lightricks,https://github.com/Lightricks/LTX-Video
13
+ OpenSora,OpenSora,880.7730380536314,879.9846635860854,Apache 2.0,HPC-AI Tech,https://github.com/hpcaitech/Open-Sora
14
+ OpenSora v1.2,OpenSora v1.2,872.9373563958695,870.3676769922687,Apache 2.0,HPC-AI Tech,https://github.com/hpcaitech/Open-Sora
15
+ AnimateDiff Turbo,AnimateDiff Turbo,834.1089618094404,832.3433342390309,creativeml-openrail-m,"The Chinese University of Hong Kong, Shanghai AI Lab, Stanford University",https://fal.ai/models/fast-animatediff-t2v-turbo
16
+ ModelScope,ModelScope,830.6455969360253,831.3512695948783,cc-by-nc-4.0,Alibaba Group,https://arxiv.org/abs/2308.06571