Spaces:
Running
on
Zero
Running
on
Zero
DongfuJiang
commited on
Commit
•
cca0b2a
1
Parent(s):
12e2ec8
Auto Daily Leaderboard udpate Fri Aug 30 12:00:24 PM EDT 2024
Browse files- arena_elo/results/20240830/clean_battle_t2i_generation.json +0 -0
- arena_elo/results/20240830/elo_results_t2i_generation.pkl +3 -0
- arena_elo/results/20240830/t2i_generation_leaderboard.csv +18 -0
- arena_elo/results/latest/clean_battle_t2i_generation.json +98 -0
- arena_elo/results/latest/elo_results_t2i_generation.pkl +2 -2
- arena_elo/results/latest/t2i_generation_leaderboard.csv +17 -17
arena_elo/results/20240830/clean_battle_t2i_generation.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
arena_elo/results/20240830/elo_results_t2i_generation.pkl
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7b07bd1eb73ba2441e1a2826c961f95e0340ed7ed04ad558150f03309cd5687a
|
3 |
+
size 88248
|
arena_elo/results/20240830/t2i_generation_leaderboard.csv
ADDED
@@ -0,0 +1,18 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
key,Model,Arena Elo rating (anony),Arena Elo rating (full),License,Organization,Link
|
2 |
+
FLUX.1-dev,FLUX.1-dev,1128.1076601793302,1145.4292259194874,flux-1-dev-non-commercial-license (other),Black Forest Labs,https://huggingface.co/docs/diffusers/main/en/api/pipelines/flux
|
3 |
+
PlayGround V2.5,PlayGround V2.5,1126.2242175792326,1127.0304762360083,Playground v2.5 Community License,Playground,https://huggingface.co/playgroundai/playground-v2.5-1024px-aesthetic
|
4 |
+
FLUX.1-schnell,FLUX.1-schnell,1086.3891359749045,1082.431753147752,Apache-2.0,Black Forest Labs,https://huggingface.co/docs/diffusers/main/en/api/pipelines/flux
|
5 |
+
PlayGround V2,PlayGround V2,1072.3338566106129,1070.3959486055644,Playground v2 Community License,Playground,https://huggingface.co/playgroundai/playground-v2-1024px-aesthetic
|
6 |
+
Kolors,Kolors,1055.6435171321828,1054.0770126985808,Apache-2.0,Kwai Kolors,https://huggingface.co/Kwai-Kolors/Kolors
|
7 |
+
HunyuanDiT,HunyuanDiT,1038.8528018338375,1026.9064910406098,tencent-hunyuan-community,Tencent,https://github.com/Tencent/HunyuanDiT
|
8 |
+
StableCascade,StableCascade,1037.482462728124,1039.871994721617,stable-cascade-nc-community (other),Stability AI,https://fal.ai/models/stable-cascade/api
|
9 |
+
SDXL-Lightning,SDXL-Lightning,1023.5139956954258,1026.8635094413457,openrail++,ByteDance,https://huggingface.co/ByteDance/SDXL-Lightning
|
10 |
+
PixArtAlpha,PixArtAlpha,1021.8191124795862,1011.2525795471853,openrail++,PixArt-alpha,https://huggingface.co/PixArt-alpha/PixArt-XL-2-1024-MS
|
11 |
+
PixArtSigma,PixArtSigma,1018.5453640621988,1017.5527842992569,openrail++,PixArt-alpha,https://github.com/PixArt-alpha/PixArt-sigma
|
12 |
+
AuraFlow,AuraFlow,1003.1773899329969,999.230314834677,Apache-2.0,Fal.AI,https://huggingface.co/fal/AuraFlow
|
13 |
+
SD3,SD3,990.1711320470132,985.5201090260039,stabilityai-nc-research-community,Stability AI,https://huggingface.co/blog/sd3
|
14 |
+
SDXL,SDXL,964.1291628891177,963.834050856154,openrail++,Stability AI,https://huggingface.co/stabilityai/stable-diffusion-xl-base-1.0
|
15 |
+
SDXLTurbo,SDXLTurbo,912.3456630523833,908.9499820955415,sai-nc-community (other),Stability AI,https://huggingface.co/stabilityai/sdxl-turbo
|
16 |
+
LCM(v1.5/XL),LCM(v1.5/XL),904.8799595749739,897.333770100635,openrail++,Latent Consistency,https://fal.ai/models/fast-lcm-diffusion-turbo
|
17 |
+
OpenJourney,OpenJourney,827.3303069916949,821.2404802457792,creativeml-openrail-m,PromptHero,https://huggingface.co/prompthero/openjourney
|
18 |
+
LCM,LCM,789.0542612363914,802.0876918790069,MIT License,Tsinghua University,https://huggingface.co/SimianLuo/LCM_Dreamshaper_v7
|
arena_elo/results/latest/clean_battle_t2i_generation.json
CHANGED
@@ -95852,5 +95852,103 @@
|
|
95852 |
"judge": "arena_user_10.16.34.60",
|
95853 |
"anony": true,
|
95854 |
"tstamp": 1724957244.8733
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
95855 |
}
|
95856 |
]
|
|
|
95852 |
"judge": "arena_user_10.16.34.60",
|
95853 |
"anony": true,
|
95854 |
"tstamp": 1724957244.8733
|
95855 |
+
},
|
95856 |
+
{
|
95857 |
+
"model_a_conv_id": "fa377430c44e4740b8e19a6a52331bf8",
|
95858 |
+
"model_b_conv_id": "7425e0586f214a5a9aba4d4a21b96ad6",
|
95859 |
+
"inputs": {
|
95860 |
+
"prompt": "una filiale di banca popolare di sondrio sul pianeta marte con i clienti che fanno la coda per entrare"
|
95861 |
+
},
|
95862 |
+
"model_a": "SDXL",
|
95863 |
+
"model_b": "OpenJourney",
|
95864 |
+
"vote_type": "bothbad_vote",
|
95865 |
+
"winner": "tie (bothbad)",
|
95866 |
+
"judge": "arena_user_10.16.18.162",
|
95867 |
+
"anony": true,
|
95868 |
+
"tstamp": 1724962761.8085
|
95869 |
+
},
|
95870 |
+
{
|
95871 |
+
"model_a_conv_id": "c918ef993350454f82b4833e789d4cf4",
|
95872 |
+
"model_b_conv_id": "08c316715a5e466494b93996c57a8e65",
|
95873 |
+
"inputs": {
|
95874 |
+
"prompt": "pope in mountain bike with guitar"
|
95875 |
+
},
|
95876 |
+
"model_a": "AuraFlow",
|
95877 |
+
"model_b": "PixArtSigma",
|
95878 |
+
"vote_type": "bothbad_vote",
|
95879 |
+
"winner": "tie (bothbad)",
|
95880 |
+
"judge": "arena_user_10.16.10.147",
|
95881 |
+
"anony": true,
|
95882 |
+
"tstamp": 1724963166.0098
|
95883 |
+
},
|
95884 |
+
{
|
95885 |
+
"model_a_conv_id": "c8e2c90f233049c7807f177240dad575",
|
95886 |
+
"model_b_conv_id": "34f0d757308f4b7dbf99030849030ae1",
|
95887 |
+
"inputs": {
|
95888 |
+
"prompt": "Figure: Fine-Tuning Process\nPre-trained Model:\nIllustration: Show a large neural network with multiple layers. Label this as \"Pre-trained Model\" with an arrow indicating it has been trained on a \"Large General Dataset\" (e.g., ImageNet for images, large text corpus for NLP).\nLayers: Highlight the layers that are pre-trained, using a color or shading to indicate they contain learned features.\nTask-Specific Dataset:\nIllustration: Next to the pre-trained model, show a smaller dataset labeled \"Task-Specific Dataset\" (e.g., labeled images for a specific classification task).\nModel Adaptation:\nIllustration: Show the pre-trained model with an additional layer on top, labeled \"Task-Specific Layer\" or \"Output Layer.\" This layer is specific to the new task.\nAnnotations: Use arrows to indicate that the new layer is added, and some layers of the pre-trained model might be frozen initially.\nFine-Tuning:\nIllustration: Show the entire model (pre-trained layers plus the new task-specific layer) with arrows indicating the flow of data during training.\nAnnotations: Indicate that backpropagation is used to update weights, with some layers gradually unfrozen.\nOutput:\nIllustration: Show the final model with an arrow pointing to \"Task-Specific Predictions\" or \"Task-Specific Output.\"\nFlowchart: Fine-Tuning Steps\nStart:\nBox: \"Start with Pre-trained Model\"\nArrow: Pointing to the next step.\nLoad Task-Specific Dataset:\nBox: \"Load Task-Specific Dataset\"\nArrow: Pointing to the next step.\nModify Model Architecture:\nBox: \"Add Task-Specific Layer\"\nArrow: Pointing to the next step.\nFreeze Layers:\nBox: \"Freeze Some Pre-trained Layers\"\nArrow: Pointing to the next step.\nTrain Model:\nBox: \"Fine-Tune Model on Task-Specific Data\"\nArrow: Pointing to the next step.\nEvaluate Model:\nBox: \"Evaluate on Validation Set\"\nArrow: Pointing to the next step.\nAdjust Hyperparameters:\nBox: \"Adjust Hyperparameters if Necessary\"\nArrow: Pointing back to \"Train Model\" for iteration or forward to the next step.\nDeploy Model:\nBox: \"Deploy Fine-Tuned Model\"\nArrow: Pointing to \"End.\"\nEnd:\nBox: \"End\"\nExplanation\nPre-trained Model: Represents the starting point with general knowledge.\nTask-Specific Dataset: Shows the new data that will guide the fine-tuning.\nModel Adaptation: Illustrates the addition of new layers and potential freezing of existing ones.\nFine-Tuning: Highlights the training process where the model learns task-specific features.\nOutput: Demonstrates the model's ability to make predictions for the specific task.\nThis visualization helps convey the concept of fine-tuning by showing how a pre-trained model is adapted and trained to perform a specific task using a smaller, task-specific dataset."
|
95889 |
+
},
|
95890 |
+
"model_a": "FLUX.1-schnell",
|
95891 |
+
"model_b": "HunyuanDiT",
|
95892 |
+
"vote_type": "leftvote",
|
95893 |
+
"winner": "model_a",
|
95894 |
+
"judge": "arena_user_10.16.18.162",
|
95895 |
+
"anony": true,
|
95896 |
+
"tstamp": 1724969910.1761
|
95897 |
+
},
|
95898 |
+
{
|
95899 |
+
"model_a_conv_id": "601acf65eec34c349ebf1e11f5ef38e7",
|
95900 |
+
"model_b_conv_id": "e211933bb74745b988d325f77f96e3c3",
|
95901 |
+
"inputs": {
|
95902 |
+
"prompt": "portait of mystical witch, hyper detailed, flowing background, intricate and detailed, trippy, 8 k "
|
95903 |
+
},
|
95904 |
+
"model_a": "PlayGround V2.5",
|
95905 |
+
"model_b": "HunyuanDiT",
|
95906 |
+
"vote_type": "leftvote",
|
95907 |
+
"winner": "model_a",
|
95908 |
+
"judge": "arena_user_10.16.34.60",
|
95909 |
+
"anony": true,
|
95910 |
+
"tstamp": 1725013008.3565
|
95911 |
+
},
|
95912 |
+
{
|
95913 |
+
"model_a_conv_id": "9a98c6652dea4da9a6c34e2af29dca9e",
|
95914 |
+
"model_b_conv_id": "04ed72a7dcab447fa2dda9bfeac8d028",
|
95915 |
+
"inputs": {
|
95916 |
+
"prompt": "Young woman wearing red dress and black sweater gives approval while holding cell phone ."
|
95917 |
+
},
|
95918 |
+
"model_a": "SDXL",
|
95919 |
+
"model_b": "Kolors",
|
95920 |
+
"vote_type": "rightvote",
|
95921 |
+
"winner": "model_b",
|
95922 |
+
"judge": "arena_user_10.16.10.147",
|
95923 |
+
"anony": true,
|
95924 |
+
"tstamp": 1725013023.6849
|
95925 |
+
},
|
95926 |
+
{
|
95927 |
+
"model_a_conv_id": "78b783666c2944db91d1d65249e3afcc",
|
95928 |
+
"model_b_conv_id": "5dd887c139cc4d7f93e954687e681fac",
|
95929 |
+
"inputs": {
|
95930 |
+
"prompt": "a cute dog is playing a ball"
|
95931 |
+
},
|
95932 |
+
"model_a": "PlayGround V2.5",
|
95933 |
+
"model_b": "AuraFlow",
|
95934 |
+
"vote_type": "leftvote",
|
95935 |
+
"winner": "model_a",
|
95936 |
+
"judge": "arena_user_10.16.1.165",
|
95937 |
+
"anony": true,
|
95938 |
+
"tstamp": 1725013066.5854
|
95939 |
+
},
|
95940 |
+
{
|
95941 |
+
"model_a_conv_id": "ab920d339c9040d588bd699e8737ece0",
|
95942 |
+
"model_b_conv_id": "b70c63a515da46d2bd8c5c7ce4bf2579",
|
95943 |
+
"inputs": {
|
95944 |
+
"prompt": "A cat riding a bamboo raft"
|
95945 |
+
},
|
95946 |
+
"model_a": "FLUX.1-dev",
|
95947 |
+
"model_b": "SD3",
|
95948 |
+
"vote_type": "leftvote",
|
95949 |
+
"winner": "model_a",
|
95950 |
+
"judge": "arena_user_10.16.34.60",
|
95951 |
+
"anony": true,
|
95952 |
+
"tstamp": 1725019838.6535
|
95953 |
}
|
95954 |
]
|
arena_elo/results/latest/elo_results_t2i_generation.pkl
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7b07bd1eb73ba2441e1a2826c961f95e0340ed7ed04ad558150f03309cd5687a
|
3 |
+
size 88248
|
arena_elo/results/latest/t2i_generation_leaderboard.csv
CHANGED
@@ -1,18 +1,18 @@
|
|
1 |
key,Model,Arena Elo rating (anony),Arena Elo rating (full),License,Organization,Link
|
2 |
-
|
3 |
-
|
4 |
-
FLUX.1-schnell,FLUX.1-schnell,
|
5 |
-
PlayGround V2,PlayGround V2,1072.
|
6 |
-
Kolors,Kolors,
|
7 |
-
HunyuanDiT,HunyuanDiT,
|
8 |
-
StableCascade,StableCascade,1037.
|
9 |
-
SDXL-Lightning,SDXL-Lightning,1023.
|
10 |
-
PixArtAlpha,PixArtAlpha,
|
11 |
-
PixArtSigma,PixArtSigma,
|
12 |
-
AuraFlow,AuraFlow,
|
13 |
-
SD3,SD3,
|
14 |
-
SDXL,SDXL,964.
|
15 |
-
SDXLTurbo,SDXLTurbo,912.
|
16 |
-
LCM(v1.5/XL),LCM(v1.5/XL),
|
17 |
-
OpenJourney,OpenJourney,827.
|
18 |
-
LCM,LCM,789.
|
|
|
1 |
key,Model,Arena Elo rating (anony),Arena Elo rating (full),License,Organization,Link
|
2 |
+
FLUX.1-dev,FLUX.1-dev,1128.1076601793302,1145.4292259194874,flux-1-dev-non-commercial-license (other),Black Forest Labs,https://huggingface.co/docs/diffusers/main/en/api/pipelines/flux
|
3 |
+
PlayGround V2.5,PlayGround V2.5,1126.2242175792326,1127.0304762360083,Playground v2.5 Community License,Playground,https://huggingface.co/playgroundai/playground-v2.5-1024px-aesthetic
|
4 |
+
FLUX.1-schnell,FLUX.1-schnell,1086.3891359749045,1082.431753147752,Apache-2.0,Black Forest Labs,https://huggingface.co/docs/diffusers/main/en/api/pipelines/flux
|
5 |
+
PlayGround V2,PlayGround V2,1072.3338566106129,1070.3959486055644,Playground v2 Community License,Playground,https://huggingface.co/playgroundai/playground-v2-1024px-aesthetic
|
6 |
+
Kolors,Kolors,1055.6435171321828,1054.0770126985808,Apache-2.0,Kwai Kolors,https://huggingface.co/Kwai-Kolors/Kolors
|
7 |
+
HunyuanDiT,HunyuanDiT,1038.8528018338375,1026.9064910406098,tencent-hunyuan-community,Tencent,https://github.com/Tencent/HunyuanDiT
|
8 |
+
StableCascade,StableCascade,1037.482462728124,1039.871994721617,stable-cascade-nc-community (other),Stability AI,https://fal.ai/models/stable-cascade/api
|
9 |
+
SDXL-Lightning,SDXL-Lightning,1023.5139956954258,1026.8635094413457,openrail++,ByteDance,https://huggingface.co/ByteDance/SDXL-Lightning
|
10 |
+
PixArtAlpha,PixArtAlpha,1021.8191124795862,1011.2525795471853,openrail++,PixArt-alpha,https://huggingface.co/PixArt-alpha/PixArt-XL-2-1024-MS
|
11 |
+
PixArtSigma,PixArtSigma,1018.5453640621988,1017.5527842992569,openrail++,PixArt-alpha,https://github.com/PixArt-alpha/PixArt-sigma
|
12 |
+
AuraFlow,AuraFlow,1003.1773899329969,999.230314834677,Apache-2.0,Fal.AI,https://huggingface.co/fal/AuraFlow
|
13 |
+
SD3,SD3,990.1711320470132,985.5201090260039,stabilityai-nc-research-community,Stability AI,https://huggingface.co/blog/sd3
|
14 |
+
SDXL,SDXL,964.1291628891177,963.834050856154,openrail++,Stability AI,https://huggingface.co/stabilityai/stable-diffusion-xl-base-1.0
|
15 |
+
SDXLTurbo,SDXLTurbo,912.3456630523833,908.9499820955415,sai-nc-community (other),Stability AI,https://huggingface.co/stabilityai/sdxl-turbo
|
16 |
+
LCM(v1.5/XL),LCM(v1.5/XL),904.8799595749739,897.333770100635,openrail++,Latent Consistency,https://fal.ai/models/fast-lcm-diffusion-turbo
|
17 |
+
OpenJourney,OpenJourney,827.3303069916949,821.2404802457792,creativeml-openrail-m,PromptHero,https://huggingface.co/prompthero/openjourney
|
18 |
+
LCM,LCM,789.0542612363914,802.0876918790069,MIT License,Tsinghua University,https://huggingface.co/SimianLuo/LCM_Dreamshaper_v7
|