Spaces:
Running
on
Zero
Running
on
Zero
DongfuJiang
commited on
Commit
β’
7e1bd0d
1
Parent(s):
a56205d
update
Browse files- app.py +2 -13
- arena_elo/elo_rating/elo_analysis.py +1 -1
- arena_elo/generation_model_info.json +20 -0
- arena_elo/results/20240818/elo_results_t2i_generation.pkl +2 -2
- arena_elo/results/20240818/t2i_generation_leaderboard.csv +17 -14
- arena_elo/results/latest/elo_results_t2i_generation.pkl +2 -2
- arena_elo/results/latest/t2i_generation_leaderboard.csv +17 -14
- model/model_manager.py +13 -2
- serve/leaderboard.py +21 -3
app.py
CHANGED
@@ -7,14 +7,6 @@ from serve.leaderboard import build_leaderboard_tab
|
|
7 |
from model.model_manager import ModelManager
|
8 |
from pathlib import Path
|
9 |
from serve.constants import SERVER_PORT, ROOT_PATH, ELO_RESULTS_DIR
|
10 |
-
from model.pre_download import pre_download_all_models, pre_download_video_models
|
11 |
-
|
12 |
-
def debug_packages():
|
13 |
-
import pkg_resources
|
14 |
-
|
15 |
-
installed_packages = pkg_resources.working_set
|
16 |
-
for package in installed_packages:
|
17 |
-
print(f"{package.key}=={package.version}")
|
18 |
|
19 |
def build_combine_demo(models, elo_results_file, leaderboard_table_file):
|
20 |
|
@@ -104,11 +96,8 @@ if __name__ == "__main__":
|
|
104 |
server_port = int(SERVER_PORT)
|
105 |
root_path = ROOT_PATH
|
106 |
elo_results_dir = ELO_RESULTS_DIR
|
107 |
-
models = ModelManager()
|
108 |
-
|
109 |
-
debug_packages()
|
110 |
-
|
111 |
-
pre_download_all_models()
|
112 |
|
113 |
elo_results_file, leaderboard_table_file = load_elo_results(elo_results_dir)
|
114 |
demo = build_combine_demo(models, elo_results_file, leaderboard_table_file)
|
|
|
7 |
from model.model_manager import ModelManager
|
8 |
from pathlib import Path
|
9 |
from serve.constants import SERVER_PORT, ROOT_PATH, ELO_RESULTS_DIR
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
10 |
|
11 |
def build_combine_demo(models, elo_results_file, leaderboard_table_file):
|
12 |
|
|
|
96 |
server_port = int(SERVER_PORT)
|
97 |
root_path = ROOT_PATH
|
98 |
elo_results_dir = ELO_RESULTS_DIR
|
99 |
+
models = ModelManager(enable_nsfw=True, pre_download=True, debug_packages=True)
|
100 |
+
# models = ModelManager(enable_nsfw=False, pre_download=False, debug_packages=False)
|
|
|
|
|
|
|
101 |
|
102 |
elo_results_file, leaderboard_table_file = load_elo_results(elo_results_dir)
|
103 |
demo = build_combine_demo(models, elo_results_file, leaderboard_table_file)
|
arena_elo/elo_rating/elo_analysis.py
CHANGED
@@ -381,7 +381,7 @@ if __name__ == "__main__":
|
|
381 |
"--rating-system", type=str, choices=["bt", "elo"], default="bt"
|
382 |
)
|
383 |
parser.add_argument("--exclude-tie", action="store_true", default=False)
|
384 |
-
parser.add_argument("--min_num_battles_per_model", type=int, default=
|
385 |
args = parser.parse_args()
|
386 |
|
387 |
np.random.seed(42)
|
|
|
381 |
"--rating-system", type=str, choices=["bt", "elo"], default="bt"
|
382 |
)
|
383 |
parser.add_argument("--exclude-tie", action="store_true", default=False)
|
384 |
+
parser.add_argument("--min_num_battles_per_model", type=int, default=25)
|
385 |
args = parser.parse_args()
|
386 |
|
387 |
np.random.seed(42)
|
arena_elo/generation_model_info.json
CHANGED
@@ -63,5 +63,25 @@
|
|
63 |
"Link": "https://fal.ai/models/fal-ai/pixart-sigma",
|
64 |
"License": "openrail++",
|
65 |
"Organization": "PixArt-alpha"
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
66 |
}
|
67 |
}
|
|
|
63 |
"Link": "https://fal.ai/models/fal-ai/pixart-sigma",
|
64 |
"License": "openrail++",
|
65 |
"Organization": "PixArt-alpha"
|
66 |
+
},
|
67 |
+
"FLUX1schnell": {
|
68 |
+
"Link": "https://huggingface.co/docs/diffusers/main/en/api/pipelines/flux",
|
69 |
+
"License": "flux-1-dev-non-commercial-license (other)",
|
70 |
+
"Organization": "Black Forest Labs"
|
71 |
+
},
|
72 |
+
"FLUX1dev": {
|
73 |
+
"Link": "https://huggingface.co/docs/diffusers/main/en/api/pipelines/flux",
|
74 |
+
"License": "flux-1-dev-non-commercial-license (other)",
|
75 |
+
"Organization": "Black Forest Labs"
|
76 |
+
},
|
77 |
+
"AuraFlow": {
|
78 |
+
"Link": "https://huggingface.co/fal/AuraFlow",
|
79 |
+
"License": "Apache-2.0",
|
80 |
+
"Organization": "Fal.AI"
|
81 |
+
},
|
82 |
+
"Kolors": {
|
83 |
+
"Link": "https://huggingface.co/Kwai-Kolors/Kolors",
|
84 |
+
"License": "Apache-2.0",
|
85 |
+
"Organization": "Kwai Kolors"
|
86 |
}
|
87 |
}
|
arena_elo/results/20240818/elo_results_t2i_generation.pkl
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4935474b3d38916a2a46738fa4a4e57a34c59abe3c61111a9e79a46187a24b38
|
3 |
+
size 86085
|
arena_elo/results/20240818/t2i_generation_leaderboard.csv
CHANGED
@@ -1,15 +1,18 @@
|
|
1 |
key,Model,Arena Elo rating (anony),Arena Elo rating (full),License,Organization,Link
|
2 |
-
|
3 |
-
|
4 |
-
PlayGround V2,PlayGround V2,
|
5 |
-
|
6 |
-
|
7 |
-
|
8 |
-
|
9 |
-
|
10 |
-
|
11 |
-
|
12 |
-
|
13 |
-
|
14 |
-
|
15 |
-
|
|
|
|
|
|
|
|
1 |
key,Model,Arena Elo rating (anony),Arena Elo rating (full),License,Organization,Link
|
2 |
+
FLUX1dev,FLUX1dev,1139.2171997788664,1154.9401991259183,flux-1-dev-non-commercial-license (other),Black Forest Labs,https://huggingface.co/docs/diffusers/main/en/api/pipelines/flux
|
3 |
+
PlayGround V2.5,PlayGround V2.5,1132.1836548838864,1132.5651835501171,Playground v2.5 Community License,Playground,https://huggingface.co/playgroundai/playground-v2.5-1024px-aesthetic
|
4 |
+
PlayGround V2,PlayGround V2,1075.3571099849078,1072.7594472644441,Playground v2 Community License,Playground,https://huggingface.co/playgroundai/playground-v2-1024px-aesthetic
|
5 |
+
FLUX1schnell,FLUX1schnell,1066.505710109784,1064.6512761628912,flux-1-dev-non-commercial-license (other),Black Forest Labs,https://huggingface.co/docs/diffusers/main/en/api/pipelines/flux
|
6 |
+
HunyuanDiT,HunyuanDiT,1051.1795507568463,1036.2184409268364,tencent-hunyuan-community,Tencent,https://huggingface.co/Tencent-Hunyuan/HunyuanDiT
|
7 |
+
StableCascade,StableCascade,1038.864872104377,1041.0470474695244,stable-cascade-nc-community (other),Stability AI,https://huggingface.co/stabilityai/stable-cascade
|
8 |
+
AuraFlow,AuraFlow,1034.6965881363633,1028.364203196634,Apache-2.0,Fal.AI,https://huggingface.co/fal/AuraFlow
|
9 |
+
PixArtAlpha,PixArtAlpha,1025.6380572404505,1014.320702980116,openrail++,PixArt-alpha,https://huggingface.co/PixArt-alpha/PixArt-XL-2-1024-MS
|
10 |
+
SDXLLightning,SDXLLightning,1025.1762643276309,1028.287019099912,openrail++,ByteDance,https://huggingface.co/ByteDance/SDXL-Lightning
|
11 |
+
PixArtSigma,PixArtSigma,1020.4950012337554,1019.0949741744585,openrail++,PixArt-alpha,https://fal.ai/models/fal-ai/pixart-sigma
|
12 |
+
SD3,SD3,993.6426659727981,987.8044800091614,stabilityai-nc-research-community,Stability AI,https://huggingface.co/stabilityai/stable-diffusion-3-medium
|
13 |
+
Kolors,Kolors,984.8923136492953,980.8110707842453,Apache-2.0,Kwai Kolors,https://huggingface.co/Kwai-Kolors/Kolors
|
14 |
+
SDXL,SDXL,966.8046145579953,966.0264408253988,openrail++,Stability AI,https://huggingface.co/stabilityai/stable-diffusion-xl-base-1.0
|
15 |
+
SDXLTurbo,SDXLTurbo,915.0182076955812,911.0171286468213,sai-nc-community (other),Stability AI,https://huggingface.co/stabilityai/sdxl-turbo
|
16 |
+
LCM(v1.5/XL),LCM(v1.5/XL),907.8353926442691,900.2703944909691,openrail++,Latent Consistency,https://fal.ai/models/fal-ai/fast-lcm-diffusion/api
|
17 |
+
OpenJourney,OpenJourney,830.3596812818465,823.5680806695481,creativeml-openrail-m,PromptHero,https://huggingface.co/prompthero/openjourney
|
18 |
+
LCM,LCM,792.1331156413471,804.405883013325,MIT License,Tsinghua University,https://huggingface.co/SimianLuo/LCM_Dreamshaper_v7
|
arena_elo/results/latest/elo_results_t2i_generation.pkl
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4935474b3d38916a2a46738fa4a4e57a34c59abe3c61111a9e79a46187a24b38
|
3 |
+
size 86085
|
arena_elo/results/latest/t2i_generation_leaderboard.csv
CHANGED
@@ -1,15 +1,18 @@
|
|
1 |
key,Model,Arena Elo rating (anony),Arena Elo rating (full),License,Organization,Link
|
2 |
-
|
3 |
-
|
4 |
-
PlayGround V2,PlayGround V2,
|
5 |
-
|
6 |
-
|
7 |
-
|
8 |
-
|
9 |
-
|
10 |
-
|
11 |
-
|
12 |
-
|
13 |
-
|
14 |
-
|
15 |
-
|
|
|
|
|
|
|
|
1 |
key,Model,Arena Elo rating (anony),Arena Elo rating (full),License,Organization,Link
|
2 |
+
FLUX1dev,FLUX1dev,1139.2171997788664,1154.9401991259183,flux-1-dev-non-commercial-license (other),Black Forest Labs,https://huggingface.co/docs/diffusers/main/en/api/pipelines/flux
|
3 |
+
PlayGround V2.5,PlayGround V2.5,1132.1836548838864,1132.5651835501171,Playground v2.5 Community License,Playground,https://huggingface.co/playgroundai/playground-v2.5-1024px-aesthetic
|
4 |
+
PlayGround V2,PlayGround V2,1075.3571099849078,1072.7594472644441,Playground v2 Community License,Playground,https://huggingface.co/playgroundai/playground-v2-1024px-aesthetic
|
5 |
+
FLUX1schnell,FLUX1schnell,1066.505710109784,1064.6512761628912,flux-1-dev-non-commercial-license (other),Black Forest Labs,https://huggingface.co/docs/diffusers/main/en/api/pipelines/flux
|
6 |
+
HunyuanDiT,HunyuanDiT,1051.1795507568463,1036.2184409268364,tencent-hunyuan-community,Tencent,https://huggingface.co/Tencent-Hunyuan/HunyuanDiT
|
7 |
+
StableCascade,StableCascade,1038.864872104377,1041.0470474695244,stable-cascade-nc-community (other),Stability AI,https://huggingface.co/stabilityai/stable-cascade
|
8 |
+
AuraFlow,AuraFlow,1034.6965881363633,1028.364203196634,Apache-2.0,Fal.AI,https://huggingface.co/fal/AuraFlow
|
9 |
+
PixArtAlpha,PixArtAlpha,1025.6380572404505,1014.320702980116,openrail++,PixArt-alpha,https://huggingface.co/PixArt-alpha/PixArt-XL-2-1024-MS
|
10 |
+
SDXLLightning,SDXLLightning,1025.1762643276309,1028.287019099912,openrail++,ByteDance,https://huggingface.co/ByteDance/SDXL-Lightning
|
11 |
+
PixArtSigma,PixArtSigma,1020.4950012337554,1019.0949741744585,openrail++,PixArt-alpha,https://fal.ai/models/fal-ai/pixart-sigma
|
12 |
+
SD3,SD3,993.6426659727981,987.8044800091614,stabilityai-nc-research-community,Stability AI,https://huggingface.co/stabilityai/stable-diffusion-3-medium
|
13 |
+
Kolors,Kolors,984.8923136492953,980.8110707842453,Apache-2.0,Kwai Kolors,https://huggingface.co/Kwai-Kolors/Kolors
|
14 |
+
SDXL,SDXL,966.8046145579953,966.0264408253988,openrail++,Stability AI,https://huggingface.co/stabilityai/stable-diffusion-xl-base-1.0
|
15 |
+
SDXLTurbo,SDXLTurbo,915.0182076955812,911.0171286468213,sai-nc-community (other),Stability AI,https://huggingface.co/stabilityai/sdxl-turbo
|
16 |
+
LCM(v1.5/XL),LCM(v1.5/XL),907.8353926442691,900.2703944909691,openrail++,Latent Consistency,https://fal.ai/models/fal-ai/fast-lcm-diffusion/api
|
17 |
+
OpenJourney,OpenJourney,830.3596812818465,823.5680806695481,creativeml-openrail-m,PromptHero,https://huggingface.co/prompthero/openjourney
|
18 |
+
LCM,LCM,792.1331156413471,804.405883013325,MIT License,Tsinghua University,https://huggingface.co/SimianLuo/LCM_Dreamshaper_v7
|
model/model_manager.py
CHANGED
@@ -7,12 +7,19 @@ import spaces
|
|
7 |
from PIL import Image
|
8 |
from .models import IMAGE_GENERATION_MODELS, IMAGE_EDITION_MODELS, VIDEO_GENERATION_MODELS, MUSEUM_UNSUPPORTED_MODELS, DESIRED_APPEAR_MODEL, load_pipeline
|
9 |
from .fetch_museum_results import draw_from_imagen_museum, draw2_from_imagen_museum, draw_from_videogen_museum, draw2_from_videogen_museum
|
10 |
-
|
11 |
from transformers import AutoTokenizer, AutoModelForCausalLM
|
12 |
import torch
|
13 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
14 |
class ModelManager:
|
15 |
-
def __init__(self, enable_nsfw=
|
16 |
self.model_ig_list = IMAGE_GENERATION_MODELS
|
17 |
self.model_ie_list = IMAGE_EDITION_MODELS
|
18 |
self.model_vg_list = VIDEO_GENERATION_MODELS
|
@@ -21,6 +28,10 @@ class ModelManager:
|
|
21 |
self.enable_nsfw = enable_nsfw
|
22 |
self.load_guard(enable_nsfw)
|
23 |
self.loaded_models = {}
|
|
|
|
|
|
|
|
|
24 |
|
25 |
def load_model_pipe(self, model_name):
|
26 |
if not model_name in self.loaded_models:
|
|
|
7 |
from PIL import Image
|
8 |
from .models import IMAGE_GENERATION_MODELS, IMAGE_EDITION_MODELS, VIDEO_GENERATION_MODELS, MUSEUM_UNSUPPORTED_MODELS, DESIRED_APPEAR_MODEL, load_pipeline
|
9 |
from .fetch_museum_results import draw_from_imagen_museum, draw2_from_imagen_museum, draw_from_videogen_museum, draw2_from_videogen_museum
|
10 |
+
from .pre_download import pre_download_all_models, pre_download_video_models
|
11 |
from transformers import AutoTokenizer, AutoModelForCausalLM
|
12 |
import torch
|
13 |
|
14 |
+
def debug_packages():
|
15 |
+
import pkg_resources
|
16 |
+
|
17 |
+
installed_packages = pkg_resources.working_set
|
18 |
+
for package in installed_packages:
|
19 |
+
print(f"{package.key}=={package.version}")
|
20 |
+
|
21 |
class ModelManager:
|
22 |
+
def __init__(self, enable_nsfw=False, pre_download=False, debug_packages=False):
|
23 |
self.model_ig_list = IMAGE_GENERATION_MODELS
|
24 |
self.model_ie_list = IMAGE_EDITION_MODELS
|
25 |
self.model_vg_list = VIDEO_GENERATION_MODELS
|
|
|
28 |
self.enable_nsfw = enable_nsfw
|
29 |
self.load_guard(enable_nsfw)
|
30 |
self.loaded_models = {}
|
31 |
+
if pre_download:
|
32 |
+
pre_download_all_models()
|
33 |
+
if debug_packages:
|
34 |
+
debug_packages()
|
35 |
|
36 |
def load_model_pipe(self, model_name):
|
37 |
if not model_name in self.loaded_models:
|
serve/leaderboard.py
CHANGED
@@ -107,13 +107,24 @@ def get_full_table(anony_arena_df, full_arena_df, model_table_df):
|
|
107 |
if model_key in anony_arena_df.index:
|
108 |
idx = anony_arena_df.index.get_loc(model_key)
|
109 |
row.append(round(anony_arena_df.iloc[idx]["rating"]))
|
|
|
|
|
|
|
110 |
else:
|
111 |
row.append(np.nan)
|
|
|
|
|
112 |
if model_key in full_arena_df.index:
|
113 |
idx = full_arena_df.index.get_loc(model_key)
|
114 |
row.append(round(full_arena_df.iloc[idx]["rating"]))
|
|
|
|
|
|
|
|
|
115 |
else:
|
116 |
row.append(np.nan)
|
|
|
|
|
117 |
# row.append(model_table_df.iloc[i]["MT-bench (score)"])
|
118 |
# row.append(model_table_df.iloc[i]["Num Battles"])
|
119 |
# row.append(model_table_df.iloc[i]["MMLU"])
|
@@ -124,6 +135,9 @@ def get_full_table(anony_arena_df, full_arena_df, model_table_df):
|
|
124 |
|
125 |
values.append(row)
|
126 |
values.sort(key=lambda x: -x[1] if not np.isnan(x[1]) else 1e9)
|
|
|
|
|
|
|
127 |
return values
|
128 |
|
129 |
|
@@ -244,7 +258,7 @@ def build_leaderboard_tab(elo_results_file, leaderboard_table_file, show_plot=Tr
|
|
244 |
value=arena_table_vals,
|
245 |
elem_id="arena_leaderboard_dataframe",
|
246 |
height=700,
|
247 |
-
column_widths=[
|
248 |
wrap=True,
|
249 |
)
|
250 |
with gr.Tab("Full Leaderboard", id=1):
|
@@ -253,16 +267,20 @@ def build_leaderboard_tab(elo_results_file, leaderboard_table_file, show_plot=Tr
|
|
253 |
full_table_vals = get_full_table(anony_arena_df, full_arena_df, model_table_df)
|
254 |
gr.Dataframe(
|
255 |
headers=[
|
|
|
256 |
"π€ Model",
|
257 |
"β Arena Elo (anony)",
|
|
|
258 |
"β Arena Elo (full)",
|
|
|
|
|
259 |
"Organization",
|
260 |
"License",
|
261 |
],
|
262 |
-
datatype=["markdown", "number", "number", "str", "str"],
|
263 |
value=full_table_vals,
|
264 |
elem_id="full_leaderboard_dataframe",
|
265 |
-
column_widths=[
|
266 |
height=700,
|
267 |
wrap=True,
|
268 |
)
|
|
|
107 |
if model_key in anony_arena_df.index:
|
108 |
idx = anony_arena_df.index.get_loc(model_key)
|
109 |
row.append(round(anony_arena_df.iloc[idx]["rating"]))
|
110 |
+
upper_diff = round(anony_arena_df.iloc[idx]["rating_q975"] - anony_arena_df.iloc[idx]["rating"])
|
111 |
+
lower_diff = round(anony_arena_df.iloc[idx]["rating"] - anony_arena_df.iloc[idx]["rating_q025"])
|
112 |
+
row.append(f"+{upper_diff}/-{lower_diff}")
|
113 |
else:
|
114 |
row.append(np.nan)
|
115 |
+
row.append("N/A")
|
116 |
+
|
117 |
if model_key in full_arena_df.index:
|
118 |
idx = full_arena_df.index.get_loc(model_key)
|
119 |
row.append(round(full_arena_df.iloc[idx]["rating"]))
|
120 |
+
upper_diff = round(full_arena_df.iloc[idx]["rating_q975"] - full_arena_df.iloc[idx]["rating"])
|
121 |
+
lower_diff = round(full_arena_df.iloc[idx]["rating"] - full_arena_df.iloc[idx]["rating_q025"])
|
122 |
+
row.append(f"+{upper_diff}/-{lower_diff}")
|
123 |
+
row.append(round(full_arena_df.iloc[idx]["num_battles"]))
|
124 |
else:
|
125 |
row.append(np.nan)
|
126 |
+
row.append("N/A")
|
127 |
+
row.append(np.nan)
|
128 |
# row.append(model_table_df.iloc[i]["MT-bench (score)"])
|
129 |
# row.append(model_table_df.iloc[i]["Num Battles"])
|
130 |
# row.append(model_table_df.iloc[i]["MMLU"])
|
|
|
135 |
|
136 |
values.append(row)
|
137 |
values.sort(key=lambda x: -x[1] if not np.isnan(x[1]) else 1e9)
|
138 |
+
# insert rank
|
139 |
+
for i, row in enumerate(values):
|
140 |
+
row.insert(0, i + 1)
|
141 |
return values
|
142 |
|
143 |
|
|
|
258 |
value=arena_table_vals,
|
259 |
elem_id="arena_leaderboard_dataframe",
|
260 |
height=700,
|
261 |
+
column_widths=[30, 50, 30, 30, 30, 70, 150],
|
262 |
wrap=True,
|
263 |
)
|
264 |
with gr.Tab("Full Leaderboard", id=1):
|
|
|
267 |
full_table_vals = get_full_table(anony_arena_df, full_arena_df, model_table_df)
|
268 |
gr.Dataframe(
|
269 |
headers=[
|
270 |
+
"Rank",
|
271 |
"π€ Model",
|
272 |
"β Arena Elo (anony)",
|
273 |
+
"π 95% CI",
|
274 |
"β Arena Elo (full)",
|
275 |
+
"π 95% CI",
|
276 |
+
"π³οΈ Votes",
|
277 |
"Organization",
|
278 |
"License",
|
279 |
],
|
280 |
+
datatype=["str", "markdown", "number", "str", "number", "str", "number", "str", "str"],
|
281 |
value=full_table_vals,
|
282 |
elem_id="full_leaderboard_dataframe",
|
283 |
+
column_widths=[30, 50, 30, 30, 30, 30, 30, 70, 150],
|
284 |
height=700,
|
285 |
wrap=True,
|
286 |
)
|