Spaces:
Running
on
Zero
Running
on
Zero
DongfuJiang
commited on
Commit
•
f6608c4
1
Parent(s):
73848fe
update
Browse files- arena_elo/elo_rating/clean_battle_data.py +2 -1
- arena_elo/generation_model_info.json +6 -1
- arena_elo/results/20240315/elo_results_image_editing.pkl +2 -2
- arena_elo/results/20240327/clean_battle_t2i_generation.json +0 -0
- arena_elo/results/20240327/elo_results_t2i_generation.pkl +2 -2
- arena_elo/results/20240327/t2i_generation_leaderboard.csv +9 -10
- arena_elo/results/latest/clean_battle_t2i_generation_20240327.json +0 -0
- arena_elo/results/latest/elo_results_image_editing.pkl +2 -2
- arena_elo/results/latest/elo_results_t2i_generation.pkl +2 -2
- arena_elo/results/latest/t2i_generation_leaderboard.csv +9 -10
- arena_elo/update_elo_rating.sh +2 -2
arena_elo/elo_rating/clean_battle_data.py
CHANGED
@@ -82,6 +82,7 @@ def replace_model_name(old_name, tstamp):
|
|
82 |
"claude-instant-v1": "claude-instant-1",
|
83 |
"oasst-sft-1-pythia-12b": "oasst-pythia-12b",
|
84 |
"claude-2": "claude-2.0",
|
|
|
85 |
}
|
86 |
if old_name in ["gpt-4", "gpt-3.5-turbo"]:
|
87 |
if tstamp > 1687849200:
|
@@ -203,7 +204,6 @@ def clean_battle_data(
|
|
203 |
# continue
|
204 |
|
205 |
# Replace bard with palm
|
206 |
-
models = [replace_model_name(m, row["tstamp"]) for m in models]
|
207 |
if task_name == "image_editing":
|
208 |
if not all(x.startswith("imagenhub_") and x.endswith("_edition") for x in models):
|
209 |
# print(f"Invalid model names: {models}")
|
@@ -222,6 +222,7 @@ def clean_battle_data(
|
|
222 |
|
223 |
else:
|
224 |
raise ValueError(f"Invalid task_name: {task_name}")
|
|
|
225 |
|
226 |
# Exclude certain models
|
227 |
if exclude_model_names and any(x in exclude_model_names for x in models):
|
|
|
82 |
"claude-instant-v1": "claude-instant-1",
|
83 |
"oasst-sft-1-pythia-12b": "oasst-pythia-12b",
|
84 |
"claude-2": "claude-2.0",
|
85 |
+
"PlayGroundV2": "Playground v2",
|
86 |
}
|
87 |
if old_name in ["gpt-4", "gpt-3.5-turbo"]:
|
88 |
if tstamp > 1687849200:
|
|
|
204 |
# continue
|
205 |
|
206 |
# Replace bard with palm
|
|
|
207 |
if task_name == "image_editing":
|
208 |
if not all(x.startswith("imagenhub_") and x.endswith("_edition") for x in models):
|
209 |
# print(f"Invalid model names: {models}")
|
|
|
222 |
|
223 |
else:
|
224 |
raise ValueError(f"Invalid task_name: {task_name}")
|
225 |
+
models = [replace_model_name(m, row["tstamp"]) for m in models]
|
226 |
|
227 |
# Exclude certain models
|
228 |
if exclude_model_names and any(x in exclude_model_names for x in models):
|
arena_elo/generation_model_info.json
CHANGED
@@ -9,6 +9,11 @@
|
|
9 |
"License": "Playground v2 Community License",
|
10 |
"Organization": "Playground"
|
11 |
},
|
|
|
|
|
|
|
|
|
|
|
12 |
"OpenJourney": {
|
13 |
"Link": "https://huggingface.co/prompthero/openjourney",
|
14 |
"License": "creativeml-openrail-m",
|
@@ -39,4 +44,4 @@
|
|
39 |
"License": "stable-cascade-nc-community (other)",
|
40 |
"Organization": "Stability AI"
|
41 |
}
|
42 |
-
}
|
|
|
9 |
"License": "Playground v2 Community License",
|
10 |
"Organization": "Playground"
|
11 |
},
|
12 |
+
"Playground v2.5": {
|
13 |
+
"Link": "https://huggingface.co/playgroundai/playground-v2.5-1024px-aesthetic",
|
14 |
+
"License": "Playground v2 Community License",
|
15 |
+
"Organization": "Playground"
|
16 |
+
},
|
17 |
"OpenJourney": {
|
18 |
"Link": "https://huggingface.co/prompthero/openjourney",
|
19 |
"License": "creativeml-openrail-m",
|
|
|
44 |
"License": "stable-cascade-nc-community (other)",
|
45 |
"Organization": "Stability AI"
|
46 |
}
|
47 |
+
}
|
arena_elo/results/20240315/elo_results_image_editing.pkl
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5cef00c45d392a30913b367825270fcee5fd29e5c830866eef3d07146b3502f3
|
3 |
+
size 57091
|
arena_elo/results/20240327/clean_battle_t2i_generation.json
CHANGED
The diff for this file is too large to render.
See raw diff
|
|
arena_elo/results/20240327/elo_results_t2i_generation.pkl
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f525abe69feb822d341929b27ef7660ddd5e6ff0491bed8383a8e3d19f0342bd
|
3 |
+
size 62414
|
arena_elo/results/20240327/t2i_generation_leaderboard.csv
CHANGED
@@ -1,11 +1,10 @@
|
|
1 |
key,Model,Arena Elo rating (anony),Arena Elo rating (full),License,Organization,Link
|
2 |
-
Playground v2.5,Playground v2.5,
|
3 |
-
StableCascade,StableCascade,
|
4 |
-
|
5 |
-
|
6 |
-
|
7 |
-
|
8 |
-
|
9 |
-
|
10 |
-
|
11 |
-
LCM,LCM,790.5659076257482,805.8155782210948,MIT License,Tsinghua University,https://huggingface.co/SimianLuo/LCM_Dreamshaper_v7
|
|
|
1 |
key,Model,Arena Elo rating (anony),Arena Elo rating (full),License,Organization,Link
|
2 |
+
Playground v2.5,Playground v2.5,1226.2872445351936,1246.1685934024742,Playground v2 Community License,Playground,https://huggingface.co/playgroundai/playground-v2.5-1024px-aesthetic
|
3 |
+
StableCascade,StableCascade,1105.3322734027522,1087.9198960927265,stable-cascade-nc-community (other),Stability AI,https://huggingface.co/stabilityai/stable-cascade
|
4 |
+
Playground v2,Playground v2,1091.4371447234744,1090.676108819673,Playground v2 Community License,Playground,https://huggingface.co/playgroundai/playground-v2-1024px-aesthetic
|
5 |
+
SDXLLightning,SDXLLightning,1043.235902888147,1045.0529259890538,openrail++,ByteDance,https://huggingface.co/ByteDance/SDXL-Lightning
|
6 |
+
PixArtAlpha,PixArtAlpha,1020.6412075829058,1006.9966036187151,openrail++,PixArt-alpha,https://huggingface.co/PixArt-alpha/PixArt-XL-2-1024-MS
|
7 |
+
SDXL,SDXL,964.7626495363717,969.5241392802999,openrail++,Stability AI,https://huggingface.co/stabilityai/stable-diffusion-xl-base-1.0
|
8 |
+
SDXLTurbo,SDXLTurbo,912.2113859675355,914.3805456579931,sai-nc-community (other),Stability AI,https://huggingface.co/stabilityai/sdxl-turbo
|
9 |
+
OpenJourney,OpenJourney,841.2224045541894,832.2282703082603,creativeml-openrail-m,PromptHero,https://huggingface.co/prompthero/openjourney
|
10 |
+
LCM,LCM,794.8697868094328,810.2118373597045,MIT License,Tsinghua University,https://huggingface.co/SimianLuo/LCM_Dreamshaper_v7
|
|
arena_elo/results/latest/clean_battle_t2i_generation_20240327.json
CHANGED
The diff for this file is too large to render.
See raw diff
|
|
arena_elo/results/latest/elo_results_image_editing.pkl
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5cef00c45d392a30913b367825270fcee5fd29e5c830866eef3d07146b3502f3
|
3 |
+
size 57091
|
arena_elo/results/latest/elo_results_t2i_generation.pkl
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f525abe69feb822d341929b27ef7660ddd5e6ff0491bed8383a8e3d19f0342bd
|
3 |
+
size 62414
|
arena_elo/results/latest/t2i_generation_leaderboard.csv
CHANGED
@@ -1,11 +1,10 @@
|
|
1 |
key,Model,Arena Elo rating (anony),Arena Elo rating (full),License,Organization,Link
|
2 |
-
Playground v2.5,Playground v2.5,
|
3 |
-
StableCascade,StableCascade,
|
4 |
-
|
5 |
-
|
6 |
-
|
7 |
-
|
8 |
-
|
9 |
-
|
10 |
-
|
11 |
-
LCM,LCM,790.5659076257482,805.8155782210948,MIT License,Tsinghua University,https://huggingface.co/SimianLuo/LCM_Dreamshaper_v7
|
|
|
1 |
key,Model,Arena Elo rating (anony),Arena Elo rating (full),License,Organization,Link
|
2 |
+
Playground v2.5,Playground v2.5,1226.2872445351936,1246.1685934024742,Playground v2 Community License,Playground,https://huggingface.co/playgroundai/playground-v2.5-1024px-aesthetic
|
3 |
+
StableCascade,StableCascade,1105.3322734027522,1087.9198960927265,stable-cascade-nc-community (other),Stability AI,https://huggingface.co/stabilityai/stable-cascade
|
4 |
+
Playground v2,Playground v2,1091.4371447234744,1090.676108819673,Playground v2 Community License,Playground,https://huggingface.co/playgroundai/playground-v2-1024px-aesthetic
|
5 |
+
SDXLLightning,SDXLLightning,1043.235902888147,1045.0529259890538,openrail++,ByteDance,https://huggingface.co/ByteDance/SDXL-Lightning
|
6 |
+
PixArtAlpha,PixArtAlpha,1020.6412075829058,1006.9966036187151,openrail++,PixArt-alpha,https://huggingface.co/PixArt-alpha/PixArt-XL-2-1024-MS
|
7 |
+
SDXL,SDXL,964.7626495363717,969.5241392802999,openrail++,Stability AI,https://huggingface.co/stabilityai/stable-diffusion-xl-base-1.0
|
8 |
+
SDXLTurbo,SDXLTurbo,912.2113859675355,914.3805456579931,sai-nc-community (other),Stability AI,https://huggingface.co/stabilityai/sdxl-turbo
|
9 |
+
OpenJourney,OpenJourney,841.2224045541894,832.2282703082603,creativeml-openrail-m,PromptHero,https://huggingface.co/prompthero/openjourney
|
10 |
+
LCM,LCM,794.8697868094328,810.2118373597045,MIT License,Tsinghua University,https://huggingface.co/SimianLuo/LCM_Dreamshaper_v7
|
|
arena_elo/update_elo_rating.sh
CHANGED
@@ -22,10 +22,10 @@ mv clean_battle_image_editing_$edition_battle_cutoff_date.json ./results/$editio
|
|
22 |
mv clean_battle_t2i_generation_$generation_battle_cutoff_date.json ./results/$generation_battle_cutoff_date/clean_battle_t2i_generation.json
|
23 |
|
24 |
|
25 |
-
python3 -m elo_rating.elo_analysis --clean-battle-file
|
26 |
mv ./elo_results_$edition_battle_cutoff_date.pkl ./results/$edition_battle_cutoff_date/elo_results_image_editing.pkl
|
27 |
|
28 |
-
python3 -m elo_rating.elo_analysis --clean-battle-file
|
29 |
mv ./elo_results_$generation_battle_cutoff_date.pkl ./results/$generation_battle_cutoff_date/elo_results_t2i_generation.pkl
|
30 |
|
31 |
# generat the leaderboard
|
|
|
22 |
mv clean_battle_t2i_generation_$generation_battle_cutoff_date.json ./results/$generation_battle_cutoff_date/clean_battle_t2i_generation.json
|
23 |
|
24 |
|
25 |
+
python3 -m elo_rating.elo_analysis --clean-battle-file ./results/$edition_battle_cutoff_date/clean_battle_image_editing.json
|
26 |
mv ./elo_results_$edition_battle_cutoff_date.pkl ./results/$edition_battle_cutoff_date/elo_results_image_editing.pkl
|
27 |
|
28 |
+
python3 -m elo_rating.elo_analysis --clean-battle-file ./results/$generation_battle_cutoff_date/clean_battle_t2i_generation.json
|
29 |
mv ./elo_results_$generation_battle_cutoff_date.pkl ./results/$generation_battle_cutoff_date/elo_results_t2i_generation.pkl
|
30 |
|
31 |
# generat the leaderboard
|