Spaces:
Running
on
Zero
Running
on
Zero
Commit
Β·
7e1bd0d
1
Parent(s):
a56205d
update
Browse files- app.py +2 -13
- arena_elo/elo_rating/elo_analysis.py +1 -1
- arena_elo/generation_model_info.json +20 -0
- arena_elo/results/20240818/elo_results_t2i_generation.pkl +2 -2
- arena_elo/results/20240818/t2i_generation_leaderboard.csv +17 -14
- arena_elo/results/latest/elo_results_t2i_generation.pkl +2 -2
- arena_elo/results/latest/t2i_generation_leaderboard.csv +17 -14
- model/model_manager.py +13 -2
- serve/leaderboard.py +21 -3
app.py
CHANGED
|
@@ -7,14 +7,6 @@ from serve.leaderboard import build_leaderboard_tab
|
|
| 7 |
from model.model_manager import ModelManager
|
| 8 |
from pathlib import Path
|
| 9 |
from serve.constants import SERVER_PORT, ROOT_PATH, ELO_RESULTS_DIR
|
| 10 |
-
from model.pre_download import pre_download_all_models, pre_download_video_models
|
| 11 |
-
|
| 12 |
-
def debug_packages():
|
| 13 |
-
import pkg_resources
|
| 14 |
-
|
| 15 |
-
installed_packages = pkg_resources.working_set
|
| 16 |
-
for package in installed_packages:
|
| 17 |
-
print(f"{package.key}=={package.version}")
|
| 18 |
|
| 19 |
def build_combine_demo(models, elo_results_file, leaderboard_table_file):
|
| 20 |
|
|
@@ -104,11 +96,8 @@ if __name__ == "__main__":
|
|
| 104 |
server_port = int(SERVER_PORT)
|
| 105 |
root_path = ROOT_PATH
|
| 106 |
elo_results_dir = ELO_RESULTS_DIR
|
| 107 |
-
models = ModelManager()
|
| 108 |
-
|
| 109 |
-
debug_packages()
|
| 110 |
-
|
| 111 |
-
pre_download_all_models()
|
| 112 |
|
| 113 |
elo_results_file, leaderboard_table_file = load_elo_results(elo_results_dir)
|
| 114 |
demo = build_combine_demo(models, elo_results_file, leaderboard_table_file)
|
|
|
|
| 7 |
from model.model_manager import ModelManager
|
| 8 |
from pathlib import Path
|
| 9 |
from serve.constants import SERVER_PORT, ROOT_PATH, ELO_RESULTS_DIR
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 10 |
|
| 11 |
def build_combine_demo(models, elo_results_file, leaderboard_table_file):
|
| 12 |
|
|
|
|
| 96 |
server_port = int(SERVER_PORT)
|
| 97 |
root_path = ROOT_PATH
|
| 98 |
elo_results_dir = ELO_RESULTS_DIR
|
| 99 |
+
models = ModelManager(enable_nsfw=True, pre_download=True, debug_packages=True)
|
| 100 |
+
# models = ModelManager(enable_nsfw=False, pre_download=False, debug_packages=False)
|
|
|
|
|
|
|
|
|
|
| 101 |
|
| 102 |
elo_results_file, leaderboard_table_file = load_elo_results(elo_results_dir)
|
| 103 |
demo = build_combine_demo(models, elo_results_file, leaderboard_table_file)
|
arena_elo/elo_rating/elo_analysis.py
CHANGED
|
@@ -381,7 +381,7 @@ if __name__ == "__main__":
|
|
| 381 |
"--rating-system", type=str, choices=["bt", "elo"], default="bt"
|
| 382 |
)
|
| 383 |
parser.add_argument("--exclude-tie", action="store_true", default=False)
|
| 384 |
-
parser.add_argument("--min_num_battles_per_model", type=int, default=
|
| 385 |
args = parser.parse_args()
|
| 386 |
|
| 387 |
np.random.seed(42)
|
|
|
|
| 381 |
"--rating-system", type=str, choices=["bt", "elo"], default="bt"
|
| 382 |
)
|
| 383 |
parser.add_argument("--exclude-tie", action="store_true", default=False)
|
| 384 |
+
parser.add_argument("--min_num_battles_per_model", type=int, default=25)
|
| 385 |
args = parser.parse_args()
|
| 386 |
|
| 387 |
np.random.seed(42)
|
arena_elo/generation_model_info.json
CHANGED
|
@@ -63,5 +63,25 @@
|
|
| 63 |
"Link": "https://fal.ai/models/fal-ai/pixart-sigma",
|
| 64 |
"License": "openrail++",
|
| 65 |
"Organization": "PixArt-alpha"
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 66 |
}
|
| 67 |
}
|
|
|
|
| 63 |
"Link": "https://fal.ai/models/fal-ai/pixart-sigma",
|
| 64 |
"License": "openrail++",
|
| 65 |
"Organization": "PixArt-alpha"
|
| 66 |
+
},
|
| 67 |
+
"FLUX1schnell": {
|
| 68 |
+
"Link": "https://huggingface.co/docs/diffusers/main/en/api/pipelines/flux",
|
| 69 |
+
"License": "flux-1-dev-non-commercial-license (other)",
|
| 70 |
+
"Organization": "Black Forest Labs"
|
| 71 |
+
},
|
| 72 |
+
"FLUX1dev": {
|
| 73 |
+
"Link": "https://huggingface.co/docs/diffusers/main/en/api/pipelines/flux",
|
| 74 |
+
"License": "flux-1-dev-non-commercial-license (other)",
|
| 75 |
+
"Organization": "Black Forest Labs"
|
| 76 |
+
},
|
| 77 |
+
"AuraFlow": {
|
| 78 |
+
"Link": "https://huggingface.co/fal/AuraFlow",
|
| 79 |
+
"License": "Apache-2.0",
|
| 80 |
+
"Organization": "Fal.AI"
|
| 81 |
+
},
|
| 82 |
+
"Kolors": {
|
| 83 |
+
"Link": "https://huggingface.co/Kwai-Kolors/Kolors",
|
| 84 |
+
"License": "Apache-2.0",
|
| 85 |
+
"Organization": "Kwai Kolors"
|
| 86 |
}
|
| 87 |
}
|
arena_elo/results/20240818/elo_results_t2i_generation.pkl
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:4935474b3d38916a2a46738fa4a4e57a34c59abe3c61111a9e79a46187a24b38
|
| 3 |
+
size 86085
|
arena_elo/results/20240818/t2i_generation_leaderboard.csv
CHANGED
|
@@ -1,15 +1,18 @@
|
|
| 1 |
key,Model,Arena Elo rating (anony),Arena Elo rating (full),License,Organization,Link
|
| 2 |
-
|
| 3 |
-
|
| 4 |
-
PlayGround V2,PlayGround V2,
|
| 5 |
-
|
| 6 |
-
|
| 7 |
-
|
| 8 |
-
|
| 9 |
-
|
| 10 |
-
|
| 11 |
-
|
| 12 |
-
|
| 13 |
-
|
| 14 |
-
|
| 15 |
-
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
key,Model,Arena Elo rating (anony),Arena Elo rating (full),License,Organization,Link
|
| 2 |
+
FLUX1dev,FLUX1dev,1139.2171997788664,1154.9401991259183,flux-1-dev-non-commercial-license (other),Black Forest Labs,https://huggingface.co/docs/diffusers/main/en/api/pipelines/flux
|
| 3 |
+
PlayGround V2.5,PlayGround V2.5,1132.1836548838864,1132.5651835501171,Playground v2.5 Community License,Playground,https://huggingface.co/playgroundai/playground-v2.5-1024px-aesthetic
|
| 4 |
+
PlayGround V2,PlayGround V2,1075.3571099849078,1072.7594472644441,Playground v2 Community License,Playground,https://huggingface.co/playgroundai/playground-v2-1024px-aesthetic
|
| 5 |
+
FLUX1schnell,FLUX1schnell,1066.505710109784,1064.6512761628912,flux-1-dev-non-commercial-license (other),Black Forest Labs,https://huggingface.co/docs/diffusers/main/en/api/pipelines/flux
|
| 6 |
+
HunyuanDiT,HunyuanDiT,1051.1795507568463,1036.2184409268364,tencent-hunyuan-community,Tencent,https://huggingface.co/Tencent-Hunyuan/HunyuanDiT
|
| 7 |
+
StableCascade,StableCascade,1038.864872104377,1041.0470474695244,stable-cascade-nc-community (other),Stability AI,https://huggingface.co/stabilityai/stable-cascade
|
| 8 |
+
AuraFlow,AuraFlow,1034.6965881363633,1028.364203196634,Apache-2.0,Fal.AI,https://huggingface.co/fal/AuraFlow
|
| 9 |
+
PixArtAlpha,PixArtAlpha,1025.6380572404505,1014.320702980116,openrail++,PixArt-alpha,https://huggingface.co/PixArt-alpha/PixArt-XL-2-1024-MS
|
| 10 |
+
SDXLLightning,SDXLLightning,1025.1762643276309,1028.287019099912,openrail++,ByteDance,https://huggingface.co/ByteDance/SDXL-Lightning
|
| 11 |
+
PixArtSigma,PixArtSigma,1020.4950012337554,1019.0949741744585,openrail++,PixArt-alpha,https://fal.ai/models/fal-ai/pixart-sigma
|
| 12 |
+
SD3,SD3,993.6426659727981,987.8044800091614,stabilityai-nc-research-community,Stability AI,https://huggingface.co/stabilityai/stable-diffusion-3-medium
|
| 13 |
+
Kolors,Kolors,984.8923136492953,980.8110707842453,Apache-2.0,Kwai Kolors,https://huggingface.co/Kwai-Kolors/Kolors
|
| 14 |
+
SDXL,SDXL,966.8046145579953,966.0264408253988,openrail++,Stability AI,https://huggingface.co/stabilityai/stable-diffusion-xl-base-1.0
|
| 15 |
+
SDXLTurbo,SDXLTurbo,915.0182076955812,911.0171286468213,sai-nc-community (other),Stability AI,https://huggingface.co/stabilityai/sdxl-turbo
|
| 16 |
+
LCM(v1.5/XL),LCM(v1.5/XL),907.8353926442691,900.2703944909691,openrail++,Latent Consistency,https://fal.ai/models/fal-ai/fast-lcm-diffusion/api
|
| 17 |
+
OpenJourney,OpenJourney,830.3596812818465,823.5680806695481,creativeml-openrail-m,PromptHero,https://huggingface.co/prompthero/openjourney
|
| 18 |
+
LCM,LCM,792.1331156413471,804.405883013325,MIT License,Tsinghua University,https://huggingface.co/SimianLuo/LCM_Dreamshaper_v7
|
arena_elo/results/latest/elo_results_t2i_generation.pkl
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:4935474b3d38916a2a46738fa4a4e57a34c59abe3c61111a9e79a46187a24b38
|
| 3 |
+
size 86085
|
arena_elo/results/latest/t2i_generation_leaderboard.csv
CHANGED
|
@@ -1,15 +1,18 @@
|
|
| 1 |
key,Model,Arena Elo rating (anony),Arena Elo rating (full),License,Organization,Link
|
| 2 |
-
|
| 3 |
-
|
| 4 |
-
PlayGround V2,PlayGround V2,
|
| 5 |
-
|
| 6 |
-
|
| 7 |
-
|
| 8 |
-
|
| 9 |
-
|
| 10 |
-
|
| 11 |
-
|
| 12 |
-
|
| 13 |
-
|
| 14 |
-
|
| 15 |
-
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
key,Model,Arena Elo rating (anony),Arena Elo rating (full),License,Organization,Link
|
| 2 |
+
FLUX1dev,FLUX1dev,1139.2171997788664,1154.9401991259183,flux-1-dev-non-commercial-license (other),Black Forest Labs,https://huggingface.co/docs/diffusers/main/en/api/pipelines/flux
|
| 3 |
+
PlayGround V2.5,PlayGround V2.5,1132.1836548838864,1132.5651835501171,Playground v2.5 Community License,Playground,https://huggingface.co/playgroundai/playground-v2.5-1024px-aesthetic
|
| 4 |
+
PlayGround V2,PlayGround V2,1075.3571099849078,1072.7594472644441,Playground v2 Community License,Playground,https://huggingface.co/playgroundai/playground-v2-1024px-aesthetic
|
| 5 |
+
FLUX1schnell,FLUX1schnell,1066.505710109784,1064.6512761628912,flux-1-dev-non-commercial-license (other),Black Forest Labs,https://huggingface.co/docs/diffusers/main/en/api/pipelines/flux
|
| 6 |
+
HunyuanDiT,HunyuanDiT,1051.1795507568463,1036.2184409268364,tencent-hunyuan-community,Tencent,https://huggingface.co/Tencent-Hunyuan/HunyuanDiT
|
| 7 |
+
StableCascade,StableCascade,1038.864872104377,1041.0470474695244,stable-cascade-nc-community (other),Stability AI,https://huggingface.co/stabilityai/stable-cascade
|
| 8 |
+
AuraFlow,AuraFlow,1034.6965881363633,1028.364203196634,Apache-2.0,Fal.AI,https://huggingface.co/fal/AuraFlow
|
| 9 |
+
PixArtAlpha,PixArtAlpha,1025.6380572404505,1014.320702980116,openrail++,PixArt-alpha,https://huggingface.co/PixArt-alpha/PixArt-XL-2-1024-MS
|
| 10 |
+
SDXLLightning,SDXLLightning,1025.1762643276309,1028.287019099912,openrail++,ByteDance,https://huggingface.co/ByteDance/SDXL-Lightning
|
| 11 |
+
PixArtSigma,PixArtSigma,1020.4950012337554,1019.0949741744585,openrail++,PixArt-alpha,https://fal.ai/models/fal-ai/pixart-sigma
|
| 12 |
+
SD3,SD3,993.6426659727981,987.8044800091614,stabilityai-nc-research-community,Stability AI,https://huggingface.co/stabilityai/stable-diffusion-3-medium
|
| 13 |
+
Kolors,Kolors,984.8923136492953,980.8110707842453,Apache-2.0,Kwai Kolors,https://huggingface.co/Kwai-Kolors/Kolors
|
| 14 |
+
SDXL,SDXL,966.8046145579953,966.0264408253988,openrail++,Stability AI,https://huggingface.co/stabilityai/stable-diffusion-xl-base-1.0
|
| 15 |
+
SDXLTurbo,SDXLTurbo,915.0182076955812,911.0171286468213,sai-nc-community (other),Stability AI,https://huggingface.co/stabilityai/sdxl-turbo
|
| 16 |
+
LCM(v1.5/XL),LCM(v1.5/XL),907.8353926442691,900.2703944909691,openrail++,Latent Consistency,https://fal.ai/models/fal-ai/fast-lcm-diffusion/api
|
| 17 |
+
OpenJourney,OpenJourney,830.3596812818465,823.5680806695481,creativeml-openrail-m,PromptHero,https://huggingface.co/prompthero/openjourney
|
| 18 |
+
LCM,LCM,792.1331156413471,804.405883013325,MIT License,Tsinghua University,https://huggingface.co/SimianLuo/LCM_Dreamshaper_v7
|
model/model_manager.py
CHANGED
|
@@ -7,12 +7,19 @@ import spaces
|
|
| 7 |
from PIL import Image
|
| 8 |
from .models import IMAGE_GENERATION_MODELS, IMAGE_EDITION_MODELS, VIDEO_GENERATION_MODELS, MUSEUM_UNSUPPORTED_MODELS, DESIRED_APPEAR_MODEL, load_pipeline
|
| 9 |
from .fetch_museum_results import draw_from_imagen_museum, draw2_from_imagen_museum, draw_from_videogen_museum, draw2_from_videogen_museum
|
| 10 |
-
|
| 11 |
from transformers import AutoTokenizer, AutoModelForCausalLM
|
| 12 |
import torch
|
| 13 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 14 |
class ModelManager:
|
| 15 |
-
def __init__(self, enable_nsfw=
|
| 16 |
self.model_ig_list = IMAGE_GENERATION_MODELS
|
| 17 |
self.model_ie_list = IMAGE_EDITION_MODELS
|
| 18 |
self.model_vg_list = VIDEO_GENERATION_MODELS
|
|
@@ -21,6 +28,10 @@ class ModelManager:
|
|
| 21 |
self.enable_nsfw = enable_nsfw
|
| 22 |
self.load_guard(enable_nsfw)
|
| 23 |
self.loaded_models = {}
|
|
|
|
|
|
|
|
|
|
|
|
|
| 24 |
|
| 25 |
def load_model_pipe(self, model_name):
|
| 26 |
if not model_name in self.loaded_models:
|
|
|
|
| 7 |
from PIL import Image
|
| 8 |
from .models import IMAGE_GENERATION_MODELS, IMAGE_EDITION_MODELS, VIDEO_GENERATION_MODELS, MUSEUM_UNSUPPORTED_MODELS, DESIRED_APPEAR_MODEL, load_pipeline
|
| 9 |
from .fetch_museum_results import draw_from_imagen_museum, draw2_from_imagen_museum, draw_from_videogen_museum, draw2_from_videogen_museum
|
| 10 |
+
from .pre_download import pre_download_all_models, pre_download_video_models
|
| 11 |
from transformers import AutoTokenizer, AutoModelForCausalLM
|
| 12 |
import torch
|
| 13 |
|
| 14 |
+
def debug_packages():
|
| 15 |
+
import pkg_resources
|
| 16 |
+
|
| 17 |
+
installed_packages = pkg_resources.working_set
|
| 18 |
+
for package in installed_packages:
|
| 19 |
+
print(f"{package.key}=={package.version}")
|
| 20 |
+
|
| 21 |
class ModelManager:
|
| 22 |
+
def __init__(self, enable_nsfw=False, pre_download=False, debug_packages=False):
|
| 23 |
self.model_ig_list = IMAGE_GENERATION_MODELS
|
| 24 |
self.model_ie_list = IMAGE_EDITION_MODELS
|
| 25 |
self.model_vg_list = VIDEO_GENERATION_MODELS
|
|
|
|
| 28 |
self.enable_nsfw = enable_nsfw
|
| 29 |
self.load_guard(enable_nsfw)
|
| 30 |
self.loaded_models = {}
|
| 31 |
+
if pre_download:
|
| 32 |
+
pre_download_all_models()
|
| 33 |
+
if debug_packages:
|
| 34 |
+
debug_packages()
|
| 35 |
|
| 36 |
def load_model_pipe(self, model_name):
|
| 37 |
if not model_name in self.loaded_models:
|
serve/leaderboard.py
CHANGED
|
@@ -107,13 +107,24 @@ def get_full_table(anony_arena_df, full_arena_df, model_table_df):
|
|
| 107 |
if model_key in anony_arena_df.index:
|
| 108 |
idx = anony_arena_df.index.get_loc(model_key)
|
| 109 |
row.append(round(anony_arena_df.iloc[idx]["rating"]))
|
|
|
|
|
|
|
|
|
|
| 110 |
else:
|
| 111 |
row.append(np.nan)
|
|
|
|
|
|
|
| 112 |
if model_key in full_arena_df.index:
|
| 113 |
idx = full_arena_df.index.get_loc(model_key)
|
| 114 |
row.append(round(full_arena_df.iloc[idx]["rating"]))
|
|
|
|
|
|
|
|
|
|
|
|
|
| 115 |
else:
|
| 116 |
row.append(np.nan)
|
|
|
|
|
|
|
| 117 |
# row.append(model_table_df.iloc[i]["MT-bench (score)"])
|
| 118 |
# row.append(model_table_df.iloc[i]["Num Battles"])
|
| 119 |
# row.append(model_table_df.iloc[i]["MMLU"])
|
|
@@ -124,6 +135,9 @@ def get_full_table(anony_arena_df, full_arena_df, model_table_df):
|
|
| 124 |
|
| 125 |
values.append(row)
|
| 126 |
values.sort(key=lambda x: -x[1] if not np.isnan(x[1]) else 1e9)
|
|
|
|
|
|
|
|
|
|
| 127 |
return values
|
| 128 |
|
| 129 |
|
|
@@ -244,7 +258,7 @@ def build_leaderboard_tab(elo_results_file, leaderboard_table_file, show_plot=Tr
|
|
| 244 |
value=arena_table_vals,
|
| 245 |
elem_id="arena_leaderboard_dataframe",
|
| 246 |
height=700,
|
| 247 |
-
column_widths=[
|
| 248 |
wrap=True,
|
| 249 |
)
|
| 250 |
with gr.Tab("Full Leaderboard", id=1):
|
|
@@ -253,16 +267,20 @@ def build_leaderboard_tab(elo_results_file, leaderboard_table_file, show_plot=Tr
|
|
| 253 |
full_table_vals = get_full_table(anony_arena_df, full_arena_df, model_table_df)
|
| 254 |
gr.Dataframe(
|
| 255 |
headers=[
|
|
|
|
| 256 |
"π€ Model",
|
| 257 |
"β Arena Elo (anony)",
|
|
|
|
| 258 |
"β Arena Elo (full)",
|
|
|
|
|
|
|
| 259 |
"Organization",
|
| 260 |
"License",
|
| 261 |
],
|
| 262 |
-
datatype=["markdown", "number", "number", "str", "str"],
|
| 263 |
value=full_table_vals,
|
| 264 |
elem_id="full_leaderboard_dataframe",
|
| 265 |
-
column_widths=[
|
| 266 |
height=700,
|
| 267 |
wrap=True,
|
| 268 |
)
|
|
|
|
| 107 |
if model_key in anony_arena_df.index:
|
| 108 |
idx = anony_arena_df.index.get_loc(model_key)
|
| 109 |
row.append(round(anony_arena_df.iloc[idx]["rating"]))
|
| 110 |
+
upper_diff = round(anony_arena_df.iloc[idx]["rating_q975"] - anony_arena_df.iloc[idx]["rating"])
|
| 111 |
+
lower_diff = round(anony_arena_df.iloc[idx]["rating"] - anony_arena_df.iloc[idx]["rating_q025"])
|
| 112 |
+
row.append(f"+{upper_diff}/-{lower_diff}")
|
| 113 |
else:
|
| 114 |
row.append(np.nan)
|
| 115 |
+
row.append("N/A")
|
| 116 |
+
|
| 117 |
if model_key in full_arena_df.index:
|
| 118 |
idx = full_arena_df.index.get_loc(model_key)
|
| 119 |
row.append(round(full_arena_df.iloc[idx]["rating"]))
|
| 120 |
+
upper_diff = round(full_arena_df.iloc[idx]["rating_q975"] - full_arena_df.iloc[idx]["rating"])
|
| 121 |
+
lower_diff = round(full_arena_df.iloc[idx]["rating"] - full_arena_df.iloc[idx]["rating_q025"])
|
| 122 |
+
row.append(f"+{upper_diff}/-{lower_diff}")
|
| 123 |
+
row.append(round(full_arena_df.iloc[idx]["num_battles"]))
|
| 124 |
else:
|
| 125 |
row.append(np.nan)
|
| 126 |
+
row.append("N/A")
|
| 127 |
+
row.append(np.nan)
|
| 128 |
# row.append(model_table_df.iloc[i]["MT-bench (score)"])
|
| 129 |
# row.append(model_table_df.iloc[i]["Num Battles"])
|
| 130 |
# row.append(model_table_df.iloc[i]["MMLU"])
|
|
|
|
| 135 |
|
| 136 |
values.append(row)
|
| 137 |
values.sort(key=lambda x: -x[1] if not np.isnan(x[1]) else 1e9)
|
| 138 |
+
# insert rank
|
| 139 |
+
for i, row in enumerate(values):
|
| 140 |
+
row.insert(0, i + 1)
|
| 141 |
return values
|
| 142 |
|
| 143 |
|
|
|
|
| 258 |
value=arena_table_vals,
|
| 259 |
elem_id="arena_leaderboard_dataframe",
|
| 260 |
height=700,
|
| 261 |
+
column_widths=[30, 50, 30, 30, 30, 70, 150],
|
| 262 |
wrap=True,
|
| 263 |
)
|
| 264 |
with gr.Tab("Full Leaderboard", id=1):
|
|
|
|
| 267 |
full_table_vals = get_full_table(anony_arena_df, full_arena_df, model_table_df)
|
| 268 |
gr.Dataframe(
|
| 269 |
headers=[
|
| 270 |
+
"Rank",
|
| 271 |
"π€ Model",
|
| 272 |
"β Arena Elo (anony)",
|
| 273 |
+
"π 95% CI",
|
| 274 |
"β Arena Elo (full)",
|
| 275 |
+
"π 95% CI",
|
| 276 |
+
"π³οΈ Votes",
|
| 277 |
"Organization",
|
| 278 |
"License",
|
| 279 |
],
|
| 280 |
+
datatype=["str", "markdown", "number", "str", "number", "str", "number", "str", "str"],
|
| 281 |
value=full_table_vals,
|
| 282 |
elem_id="full_leaderboard_dataframe",
|
| 283 |
+
column_widths=[30, 50, 30, 30, 30, 30, 30, 70, 150],
|
| 284 |
height=700,
|
| 285 |
wrap=True,
|
| 286 |
)
|