Spaces:
Running
on
CPU Upgrade
Running
on
CPU Upgrade
shigeki Ishida
commited on
Commit
·
f4d3c9c
1
Parent(s):
1071b04
add vllm version's filter
Browse files- app.py +18 -0
- src/display/utils.py +1 -0
- src/leaderboard/read_evals.py +7 -0
app.py
CHANGED
@@ -34,6 +34,7 @@ from src.display.utils import (
|
|
34 |
NumFewShots,
|
35 |
Precision,
|
36 |
Version,
|
|
|
37 |
fields,
|
38 |
)
|
39 |
from src.envs import API, EVAL_REQUESTS_PATH, EVAL_RESULTS_PATH, QUEUE_REPO, REPO_ID, RESULTS_REPO
|
@@ -108,6 +109,7 @@ def filter_models(
|
|
108 |
add_special_tokens_query: list,
|
109 |
num_few_shots_query: list,
|
110 |
version_query: list,
|
|
|
111 |
# backend_query: list,
|
112 |
) -> pd.DataFrame:
|
113 |
print(f"Initial df shape: {df.shape}")
|
@@ -146,6 +148,10 @@ def filter_models(
|
|
146 |
filtered_df = filtered_df[filtered_df["llm-jp-eval version"].isin(version_query)]
|
147 |
print(f"After version filter: {filtered_df.shape}")
|
148 |
|
|
|
|
|
|
|
|
|
149 |
# Backend フィルタリング
|
150 |
# filtered_df = filtered_df[filtered_df["Backend Library"].isin(backend_query)]
|
151 |
# print(f"After backend filter: {filtered_df.shape}")
|
@@ -199,6 +205,7 @@ def update_table(
|
|
199 |
add_special_tokens_query: list,
|
200 |
num_few_shots_query: list,
|
201 |
version_query: list,
|
|
|
202 |
# backend_query: list,
|
203 |
query: str,
|
204 |
*columns,
|
@@ -216,6 +223,7 @@ def update_table(
|
|
216 |
add_special_tokens_query,
|
217 |
num_few_shots_query,
|
218 |
version_query,
|
|
|
219 |
# backend_query,
|
220 |
)
|
221 |
print(f"filtered_df shape after filter_models: {filtered_df.shape}")
|
@@ -248,6 +256,7 @@ leaderboard_df = filter_models(
|
|
248 |
[i.value.name for i in AddSpecialTokens],
|
249 |
[i.value.name for i in NumFewShots],
|
250 |
[i.value.name for i in Version],
|
|
|
251 |
# [i.value.name for i in Backend],
|
252 |
)
|
253 |
# DataFrameの初期化部分のみを修正
|
@@ -492,6 +501,13 @@ with gr.Blocks() as demo_leaderboard:
|
|
492 |
value=[i.value.name for i in Version],
|
493 |
elem_id="filter-columns-version",
|
494 |
)
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
495 |
# filter_columns_backend = gr.CheckboxGroup(
|
496 |
# label="Backend Library",
|
497 |
# choices=[i.value.name for i in Backend],
|
@@ -539,6 +555,7 @@ with gr.Blocks() as demo_leaderboard:
|
|
539 |
filter_columns_add_special_tokens.change,
|
540 |
filter_columns_num_few_shots.change,
|
541 |
filter_columns_version.change,
|
|
|
542 |
# filter_columns_backend.change,
|
543 |
search_bar.submit,
|
544 |
]
|
@@ -551,6 +568,7 @@ with gr.Blocks() as demo_leaderboard:
|
|
551 |
filter_columns_add_special_tokens,
|
552 |
filter_columns_num_few_shots,
|
553 |
filter_columns_version,
|
|
|
554 |
# filter_columns_backend,
|
555 |
search_bar,
|
556 |
]
|
|
|
34 |
NumFewShots,
|
35 |
Precision,
|
36 |
Version,
|
37 |
+
VllmVersion,
|
38 |
fields,
|
39 |
)
|
40 |
from src.envs import API, EVAL_REQUESTS_PATH, EVAL_RESULTS_PATH, QUEUE_REPO, REPO_ID, RESULTS_REPO
|
|
|
109 |
add_special_tokens_query: list,
|
110 |
num_few_shots_query: list,
|
111 |
version_query: list,
|
112 |
+
vllm_query: list,
|
113 |
# backend_query: list,
|
114 |
) -> pd.DataFrame:
|
115 |
print(f"Initial df shape: {df.shape}")
|
|
|
148 |
filtered_df = filtered_df[filtered_df["llm-jp-eval version"].isin(version_query)]
|
149 |
print(f"After version filter: {filtered_df.shape}")
|
150 |
|
151 |
+
# Vllm Version フィルタリング
|
152 |
+
filtered_df = filtered_df[filtered_df["vllm version"].isin(vllm_query)]
|
153 |
+
print(f"After vllm version filter: {filtered_df.shape}")
|
154 |
+
|
155 |
# Backend フィルタリング
|
156 |
# filtered_df = filtered_df[filtered_df["Backend Library"].isin(backend_query)]
|
157 |
# print(f"After backend filter: {filtered_df.shape}")
|
|
|
205 |
add_special_tokens_query: list,
|
206 |
num_few_shots_query: list,
|
207 |
version_query: list,
|
208 |
+
vllm_query: list,
|
209 |
# backend_query: list,
|
210 |
query: str,
|
211 |
*columns,
|
|
|
223 |
add_special_tokens_query,
|
224 |
num_few_shots_query,
|
225 |
version_query,
|
226 |
+
vllm_query,
|
227 |
# backend_query,
|
228 |
)
|
229 |
print(f"filtered_df shape after filter_models: {filtered_df.shape}")
|
|
|
256 |
[i.value.name for i in AddSpecialTokens],
|
257 |
[i.value.name for i in NumFewShots],
|
258 |
[i.value.name for i in Version],
|
259 |
+
[i.value.name for i in VllmVersion],
|
260 |
# [i.value.name for i in Backend],
|
261 |
)
|
262 |
# DataFrameの初期化部分のみを修正
|
|
|
501 |
value=[i.value.name for i in Version],
|
502 |
elem_id="filter-columns-version",
|
503 |
)
|
504 |
+
filter_columns_vllm = gr.CheckboxGroup(
|
505 |
+
label="vllm version",
|
506 |
+
choices=[i.value.name for i in VllmVersion],
|
507 |
+
value=[i.value.name for i in VllmVersion],
|
508 |
+
elem_id="filter-columns-vllm",
|
509 |
+
)
|
510 |
+
|
511 |
# filter_columns_backend = gr.CheckboxGroup(
|
512 |
# label="Backend Library",
|
513 |
# choices=[i.value.name for i in Backend],
|
|
|
555 |
filter_columns_add_special_tokens.change,
|
556 |
filter_columns_num_few_shots.change,
|
557 |
filter_columns_version.change,
|
558 |
+
filter_columns_vllm.change,
|
559 |
# filter_columns_backend.change,
|
560 |
search_bar.submit,
|
561 |
]
|
|
|
568 |
filter_columns_add_special_tokens,
|
569 |
filter_columns_num_few_shots,
|
570 |
filter_columns_version,
|
571 |
+
filter_columns_vllm,
|
572 |
# filter_columns_backend,
|
573 |
search_bar,
|
574 |
]
|
src/display/utils.py
CHANGED
@@ -60,6 +60,7 @@ auto_eval_column_dict.append(["add_special_tokens", ColumnContent, ColumnContent
|
|
60 |
auto_eval_column_dict.append(
|
61 |
["llm_jp_eval_version", ColumnContent, ColumnContent("llm-jp-eval version", "str", False)]
|
62 |
)
|
|
|
63 |
auto_eval_column_dict.append(["backend", ColumnContent, ColumnContent("Backend Library", "str", False, dummy=True)])
|
64 |
auto_eval_column_dict.append(["dummy", ColumnContent, ColumnContent("model_name_for_query", "str", False, dummy=True)])
|
65 |
auto_eval_column_dict.append(["row_id", ColumnContent, ColumnContent("ID", "number", False, dummy=True)])
|
|
|
60 |
auto_eval_column_dict.append(
|
61 |
["llm_jp_eval_version", ColumnContent, ColumnContent("llm-jp-eval version", "str", False)]
|
62 |
)
|
63 |
+
auto_eval_column_dict.append(["vllm_version", ColumnContent, ColumnContent("vllm version", "str", False)])
|
64 |
auto_eval_column_dict.append(["backend", ColumnContent, ColumnContent("Backend Library", "str", False, dummy=True)])
|
65 |
auto_eval_column_dict.append(["dummy", ColumnContent, ColumnContent("model_name_for_query", "str", False, dummy=True)])
|
66 |
auto_eval_column_dict.append(["row_id", ColumnContent, ColumnContent("ID", "number", False, dummy=True)])
|
src/leaderboard/read_evals.py
CHANGED
@@ -34,6 +34,7 @@ class EvalResult:
|
|
34 |
num_few_shots: str = "0"
|
35 |
add_special_tokens: str = ""
|
36 |
llm_jp_eval_version: str = ""
|
|
|
37 |
backend: str = ""
|
38 |
|
39 |
@classmethod
|
@@ -67,6 +68,10 @@ class EvalResult:
|
|
67 |
)
|
68 |
|
69 |
version = Version.from_str(metainfo.get("version", "?")).value.name
|
|
|
|
|
|
|
|
|
70 |
backend = Backend.from_str(model_config.get("_target_", "?").split(".")[0]).value.name
|
71 |
revision = model_config.get("revision", "")
|
72 |
|
@@ -114,6 +119,7 @@ class EvalResult:
|
|
114 |
num_few_shots=num_few_shots,
|
115 |
add_special_tokens=add_special_tokens,
|
116 |
llm_jp_eval_version=version,
|
|
|
117 |
backend=backend,
|
118 |
)
|
119 |
|
@@ -153,6 +159,7 @@ class EvalResult:
|
|
153 |
AutoEvalColumn.num_few_shots.name: self.num_few_shots,
|
154 |
AutoEvalColumn.add_special_tokens.name: self.add_special_tokens,
|
155 |
AutoEvalColumn.llm_jp_eval_version.name: self.llm_jp_eval_version,
|
|
|
156 |
AutoEvalColumn.backend.name: self.backend,
|
157 |
}
|
158 |
|
|
|
34 |
num_few_shots: str = "0"
|
35 |
add_special_tokens: str = ""
|
36 |
llm_jp_eval_version: str = ""
|
37 |
+
vllm_version: str = ""
|
38 |
backend: str = ""
|
39 |
|
40 |
@classmethod
|
|
|
68 |
)
|
69 |
|
70 |
version = Version.from_str(metainfo.get("version", "?")).value.name
|
71 |
+
|
72 |
+
# Get vllm version from metainfo
|
73 |
+
vllm_version = metainfo.get("vllm-version", "")
|
74 |
+
|
75 |
backend = Backend.from_str(model_config.get("_target_", "?").split(".")[0]).value.name
|
76 |
revision = model_config.get("revision", "")
|
77 |
|
|
|
119 |
num_few_shots=num_few_shots,
|
120 |
add_special_tokens=add_special_tokens,
|
121 |
llm_jp_eval_version=version,
|
122 |
+
vllm_version=vllm_version,
|
123 |
backend=backend,
|
124 |
)
|
125 |
|
|
|
159 |
AutoEvalColumn.num_few_shots.name: self.num_few_shots,
|
160 |
AutoEvalColumn.add_special_tokens.name: self.add_special_tokens,
|
161 |
AutoEvalColumn.llm_jp_eval_version.name: self.llm_jp_eval_version,
|
162 |
+
AutoEvalColumn.vllm_version.name: self.vllm_version,
|
163 |
AutoEvalColumn.backend.name: self.backend,
|
164 |
}
|
165 |
|