shigeki Ishida commited on
Commit
f4d3c9c
·
1 Parent(s): 1071b04

add vllm version's filter

Browse files
Files changed (3) hide show
  1. app.py +18 -0
  2. src/display/utils.py +1 -0
  3. src/leaderboard/read_evals.py +7 -0
app.py CHANGED
@@ -34,6 +34,7 @@ from src.display.utils import (
34
  NumFewShots,
35
  Precision,
36
  Version,
 
37
  fields,
38
  )
39
  from src.envs import API, EVAL_REQUESTS_PATH, EVAL_RESULTS_PATH, QUEUE_REPO, REPO_ID, RESULTS_REPO
@@ -108,6 +109,7 @@ def filter_models(
108
  add_special_tokens_query: list,
109
  num_few_shots_query: list,
110
  version_query: list,
 
111
  # backend_query: list,
112
  ) -> pd.DataFrame:
113
  print(f"Initial df shape: {df.shape}")
@@ -146,6 +148,10 @@ def filter_models(
146
  filtered_df = filtered_df[filtered_df["llm-jp-eval version"].isin(version_query)]
147
  print(f"After version filter: {filtered_df.shape}")
148
 
 
 
 
 
149
  # Backend フィルタリング
150
  # filtered_df = filtered_df[filtered_df["Backend Library"].isin(backend_query)]
151
  # print(f"After backend filter: {filtered_df.shape}")
@@ -199,6 +205,7 @@ def update_table(
199
  add_special_tokens_query: list,
200
  num_few_shots_query: list,
201
  version_query: list,
 
202
  # backend_query: list,
203
  query: str,
204
  *columns,
@@ -216,6 +223,7 @@ def update_table(
216
  add_special_tokens_query,
217
  num_few_shots_query,
218
  version_query,
 
219
  # backend_query,
220
  )
221
  print(f"filtered_df shape after filter_models: {filtered_df.shape}")
@@ -248,6 +256,7 @@ leaderboard_df = filter_models(
248
  [i.value.name for i in AddSpecialTokens],
249
  [i.value.name for i in NumFewShots],
250
  [i.value.name for i in Version],
 
251
  # [i.value.name for i in Backend],
252
  )
253
  # DataFrameの初期化部分のみを修正
@@ -492,6 +501,13 @@ with gr.Blocks() as demo_leaderboard:
492
  value=[i.value.name for i in Version],
493
  elem_id="filter-columns-version",
494
  )
 
 
 
 
 
 
 
495
  # filter_columns_backend = gr.CheckboxGroup(
496
  # label="Backend Library",
497
  # choices=[i.value.name for i in Backend],
@@ -539,6 +555,7 @@ with gr.Blocks() as demo_leaderboard:
539
  filter_columns_add_special_tokens.change,
540
  filter_columns_num_few_shots.change,
541
  filter_columns_version.change,
 
542
  # filter_columns_backend.change,
543
  search_bar.submit,
544
  ]
@@ -551,6 +568,7 @@ with gr.Blocks() as demo_leaderboard:
551
  filter_columns_add_special_tokens,
552
  filter_columns_num_few_shots,
553
  filter_columns_version,
 
554
  # filter_columns_backend,
555
  search_bar,
556
  ]
 
34
  NumFewShots,
35
  Precision,
36
  Version,
37
+ VllmVersion,
38
  fields,
39
  )
40
  from src.envs import API, EVAL_REQUESTS_PATH, EVAL_RESULTS_PATH, QUEUE_REPO, REPO_ID, RESULTS_REPO
 
109
  add_special_tokens_query: list,
110
  num_few_shots_query: list,
111
  version_query: list,
112
+ vllm_query: list,
113
  # backend_query: list,
114
  ) -> pd.DataFrame:
115
  print(f"Initial df shape: {df.shape}")
 
148
  filtered_df = filtered_df[filtered_df["llm-jp-eval version"].isin(version_query)]
149
  print(f"After version filter: {filtered_df.shape}")
150
 
151
+ # Vllm Version フィルタリング
152
+ filtered_df = filtered_df[filtered_df["vllm version"].isin(vllm_query)]
153
+ print(f"After vllm version filter: {filtered_df.shape}")
154
+
155
  # Backend フィルタリング
156
  # filtered_df = filtered_df[filtered_df["Backend Library"].isin(backend_query)]
157
  # print(f"After backend filter: {filtered_df.shape}")
 
205
  add_special_tokens_query: list,
206
  num_few_shots_query: list,
207
  version_query: list,
208
+ vllm_query: list,
209
  # backend_query: list,
210
  query: str,
211
  *columns,
 
223
  add_special_tokens_query,
224
  num_few_shots_query,
225
  version_query,
226
+ vllm_query,
227
  # backend_query,
228
  )
229
  print(f"filtered_df shape after filter_models: {filtered_df.shape}")
 
256
  [i.value.name for i in AddSpecialTokens],
257
  [i.value.name for i in NumFewShots],
258
  [i.value.name for i in Version],
259
+ [i.value.name for i in VllmVersion],
260
  # [i.value.name for i in Backend],
261
  )
262
  # DataFrameの初期化部分のみを修正
 
501
  value=[i.value.name for i in Version],
502
  elem_id="filter-columns-version",
503
  )
504
+ filter_columns_vllm = gr.CheckboxGroup(
505
+ label="vllm version",
506
+ choices=[i.value.name for i in VllmVersion],
507
+ value=[i.value.name for i in VllmVersion],
508
+ elem_id="filter-columns-vllm",
509
+ )
510
+
511
  # filter_columns_backend = gr.CheckboxGroup(
512
  # label="Backend Library",
513
  # choices=[i.value.name for i in Backend],
 
555
  filter_columns_add_special_tokens.change,
556
  filter_columns_num_few_shots.change,
557
  filter_columns_version.change,
558
+ filter_columns_vllm.change,
559
  # filter_columns_backend.change,
560
  search_bar.submit,
561
  ]
 
568
  filter_columns_add_special_tokens,
569
  filter_columns_num_few_shots,
570
  filter_columns_version,
571
+ filter_columns_vllm,
572
  # filter_columns_backend,
573
  search_bar,
574
  ]
src/display/utils.py CHANGED
@@ -60,6 +60,7 @@ auto_eval_column_dict.append(["add_special_tokens", ColumnContent, ColumnContent
60
  auto_eval_column_dict.append(
61
  ["llm_jp_eval_version", ColumnContent, ColumnContent("llm-jp-eval version", "str", False)]
62
  )
 
63
  auto_eval_column_dict.append(["backend", ColumnContent, ColumnContent("Backend Library", "str", False, dummy=True)])
64
  auto_eval_column_dict.append(["dummy", ColumnContent, ColumnContent("model_name_for_query", "str", False, dummy=True)])
65
  auto_eval_column_dict.append(["row_id", ColumnContent, ColumnContent("ID", "number", False, dummy=True)])
 
60
  auto_eval_column_dict.append(
61
  ["llm_jp_eval_version", ColumnContent, ColumnContent("llm-jp-eval version", "str", False)]
62
  )
63
+ auto_eval_column_dict.append(["vllm_version", ColumnContent, ColumnContent("vllm version", "str", False)])
64
  auto_eval_column_dict.append(["backend", ColumnContent, ColumnContent("Backend Library", "str", False, dummy=True)])
65
  auto_eval_column_dict.append(["dummy", ColumnContent, ColumnContent("model_name_for_query", "str", False, dummy=True)])
66
  auto_eval_column_dict.append(["row_id", ColumnContent, ColumnContent("ID", "number", False, dummy=True)])
src/leaderboard/read_evals.py CHANGED
@@ -34,6 +34,7 @@ class EvalResult:
34
  num_few_shots: str = "0"
35
  add_special_tokens: str = ""
36
  llm_jp_eval_version: str = ""
 
37
  backend: str = ""
38
 
39
  @classmethod
@@ -67,6 +68,10 @@ class EvalResult:
67
  )
68
 
69
  version = Version.from_str(metainfo.get("version", "?")).value.name
 
 
 
 
70
  backend = Backend.from_str(model_config.get("_target_", "?").split(".")[0]).value.name
71
  revision = model_config.get("revision", "")
72
 
@@ -114,6 +119,7 @@ class EvalResult:
114
  num_few_shots=num_few_shots,
115
  add_special_tokens=add_special_tokens,
116
  llm_jp_eval_version=version,
 
117
  backend=backend,
118
  )
119
 
@@ -153,6 +159,7 @@ class EvalResult:
153
  AutoEvalColumn.num_few_shots.name: self.num_few_shots,
154
  AutoEvalColumn.add_special_tokens.name: self.add_special_tokens,
155
  AutoEvalColumn.llm_jp_eval_version.name: self.llm_jp_eval_version,
 
156
  AutoEvalColumn.backend.name: self.backend,
157
  }
158
 
 
34
  num_few_shots: str = "0"
35
  add_special_tokens: str = ""
36
  llm_jp_eval_version: str = ""
37
+ vllm_version: str = ""
38
  backend: str = ""
39
 
40
  @classmethod
 
68
  )
69
 
70
  version = Version.from_str(metainfo.get("version", "?")).value.name
71
+
72
+ # Get vllm version from metainfo
73
+ vllm_version = metainfo.get("vllm-version", "")
74
+
75
  backend = Backend.from_str(model_config.get("_target_", "?").split(".")[0]).value.name
76
  revision = model_config.get("revision", "")
77
 
 
119
  num_few_shots=num_few_shots,
120
  add_special_tokens=add_special_tokens,
121
  llm_jp_eval_version=version,
122
+ vllm_version=vllm_version,
123
  backend=backend,
124
  )
125
 
 
159
  AutoEvalColumn.num_few_shots.name: self.num_few_shots,
160
  AutoEvalColumn.add_special_tokens.name: self.add_special_tokens,
161
  AutoEvalColumn.llm_jp_eval_version.name: self.llm_jp_eval_version,
162
+ AutoEvalColumn.vllm_version.name: self.vllm_version,
163
  AutoEvalColumn.backend.name: self.backend,
164
  }
165