Spaces:
Running
on
CPU Upgrade
Running
on
CPU Upgrade
shigeki Ishida
commited on
Commit
·
f4d3c9c
1
Parent(s):
1071b04
add vllm version's filter
Browse files- app.py +18 -0
- src/display/utils.py +1 -0
- src/leaderboard/read_evals.py +7 -0
app.py
CHANGED
|
@@ -34,6 +34,7 @@ from src.display.utils import (
|
|
| 34 |
NumFewShots,
|
| 35 |
Precision,
|
| 36 |
Version,
|
|
|
|
| 37 |
fields,
|
| 38 |
)
|
| 39 |
from src.envs import API, EVAL_REQUESTS_PATH, EVAL_RESULTS_PATH, QUEUE_REPO, REPO_ID, RESULTS_REPO
|
|
@@ -108,6 +109,7 @@ def filter_models(
|
|
| 108 |
add_special_tokens_query: list,
|
| 109 |
num_few_shots_query: list,
|
| 110 |
version_query: list,
|
|
|
|
| 111 |
# backend_query: list,
|
| 112 |
) -> pd.DataFrame:
|
| 113 |
print(f"Initial df shape: {df.shape}")
|
|
@@ -146,6 +148,10 @@ def filter_models(
|
|
| 146 |
filtered_df = filtered_df[filtered_df["llm-jp-eval version"].isin(version_query)]
|
| 147 |
print(f"After version filter: {filtered_df.shape}")
|
| 148 |
|
|
|
|
|
|
|
|
|
|
|
|
|
| 149 |
# Backend フィルタリング
|
| 150 |
# filtered_df = filtered_df[filtered_df["Backend Library"].isin(backend_query)]
|
| 151 |
# print(f"After backend filter: {filtered_df.shape}")
|
|
@@ -199,6 +205,7 @@ def update_table(
|
|
| 199 |
add_special_tokens_query: list,
|
| 200 |
num_few_shots_query: list,
|
| 201 |
version_query: list,
|
|
|
|
| 202 |
# backend_query: list,
|
| 203 |
query: str,
|
| 204 |
*columns,
|
|
@@ -216,6 +223,7 @@ def update_table(
|
|
| 216 |
add_special_tokens_query,
|
| 217 |
num_few_shots_query,
|
| 218 |
version_query,
|
|
|
|
| 219 |
# backend_query,
|
| 220 |
)
|
| 221 |
print(f"filtered_df shape after filter_models: {filtered_df.shape}")
|
|
@@ -248,6 +256,7 @@ leaderboard_df = filter_models(
|
|
| 248 |
[i.value.name for i in AddSpecialTokens],
|
| 249 |
[i.value.name for i in NumFewShots],
|
| 250 |
[i.value.name for i in Version],
|
|
|
|
| 251 |
# [i.value.name for i in Backend],
|
| 252 |
)
|
| 253 |
# DataFrameの初期化部分のみを修正
|
|
@@ -492,6 +501,13 @@ with gr.Blocks() as demo_leaderboard:
|
|
| 492 |
value=[i.value.name for i in Version],
|
| 493 |
elem_id="filter-columns-version",
|
| 494 |
)
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 495 |
# filter_columns_backend = gr.CheckboxGroup(
|
| 496 |
# label="Backend Library",
|
| 497 |
# choices=[i.value.name for i in Backend],
|
|
@@ -539,6 +555,7 @@ with gr.Blocks() as demo_leaderboard:
|
|
| 539 |
filter_columns_add_special_tokens.change,
|
| 540 |
filter_columns_num_few_shots.change,
|
| 541 |
filter_columns_version.change,
|
|
|
|
| 542 |
# filter_columns_backend.change,
|
| 543 |
search_bar.submit,
|
| 544 |
]
|
|
@@ -551,6 +568,7 @@ with gr.Blocks() as demo_leaderboard:
|
|
| 551 |
filter_columns_add_special_tokens,
|
| 552 |
filter_columns_num_few_shots,
|
| 553 |
filter_columns_version,
|
|
|
|
| 554 |
# filter_columns_backend,
|
| 555 |
search_bar,
|
| 556 |
]
|
|
|
|
| 34 |
NumFewShots,
|
| 35 |
Precision,
|
| 36 |
Version,
|
| 37 |
+
VllmVersion,
|
| 38 |
fields,
|
| 39 |
)
|
| 40 |
from src.envs import API, EVAL_REQUESTS_PATH, EVAL_RESULTS_PATH, QUEUE_REPO, REPO_ID, RESULTS_REPO
|
|
|
|
| 109 |
add_special_tokens_query: list,
|
| 110 |
num_few_shots_query: list,
|
| 111 |
version_query: list,
|
| 112 |
+
vllm_query: list,
|
| 113 |
# backend_query: list,
|
| 114 |
) -> pd.DataFrame:
|
| 115 |
print(f"Initial df shape: {df.shape}")
|
|
|
|
| 148 |
filtered_df = filtered_df[filtered_df["llm-jp-eval version"].isin(version_query)]
|
| 149 |
print(f"After version filter: {filtered_df.shape}")
|
| 150 |
|
| 151 |
+
# Vllm Version フィルタリング
|
| 152 |
+
filtered_df = filtered_df[filtered_df["vllm version"].isin(vllm_query)]
|
| 153 |
+
print(f"After vllm version filter: {filtered_df.shape}")
|
| 154 |
+
|
| 155 |
# Backend フィルタリング
|
| 156 |
# filtered_df = filtered_df[filtered_df["Backend Library"].isin(backend_query)]
|
| 157 |
# print(f"After backend filter: {filtered_df.shape}")
|
|
|
|
| 205 |
add_special_tokens_query: list,
|
| 206 |
num_few_shots_query: list,
|
| 207 |
version_query: list,
|
| 208 |
+
vllm_query: list,
|
| 209 |
# backend_query: list,
|
| 210 |
query: str,
|
| 211 |
*columns,
|
|
|
|
| 223 |
add_special_tokens_query,
|
| 224 |
num_few_shots_query,
|
| 225 |
version_query,
|
| 226 |
+
vllm_query,
|
| 227 |
# backend_query,
|
| 228 |
)
|
| 229 |
print(f"filtered_df shape after filter_models: {filtered_df.shape}")
|
|
|
|
| 256 |
[i.value.name for i in AddSpecialTokens],
|
| 257 |
[i.value.name for i in NumFewShots],
|
| 258 |
[i.value.name for i in Version],
|
| 259 |
+
[i.value.name for i in VllmVersion],
|
| 260 |
# [i.value.name for i in Backend],
|
| 261 |
)
|
| 262 |
# DataFrameの初期化部分のみを修正
|
|
|
|
| 501 |
value=[i.value.name for i in Version],
|
| 502 |
elem_id="filter-columns-version",
|
| 503 |
)
|
| 504 |
+
filter_columns_vllm = gr.CheckboxGroup(
|
| 505 |
+
label="vllm version",
|
| 506 |
+
choices=[i.value.name for i in VllmVersion],
|
| 507 |
+
value=[i.value.name for i in VllmVersion],
|
| 508 |
+
elem_id="filter-columns-vllm",
|
| 509 |
+
)
|
| 510 |
+
|
| 511 |
# filter_columns_backend = gr.CheckboxGroup(
|
| 512 |
# label="Backend Library",
|
| 513 |
# choices=[i.value.name for i in Backend],
|
|
|
|
| 555 |
filter_columns_add_special_tokens.change,
|
| 556 |
filter_columns_num_few_shots.change,
|
| 557 |
filter_columns_version.change,
|
| 558 |
+
filter_columns_vllm.change,
|
| 559 |
# filter_columns_backend.change,
|
| 560 |
search_bar.submit,
|
| 561 |
]
|
|
|
|
| 568 |
filter_columns_add_special_tokens,
|
| 569 |
filter_columns_num_few_shots,
|
| 570 |
filter_columns_version,
|
| 571 |
+
filter_columns_vllm,
|
| 572 |
# filter_columns_backend,
|
| 573 |
search_bar,
|
| 574 |
]
|
src/display/utils.py
CHANGED
|
@@ -60,6 +60,7 @@ auto_eval_column_dict.append(["add_special_tokens", ColumnContent, ColumnContent
|
|
| 60 |
auto_eval_column_dict.append(
|
| 61 |
["llm_jp_eval_version", ColumnContent, ColumnContent("llm-jp-eval version", "str", False)]
|
| 62 |
)
|
|
|
|
| 63 |
auto_eval_column_dict.append(["backend", ColumnContent, ColumnContent("Backend Library", "str", False, dummy=True)])
|
| 64 |
auto_eval_column_dict.append(["dummy", ColumnContent, ColumnContent("model_name_for_query", "str", False, dummy=True)])
|
| 65 |
auto_eval_column_dict.append(["row_id", ColumnContent, ColumnContent("ID", "number", False, dummy=True)])
|
|
|
|
| 60 |
auto_eval_column_dict.append(
|
| 61 |
["llm_jp_eval_version", ColumnContent, ColumnContent("llm-jp-eval version", "str", False)]
|
| 62 |
)
|
| 63 |
+
auto_eval_column_dict.append(["vllm_version", ColumnContent, ColumnContent("vllm version", "str", False)])
|
| 64 |
auto_eval_column_dict.append(["backend", ColumnContent, ColumnContent("Backend Library", "str", False, dummy=True)])
|
| 65 |
auto_eval_column_dict.append(["dummy", ColumnContent, ColumnContent("model_name_for_query", "str", False, dummy=True)])
|
| 66 |
auto_eval_column_dict.append(["row_id", ColumnContent, ColumnContent("ID", "number", False, dummy=True)])
|
src/leaderboard/read_evals.py
CHANGED
|
@@ -34,6 +34,7 @@ class EvalResult:
|
|
| 34 |
num_few_shots: str = "0"
|
| 35 |
add_special_tokens: str = ""
|
| 36 |
llm_jp_eval_version: str = ""
|
|
|
|
| 37 |
backend: str = ""
|
| 38 |
|
| 39 |
@classmethod
|
|
@@ -67,6 +68,10 @@ class EvalResult:
|
|
| 67 |
)
|
| 68 |
|
| 69 |
version = Version.from_str(metainfo.get("version", "?")).value.name
|
|
|
|
|
|
|
|
|
|
|
|
|
| 70 |
backend = Backend.from_str(model_config.get("_target_", "?").split(".")[0]).value.name
|
| 71 |
revision = model_config.get("revision", "")
|
| 72 |
|
|
@@ -114,6 +119,7 @@ class EvalResult:
|
|
| 114 |
num_few_shots=num_few_shots,
|
| 115 |
add_special_tokens=add_special_tokens,
|
| 116 |
llm_jp_eval_version=version,
|
|
|
|
| 117 |
backend=backend,
|
| 118 |
)
|
| 119 |
|
|
@@ -153,6 +159,7 @@ class EvalResult:
|
|
| 153 |
AutoEvalColumn.num_few_shots.name: self.num_few_shots,
|
| 154 |
AutoEvalColumn.add_special_tokens.name: self.add_special_tokens,
|
| 155 |
AutoEvalColumn.llm_jp_eval_version.name: self.llm_jp_eval_version,
|
|
|
|
| 156 |
AutoEvalColumn.backend.name: self.backend,
|
| 157 |
}
|
| 158 |
|
|
|
|
| 34 |
num_few_shots: str = "0"
|
| 35 |
add_special_tokens: str = ""
|
| 36 |
llm_jp_eval_version: str = ""
|
| 37 |
+
vllm_version: str = ""
|
| 38 |
backend: str = ""
|
| 39 |
|
| 40 |
@classmethod
|
|
|
|
| 68 |
)
|
| 69 |
|
| 70 |
version = Version.from_str(metainfo.get("version", "?")).value.name
|
| 71 |
+
|
| 72 |
+
# Get vllm version from metainfo
|
| 73 |
+
vllm_version = metainfo.get("vllm-version", "")
|
| 74 |
+
|
| 75 |
backend = Backend.from_str(model_config.get("_target_", "?").split(".")[0]).value.name
|
| 76 |
revision = model_config.get("revision", "")
|
| 77 |
|
|
|
|
| 119 |
num_few_shots=num_few_shots,
|
| 120 |
add_special_tokens=add_special_tokens,
|
| 121 |
llm_jp_eval_version=version,
|
| 122 |
+
vllm_version=vllm_version,
|
| 123 |
backend=backend,
|
| 124 |
)
|
| 125 |
|
|
|
|
| 159 |
AutoEvalColumn.num_few_shots.name: self.num_few_shots,
|
| 160 |
AutoEvalColumn.add_special_tokens.name: self.add_special_tokens,
|
| 161 |
AutoEvalColumn.llm_jp_eval_version.name: self.llm_jp_eval_version,
|
| 162 |
+
AutoEvalColumn.vllm_version.name: self.vllm_version,
|
| 163 |
AutoEvalColumn.backend.name: self.backend,
|
| 164 |
}
|
| 165 |
|