Spaces:
Running
Running
Commit
Β·
4f5bf6c
1
Parent(s):
5345cba
update
Browse files- app.py +2 -0
- src/assets.py +3 -0
- src/map.py +2 -1
- src/panel.py +30 -3
- src/utils.py +1 -1
app.py
CHANGED
@@ -40,6 +40,7 @@ with demo:
|
|
40 |
datatype_checkboxes,
|
41 |
optimization_checkboxes,
|
42 |
quantization_checkboxes,
|
|
|
43 |
) = create_control_panel(machine=machine)
|
44 |
####################### HARDWARE SUBTABS #######################
|
45 |
with gr.Tabs(elem_classes="subtabs"):
|
@@ -73,6 +74,7 @@ with demo:
|
|
73 |
datatype_checkboxes,
|
74 |
optimization_checkboxes,
|
75 |
quantization_checkboxes,
|
|
|
76 |
# interactive
|
77 |
columns_checkboxes,
|
78 |
search_bar,
|
|
|
40 |
datatype_checkboxes,
|
41 |
optimization_checkboxes,
|
42 |
quantization_checkboxes,
|
43 |
+
kernels_checkboxes,
|
44 |
) = create_control_panel(machine=machine)
|
45 |
####################### HARDWARE SUBTABS #######################
|
46 |
with gr.Tabs(elem_classes="subtabs"):
|
|
|
74 |
datatype_checkboxes,
|
75 |
optimization_checkboxes,
|
76 |
quantization_checkboxes,
|
77 |
+
kernels_checkboxes,
|
78 |
# interactive
|
79 |
columns_checkboxes,
|
80 |
search_bar,
|
src/assets.py
CHANGED
@@ -48,6 +48,9 @@ custom_css = """
|
|
48 |
#quantization-checkboxes span {
|
49 |
font-size: 16px !important;
|
50 |
}
|
|
|
|
|
|
|
51 |
|
52 |
#leaderboard-table td:first-child,
|
53 |
#leaderboard-table th:first-child {
|
|
|
48 |
#quantization-checkboxes span {
|
49 |
font-size: 16px !important;
|
50 |
}
|
51 |
+
#kernel-checkboxes span {
|
52 |
+
font-size: 16px !important;
|
53 |
+
}
|
54 |
|
55 |
#leaderboard-table td:first-child,
|
56 |
#leaderboard-table th:first-child {
|
src/map.py
CHANGED
@@ -54,7 +54,7 @@ def get_lat_score_mem_fig(llm_perf_df):
|
|
54 |
height=600,
|
55 |
)
|
56 |
# update x range with 95 percentile of
|
57 |
-
fig.update_xaxes(range=[0, copy_df["End-to-End (s)"].quantile(0.
|
58 |
|
59 |
return fig
|
60 |
|
@@ -62,6 +62,7 @@ def get_lat_score_mem_fig(llm_perf_df):
|
|
62 |
def create_lat_score_mem_plot(llm_perf_df):
|
63 |
# descriptive text
|
64 |
gr.HTML("π Hover over the points π for additional information. ", elem_id="text")
|
|
|
65 |
# get figure
|
66 |
fig = get_lat_score_mem_fig(llm_perf_df)
|
67 |
# create plot
|
|
|
54 |
height=600,
|
55 |
)
|
56 |
# update x range with 95 percentile of
|
57 |
+
fig.update_xaxes(range=[-0.5, copy_df["End-to-End (s)"].quantile(0.90)])
|
58 |
|
59 |
return fig
|
60 |
|
|
|
62 |
def create_lat_score_mem_plot(llm_perf_df):
|
63 |
# descriptive text
|
64 |
gr.HTML("π Hover over the points π for additional information. ", elem_id="text")
|
65 |
+
gr.HTML("π We only show the top 90% LLMs based on latency β", elem_id="text")
|
66 |
# get figure
|
67 |
fig = get_lat_score_mem_fig(llm_perf_df)
|
68 |
# create plot
|
src/panel.py
CHANGED
@@ -13,14 +13,14 @@ def create_control_panel(machine: str):
|
|
13 |
machine_textbox = gr.Textbox(value=machine, visible=False)
|
14 |
with gr.Accordion("Control Panel ποΈ", open=False, elem_id="control-panel"):
|
15 |
with gr.Row():
|
16 |
-
with gr.Column(scale=
|
17 |
score_slider = gr.Slider(
|
18 |
label="Open LLM Score (%) π",
|
19 |
info="ποΈ Slide to minimum Open LLM score",
|
20 |
value=0,
|
21 |
elem_id="threshold-slider",
|
22 |
)
|
23 |
-
with gr.Column(scale=
|
24 |
memory_slider = gr.Slider(
|
25 |
label="Peak Memory (MB) π",
|
26 |
info="ποΈ Slide to maximum Peak Memory",
|
@@ -54,7 +54,8 @@ def create_control_panel(machine: str):
|
|
54 |
info="βοΈ Select the optimization",
|
55 |
elem_id="optimization-checkboxes",
|
56 |
)
|
57 |
-
|
|
|
58 |
quantization_checkboxes = gr.CheckboxGroup(
|
59 |
label="Quantizations ποΈ",
|
60 |
choices=[
|
@@ -75,6 +76,27 @@ def create_control_panel(machine: str):
|
|
75 |
elem_id="quantization-checkboxes",
|
76 |
elem_classes="boxed-option",
|
77 |
)
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
78 |
with gr.Row():
|
79 |
filter_button = gr.Button(
|
80 |
value="Filter π",
|
@@ -91,6 +113,7 @@ def create_control_panel(machine: str):
|
|
91 |
datatype_checkboxes,
|
92 |
optimization_checkboxes,
|
93 |
quantization_checkboxes,
|
|
|
94 |
)
|
95 |
|
96 |
|
@@ -103,6 +126,7 @@ def filter_rows_fn(
|
|
103 |
precisions,
|
104 |
attentions,
|
105 |
quantizations,
|
|
|
106 |
# interactive
|
107 |
columns,
|
108 |
search,
|
@@ -116,6 +140,7 @@ def filter_rows_fn(
|
|
116 |
& llm_perf_df["Precision π₯"].isin(precisions)
|
117 |
& llm_perf_df["Attention ποΈ"].isin(attentions)
|
118 |
& llm_perf_df["Quantization ποΈ"].isin(quantizations)
|
|
|
119 |
& (llm_perf_df["Open LLM Score (%)"] >= score)
|
120 |
& (llm_perf_df["Memory (MB)"] <= memory)
|
121 |
]
|
@@ -154,6 +179,7 @@ def create_control_callback(
|
|
154 |
datatype_checkboxes,
|
155 |
optimization_checkboxes,
|
156 |
quantization_checkboxes,
|
|
|
157 |
# interactive
|
158 |
columns_checkboxes,
|
159 |
search_bar,
|
@@ -179,6 +205,7 @@ def create_control_callback(
|
|
179 |
datatype_checkboxes,
|
180 |
optimization_checkboxes,
|
181 |
quantization_checkboxes,
|
|
|
182 |
# interactive
|
183 |
columns_checkboxes,
|
184 |
search_bar,
|
|
|
13 |
machine_textbox = gr.Textbox(value=machine, visible=False)
|
14 |
with gr.Accordion("Control Panel ποΈ", open=False, elem_id="control-panel"):
|
15 |
with gr.Row():
|
16 |
+
with gr.Column(scale=2, variant="panel"):
|
17 |
score_slider = gr.Slider(
|
18 |
label="Open LLM Score (%) π",
|
19 |
info="ποΈ Slide to minimum Open LLM score",
|
20 |
value=0,
|
21 |
elem_id="threshold-slider",
|
22 |
)
|
23 |
+
with gr.Column(scale=2, variant="panel"):
|
24 |
memory_slider = gr.Slider(
|
25 |
label="Peak Memory (MB) π",
|
26 |
info="ποΈ Slide to maximum Peak Memory",
|
|
|
54 |
info="βοΈ Select the optimization",
|
55 |
elem_id="optimization-checkboxes",
|
56 |
)
|
57 |
+
with gr.Row():
|
58 |
+
with gr.Column(scale=1, variant="panel"):
|
59 |
quantization_checkboxes = gr.CheckboxGroup(
|
60 |
label="Quantizations ποΈ",
|
61 |
choices=[
|
|
|
76 |
elem_id="quantization-checkboxes",
|
77 |
elem_classes="boxed-option",
|
78 |
)
|
79 |
+
with gr.Column(scale=1, variant="panel"):
|
80 |
+
kernels_checkboxes = gr.CheckboxGroup(
|
81 |
+
label="Kernels βοΈ",
|
82 |
+
choices=[
|
83 |
+
"No Kernel",
|
84 |
+
"GPTQ.ExllamaV1",
|
85 |
+
"GPTQ.ExllamaV2",
|
86 |
+
"AWQ.GEMM",
|
87 |
+
"AWQ.GEMV",
|
88 |
+
],
|
89 |
+
value=[
|
90 |
+
"No Kernel",
|
91 |
+
"GPTQ.ExllamaV1",
|
92 |
+
"GPTQ.ExllamaV2",
|
93 |
+
"AWQ.GEMM",
|
94 |
+
"AWQ.GEMV",
|
95 |
+
],
|
96 |
+
info="βοΈ Select the custom kernels",
|
97 |
+
elem_id="kernel-checkboxes",
|
98 |
+
elem_classes="boxed-option",
|
99 |
+
)
|
100 |
with gr.Row():
|
101 |
filter_button = gr.Button(
|
102 |
value="Filter π",
|
|
|
113 |
datatype_checkboxes,
|
114 |
optimization_checkboxes,
|
115 |
quantization_checkboxes,
|
116 |
+
kernels_checkboxes,
|
117 |
)
|
118 |
|
119 |
|
|
|
126 |
precisions,
|
127 |
attentions,
|
128 |
quantizations,
|
129 |
+
kernels,
|
130 |
# interactive
|
131 |
columns,
|
132 |
search,
|
|
|
140 |
& llm_perf_df["Precision π₯"].isin(precisions)
|
141 |
& llm_perf_df["Attention ποΈ"].isin(attentions)
|
142 |
& llm_perf_df["Quantization ποΈ"].isin(quantizations)
|
143 |
+
& llm_perf_df["Kernel βοΈ"].isin(kernels)
|
144 |
& (llm_perf_df["Open LLM Score (%)"] >= score)
|
145 |
& (llm_perf_df["Memory (MB)"] <= memory)
|
146 |
]
|
|
|
179 |
datatype_checkboxes,
|
180 |
optimization_checkboxes,
|
181 |
quantization_checkboxes,
|
182 |
+
kernels_checkboxes,
|
183 |
# interactive
|
184 |
columns_checkboxes,
|
185 |
search_bar,
|
|
|
205 |
datatype_checkboxes,
|
206 |
optimization_checkboxes,
|
207 |
quantization_checkboxes,
|
208 |
+
kernels_checkboxes,
|
209 |
# interactive
|
210 |
columns_checkboxes,
|
211 |
search_bar,
|
src/utils.py
CHANGED
@@ -97,7 +97,7 @@ def process_kernels(x):
|
|
97 |
):
|
98 |
return "AWQ.GEMV"
|
99 |
else:
|
100 |
-
return "
|
101 |
|
102 |
|
103 |
# def change_tab(query_param):
|
|
|
97 |
):
|
98 |
return "AWQ.GEMV"
|
99 |
else:
|
100 |
+
return "No Kernel"
|
101 |
|
102 |
|
103 |
# def change_tab(query_param):
|