Spaces:
Running
Running
BenchmarkBot
commited on
Commit
β’
18468e8
1
Parent(s):
9b1f5f8
allow slower models on the plot
Browse files
app.py
CHANGED
@@ -70,11 +70,10 @@ def get_benchmark_df(benchmark="1xA100-80GB"):
|
|
70 |
].apply(
|
71 |
lambda x: ", ".join(
|
72 |
[
|
73 |
-
optimization
|
74 |
for optimization, value in zip(
|
75 |
["BetterTransformer", "LLM.int8", "NF4"], x.values
|
76 |
)
|
77 |
-
if value
|
78 |
]
|
79 |
),
|
80 |
)
|
@@ -100,7 +99,7 @@ def get_benchmark_table(bench_df):
|
|
100 |
|
101 |
def get_benchmark_plot(bench_df):
|
102 |
# untill falcon gets fixed / natively supported
|
103 |
-
bench_df = bench_df[bench_df["generate.latency(s)"] <
|
104 |
|
105 |
fig = px.scatter(
|
106 |
bench_df,
|
|
|
70 |
].apply(
|
71 |
lambda x: ", ".join(
|
72 |
[
|
73 |
+
optimization if value == True else "None"
|
74 |
for optimization, value in zip(
|
75 |
["BetterTransformer", "LLM.int8", "NF4"], x.values
|
76 |
)
|
|
|
77 |
]
|
78 |
),
|
79 |
)
|
|
|
99 |
|
100 |
def get_benchmark_plot(bench_df):
|
101 |
# untill falcon gets fixed / natively supported
|
102 |
+
bench_df = bench_df[bench_df["generate.latency(s)"] < 200]
|
103 |
|
104 |
fig = px.scatter(
|
105 |
bench_df,
|