BenchmarkBot commited on
Commit
35afb9b
1 Parent(s): 18b69eb
Files changed (1) hide show
  1. app.py +3 -3
app.py CHANGED
@@ -20,7 +20,7 @@ COLUMNS_MAPPING = {
20
  "num_parameters": "#Parameters 📏",
21
  "forward.peak_memory(MB)": "Peak Memory (MB) ⬇️",
22
  "generate.throughput(tokens/s)": "Throughput (tokens/s) ⬆️",
23
- "h4_score": "Average Open LLM Score ⬆️",
24
  }
25
  COLUMNS_DATATYPES = ["markdown", "str", "str",
26
  "number", "number", "number", "markdown"]
@@ -67,7 +67,7 @@ def get_benchmark_plot(bench_df):
67
  bench_df = bench_df[bench_df["generate.latency(s)"] < 100]
68
 
69
  fig = px.scatter(
70
- bench_df, x="generate.latency(s)", y="h4_score",
71
  color='model_type', symbol='backend.name', size='forward.peak_memory(MB)',
72
  custom_data=['model', 'backend.name', 'backend.torch_dtype',
73
  'forward.peak_memory(MB)', 'generate.throughput(tokens/s)'],
@@ -120,7 +120,7 @@ def filter_query(text, backends, datatypes, threshold, benchmark="1xA100-80GB"):
120
  raw_df["model"].str.lower().str.contains(text.lower()) &
121
  raw_df["backend.name"].isin(backends) &
122
  raw_df["backend.torch_dtype"].isin(datatypes) &
123
- (raw_df["h4_score"] >= threshold)
124
  ]
125
 
126
  filtered_table = get_benchmark_table(filtered_df)
 
20
  "num_parameters": "#Parameters 📏",
21
  "forward.peak_memory(MB)": "Peak Memory (MB) ⬇️",
22
  "generate.throughput(tokens/s)": "Throughput (tokens/s) ⬆️",
23
+ "average": "Average Open LLM Score ⬆️",
24
  }
25
  COLUMNS_DATATYPES = ["markdown", "str", "str",
26
  "number", "number", "number", "markdown"]
 
67
  bench_df = bench_df[bench_df["generate.latency(s)"] < 100]
68
 
69
  fig = px.scatter(
70
+ bench_df, x="generate.latency(s)", y="average",
71
  color='model_type', symbol='backend.name', size='forward.peak_memory(MB)',
72
  custom_data=['model', 'backend.name', 'backend.torch_dtype',
73
  'forward.peak_memory(MB)', 'generate.throughput(tokens/s)'],
 
120
  raw_df["model"].str.lower().str.contains(text.lower()) &
121
  raw_df["backend.name"].isin(backends) &
122
  raw_df["backend.torch_dtype"].isin(datatypes) &
123
+ (raw_df["average"] >= threshold)
124
  ]
125
 
126
  filtered_table = get_benchmark_table(filtered_df)