BenchmarkBot commited on
Commit
75b2595
ยท
1 Parent(s): 18468e8
Files changed (1) hide show
  1. app.py +7 -12
app.py CHANGED
@@ -68,14 +68,10 @@ def get_benchmark_df(benchmark="1xA100-80GB"):
68
  bench_df["optimizations"] = bench_df[
69
  ["backend.bettertransformer", "backend.load_in_8bit", "backend.load_in_4bit"]
70
  ].apply(
71
- lambda x: ", ".join(
72
- [
73
- optimization if value == True else "None"
74
- for optimization, value in zip(
75
- ["BetterTransformer", "LLM.int8", "NF4"], x.values
76
- )
77
- ]
78
- ),
79
  )
80
 
81
  return bench_df
@@ -99,7 +95,7 @@ def get_benchmark_table(bench_df):
99
 
100
  def get_benchmark_plot(bench_df):
101
  # untill falcon gets fixed / natively supported
102
- bench_df = bench_df[bench_df["generate.latency(s)"] < 200]
103
 
104
  fig = px.scatter(
105
  bench_df,
@@ -117,7 +113,6 @@ def get_benchmark_plot(bench_df):
117
  "generate.throughput(tokens/s)",
118
  ],
119
  symbol_sequence=["triangle-up", "circle"],
120
- # as many distinct colors as there are model_type,backend.name couples
121
  color_discrete_sequence=px.colors.qualitative.Light24,
122
  )
123
 
@@ -254,8 +249,8 @@ with demo:
254
  with gr.Column(scale=2):
255
  optimizations_checkboxes = gr.CheckboxGroup(
256
  label="Optimizations ๐Ÿ› ๏ธ",
257
- choices=["None", "BetterTransformer", "LLM.int8", "NF4"],
258
- value=["None", "BetterTransformer", "LLM.int8", "NF4"],
259
  info="โ˜‘๏ธ Select the optimizations",
260
  elem_id="optimizations-checkboxes",
261
  )
 
68
  bench_df["optimizations"] = bench_df[
69
  ["backend.bettertransformer", "backend.load_in_8bit", "backend.load_in_4bit"]
70
  ].apply(
71
+ lambda x: "BetterTransformer"
72
+ if x[0] == True
73
+ else ("LLM.int8" if x[1] == True else ("LLM.fp4" if x[2] == True else "None")),
74
+ axis=1,
 
 
 
 
75
  )
76
 
77
  return bench_df
 
95
 
96
  def get_benchmark_plot(bench_df):
97
  # untill falcon gets fixed / natively supported
98
+ bench_df = bench_df[bench_df["generate.latency(s)"] < 100]
99
 
100
  fig = px.scatter(
101
  bench_df,
 
113
  "generate.throughput(tokens/s)",
114
  ],
115
  symbol_sequence=["triangle-up", "circle"],
 
116
  color_discrete_sequence=px.colors.qualitative.Light24,
117
  )
118
 
 
249
  with gr.Column(scale=2):
250
  optimizations_checkboxes = gr.CheckboxGroup(
251
  label="Optimizations ๐Ÿ› ๏ธ",
252
+ choices=["None", "BetterTransformer", "LLM.int8", "LLM.fp4"],
253
+ value=["None", "BetterTransformer", "LLM.int8", "LLM.fp4"],
254
  info="โ˜‘๏ธ Select the optimizations",
255
  elem_id="optimizations-checkboxes",
256
  )