BenchmarkBot commited on
Commit
f2d0515
β€’
1 Parent(s): 75b2595
Files changed (1) hide show
  1. app.py +13 -4
app.py CHANGED
@@ -68,9 +68,18 @@ def get_benchmark_df(benchmark="1xA100-80GB"):
68
  bench_df["optimizations"] = bench_df[
69
  ["backend.bettertransformer", "backend.load_in_8bit", "backend.load_in_4bit"]
70
  ].apply(
71
- lambda x: "BetterTransformer"
72
- if x[0] == True
73
- else ("LLM.int8" if x[1] == True else ("LLM.fp4" if x[2] == True else "None")),
 
 
 
 
 
 
 
 
 
74
  axis=1,
75
  )
76
 
@@ -95,7 +104,7 @@ def get_benchmark_table(bench_df):
95
 
96
  def get_benchmark_plot(bench_df):
97
  # untill falcon gets fixed / natively supported
98
- bench_df = bench_df[bench_df["generate.latency(s)"] < 100]
99
 
100
  fig = px.scatter(
101
  bench_df,
 
68
  bench_df["optimizations"] = bench_df[
69
  ["backend.bettertransformer", "backend.load_in_8bit", "backend.load_in_4bit"]
70
  ].apply(
71
+ lambda x: ", ".join(
72
+ sum(
73
+ [
74
+ ["BetterTransformer"] if x[0] == True else [],
75
+ ["LLM.int8"] if x[1] == True else [],
76
+ ["LLM.fp4"] if x[2] == True else [],
77
+ ],
78
+ [],
79
+ )
80
+ )
81
+ if any(x)
82
+ else "None",
83
  axis=1,
84
  )
85
 
 
104
 
105
  def get_benchmark_plot(bench_df):
106
  # untill falcon gets fixed / natively supported
107
+ bench_df = bench_df[bench_df["generate.latency(s)"] < 150]
108
 
109
  fig = px.scatter(
110
  bench_df,