Spaces:
Running
Running
BenchmarkBot
commited on
Commit
•
6640b32
1
Parent(s):
a62bffd
add benchmark description
Browse files
app.py
CHANGED
@@ -16,11 +16,11 @@ OLD_COLUMNS = ["model", "backend.name", "backend.torch_dtype", "backend.quantiza
|
|
16 |
"generate.latency(s)", "generate.throughput(tokens/s)"]
|
17 |
|
18 |
NEW_COLUMNS = ["Model", "Backend 🏭", "Load Datatype", "Quantization 🗜️",
|
19 |
-
"
|
20 |
|
21 |
COLUMNS_DATATYPES = ["markdown", "str", "str", "str", "number", "number"]
|
22 |
|
23 |
-
SORTING_COLUMN = ["
|
24 |
|
25 |
|
26 |
llm_perf_dataset_repo = load_dataset_repo(LLM_PERF_DATASET_REPO, OPTIMUM_TOKEN)
|
@@ -58,9 +58,12 @@ with demo:
|
|
58 |
gr.Markdown(INTRODUCTION_TEXT, elem_classes="markdown-text")
|
59 |
|
60 |
with gr.Tabs(elem_classes="tab-buttons") as tabs:
|
61 |
-
with gr.TabItem("
|
62 |
-
|
63 |
vanilla_benchmark_df = get_vanilla_benchmark_df()
|
|
|
|
|
|
|
|
|
64 |
leaderboard_table_lite = gr.components.Dataframe(
|
65 |
value=vanilla_benchmark_df,
|
66 |
datatype=COLUMNS_DATATYPES,
|
|
|
16 |
"generate.latency(s)", "generate.throughput(tokens/s)"]
|
17 |
|
18 |
NEW_COLUMNS = ["Model", "Backend 🏭", "Load Datatype", "Quantization 🗜️",
|
19 |
+
"Latency (s) ⬇️", "Throughput (tokens/s) ⬆️"]
|
20 |
|
21 |
COLUMNS_DATATYPES = ["markdown", "str", "str", "str", "number", "number"]
|
22 |
|
23 |
+
SORTING_COLUMN = ["Throughput (tokens/s) ⬆️"]
|
24 |
|
25 |
|
26 |
llm_perf_dataset_repo = load_dataset_repo(LLM_PERF_DATASET_REPO, OPTIMUM_TOKEN)
|
|
|
58 |
gr.Markdown(INTRODUCTION_TEXT, elem_classes="markdown-text")
|
59 |
|
60 |
with gr.Tabs(elem_classes="tab-buttons") as tabs:
|
61 |
+
with gr.TabItem("A100 Benchmark", elem_id="vanilla-benchmark", id=0):
|
|
|
62 |
vanilla_benchmark_df = get_vanilla_benchmark_df()
|
63 |
+
|
64 |
+
A100_text = "Machine: 4x A100 80GB<br>Batches: 1<br>Number of tokens: 100<br>"
|
65 |
+
gr.HTML(A100_text)
|
66 |
+
|
67 |
leaderboard_table_lite = gr.components.Dataframe(
|
68 |
value=vanilla_benchmark_df,
|
69 |
datatype=COLUMNS_DATATYPES,
|