Spaces:

optimum
/

llm-perf-leaderboard

Running

App Files Files Community

BenchmarkBot commited on Aug 16, 2023

Commit

483e3a1

1 Parent(s): e89d633

added example config

Browse files

Files changed (2) hide show

app.py +2 -0
src/assets/text_content.py +46 -1

app.py CHANGED Viewed

@@ -9,6 +9,7 @@ from src.assets.text_content import (
     TITLE,
     INTRODUCTION_TEXT,
     ABOUT_TEXT,
     CITATION_BUTTON_LABEL,
     CITATION_BUTTON_TEXT,
 )
@@ -335,6 +336,7 @@ with demo:
         with gr.TabItem("About 📖", id=3):
             gr.HTML(ABOUT_TEXT, elem_classes="descriptive-text")
     demo.load(
         change_tab,

     TITLE,
     INTRODUCTION_TEXT,
     ABOUT_TEXT,
+    EXAMPLE_CONFIG_TEXT,
     CITATION_BUTTON_LABEL,
     CITATION_BUTTON_TEXT,
 )
         with gr.TabItem("About 📖", id=3):
             gr.HTML(ABOUT_TEXT, elem_classes="descriptive-text")
+            gr.Markdown(EXAMPLE_CONFIG_TEXT, elem_classes="descriptive-text")
     demo.load(
         change_tab,

src/assets/text_content.py CHANGED Viewed

@@ -15,10 +15,55 @@ ABOUT_TEXT = """<h3>About the 🤗 Open LLM-Perf Leaderboard 🏋️</h3>
     <li>Peak memory is measured in MB during the first forward pass of the LLM (no warmup).</li>
     <li>Each pair of (Model Type, Weight Class) is represented by the best scored model. This LLM is the one used for all the hardware/backend/optimization experiments.</li>
     <li>Score is the average evaluation score obtained from the <a href="https://huggingface.co/spaces/HuggingFaceH4/open_llm_leaderboard">🤗 Open LLM Leaderboard</a>.</li>
-    <li>Ranking is based on the euclidean distance from the "Perfect LLM" (i.e. 0 latency and 100% accuracy).</li>
 </ul>
 """
 CITATION_BUTTON_LABEL = "Copy the following snippet to cite these results."
 CITATION_BUTTON_TEXT = r"""@misc{open-llm-perf-leaderboard,
   author = {Ilyas Moutawwakil, Régis Pierrard},

     <li>Peak memory is measured in MB during the first forward pass of the LLM (no warmup).</li>
     <li>Each pair of (Model Type, Weight Class) is represented by the best scored model. This LLM is the one used for all the hardware/backend/optimization experiments.</li>
     <li>Score is the average evaluation score obtained from the <a href="https://huggingface.co/spaces/HuggingFaceH4/open_llm_leaderboard">🤗 Open LLM Leaderboard</a>.</li>
+    <li>Ranking is based on a composite metric which is the euclidean distance from the "Perfect LLM" (i.e. 0 latency and 100% accuracy).</li>
 </ul>
 """
+EXAMPLE_CONFIG_TEXT = """
+Here's an example of the configuration file used to benchmark the models with Optimum-Benchmark:
+```yaml
+defaults:
+  - backend: pytorch # default backend
+  - benchmark: inference # default benchmark
+  - experiment # inheriting from experiment config
+  - _self_ # for hydra 1.1 compatibility
+  - override hydra/job_logging: colorlog # colorful logging
+  - override hydra/hydra_logging: colorlog # colorful logging
+hydra:
+  run:
+    dir: llm-experiments/{experiment_name}
+  job:
+    chdir: true
+experiment_name: {experiment_name}
+model: {model}
+hub_kwargs:
+  revision: {revision}
+  trust_remote_code: {trust_remote_code}
+device: cuda
+backend:
+  no_weights: true
+  delete_cache: true
+  torch_dtype: float16
+  load_in_4bit: true
+  bettertransformer: true
+benchmark:
+  memory: true
+  input_shapes:
+    batch_size: 1
+    sequence_length: 1
+  new_tokens: 1000
+```
+"""
 CITATION_BUTTON_LABEL = "Copy the following snippet to cite these results."
 CITATION_BUTTON_TEXT = r"""@misc{open-llm-perf-leaderboard,
   author = {Ilyas Moutawwakil, Régis Pierrard},