Spaces:

optimum
/

auto-benchmark

Running

File size: 5,668 Bytes

4daeefd
a6d3fdf
 
d1e3b68
7724866
7f9a235
 
 
 
a6d3fdf
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
7f9a235
d1e3b68
a6d3fdf
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
d1e3b68
a6d3fdf
 
 
c36ecfb
da818ef
025ba08
c36ecfb
a6d3fdf
d1e3b68
a6d3fdf
c36ecfb
d1e3b68
3aef4fb
 
a6d3fdf
 
 
 
 
3aef4fb
db435b4
d1e3b68
a6d3fdf
d1e3b68
a6d3fdf
 
 
d1e3b68
 
 
a6d3fdf
 
 
d1e3b68
 
 
a6d3fdf
 
7f9a235
a6d3fdf
 
 
 
 
 
 
7f9a235
a6d3fdf
 
 
b71e276
7f9a235
a6d3fdf
 
7f9a235
 
 
d1e3b68
 
a6d3fdf
 
 
 
 
 
d1e3b68
a6d3fdf
 
7bb9bae
d1e3b68
a6d3fdf

import os
import time
from huggingface_hub import create_repo, whoami
import gradio as gr
from config_store import (
    get_inference_config,
    get_onnxruntime_config,
    get_openvino_config,
    get_pytorch_config,
    get_process_config,
)
from optimum_benchmark.backends.openvino.utils import TASKS_TO_OVMODEL
from optimum_benchmark.backends.transformers_utils import TASKS_TO_MODEL_LOADERS
from optimum_benchmark.backends.onnxruntime.utils import TASKS_TO_ORTMODELS
from optimum_benchmark.backends.ipex.utils import TASKS_TO_IPEXMODEL
from optimum_benchmark import (
    BenchmarkConfig,
    PyTorchConfig,
    OVConfig,
    ORTConfig,
    IPEXConfig,
    ProcessConfig,
    InferenceConfig,
    Benchmark,
)
from optimum_benchmark.logging_utils import setup_logging

os.environ["LOG_TO_FILE"] = "0"
os.environ["LOG_LEVEL"] = "INFO"
setup_logging(level="INFO", prefix="MAIN-PROCESS")

DEVICE = "cpu"
BACKENDS = ["pytorch", "onnxruntime", "openvino", "ipex"]

CHOSEN_MODELS = ["bert-base-uncased", "gpt2"]
CHOSEN_TASKS = (
    set(TASKS_TO_OVMODEL.keys())
    & set(TASKS_TO_ORTMODELS.keys())
    & set(TASKS_TO_IPEXMODEL.keys())
    & set(TASKS_TO_MODEL_LOADERS.keys())
)


def run_benchmark(kwargs, oauth_token: gr.OAuthToken):
    if oauth_token.token is None:
        return "You must be logged in to use this space"

    username = whoami(oauth_token.token)["name"]
    create_repo(
        f"{username}/benchmarks",
        token=oauth_token.token,
        repo_type="dataset",
        exist_ok=True,
    )

    configs = {
        "process": {},
        "inference": {},
        "onnxruntime": {},
        "openvino": {},
        "pytorch": {},
        "ipex": {},
    }

    for key, value in kwargs.items():
        if key.label == "model":
            model = value
        elif key.label == "task":
            task = value
        elif "." in key.label:
            backend, argument = key.label.split(".")
            configs[backend][argument] = value
        else:
            continue

    process_config = ProcessConfig(**configs.pop("process"))
    inference_config = InferenceConfig(**configs.pop("inference"))

    configs["onnxruntime"] = ORTConfig(
        task=task,
        model=model,
        device=DEVICE,
        **configs["onnxruntime"],
    )
    configs["openvino"] = OVConfig(
        task=task,
        model=model,
        device=DEVICE,
        **configs["openvino"],
    )
    configs["pytorch"] = PyTorchConfig(
        task=task,
        model=model,
        device=DEVICE,
        **configs["pytorch"],
    )
    configs["ipex"] = IPEXConfig(
        task=task,
        model=model,
        device=DEVICE,
        **configs["ipex"],
    )

    for backend in configs:
        benchmark_name = (
            f"{model}-{task}-{backend}-{time.strftime('%Y-%m-%d-%H-%M-%S')}"
        )
        benchmark_config = BenchmarkConfig(
            name=benchmark_name,
            launcher=process_config,
            scenario=inference_config,
            backend=configs[backend],
        )
        benchmark_report = Benchmark.run(benchmark_config)
        benchmark = Benchmark(config=benchmark_config, report=benchmark_report)
        benchmark.push_to_hub(
            repo_id=f"{username}/benchmarks",
            subfolder=benchmark_name,
            token=oauth_token.token,
        )

    return f"🚀 Benchmark {benchmark_name} has been pushed to {username}/benchmarks"


with gr.Blocks() as demo:
    # add login button
    gr.LoginButton(min_width=250)

    # add image
    gr.Markdown(
        """<img src="https://huggingface.co/spaces/optimum/optimum-benchmark-ui/resolve/main/huggy_bench.png" style="display: block; margin-left: auto; margin-right: auto; width: 30%;">"""
    )

    # title text
    gr.Markdown("<h1 style='text-align: center'>🤗 Optimum-Benchmark Interface 🏋️</h1>")

    # explanation text
    gr.HTML(
        "<h3 style='text-align: center'>"
        "Zero code Gradio interface of "
        "<a href='https://github.com/huggingface/optimum-benchmark.git'>"
        "Optimum-Benchmark"
        "</a>"
        "<br>"
        "</h3>"
    )

    model = gr.Dropdown(
        label="model",
        choices=CHOSEN_MODELS,
        value="bert-base-uncased",
        info="Model to run the benchmark on.",
    )
    task = gr.Dropdown(
        label="task",
        choices=CHOSEN_TASKS,
        value="feature-extraction",
        info="Task to run the benchmark on.",
    )

    with gr.Row():
        with gr.Accordion(label="Process Config", open=False, visible=True):
            process_config = get_process_config()

    with gr.Row():
        with gr.Accordion(label="PyTorch Config", open=True, visible=True):
            pytorch_config = get_pytorch_config()
        with gr.Accordion(label="OpenVINO Config", open=True, visible=True):
            openvino_config = get_openvino_config()
        with gr.Accordion(label="OnnxRuntime Config", open=True, visible=True):
            onnxruntime_config = get_onnxruntime_config()

    with gr.Row():
        with gr.Accordion(label="Scenario Config", open=False, visible=True):
            inference_config = get_inference_config()

    button = gr.Button(value="Run Benchmark", variant="primary")

    html_output = gr.HTML()

    button.click(
        fn=run_benchmark,
        inputs={
            task,
            model,
            *process_config.values(),
            *inference_config.values(),
            *onnxruntime_config.values(),
            *openvino_config.values(),
            *pytorch_config.values(),
        },
        outputs=[html_output],
        concurrency_limit=1,
    )


demo.queue(max_size=10).launch()