Spaces:

optimum
/

auto-benchmark

Running

App Files Files Community

IlyasMoutawwakil HF Staff commited on Sep 25, 2024

Commit

0f9db6d

1 Parent(s): 9a78645

test

Browse files

Files changed (5) hide show

app.py +138 -85
benchmark.log +41 -0
config_store.py +4 -0
packages.txt +0 -0
pyproject.toml +0 -3

app.py CHANGED Viewed

@@ -3,12 +3,14 @@ import time
 from huggingface_hub import create_repo, whoami
 import gradio as gr
 from config_store import (
     get_inference_config,
     get_onnxruntime_config,
     get_openvino_config,
     get_pytorch_config,
-    get_process_config,
 )
 from optimum_benchmark.backends.openvino.utils import TASKS_TO_OVMODEL
 from optimum_benchmark.backends.transformers_utils import TASKS_TO_MODEL_LOADERS
 from optimum_benchmark.backends.onnxruntime.utils import TASKS_TO_ORTMODELS
@@ -25,15 +27,17 @@ from optimum_benchmark import (
 )
 from optimum_benchmark.logging_utils import setup_logging
-os.environ["LOG_TO_FILE"] = "0"
-os.environ["LOG_LEVEL"] = "INFO"
-setup_logging(level="INFO", prefix="MAIN-PROCESS")
 DEVICE = "cpu"
-BACKENDS = ["pytorch", "onnxruntime", "openvino", "ipex"]
-CHOSEN_MODELS = ["bert-base-uncased", "gpt2"]
-CHOSEN_TASKS = (
     set(TASKS_TO_OVMODEL.keys())
     & set(TASKS_TO_ORTMODELS.keys())
     & set(TASKS_TO_IPEXMODEL.keys())
@@ -67,14 +71,16 @@ def run_benchmark(kwargs, oauth_token: gr.OAuthToken):
             model = value
         elif key.label == "task":
             task = value
         elif "." in key.label:
             backend, argument = key.label.split(".")
             configs[backend][argument] = value
         else:
             continue
-    process_config = ProcessConfig(**configs.pop("process"))
-    inference_config = InferenceConfig(**configs.pop("inference"))
     configs["onnxruntime"] = ORTConfig(
         task=task,
@@ -101,17 +107,31 @@ def run_benchmark(kwargs, oauth_token: gr.OAuthToken):
         **configs["ipex"],
     )
-    for backend in configs:
-        benchmark_name = (
-            f"{model}-{task}-{backend}-{time.strftime('%Y-%m-%d-%H-%M-%S')}"
-        )
         benchmark_config = BenchmarkConfig(
             name=benchmark_name,
-            launcher=process_config,
-            scenario=inference_config,
             backend=configs[backend],
         )
-        benchmark_report = Benchmark.run(benchmark_config)
         benchmark = Benchmark(config=benchmark_config, report=benchmark_report)
         benchmark.push_to_hub(
             repo_id=f"{username}/benchmarks",
@@ -119,79 +139,112 @@ def run_benchmark(kwargs, oauth_token: gr.OAuthToken):
             token=oauth_token.token,
         )
-    return f"🚀 Benchmark {benchmark_name} has been pushed to {username}/benchmarks"
-with gr.Blocks() as demo:
-    # add login button
-    gr.LoginButton(min_width=250)
-    # add image
-    gr.Markdown(
-        """<img src="https://huggingface.co/spaces/optimum/optimum-benchmark-ui/resolve/main/huggy_bench.png" style="display: block; margin-left: auto; margin-right: auto; width: 30%;">"""
-    )
-    # title text
-    gr.Markdown("<h1 style='text-align: center'>🤗 Optimum-Benchmark Interface 🏋️</h1>")
-    # explanation text
-    gr.HTML(
-        "<h3 style='text-align: center'>"
-        "Zero code Gradio interface of "
-        "<a href='https://github.com/huggingface/optimum-benchmark.git'>"
-        "Optimum-Benchmark"
-        "</a>"
-        "<br>"
-        "</h3>"
-    )
-    model = gr.Dropdown(
-        label="model",
-        choices=CHOSEN_MODELS,
-        value="bert-base-uncased",
-        info="Model to run the benchmark on.",
-    )
-    task = gr.Dropdown(
-        label="task",
-        choices=CHOSEN_TASKS,
-        value="feature-extraction",
-        info="Task to run the benchmark on.",
-    )
-    with gr.Row():
-        with gr.Accordion(label="Process Config", open=False, visible=True):
-            process_config = get_process_config()
-    with gr.Row():
-        with gr.Accordion(label="PyTorch Config", open=True, visible=True):
-            pytorch_config = get_pytorch_config()
-        with gr.Accordion(label="OpenVINO Config", open=True, visible=True):
-            openvino_config = get_openvino_config()
-        with gr.Accordion(label="OnnxRuntime Config", open=True, visible=True):
-            onnxruntime_config = get_onnxruntime_config()
-    with gr.Row():
-        with gr.Accordion(label="Scenario Config", open=False, visible=True):
-            inference_config = get_inference_config()
-    button = gr.Button(value="Run Benchmark", variant="primary")
-    html_output = gr.HTML()
-    button.click(
-        fn=run_benchmark,
-        inputs={
-            task,
-            model,
-            *process_config.values(),
-            *inference_config.values(),
-            *onnxruntime_config.values(),
-            *openvino_config.values(),
-            *pytorch_config.values(),
-        },
-        outputs=[html_output],
-        concurrency_limit=1,
-    )
-demo.queue(max_size=10).launch()

 from huggingface_hub import create_repo, whoami
 import gradio as gr
 from config_store import (
+    get_process_config,
     get_inference_config,
     get_onnxruntime_config,
     get_openvino_config,
     get_pytorch_config,
+    get_ipex_config,
 )
+from optimum_benchmark.launchers.base import Launcher  # noqa
 from optimum_benchmark.backends.openvino.utils import TASKS_TO_OVMODEL
 from optimum_benchmark.backends.transformers_utils import TASKS_TO_MODEL_LOADERS
 from optimum_benchmark.backends.onnxruntime.utils import TASKS_TO_ORTMODELS
 )
 from optimum_benchmark.logging_utils import setup_logging
 DEVICE = "cpu"
+LAUNCHER = "process"
+SCENARIO = "inference"
+BACKENDS = ["onnxruntime", "openvino", "pytorch", "ipex"]
+MODELS = [
+    "hf-internal-testing/tiny-random-bert",
+    "google-bert/bert-base-uncased",
+    "openai-community/gpt2",
+]
+TASKS = (
     set(TASKS_TO_OVMODEL.keys())
     & set(TASKS_TO_ORTMODELS.keys())
     & set(TASKS_TO_IPEXMODEL.keys())
             model = value
         elif key.label == "task":
             task = value
+        elif key.label == "backends":
+            backends = value
         elif "." in key.label:
             backend, argument = key.label.split(".")
             configs[backend][argument] = value
         else:
             continue
+    configs["process"] = ProcessConfig(**configs.pop("process"))
+    configs["inference"] = InferenceConfig(**configs.pop("inference"))
     configs["onnxruntime"] = ORTConfig(
         task=task,
         **configs["ipex"],
     )
+    html_output = f"<h3>Running benchmark for model {model} on task {task} with backends {backends}</h3>"
+    yield html_output
+    timestamp = time.strftime("%Y-%m-%d-%H-%M-%S")
+    for backend in backends:
+        benchmark_name = f"{timestamp}/{backend}"
         benchmark_config = BenchmarkConfig(
             name=benchmark_name,
             backend=configs[backend],
+            launcher=configs[LAUNCHER],
+            scenario=configs[SCENARIO],
+        )
+        benchmark_config.push_to_hub(
+            repo_id=f"{username}/benchmarks",
+            subfolder=benchmark_name,
+            token=oauth_token.token,
+        )
+        benchmark_report = Benchmark.launch(benchmark_config)
+        benchmark_report.push_to_hub(
+            repo_id=f"{username}/benchmarks",
+            subfolder=benchmark_name,
+            token=oauth_token.token,
         )
         benchmark = Benchmark(config=benchmark_config, report=benchmark_report)
         benchmark.push_to_hub(
             repo_id=f"{username}/benchmarks",
             token=oauth_token.token,
         )
+        html_output += f"<br>📊 Benchmark report for {backend} backend in the folder {benchmark_name} of your benchmarks dataset"
+        yield html_output
+def build_demo():
+    with gr.Blocks() as demo:
+        # add login button
+        gr.LoginButton(min_width=250)
+        # add image
+        gr.Markdown(
+            """<img src="https://huggingface.co/spaces/optimum/optimum-benchmark-ui/resolve/main/huggy_bench.png" style="display: block; margin-left: auto; margin-right: auto; width: 30%;">"""
+        )
+        # title text
+        gr.Markdown(
+            "<h1 style='text-align: center'>🤗 Optimum-Benchmark Interface 🏋️</h1>"
+        )
+        # explanation text
+        gr.HTML(
+            "<h3 style='text-align: center'>"
+            "Zero code Gradio interface of "
+            "<a href='https://github.com/huggingface/optimum-benchmark.git'>"
+            "Optimum-Benchmark"
+            "</a>"
+            "<br>"
+            "</h3>"
+        )
+        model = gr.Dropdown(
+            label="model",
+            choices=MODELS,
+            value=MODELS[0],
+            info="Model to run the benchmark on.",
+        )
+        task = gr.Dropdown(
+            label="task",
+            choices=TASKS,
+            value="feature-extraction",
+            info="Task to run the benchmark on.",
+        )
+        backends = gr.CheckboxGroup(
+            interactive=True,
+            label="backends",
+            choices=BACKENDS,
+            value=BACKENDS,
+            info="Backends to run the benchmark on.",
+        )
+        with gr.Row():
+            with gr.Accordion(label="Process Config", open=False, visible=True):
+                process_config = get_process_config()
+        with gr.Row() as backend_configs:
+            with gr.Accordion(label="OnnxRuntime Config", open=False, visible=True):
+                onnxruntime_config = get_onnxruntime_config()
+            with gr.Accordion(label="OpenVINO Config", open=False, visible=True):
+                openvino_config = get_openvino_config()
+            with gr.Accordion(label="PyTorch Config", open=False, visible=True):
+                pytorch_config = get_pytorch_config()
+            with gr.Accordion(label="IPEX Config", open=False, visible=True):
+                ipex_config = get_ipex_config()
+        backends.change(
+            inputs=backends,
+            outputs=backend_configs.children,
+            fn=lambda values: [
+                gr.update(visible=value in values) for value in BACKENDS
+            ],
+        )
+        with gr.Row():
+            with gr.Accordion(label="Scenario Config", open=False, visible=True):
+                inference_config = get_inference_config()
+        button = gr.Button(value="Run Benchmark", variant="primary")
+        with gr.Row():
+            html_output = gr.HTML(label="Output", value="")
+        button.click(
+            fn=run_benchmark,
+            inputs={
+                task,
+                model,
+                backends,
+                *process_config.values(),
+                *inference_config.values(),
+                *onnxruntime_config.values(),
+                *openvino_config.values(),
+                *pytorch_config.values(),
+                *ipex_config.values(),
+            },
+            outputs=[html_output],
+            concurrency_limit=1,
+        )
+    return demo
+if __name__ == "__main__":
+    os.environ["LOG_TO_FILE"] = "0"
+    os.environ["LOG_LEVEL"] = "INFO"
+    setup_logging(level="INFO", prefix="MAIN-PROCESS")
+    demo = build_demo()
+    demo.queue(max_size=10).launch()

benchmark.log ADDED Viewed

	@@ -0,0 +1,41 @@

+[ISOLATED-PROCESS][[36m2024-09-25 18:53:27,439[0m][[34mpytorch[0m][[32mINFO[0m] - Allocating pytorch backend[0m
+[ISOLATED-PROCESS][[36m2024-09-25 18:53:27,439[0m][[34mpytorch[0m][[32mINFO[0m] - 	+ Seeding backend with 42[0m
+[ISOLATED-PROCESS][[36m2024-09-25 18:53:27,440[0m][[34mpytorch[0m][[32mINFO[0m] - 	+ Benchmarking a Transformers model[0m
+[ISOLATED-PROCESS][[36m2024-09-25 18:53:28,549[0m][[34minference[0m][[32mINFO[0m] - Allocating inference scenario[0m
+[ISOLATED-PROCESS][[36m2024-09-25 18:53:28,549[0m][[34minference[0m][[32mINFO[0m] - 	+ Creating input generator[0m
+[ISOLATED-PROCESS][[36m2024-09-25 18:53:28,550[0m][[34minference[0m][[32mINFO[0m] - 	+ Generating Inference inputs[0m
+[ISOLATED-PROCESS][[36m2024-09-25 18:53:28,550[0m][[34minference[0m][[32mINFO[0m] - 	+ Initializing Inference report[0m
+[ISOLATED-PROCESS][[36m2024-09-25 18:53:28,551[0m][[34minference[0m][[32mINFO[0m] - 	+ Preparing input shapes for Inference[0m
+[ISOLATED-PROCESS][[36m2024-09-25 18:53:28,551[0m][[34minference[0m][[32mINFO[0m] - 	+ Running model loading tracking[0m
+[ISOLATED-PROCESS][[36m2024-09-25 18:53:28,551[0m][[34mlatency[0m][[32mINFO[0m] - 	+ Tracking latency using CPU performance counter[0m
+[ISOLATED-PROCESS][[36m2024-09-25 18:53:28,551[0m][[34minference[0m][[32mINFO[0m] - 	+ Loading model for Inference[0m
+[ISOLATED-PROCESS][[36m2024-09-25 18:53:28,552[0m][[34mpytorch[0m][[32mINFO[0m] - 	+ Creating backend temporary directory[0m
+[ISOLATED-PROCESS][[36m2024-09-25 18:53:28,553[0m][[34mpytorch[0m][[32mINFO[0m] - 	+ Loading model with pretrained weights[0m
+[ISOLATED-PROCESS][[36m2024-09-25 18:53:28,554[0m][[34mpytorch[0m][[32mINFO[0m] - 	+ Loading Transformers model[0m
+[ISOLATED-PROCESS][[36m2024-09-25 18:53:28,881[0m][[34mpytorch[0m][[32mINFO[0m] - 	+ Enabling eval mode[0m
+[ISOLATED-PROCESS][[36m2024-09-25 18:53:28,883[0m][[34mpytorch[0m][[32mINFO[0m] - 	+ Cleaning up backend temporary directory[0m
+[ISOLATED-PROCESS][[36m2024-09-25 18:53:28,884[0m][[34minference[0m][[32mINFO[0m] - 	+ Preparing inputs for Inference[0m
+[ISOLATED-PROCESS][[36m2024-09-25 18:53:28,885[0m][[34minference[0m][[32mINFO[0m] - 	+ Warming up backend for Inference[0m
+[ISOLATED-PROCESS][[36m2024-09-25 18:53:29,252[0m][[34minference[0m][[32mINFO[0m] - 	+ Running Inference latency tracking[0m
+[ISOLATED-PROCESS][[36m2024-09-25 18:53:29,252[0m][[34mlatency[0m][[32mINFO[0m] - 	+ Tracking latency using CPU performance counter[0m
+[ISOLATED-PROCESS][[36m2024-09-25 18:53:39,282[0m][[34mlatency[0m][[32mINFO[0m] - 		+ load latency:[0m
+[ISOLATED-PROCESS][[36m2024-09-25 18:53:39,282[0m][[34mlatency[0m][[32mINFO[0m] - 			- count: 1[0m
+[ISOLATED-PROCESS][[36m2024-09-25 18:53:39,283[0m][[34mlatency[0m][[32mINFO[0m] - 			- total: 0.331631 s[0m
+[ISOLATED-PROCESS][[36m2024-09-25 18:53:39,283[0m][[34mlatency[0m][[32mINFO[0m] - 			- mean: 0.331631 s[0m
+[ISOLATED-PROCESS][[36m2024-09-25 18:53:39,283[0m][[34mlatency[0m][[32mINFO[0m] - 			- stdev: 0.000000 s (0.00%)[0m
+[ISOLATED-PROCESS][[36m2024-09-25 18:53:39,284[0m][[34mlatency[0m][[32mINFO[0m] - 			- p50: 0.331631 s[0m
+[ISOLATED-PROCESS][[36m2024-09-25 18:53:39,284[0m][[34mlatency[0m][[32mINFO[0m] - 			- p90: 0.331631 s[0m
+[ISOLATED-PROCESS][[36m2024-09-25 18:53:39,284[0m][[34mlatency[0m][[32mINFO[0m] - 			- p95: 0.331631 s[0m
+[ISOLATED-PROCESS][[36m2024-09-25 18:53:39,284[0m][[34mlatency[0m][[32mINFO[0m] - 			- p99: 0.331631 s[0m
+[ISOLATED-PROCESS][[36m2024-09-25 18:53:39,285[0m][[34mlatency[0m][[32mINFO[0m] - 		+ forward latency:[0m
+[ISOLATED-PROCESS][[36m2024-09-25 18:53:39,285[0m][[34mlatency[0m][[32mINFO[0m] - 			- count: 266[0m
+[ISOLATED-PROCESS][[36m2024-09-25 18:53:39,285[0m][[34mlatency[0m][[32mINFO[0m] - 			- total: 10.021863 s[0m
+[ISOLATED-PROCESS][[36m2024-09-25 18:53:39,285[0m][[34mlatency[0m][[32mINFO[0m] - 			- mean: 0.037676 s[0m
+[ISOLATED-PROCESS][[36m2024-09-25 18:53:39,286[0m][[34mlatency[0m][[32mINFO[0m] - 			- stdev: 0.008922 s (23.68%)[0m
+[ISOLATED-PROCESS][[36m2024-09-25 18:53:39,286[0m][[34mlatency[0m][[32mINFO[0m] - 			- p50: 0.035970 s[0m
+[ISOLATED-PROCESS][[36m2024-09-25 18:53:39,286[0m][[34mlatency[0m][[32mINFO[0m] - 			- p90: 0.043994 s[0m
+[ISOLATED-PROCESS][[36m2024-09-25 18:53:39,286[0m][[34mlatency[0m][[32mINFO[0m] - 			- p95: 0.046884 s[0m
+[ISOLATED-PROCESS][[36m2024-09-25 18:53:39,287[0m][[34mlatency[0m][[32mINFO[0m] - 			- p99: 0.073021 s[0m
+[ISOLATED-PROCESS][[36m2024-09-25 18:53:39,288[0m][[34mlatency[0m][[32mINFO[0m] - 		+ forward throughput: 53.083941 samples/s[0m
+[ISOLATED-PROCESS][[36m2024-09-25 18:53:39,296[0m][[34mprocess[0m][[32mINFO[0m] - 	+ Sending report to main process[0m
+[ISOLATED-PROCESS][[36m2024-09-25 18:53:39,297[0m][[34mprocess[0m][[32mINFO[0m] - 	+ Exiting isolated process[0m

config_store.py CHANGED Viewed

@@ -88,6 +88,10 @@ def get_openvino_config():
     }
 def get_inference_config():
     return {
         "inference.warmup_runs": gr.Slider(

     }
+def get_ipex_config():
+    return {}
 def get_inference_config():
     return {
         "inference.warmup_runs": gr.Slider(

packages.txt ADDED Viewed

File without changes

pyproject.toml DELETED Viewed

@@ -1,3 +0,0 @@
-[tool.black]
-line-length = 119
-target-version = ['py37']