Spaces:

optimum
/

llm-perf-leaderboard

Running

App Files Files Community

BenchmarkBot commited on Jun 27, 2023

Commit

a18f8de

1 Parent(s): bee5389

added single and multi gpu inference

Browse files

Files changed (1) hide show

app.py +27 -15

app.py CHANGED Viewed

@@ -26,16 +26,13 @@ SORTING_COLUMN = ["Throughput (tokens/s) ⬆️"]
 llm_perf_dataset_repo = load_dataset_repo(LLM_PERF_DATASET_REPO, OPTIMUM_TOKEN)
-def get_benchmark_df():
     if llm_perf_dataset_repo:
         llm_perf_dataset_repo.git_pull()
     # load
     df = pd.read_csv(
-        "./llm-perf-dataset/reports/cuda_1_100/inference_report.csv")
-    # remove quantized models
-    df = df[df["backend.quantization"].isnull()]
     # preprocess
     df["model"] = df["model"].apply(make_clickable_model)
@@ -61,19 +58,34 @@ with demo:
     gr.Markdown(INTRODUCTION_TEXT, elem_classes="markdown-text")
     with gr.Tabs(elem_classes="tab-buttons") as tabs:
-        with gr.TabItem("📊 A100-80GB Benchmark 🏋️", elem_id="a100-benchmark", id=0):
-            dataframe_text = """<h4>Specifications:</h4>
-            - Single and Multi-GPU Setup
-            - Batch Size: 1
-            - Generated Tokens: 100"""
-            gr.Markdown(dataframe_text, elem_classes="markdown-text")
-            benchmark_df = get_benchmark_df()
             leaderboard_table_lite = gr.components.Dataframe(
-                value=benchmark_df,
                 datatype=COLUMNS_DATATYPES,
                 headers=NEW_COLUMNS,
-                elem_id="pytorch-A100-benchmark",
             )
     with gr.Row():

 llm_perf_dataset_repo = load_dataset_repo(LLM_PERF_DATASET_REPO, OPTIMUM_TOKEN)
+def get_benchmark_df(benchmark):
     if llm_perf_dataset_repo:
         llm_perf_dataset_repo.git_pull()
     # load
     df = pd.read_csv(
+        f"./llm-perf-dataset/reports/{benchmark}/inference_report.csv")
     # preprocess
     df["model"] = df["model"].apply(make_clickable_model)
     gr.Markdown(INTRODUCTION_TEXT, elem_classes="markdown-text")
     with gr.Tabs(elem_classes="tab-buttons") as tabs:
+        with gr.TabItem("🖥️ A100-80GB Benchmark 🏋️", elem_id="A100-benchmark", id=0):
+            SINGLE_A100_TEXT = """<h4>Specifications:</h4>
+            - Single-GPU (1)
+            - Singleton Batch (1)
+            - Thousand Tokens (1000)"""
+            gr.HTML(SINGLE_A100_TEXT)
+            single_A100_df = get_benchmark_df(benchmark="1xA100-80GB")
             leaderboard_table_lite = gr.components.Dataframe(
+                value=single_A100_df,
+                datatype=COLUMNS_DATATYPES,
+                headers=NEW_COLUMNS,
+                elem_id="1xA100-table",
+            )
+            MULTI_A100_TEXT = """<h4>Specifications:</h4>
+            - Multi-GPU (4)
+            - Singleton Batch (1)
+            - Thousand Tokens (1000)"""
+            gr.HTML(MULTI_A100_TEXT)
+            multi_A100_df = get_benchmark_df(benchmark="4xA100-80GB")
+            leaderboard_table_full = gr.components.Dataframe(
+                value=multi_A100_df,
                 datatype=COLUMNS_DATATYPES,
                 headers=NEW_COLUMNS,
+                elem_id="4xA100-table",
             )
     with gr.Row():