BenchmarkBot commited on
Commit
a18f8de
Β·
1 Parent(s): bee5389

added single and multi gpu inference

Browse files
Files changed (1) hide show
  1. app.py +27 -15
app.py CHANGED
@@ -26,16 +26,13 @@ SORTING_COLUMN = ["Throughput (tokens/s) ⬆️"]
26
  llm_perf_dataset_repo = load_dataset_repo(LLM_PERF_DATASET_REPO, OPTIMUM_TOKEN)
27
 
28
 
29
- def get_benchmark_df():
30
  if llm_perf_dataset_repo:
31
  llm_perf_dataset_repo.git_pull()
32
 
33
  # load
34
  df = pd.read_csv(
35
- "./llm-perf-dataset/reports/cuda_1_100/inference_report.csv")
36
-
37
- # remove quantized models
38
- df = df[df["backend.quantization"].isnull()]
39
 
40
  # preprocess
41
  df["model"] = df["model"].apply(make_clickable_model)
@@ -61,19 +58,34 @@ with demo:
61
  gr.Markdown(INTRODUCTION_TEXT, elem_classes="markdown-text")
62
 
63
  with gr.Tabs(elem_classes="tab-buttons") as tabs:
64
- with gr.TabItem("πŸ“Š A100-80GB Benchmark πŸ‹οΈ", elem_id="a100-benchmark", id=0):
65
- dataframe_text = """<h4>Specifications:</h4>
66
- - Single and Multi-GPU Setup
67
- - Batch Size: 1
68
- - Generated Tokens: 100"""
69
-
70
- gr.Markdown(dataframe_text, elem_classes="markdown-text")
71
- benchmark_df = get_benchmark_df()
 
72
  leaderboard_table_lite = gr.components.Dataframe(
73
- value=benchmark_df,
 
 
 
 
 
 
 
 
 
 
 
 
 
 
74
  datatype=COLUMNS_DATATYPES,
75
  headers=NEW_COLUMNS,
76
- elem_id="pytorch-A100-benchmark",
77
  )
78
 
79
  with gr.Row():
 
26
  llm_perf_dataset_repo = load_dataset_repo(LLM_PERF_DATASET_REPO, OPTIMUM_TOKEN)
27
 
28
 
29
+ def get_benchmark_df(benchmark):
30
  if llm_perf_dataset_repo:
31
  llm_perf_dataset_repo.git_pull()
32
 
33
  # load
34
  df = pd.read_csv(
35
+ f"./llm-perf-dataset/reports/{benchmark}/inference_report.csv")
 
 
 
36
 
37
  # preprocess
38
  df["model"] = df["model"].apply(make_clickable_model)
 
58
  gr.Markdown(INTRODUCTION_TEXT, elem_classes="markdown-text")
59
 
60
  with gr.Tabs(elem_classes="tab-buttons") as tabs:
61
+ with gr.TabItem("πŸ–₯️ A100-80GB Benchmark πŸ‹οΈ", elem_id="A100-benchmark", id=0):
62
+
63
+ SINGLE_A100_TEXT = """<h4>Specifications:</h4>
64
+ - Single-GPU (1)
65
+ - Singleton Batch (1)
66
+ - Thousand Tokens (1000)"""
67
+ gr.HTML(SINGLE_A100_TEXT)
68
+
69
+ single_A100_df = get_benchmark_df(benchmark="1xA100-80GB")
70
  leaderboard_table_lite = gr.components.Dataframe(
71
+ value=single_A100_df,
72
+ datatype=COLUMNS_DATATYPES,
73
+ headers=NEW_COLUMNS,
74
+ elem_id="1xA100-table",
75
+ )
76
+
77
+ MULTI_A100_TEXT = """<h4>Specifications:</h4>
78
+ - Multi-GPU (4)
79
+ - Singleton Batch (1)
80
+ - Thousand Tokens (1000)"""
81
+ gr.HTML(MULTI_A100_TEXT)
82
+
83
+ multi_A100_df = get_benchmark_df(benchmark="4xA100-80GB")
84
+ leaderboard_table_full = gr.components.Dataframe(
85
+ value=multi_A100_df,
86
  datatype=COLUMNS_DATATYPES,
87
  headers=NEW_COLUMNS,
88
+ elem_id="4xA100-table",
89
  )
90
 
91
  with gr.Row():