|
1 |
| -import os |
2 | 1 | from contextlib import ExitStack
|
3 | 2 | from dataclasses import dataclass
|
4 |
| -from typing import Tuple, List |
| 3 | +from typing import List |
5 | 4 |
|
6 | 5 | import click
|
7 | 6 | import gradio as gr
|
8 | 7 | import pandas as pd
|
9 |
| -from github import Github, Auth |
10 | 8 |
|
11 | 9 | from parse_results import build_results
|
12 | 10 |
|
@@ -69,7 +67,7 @@ def update_bench(model, percentiles):
|
69 | 67 | return res + [summary_table()]
|
70 | 68 |
|
71 | 69 | def summary_table() -> pd.DataFrame:
|
72 |
| - data = df_bench.groupby(['model', 'run_id','rate']).agg( |
| 70 | + data = df_bench.groupby(['model', 'run_id', 'rate']).agg( |
73 | 71 | {'inter_token_latency_ms_p90': 'mean', 'time_to_first_token_ms_p90': 'mean',
|
74 | 72 | 'e2e_latency_ms_p90': 'mean', 'token_throughput_secs': 'mean',
|
75 | 73 | 'successful_requests': 'mean', 'error_rate': 'mean'}).reset_index()
|
@@ -196,7 +194,7 @@ def load_datasource(datasource, fn):
|
196 | 194 | demo.load(load_demo, [model, percentiles_bench],
|
197 | 195 | [item["component"] for item in line_plots_bench] + [table])
|
198 | 196 |
|
199 |
| - demo.launch(server_port=port) |
| 197 | + demo.launch(server_port=port, server_name="0.0.0.0") |
200 | 198 |
|
201 | 199 |
|
202 | 200 | @click.command()
|
|
0 commit comments