|
1 | | -import os |
2 | 1 | from contextlib import ExitStack |
3 | 2 | from dataclasses import dataclass |
4 | | -from typing import Tuple, List |
| 3 | +from typing import List |
5 | 4 |
|
6 | 5 | import click |
7 | 6 | import gradio as gr |
8 | 7 | import pandas as pd |
9 | | -from github import Github, Auth |
10 | 8 |
|
11 | 9 | from parse_results import build_results |
12 | 10 |
|
@@ -69,7 +67,7 @@ def update_bench(model, percentiles): |
69 | 67 | return res + [summary_table()] |
70 | 68 |
|
71 | 69 | def summary_table() -> pd.DataFrame: |
72 | | - data = df_bench.groupby(['model', 'run_id','rate']).agg( |
| 70 | + data = df_bench.groupby(['model', 'run_id', 'rate']).agg( |
73 | 71 | {'inter_token_latency_ms_p90': 'mean', 'time_to_first_token_ms_p90': 'mean', |
74 | 72 | 'e2e_latency_ms_p90': 'mean', 'token_throughput_secs': 'mean', |
75 | 73 | 'successful_requests': 'mean', 'error_rate': 'mean'}).reset_index() |
@@ -196,7 +194,7 @@ def load_datasource(datasource, fn): |
196 | 194 | demo.load(load_demo, [model, percentiles_bench], |
197 | 195 | [item["component"] for item in line_plots_bench] + [table]) |
198 | 196 |
|
199 | | - demo.launch(server_port=port) |
| 197 | + demo.launch(server_port=port, server_name="0.0.0.0") |
200 | 198 |
|
201 | 199 |
|
202 | 200 | @click.command() |
|
0 commit comments