@@ -101,15 +101,17 @@ def run_pipeline(
101
101
args .output_len_std ,
102
102
)
103
103
request_records = pipeline (request_records )
104
- assert len (request_records ) == args .num_requests
105
- sorted_requests : List [RequestRecord ] = [None ] * args .num_requests
104
+ assert len (request_records ) == args .num_requests * args . num_gpus
105
+ sorted_requests : List [RequestRecord ] = [None ] * args .num_requests * args . num_gpus
106
106
for request_record in request_records :
107
107
assert request_record .request_id is not None
108
108
assert sorted_requests [request_record .request_id ] is None
109
109
sorted_requests [request_record .request_id ] = request_record
110
110
111
111
request_records = MetricAnalyzer (tokenizer )(request_records )
112
- report = generate_metrics_summary (request_records , args .num_requests , args .num_gpus )
112
+ report = generate_metrics_summary (
113
+ request_records , args .num_requests * args .num_gpus , args .num_gpus
114
+ )
113
115
return report , sorted_requests
114
116
115
117
@@ -135,7 +137,7 @@ def _main():
135
137
tokenizer = AutoTokenizer .from_pretrained (args .tokenizer )
136
138
dataset = create_dataset (args , tokenizer )
137
139
f_create_api_endpoint = functools .partial (create_api_endpoint , args )
138
- pipelines = create_pipelines (args , f_create_api_endpoint )
140
+ pipelines = create_pipelines (args , f_create_api_endpoint , dataset )
139
141
reports = []
140
142
alltime_records = {}
141
143
for i , pipeline in enumerate (pipelines ):
@@ -291,6 +293,7 @@ def _main():
291
293
parser .add_argument (
292
294
"--timeout" ,
293
295
type = float ,
296
+ default = 3 * 60 * 60 ,
294
297
help = "The timeout limit of each request." ,
295
298
)
296
299
parser .add_argument (
@@ -380,4 +383,8 @@ def _main():
380
383
"The --num-concurrent-requests should be provided when enabling this option." ,
381
384
)
382
385
386
+ parser .add_argument (
387
+ "--testset-name" , type = str , help = "The name of the testset. Only used for Loogle dataset"
388
+ )
389
+
383
390
main (parser .parse_args ())
0 commit comments