Skip to content

Commit ae76754

Browse files
committed
update docs
1 parent 22cbcaa commit ae76754

File tree

2 files changed

+11
-2
lines changed

2 files changed

+11
-2
lines changed

docs/EN/source/getting_started/quickstart.rst

Lines changed: 7 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -81,4 +81,11 @@ In a new terminal, use the following command to test the model service:
8181
$ }'
8282
8383
84+
For DeepSeek-R1 benchmark, use the following command to test the model service:
85+
86+
.. code-block:: console
87+
88+
$ cd test
89+
$ python benchmark_client.py --num_clients 100 --input_num 2000 --tokenizer_path /nvme/DeepSeek-R1/ --url http://127.0.01:8000/generate_stream
90+
8491

test/benchmark_client.py

Lines changed: 4 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -60,6 +60,7 @@ def gen_random_data(
6060
prompts.append(input_text)
6161
input_lens.append(input_len)
6262
output_lens.append(output_len)
63+
print("Generate random data finish.")
6364
return prompts, input_lens, output_lens
6465

6566

@@ -143,8 +144,8 @@ def post_stream_triton(url: str, text_input: str, max_new_tokens: int) -> List[f
143144

144145
def main():
145146
parser = argparse.ArgumentParser()
146-
parser.add_argument("--url", type=str, default="")
147-
parser.add_argument("--num_clients", type=int, default=0)
147+
parser.add_argument("--url", type=str, default="http://127.0.0.1:8000/generate_stream")
148+
parser.add_argument("--num_clients", type=int, default=100)
148149
parser.add_argument("--tokenizer_path", type=str, default=None)
149150
parser.add_argument("--input_num", type=int, default=2000)
150151
parser.add_argument("--input_len", type=int, default=1024)
@@ -161,6 +162,7 @@ def main():
161162
print(json.dumps(content, indent=4))
162163
return
163164

165+
assert args.tokenizer_path is not None
164166
model_name.append(args.tokenizer_path)
165167
seed_all(args.seed)
166168
url = args.url

0 commit comments

Comments
 (0)