Skip to content
Merged
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
4 changes: 2 additions & 2 deletions docs/run.md
Original file line number Diff line number Diff line change
Expand Up @@ -76,13 +76,13 @@ data:
min: 10 # min length of the synthetic prompts
max: 100 # max length of the synthetic prompts
mean: 50 # mean length of the synthetic prompts
std: 10 # standard deviation of the length of the synthetic prompts
std_dev: 10 # standard deviation of the length of the synthetic prompts
total_count: 100 # total number of prompts to generate to fit the above mentioned distribution constraints
output_distribution:
min: 10 # min length of the output to be generated
max: 100 # max length of the output to be generated
mean: 50 # mean length of the output to be generated
std: 10 # standard deviation of the length of the output to be generated
std_dev: 10 # standard deviation of the length of the output to be generated
total_count: 100 # total number of output lengths to generate to fit the above mentioned distribution constraints
report:
request_lifecycle:
Expand Down
4 changes: 2 additions & 2 deletions existing_stack/config_template.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -51,13 +51,13 @@ workload: # yaml configuration for harness workload(s)
min: 10 # min length of the synthetic prompts
max: 100 # max length of the synthetic prompts
mean: 50 # mean length of the synthetic prompts
std: 10 # standard deviation of the length of the synthetic prompts
std_dev: 10 # standard deviation of the length of the synthetic prompts
total_count: 100 # total number of prompts to generate to fit the above mentioned distribution constraints
output_distribution:
min: 10 # min length of the output to be generated
max: 100 # max length of the output to be generated
mean: 50 # mean length of the output to be generated
std: 10 # standard deviation of the length of the output to be generated
std_dev: 10 # standard deviation of the length of the output to be generated
total_count: 100 # total number of output lengths to generate to fit the above mentioned distribution constraints
report:
request_lifecycle:
Expand Down
4 changes: 2 additions & 2 deletions workload/profiles/inference-perf/chatbot_synthetic.yaml.in
Original file line number Diff line number Diff line change
Expand Up @@ -25,13 +25,13 @@ data:
min: 10 # min length of the synthetic prompts
max: 8192 # max length of the synthetic prompts
mean: 4096 # mean length of the synthetic prompts
std: 2048 # standard deviation of the length of the synthetic prompts
std_dev: 2048 # standard deviation of the length of the synthetic prompts
total_count: 1000 # total number of prompts to generate to fit the above mentioned distribution constraints
output_distribution:
min: 10 # min length of the output to be generated
max: 2048 # max length of the output to be generated
mean: 1024 # mean length of the output to be generated
std: 512 # standard deviation of the length of the output to be generated
std_dev: 512 # standard deviation of the length of the output to be generated
total_count: 1000 # total number of output lengths to generate to fit the above mentioned distribution constraints
report:
request_lifecycle:
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -25,13 +25,13 @@ data:
min: 10 # min length of the synthetic prompts
max: 4096 # max length of the synthetic prompts
mean: 2048 # mean length of the synthetic prompts
std: 1024 # standard deviation of the length of the synthetic prompts
std_dev: 1024 # standard deviation of the length of the synthetic prompts
total_count: 1000 # total number of prompts to generate to fit the above mentioned distribution constraints
output_distribution:
min: 10 # min length of the output to be generated
max: 256 # max length of the output to be generated
mean: 128 # mean length of the output to be generated
std: 64 # standard deviation of the length of the output to be generated
std_dev: 64 # standard deviation of the length of the output to be generated
total_count: 1000 # total number of output lengths to generate to fit the above mentioned distribution constraints
report:
request_lifecycle:
Expand Down
4 changes: 2 additions & 2 deletions workload/profiles/inference-perf/sanity_random.yaml.in
Original file line number Diff line number Diff line change
Expand Up @@ -19,13 +19,13 @@ data:
min: 10 # min length of the synthetic prompts
max: 100 # max length of the synthetic prompts
mean: 50 # mean length of the synthetic prompts
std: 10 # standard deviation of the length of the synthetic prompts
std_dev: 10 # standard deviation of the length of the synthetic prompts
total_count: 100 # total number of prompts to generate to fit the above mentioned distribution constraints
output_distribution:
min: 10 # min length of the output to be generated
max: 100 # max length of the output to be generated
mean: 50 # mean length of the output to be generated
std: 10 # standard deviation of the length of the output to be generated
std_dev: 10 # standard deviation of the length of the output to be generated
total_count: 100 # total number of output lengths to generate to fit the above mentioned distribution constraints
report:
request_lifecycle:
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -25,13 +25,13 @@ data:
min: 10 # min length of the synthetic prompts
max: 4096 # max length of the synthetic prompts
mean: 2048 # mean length of the synthetic prompts
std: 1024 # standard deviation of the length of the synthetic prompts
std_dev: 1024 # standard deviation of the length of the synthetic prompts
total_count: 1000 # total number of prompts to generate to fit the above mentioned distribution constraints
output_distribution:
min: 10 # min length of the output to be generated
max: 512 # max length of the output to be generated
mean: 256 # mean length of the output to be generated
std: 128 # standard deviation of the length of the output to be generated
std_dev: 128 # standard deviation of the length of the output to be generated
total_count: 1000 # total number of output lengths to generate to fit the above mentioned distribution constraints
report:
request_lifecycle:
Expand Down