Update performance config files (#5)

dbarbuzzi · web-flow · commit 1bb8483e9e3c · 2025-04-08T15:58:02.000-04:00
* Drop `model` key from server config

* Drop perf client fields

* Add data-type to client config

* Fix data sub-arg
diff --git a/meta-llama/Llama-3.1-8B-Instruct/performance/client.yml b/meta-llama/Llama-3.1-8B-Instruct/performance/client.yml
@@ -1,8 +1,6 @@
-target: "http://localhost:8000/v1"
-model: "meta-llama/Llama-3.1-8B-Instruct"
 data:
   prompt_tokens: 64
-  output_tokens: 16
+  generated_tokens: 16
+data-type: emulated
 rate-type: throughput
 max-seconds: 400
-output_path: ""
diff --git a/meta-llama/Llama-3.1-8B-Instruct/performance/server.yml b/meta-llama/Llama-3.1-8B-Instruct/performance/server.yml
@@ -1,6 +1,5 @@
 # server configs for https://huggingface.co/meta-llama/Meta-Llama-3.1-8B-Instruct
 # config.yaml
-model: meta-llama/Llama-3.1-8B-Instruct
 uvicorn-log-level: "debug"
 trust-remote-code: true
 enable-chunked-prefill: true