Skip to content
6 changes: 6 additions & 0 deletions Qwen/Qwen2.5-7B-Instruct/accuracy/server-rocm.yml
Original file line number Diff line number Diff line change
@@ -0,0 +1,6 @@
# common/accuracy/server.yml
trust-remote-code: true
tensor-parallel-size: 1
max-model-len: 16384
# override
gpu_memory_utilization: 0.6
Original file line number Diff line number Diff line change
@@ -0,0 +1,6 @@
# common/accuracy/server.yml
trust-remote-code: true
tensor-parallel-size: 1
max-model-len: 16384
# override
enforce-eager: true
Original file line number Diff line number Diff line change
@@ -0,0 +1,6 @@
# common/accuracy/server.yml
trust-remote-code: true
tensor-parallel-size: 1
max-model-len: 16384
# override
enforce-eager: true
Original file line number Diff line number Diff line change
@@ -0,0 +1,6 @@
# common/accuracy/server.yml
trust-remote-code: true
tensor-parallel-size: 1
max-model-len: 16384
# override
enforce-eager: true
Original file line number Diff line number Diff line change
@@ -0,0 +1,6 @@
# common/accuracy/server.yml
trust-remote-code: true
tensor-parallel-size: 1
max-model-len: 16384
# override
enforce-eager: true
Original file line number Diff line number Diff line change
@@ -0,0 +1,6 @@
# common/accuracy/server.yml
trust-remote-code: true
tensor-parallel-size: 1
max-model-len: 16384
# override
enforce-eager: true
Original file line number Diff line number Diff line change
@@ -0,0 +1,6 @@
# common/accuracy/server.yml
trust-remote-code: true
tensor-parallel-size: 1
max-model-len: 16384
# override
enforce-eager: true
6 changes: 6 additions & 0 deletions RedHatAI/phi-4-FP8-dynamic/accuracy/server-rocm.yml
Original file line number Diff line number Diff line change
@@ -0,0 +1,6 @@
# common/accuracy/server.yml
trust-remote-code: true
tensor-parallel-size: 1
max-model-len: 16384
# override
enforce-eager: true
6 changes: 6 additions & 0 deletions ibm-granite/granite-3.1-8b-instruct/accuracy/server-rocm.yml
Original file line number Diff line number Diff line change
@@ -0,0 +1,6 @@
# common/accuracy/server.yml
trust-remote-code: true
tensor-parallel-size: 1
max-model-len: 16384
# override
enforce-eager: true
6 changes: 6 additions & 0 deletions meta-llama/Llama-3.1-8B-Instruct/accuracy/server-rocm.yml
Original file line number Diff line number Diff line change
@@ -0,0 +1,6 @@
# common/accuracy/server.yml
trust-remote-code: true
tensor-parallel-size: 1
max-model-len: 16384
# override
enforce-eager: true
Original file line number Diff line number Diff line change
@@ -0,0 +1,6 @@
# common/accuracy/server.yml
trust-remote-code: true
tensor-parallel-size: 1
max-model-len: 16384
# override
gpu_memory_utilization: 0.6
Original file line number Diff line number Diff line change
@@ -0,0 +1,6 @@
# common/accuracy/server.yml
trust-remote-code: true
tensor-parallel-size: 1
max-model-len: 16384
# override
gpu_memory_utilization: 0.6
7 changes: 7 additions & 0 deletions mistralai/Mixtral-8x7B-Instruct-v0.1/accuracy/server-rocm.yml
Original file line number Diff line number Diff line change
@@ -0,0 +1,7 @@
# https://huggingface.co/mistralai/Mixtral-8x7B-Instruct-v0.1
model: 'mistralai/Mixtral-8x7B-Instruct-v0.1'
Copy link
Member

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

The model config here can be removed.

trust-remote-code: true
tensor-parallel-size: 2
max-model-len: 16384
# override
enforce-eager: true