We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
1 parent e3e0adb commit ab2c023Copy full SHA for ab2c023
tutorials/assets/values-16-disagg-prefill.yaml
@@ -23,7 +23,7 @@ servingEngineSpec:
23
kvRole: "kv_producer"
24
enableNixl: true
25
nixlRole: "sender"
26
- nixlPeerHost: "vllm-llama-decode-engine-service"
+ nixlPeerHost: "pd-llama-decode-engine-service"
27
nixlPeerPort: "55555"
28
nixlBufferSize: "1073741824" # 1GB
29
nixlBufferDevice: "cuda"
0 commit comments