|
| 1 | +# vLLM Production Stack configuration with official Helm chart |
| 2 | +CONFIG_KDEVOPS_FIRST_RUN=n |
| 3 | +CONFIG_LIBVIRT=y |
| 4 | +CONFIG_LIBVIRT_URI="qemu:///system" |
| 5 | +CONFIG_LIBVIRT_HOST_PASSTHROUGH=y |
| 6 | +CONFIG_LIBVIRT_MACHINE_TYPE_DEFAULT=y |
| 7 | +CONFIG_LIBVIRT_CPU_MODEL_PASSTHROUGH=y |
| 8 | +CONFIG_LIBVIRT_VCPUS=64 |
| 9 | +CONFIG_LIBVIRT_MEM_64G=y |
| 10 | +CONFIG_LIBVIRT_OS_VARIANT="generic" |
| 11 | +CONFIG_LIBVIRT_IMAGE_SIZE="100G" |
| 12 | +CONFIG_LIBVIRT_LVM_GROUP="" |
| 13 | +CONFIG_TARGET_ARCH_X86_64=y |
| 14 | +CONFIG_KDEVOPS_LOCAL_QCOW2_DEVELOPMENT=y |
| 15 | +CONFIG_KDEVOPS_SETUP_WORKFLOWS=y |
| 16 | + |
| 17 | +# Target kernel configuration |
| 18 | +CONFIG_TARGET_LINUX_UPSTREAM=y |
| 19 | +CONFIG_TARGET_LINUX_UPSTREAM_LINUS=y |
| 20 | +CONFIG_TARGET_LINUX_VERSION="linus" |
| 21 | + |
| 22 | +# Network configuration |
| 23 | +CONFIG_GUESTFS_DEFAULT_BRIDGE=y |
| 24 | +CONFIG_GUESTFS_NETWORK="default" |
| 25 | +CONFIG_KDEVOPS_HOSTS="hosts" |
| 26 | +CONFIG_KDEVOPS_NODES="nodes" |
| 27 | +CONFIG_SSH_NO_VERIFY_KNOWNHOSTS=y |
| 28 | + |
| 29 | +# Workflow configuration |
| 30 | +CONFIG_WORKFLOWS=y |
| 31 | +CONFIG_WORKFLOWS_TESTS=y |
| 32 | +CONFIG_WORKFLOWS_LINUX_TESTS=y |
| 33 | +CONFIG_WORKFLOWS_DEDICATED_WORKFLOW=y |
| 34 | +CONFIG_KDEVOPS_WORKFLOW_DEDICATE_VLLM=y |
| 35 | + |
| 36 | +# vLLM Production Stack specific configuration |
| 37 | +CONFIG_VLLM_PRODUCTION_STACK=y |
| 38 | +CONFIG_VLLM_K8S_MINIKUBE=y |
| 39 | +CONFIG_VLLM_VERSION_LATEST=y |
| 40 | +CONFIG_VLLM_HELM_RELEASE_NAME="vllm-prod" |
| 41 | +CONFIG_VLLM_HELM_NAMESPACE="vllm-system" |
| 42 | +CONFIG_VLLM_PROD_STACK_REPO="https://vllm-project.github.io/production-stack" |
| 43 | +CONFIG_VLLM_PROD_STACK_CHART_VERSION="latest" |
| 44 | +CONFIG_VLLM_PROD_STACK_ROUTER_IMAGE="ghcr.io/vllm-project/production-stack/router" |
| 45 | +CONFIG_VLLM_PROD_STACK_ROUTER_TAG="latest" |
| 46 | +CONFIG_VLLM_PROD_STACK_ENABLE_MONITORING=y |
| 47 | +CONFIG_VLLM_PROD_STACK_ENABLE_AUTOSCALING=n |
| 48 | +CONFIG_VLLM_MODEL_URL="facebook/opt-125m" |
| 49 | +CONFIG_VLLM_MODEL_NAME="opt-125m" |
| 50 | +CONFIG_VLLM_REPLICA_COUNT=2 |
| 51 | +CONFIG_VLLM_USE_CPU_INFERENCE=y |
| 52 | +CONFIG_VLLM_REQUEST_CPU=8 |
| 53 | +CONFIG_VLLM_REQUEST_MEMORY="20Gi" |
| 54 | +CONFIG_VLLM_REQUEST_GPU=0 |
| 55 | +CONFIG_VLLM_MAX_MODEL_LEN=2048 |
| 56 | +CONFIG_VLLM_DTYPE="float32" |
| 57 | +CONFIG_VLLM_TENSOR_PARALLEL_SIZE=1 |
| 58 | +CONFIG_VLLM_ROUTER_ENABLED=y |
| 59 | +CONFIG_VLLM_ROUTER_ROUND_ROBIN=y |
| 60 | +CONFIG_VLLM_OBSERVABILITY_ENABLED=y |
| 61 | +CONFIG_VLLM_GRAFANA_PORT=3000 |
| 62 | +CONFIG_VLLM_PROMETHEUS_PORT=9090 |
| 63 | +CONFIG_VLLM_API_PORT=8000 |
| 64 | +CONFIG_VLLM_BENCHMARK_ENABLED=y |
| 65 | +CONFIG_VLLM_BENCHMARK_DURATION=60 |
| 66 | +CONFIG_VLLM_BENCHMARK_CONCURRENT_USERS=10 |
| 67 | +CONFIG_VLLM_BENCHMARK_RESULTS_DIR="/data/vllm-benchmark" |
0 commit comments