ai-dynamo
diff --git a/‎.github/filters.yaml‎
Lines changed: 3 additions & 3 deletions b/‎.github/filters.yaml‎
Lines changed: 3 additions & 3 deletions
diff --git a/‎.github/workflows/container-validation-backends.yml‎
Lines changed: 1 addition & 1 deletion b/‎.github/workflows/container-validation-backends.yml‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎README.md‎
Lines changed: 1 addition & 1 deletion b/‎README.md‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎benchmarks/README.md‎
Lines changed: 1 addition & 1 deletion b/‎benchmarks/README.md‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎benchmarks/profiler/utils/config_modifiers/sglang.py‎
Lines changed: 1 addition & 1 deletion b/‎benchmarks/profiler/utils/config_modifiers/sglang.py‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎benchmarks/profiler/utils/config_modifiers/trtllm.py‎
Lines changed: 1 addition & 1 deletion b/‎benchmarks/profiler/utils/config_modifiers/trtllm.py‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎benchmarks/profiler/utils/config_modifiers/vllm.py‎
Lines changed: 1 addition & 1 deletion b/‎benchmarks/profiler/utils/config_modifiers/vllm.py‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎components/README.md‎
Lines changed: 7 additions & 15 deletions b/‎components/README.md‎
Lines changed: 7 additions & 15 deletions
diff --git a/‎components/src/dynamo/router/README.md‎
Lines changed: 1 addition & 1 deletion b/‎components/src/dynamo/router/README.md‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎container/Dockerfile.sglang-wideep‎
Lines changed: 1 addition & 1 deletion b/‎container/Dockerfile.sglang-wideep‎
Lines changed: 1 addition & 1 deletion
@@ -28,22 +28,22 @@ vllm: &vllm
   - 'container/Dockerfile.vllm'
   - 'container/deps/requirements.vllm.txt'
   - 'container/deps/vllm/**'
-  - 'components/backends/vllm/**'
+  - 'examples/backends/vllm/**'
   - 'components/src/dynamo/vllm/**'
   - 'container/build.sh'
   - 'tests/serve/test_vllm.py'
 
 sglang: &sglang
   - 'container/Dockerfile.sglang'
   - 'container/Dockerfile.sglang-wideep'
-  - 'components/backends/sglang/**'
+  - 'examples/backends/sglang/**'
   - 'components/src/dynamo/sglang/**'
   - 'container/build.sh'
   - 'tests/serve/test_sglang.py'
 
 trtllm: &trtllm
   - 'container/Dockerfile.trtllm'
-  - 'components/backends/trtllm/**'
+  - 'examples/backends/trtllm/**'
   - 'components/src/dynamo/trtllm/**'
   - 'container/build.sh'
   - 'container/build_trtllm_wheel.sh'
 
@@ -429,7 +429,7 @@ jobs:
         export KUBECONFIG=$(pwd)/.kubeconfig
         kubectl config set-context --current --namespace=$NAMESPACE
 
-        cd components/backends/$FRAMEWORK
+        cd examples/backends/$FRAMEWORK
         export FRAMEWORK_RUNTIME_IMAGE="${{ secrets.AZURE_ACR_HOSTNAME }}/ai-dynamo/dynamo:${{ github.sha }}-${FRAMEWORK}-amd64"
         export KUBE_NS=$NAMESPACE
         export GRAPH_NAME=$(yq e '.metadata.name' $DEPLOYMENT_FILE)
 
@@ -171,7 +171,7 @@ Rerun with `curl -N` and change `stream` in the request to `true` to get the res
 ### Deploying Dynamo
 
 - Follow the [Quickstart Guide](docs/kubernetes/README.md) to deploy on Kubernetes.
-- Check out [Backends](components/backends) to deploy various workflow configurations (e.g. SGLang with router, vLLM with disaggregated serving, etc.)
+- Check out [Backends](examples/backends) to deploy various workflow configurations (e.g. SGLang with router, vLLM with disaggregated serving, etc.)
 - Run some [Examples](examples) to learn about building components in Dynamo and exploring various integrations.
 
 ### Benchmarking Dynamo
 
@@ -20,7 +20,7 @@ This directory contains benchmarking scripts and tools for performance evaluatio
 ## Quick Start
 
 ### Benchmark a Dynamo Deployment
-First, deploy your DynamoGraphDeployment using the [deployment documentation](../components/backends/), then:
+First, deploy your DynamoGraphDeployment using the [deployment documentation](../docs/kubernetes/), then:
 
 ```bash
 # Port-forward your deployment to http://localhost:8000
 
@@ -36,7 +36,7 @@
 logger.addHandler(console_handler)
 
 
-DEFAULT_SGLANG_CONFIG_PATH = "components/backends/sglang/deploy/disagg.yaml"
+DEFAULT_SGLANG_CONFIG_PATH = "examples/backends/sglang/deploy/disagg.yaml"
 
 
 class SGLangConfigModifier:
 
@@ -38,7 +38,7 @@
 logger.addHandler(console_handler)
 
 
-DEFAULT_TRTLLM_CONFIG_PATH = "components/backends/trtllm/deploy/disagg.yaml"
+DEFAULT_TRTLLM_CONFIG_PATH = "examples/backends/trtllm/deploy/disagg.yaml"
 
 
 class TrtllmConfigModifier:
 
@@ -34,7 +34,7 @@
 logger.addHandler(console_handler)
 
 
-DEFAULT_VLLM_CONFIG_PATH = "components/backends/vllm/deploy/disagg.yaml"
+DEFAULT_VLLM_CONFIG_PATH = "examples/backends/vllm/deploy/disagg.yaml"
 
 
 class VllmV1ConfigModifier:
 
@@ -19,25 +19,17 @@ limitations under the License.
 
 This directory contains the core components that make up the Dynamo inference framework. Each component serves a specific role in the distributed LLM serving architecture, enabling high-throughput, low-latency inference across multiple nodes and GPUs.
 
-## Supported Inference Engines
-
-Dynamo supports multiple inference engines (with a focus on SGLang, vLLM, and TensorRT-LLM), each with their own deployment configurations and capabilities:
-
-- **[vLLM](/docs/backends/vllm/README.md)** - High-performance LLM inference with native KV cache events and NIXL-based transfer mechanisms
-- **[SGLang](/docs/backends/sglang/README.md)** - Structured generation language framework with ZMQ-based communication
-- **[TensorRT-LLM](/docs/backends/trtllm/README.md)** - NVIDIA's optimized LLM inference engine with TensorRT acceleration
-
-Each engine provides launch scripts for different deployment patterns in their respective `/launch` & `/deploy` directories.
-
 ## Core Components
 
-### [Backends](backends/)
+### Backends
+
+Dynamo supports multiple inference engines, each with their own deployment configurations and capabilities:
 
-The backends directory contains inference engine integrations and implementations, with a key focus on:
+- **[vLLM](/docs/backends/vllm/README.md)** - Full-featured vLLM integration with disaggregated serving, KV-aware routing, SLA-based planning, native KV cache events, and NIXL-based transfer mechanisms
+- **[SGLang](/docs/backends/sglang/README.md)** - SGLang engine integration with ZMQ-based communication, supporting disaggregated serving and KV-aware routing
+- **[TensorRT-LLM](/docs/backends/trtllm/README.md)** - TensorRT-LLM integration with disaggregated serving capabilities and TensorRT acceleration
 
-- **vLLM** - Full-featured vLLM integration with disaggregated serving, KV-aware routing, and SLA-based planning
-- **SGLang** - SGLang engine integration supporting disaggregated serving and KV-aware routing
-- **TensorRT-LLM** - TensorRT-LLM integration with disaggregated serving capabilities
+Each engine provides launch and deploy scripts for different deployment patterns in the [examples](../examples/backends/) folder.
 
 
 ### [Frontend](src/dynamo/frontend/)
 
@@ -47,7 +47,7 @@ Clients query the `find_best_worker` endpoint to determine which worker should p
 >
 > Use this manual setup if you need explicit control over prefill routing configuration or want to manage prefill and decode routers separately.
 
-See [`components/backends/vllm/launch/disagg_router.sh`](/components/backends/vllm/launch/disagg_router.sh) for a complete example.
+See [`examples/backends/vllm/launch/disagg_router.sh`](/examples/backends/vllm/launch/disagg_router.sh) for a complete example.
 
 ```bash
 # Start frontend router for decode workers
 
@@ -87,4 +87,4 @@ ENV PATH=/usr/local/bin/etcd:$PATH
 # Enable forceful shutdown of inflight requests
 ENV SGL_FORCE_SHUTDOWN=1
 
-WORKDIR /sgl-workspace/dynamo/components/backends/sglang
+WORKDIR /sgl-workspace/dynamo/examples/backends/sglang
Original file line number	Diff line number	Diff line change
@@ -47,7 +47,7 @@ Clients query the `find_best_worker` endpoint to determine which worker should p
`47`	`47`	`>`
`48`	`48`	`> Use this manual setup if you need explicit control over prefill routing configuration or want to manage prefill and decode routers separately.`
`49`	`49`
`50`		-See [`components/backends/vllm/launch/disagg_router.sh`](/components/backends/vllm/launch/disagg_router.sh) for a complete example.
	`50`	+See [`examples/backends/vllm/launch/disagg_router.sh`](/examples/backends/vllm/launch/disagg_router.sh) for a complete example.
`51`	`51`
`52`	`52`	```bash
`53`	`53`	`# Start frontend router for decode workers`