diff --git a/website/docs/overview/categories/overview.md b/website/docs/overview/categories/overview.md index 2d3fa116..9976b1ca 100644 --- a/website/docs/overview/categories/overview.md +++ b/website/docs/overview/categories/overview.md @@ -1,4 +1,4 @@ -# Category Overview +# Overview The Category system is the intelligence core of vLLM Semantic Router, enabling intelligent query classification and routing decisions based on semantic understanding of user inputs. diff --git a/website/docs/overview/semantic-router-overview.md b/website/docs/overview/semantic-router-overview.md index 5aaab1a6..958f04d6 100644 --- a/website/docs/overview/semantic-router-overview.md +++ b/website/docs/overview/semantic-router-overview.md @@ -1,4 +1,4 @@ -# Semantic Router Overview +# What is Semantic Router? Semantic routers represent a paradigm shift in how we deploy and utilize large language models at scale. By intelligently routing queries to the most appropriate model based on semantic understanding, these systems optimize the critical balance between performance, cost, and quality. diff --git a/docs/design/additional-prompt-classification-routing.md b/website/docs/proposals/prompt-classification-routing.md similarity index 98% rename from docs/design/additional-prompt-classification-routing.md rename to website/docs/proposals/prompt-classification-routing.md index a527b648..653d8b59 100644 --- a/docs/design/additional-prompt-classification-routing.md +++ b/website/docs/proposals/prompt-classification-routing.md @@ -1,4 +1,4 @@ -# Additional Prompt Classification Routing for vLLM Semantic Router +# Prompt Classification Routing **Related Issues:** [#313](https://github.com/vllm-project/semantic-router/issues/313), [#200](https://github.com/vllm-project/semantic-router/issues/200) @@ -212,7 +212,7 @@ The Regex Scanner uses regular expression patterns to detect structured data and - **Performance:** ~2-5ms for dozens of patterns - **Use Case:** PII patterns (SSN, credit cards), CVE IDs, email addresses, structured data - **Safety:** RE2 engine prevents catastrophic backtracking (ReDoS protection) -- **Limitations:** Best for <100 patterns; for larger rule sets, use MCP with Hyperscan +- **Limitations:** Best for fewer than 100 patterns; for larger rule sets, use MCP with Hyperscan **Example Use:** Detect and block Social Security Numbers, route CVE IDs to security models. @@ -347,7 +347,7 @@ The Signal Fusion Layer is the decision-making engine that combines all signals - **Priority-Based**: Rules evaluated from highest to lowest priority (200 → 0) - **Short-Circuit**: First matching rule wins, no further evaluation - **Boolean Expressions**: Combine multiple signal conditions with AND, OR, NOT -- **Flexible Comparisons**: Support ==, !=, >, <, >=, <= for numeric thresholds +- **Flexible Comparisons**: Support `==`, `!=`, `>`, `<`, `>=`, `<=` for numeric thresholds **Expression Capabilities:** diff --git a/website/sidebars.ts b/website/sidebars.ts index f324e817..2bde9dda 100644 --- a/website/sidebars.ts +++ b/website/sidebars.ts @@ -54,7 +54,7 @@ const sidebars: SidebarsConfig = { }, { type: 'category', - label: 'Tutorials', + label: 'Capacities', items: [ { type: 'category', @@ -92,6 +92,13 @@ const sidebars: SidebarsConfig = { }, ], }, + { + type: 'category', + label: 'Proposals', + items: [ + 'proposals/prompt-classification-routing', + ], + }, { type: 'category', label: 'Model Training',