-{"version":{"pluginId":"default","version":"current","label":"Next","banner":null,"badge":false,"noIndex":false,"className":"docs-version-current","isLast":true,"docsSidebars":{"tutorialSidebar":[{"type":"link","label":"LLM Semantic Router","href":"/docs/intro","docId":"intro","unlisted":false},{"type":"category","label":"Overview","items":[{"type":"link","label":"Semantic Router Overview","href":"/docs/overview/semantic-router-overview","docId":"overview/semantic-router-overview","unlisted":false},{"type":"link","label":"Why Mixture of Models?","href":"/docs/overview/mixture-of-models","docId":"overview/mixture-of-models","unlisted":false}],"collapsed":true,"collapsible":true},{"type":"category","label":"Architecture","items":[{"type":"link","label":"System Architecture","href":"/docs/architecture/system-architecture","docId":"architecture/system-architecture","unlisted":false},{"type":"link","label":"Envoy ExtProc Integration","href":"/docs/architecture/envoy-extproc","docId":"architecture/envoy-extproc","unlisted":false},{"type":"link","label":"Router Implementation Details","href":"/docs/architecture/router-implementation","docId":"architecture/router-implementation","unlisted":false}],"collapsed":true,"collapsible":true},{"type":"category","label":"Model Training","items":[{"type":"link","label":"Model Training Overview","href":"/docs/training/training-overview","docId":"training/training-overview","unlisted":false},{"type":"link","label":"Classification Models","href":"/docs/training/classification-models","docId":"training/classification-models","unlisted":false},{"type":"link","label":"Datasets and Purposes","href":"/docs/training/datasets","docId":"training/datasets","unlisted":false}],"collapsed":true,"collapsible":true},{"type":"category","label":"Getting Started","items":[{"type":"link","label":"Installation Guide","href":"/docs/getting-started/installation","docId":"getting-started/installation","unlisted":false},{"type":"link","label":"Quick Start Guide","href":"/docs/getting-started/quick-start","docId":"getting-started/quick-start","unlisted":false},{"type":"link","label":"Configuration Guide","href":"/docs/getting-started/configuration","docId":"getting-started/configuration","unlisted":false}],"collapsed":true,"collapsible":true},{"type":"category","label":"API Reference","items":[{"type":"link","label":"Router API Reference","href":"/docs/api/router","docId":"api/router","unlisted":false},{"type":"link","label":"Classification API Reference","href":"/docs/api/classification","docId":"api/classification","unlisted":false}],"collapsed":true,"collapsible":true}]},"docs":{"api/classification":{"id":"api/classification","title":"Classification API Reference","description":"The Classification API provides direct access to the Semantic Router's classification models for intent detection, PII identification, and security analysis. This API is useful for testing, debugging, and standalone classification tasks.","sidebar":"tutorialSidebar"},"api/router":{"id":"api/router","title":"Router API Reference","description":"The Semantic Router provides a gRPC-based API that integrates seamlessly with Envoy's External Processing (ExtProc) protocol. This document covers the API endpoints, request/response formats, and integration patterns.","sidebar":"tutorialSidebar"},"architecture/envoy-extproc":{"id":"architecture/envoy-extproc","title":"Envoy ExtProc Integration","description":"The Semantic Router leverages Envoy's External Processing (ExtProc) filter to implement intelligent routing decisions. This integration provides a clean separation between traffic management (Envoy) and business logic (Semantic Router), enabling sophisticated routing capabilities while maintaining high performance.","sidebar":"tutorialSidebar"},"architecture/router-implementation":{"id":"architecture/router-implementation","title":"Router Implementation Details","description":"This document provides detailed insights into the core routing algorithms, classification logic, and implementation specifics of the Semantic Router.","sidebar":"tutorialSidebar"},"architecture/system-architecture":{"id":"architecture/system-architecture","title":"System Architecture","description":"The Semantic Router implements a sophisticated Mixture-of-Models (MoM) architecture using Envoy Proxy as the foundation, with an External Processor (ExtProc) service that provides intelligent routing capabilities. This design ensures high performance, scalability, and maintainability for production LLM deployments.","sidebar":"tutorialSidebar"},"getting-started/configuration":{"id":"getting-started/configuration","title":"Configuration Guide","description":"This guide covers all configuration options available in the Semantic Router, from basic setup to advanced customization for production deployments.","sidebar":"tutorialSidebar"},"getting-started/installation":{"id":"getting-started/installation","title":"Installation Guide","description":"This guide will help you set up and install the Semantic Router on your system. The installation process includes setting up dependencies, downloading models, and configuring the routing system.","sidebar":"tutorialSidebar"},"getting-started/quick-start":{"id":"getting-started/quick-start","title":"Quick Start Guide","description":"This guide will get you up and running with the Semantic Router in just a few minutes. Follow these steps to see the router in action with intelligent model selection.","sidebar":"tutorialSidebar"},"intro":{"id":"intro","title":"LLM Semantic Router","description":"License","sidebar":"tutorialSidebar"},"overview/mixture-of-models":{"id":"overview/mixture-of-models","title":"Why Mixture of Models?","description":"The Mixture of Models (MoM) approach represents a fundamental shift from traditional single-model deployment to a more intelligent, cost-effective, and performance-optimized architecture. This section explores the compelling reasons why MoM has become the preferred approach for production LLM deployments.","sidebar":"tutorialSidebar"},"overview/semantic-router-overview":{"id":"overview/semantic-router-overview","title":"Semantic Router Overview","description":"Semantic routers represent a paradigm shift in how we deploy and utilize large language models at scale. By intelligently routing queries to the most appropriate model based on semantic understanding, these systems optimize the critical balance between performance, cost, and quality.","sidebar":"tutorialSidebar"},"training/classification-models":{"id":"training/classification-models","title":"Classification Models","description":"This document provides in-depth technical details about each classification model used in the Semantic Router, including architecture specifics, training procedures, and performance characteristics.","sidebar":"tutorialSidebar"},"training/datasets":{"id":"training/datasets","title":"Datasets and Purposes","description":"This document provides comprehensive details about the datasets used to train each classification model in the Semantic Router, including data sources, preprocessing methods, and the specific purposes each dataset serves in the routing pipeline.","sidebar":"tutorialSidebar"},"training/training-overview":{"id":"training/training-overview","title":"Model Training Overview","description":"The Semantic Router relies on multiple specialized classification models to make intelligent routing decisions. This section provides a comprehensive overview of the training process, datasets used, and the purpose of each model in the routing pipeline.","sidebar":"tutorialSidebar"}}}}
0 commit comments