redis
diff --git a/‎redisvl/schema/fields.py‎
Lines changed: 25 additions & 6 deletions b/‎redisvl/schema/fields.py‎
Lines changed: 25 additions & 6 deletions
diff --git a/‎redisvl/utils/__init__.py‎
Lines changed: 3 additions & 0 deletions b/‎redisvl/utils/__init__.py‎
Lines changed: 3 additions & 0 deletions
diff --git a/‎redisvl/utils/compression.py‎
Lines changed: 216 additions & 0 deletions b/‎redisvl/utils/compression.py‎
Lines changed: 216 additions & 0 deletions
@@ -16,8 +16,11 @@
 from redis.commands.search.field import TextField as RedisTextField
 from redis.commands.search.field import VectorField as RedisVectorField
 
+from redisvl.utils.log import get_logger
 from redisvl.utils.utils import norm_cosine_distance, norm_l2_distance
 
+logger = get_logger(__name__)
+
 VECTOR_NORM_MAP = {
     "COSINE": norm_cosine_distance,
     "L2": norm_l2_distance,
@@ -241,12 +244,28 @@ def validate_svs_params(self):
                     f"Either use LeanVec4x8/LeanVec8x8 or remove the reduce parameter."
                 )
 
-        # Phase C: Add warning for LeanVec without reduce
-        # if self.compression and self.compression.value.startswith("LeanVec") and not self.reduce:
-        #     logger.warning(
-        #         f"LeanVec compression selected without 'reduce'. "
-        #         f"Consider setting reduce={self.dims//2} for better performance"
-        #     )
+        # LeanVec without reduce is not recommended
+        if (
+            self.compression
+            and self.compression.value.startswith("LeanVec")
+            and not self.reduce
+        ):
+            logger.warning(
+                f"LeanVec compression selected without 'reduce'. "
+                f"Consider setting reduce={self.dims//2} for better performance"
+            )
+
+        if self.graph_max_degree and self.graph_max_degree < 32:
+            logger.warning(
+                f"graph_max_degree={self.graph_max_degree} is low. "
+                f"Consider values between 32-64 for better recall."
+            )
+
+        if self.search_window_size and self.search_window_size > 100:
+            logger.warning(
+                f"search_window_size={self.search_window_size} is high. "
+                f"This may impact query latency. Consider values between 20-50."
+            )
 
         return self
 
 
@@ -0,0 +1,3 @@
+from redisvl.utils.compression import CompressionAdvisor
+
+__all__ = ["CompressionAdvisor"]
@@ -0,0 +1,216 @@
+"""SVS-VAMANA compression configuration utilities."""
+
+from typing import Literal, Optional, TypedDict, cast
+
+
+class SVSConfig(TypedDict, total=False):
+    """SVS-VAMANA configuration dictionary.
+
+    Attributes:
+        algorithm: Always "svs-vamana"
+        datatype: Vector datatype (float16, float32)
+        compression: Compression type (LVQ4, LeanVec4x8, etc.)
+        reduce: Reduced dimensionality (only for LeanVec)
+        graph_max_degree: Max edges per node
+        construction_window_size: Build-time candidates
+        search_window_size: Query-time candidates
+    """
+
+    algorithm: Literal["svs-vamana"]
+    datatype: str
+    compression: str
+    reduce: int  # only for LeanVec
+    graph_max_degree: int
+    construction_window_size: int
+    search_window_size: int
+
+
+class CompressionAdvisor:
+    """Helper to recommend compression settings based on vector characteristics.
+
+    This class provides utilities to:
+    - Recommend optimal SVS-VAMANA configurations based on vector dimensions and priorities
+    - Estimate memory savings from compression and dimensionality reduction
+
+    Examples:
+        >>> # Get recommendations for high-dimensional vectors
+        >>> config = CompressionAdvisor.recommend(dims=1536, priority="balanced")
+        >>> config["compression"]
+        'LeanVec4x8'
+        >>> config["reduce"]
+        768
+
+        >>> # Estimate memory savings
+        >>> savings = CompressionAdvisor.estimate_memory_savings(
+        ...     compression="LeanVec4x8",
+        ...     dims=1536,
+        ...     reduce=768
+        ... )
+        >>> savings
+        81.2
+    """
+
+    # Dimension thresholds
+    HIGH_DIM_THRESHOLD = 1024
+
+    # Compression bit rates (bits per dimension)
+    COMPRESSION_BITS = {
+        "LVQ4": 4,
+        "LVQ4x4": 8,
+        "LVQ4x8": 12,
+        "LVQ8": 8,
+        "LeanVec4x8": 12,
+        "LeanVec8x8": 16,
+    }
+
+    @staticmethod
+    def recommend(
+        dims: int,
+        priority: Literal["speed", "memory", "balanced"] = "balanced",
+        datatype: Optional[str] = None,
+    ) -> SVSConfig:
+        """Recommend compression settings based on dimensions and priorities.
+
+        Args:
+            dims: Vector dimensionality (must be > 0)
+            priority: Optimization priority:
+                - "memory": Maximize memory savings
+                - "speed": Optimize for query speed
+                - "balanced": Balance between memory and speed
+            datatype: Override datatype (default: float16 for high-dim, float32 for low-dim)
+
+        Returns:
+            dict: Complete SVS-VAMANA configuration including:
+                - algorithm: "svs-vamana"
+                - datatype: Recommended datatype
+                - compression: Compression type
+                - reduce: Dimensionality reduction (for LeanVec only)
+                - graph_max_degree: Graph connectivity
+                - construction_window_size: Build-time candidates
+                - search_window_size: Query-time candidates
+
+        Raises:
+            ValueError: If dims <= 0
+
+        Examples:
+            >>> # High-dimensional embeddings (e.g., OpenAI ada-002)
+            >>> config = CompressionAdvisor.recommend(dims=1536, priority="memory")
+            >>> config["compression"]
+            'LeanVec4x8'
+            >>> config["reduce"]
+            768
+
+            >>> # Lower-dimensional embeddings
+            >>> config = CompressionAdvisor.recommend(dims=384, priority="speed")
+            >>> config["compression"]
+            'LVQ4x8'
+        """
+        if dims <= 0:
+            raise ValueError(f"dims must be positive, got {dims}")
+
+        # High-dimensional vectors (>= 1024) - use LeanVec
+        if dims >= CompressionAdvisor.HIGH_DIM_THRESHOLD:
+            base = {
+                "algorithm": "svs-vamana",
+                "datatype": datatype or "float16",
+                "graph_max_degree": 64,
+                "construction_window_size": 300,
+            }
+
+            if priority == "memory":
+                return cast(
+                    SVSConfig,
+                    {
+                        **base,
+                        "compression": "LeanVec4x8",
+                        "reduce": dims // 2,
+                        "search_window_size": 20,
+                    },
+                )
+            elif priority == "speed":
+                return cast(
+                    SVSConfig,
+                    {
+                        **base,
+                        "compression": "LeanVec4x8",
+                        "reduce": max(256, dims // 4),
+                        "search_window_size": 40,
+                    },
+                )
+            else:  # balanced
+                return cast(
+                    SVSConfig,
+                    {
+                        **base,
+                        "compression": "LeanVec4x8",
+                        "reduce": dims // 2,
+                        "search_window_size": 30,
+                    },
+                )
+
+        # Lower-dimensional vectors - use LVQ
+        else:
+            base = {
+                "algorithm": "svs-vamana",
+                "datatype": datatype or "float32",
+                "graph_max_degree": 40,
+                "construction_window_size": 250,
+                "search_window_size": 20,
+            }
+
+            if priority == "memory":
+                return cast(SVSConfig, {**base, "compression": "LVQ4"})
+            elif priority == "speed":
+                return cast(SVSConfig, {**base, "compression": "LVQ4x8"})
+            else:  # balanced
+                return cast(SVSConfig, {**base, "compression": "LVQ4x4"})
+
+    @staticmethod
+    def estimate_memory_savings(
+        compression: str, dims: int, reduce: Optional[int] = None
+    ) -> float:
+        """Estimate memory savings percentage from compression.
+
+        Calculates the percentage of memory saved compared to uncompressed float32 vectors.
+
+        Args:
+            compression: Compression type (e.g., "LVQ4", "LeanVec4x8")
+            dims: Original vector dimensionality
+            reduce: Reduced dimensionality (for LeanVec compression)
+
+        Returns:
+            float: Memory savings percentage (0-100)
+
+        Examples:
+            >>> # LeanVec with dimensionality reduction
+            >>> CompressionAdvisor.estimate_memory_savings(
+            ...     compression="LeanVec4x8",
+            ...     dims=1536,
+            ...     reduce=768
+            ... )
+            81.2
+
+            >>> # LVQ without dimensionality reduction
+            >>> CompressionAdvisor.estimate_memory_savings(
+            ...     compression="LVQ4",
+            ...     dims=384
+            ... )
+            87.5
+        """
+        # Base bits per dimension (float32)
+        base_bits = 32
+
+        # Compressed bits per dimension
+        compression_bits = CompressionAdvisor.COMPRESSION_BITS.get(
+            compression, base_bits
+        )
+
+        # Account for dimensionality reduction
+        effective_dims = reduce if reduce else dims
+
+        # Calculate savings
+        original_size = dims * base_bits
+        compressed_size = effective_dims * compression_bits
+        savings = (1 - compressed_size / original_size) * 100
+
+        return round(savings, 1)
Original file line number	Diff line number	Diff line change
`@@ -0,0 +1,3 @@`
	`1`	`+from redisvl.utils.compression import CompressionAdvisor`
	`2`	`+`
	`3`	`+__all__ = ["CompressionAdvisor"]`