fix(cockroachdb): Handle 30s timeout and ensure vector index usage

viragtripathi · viragtripathi · commit de2f2a38c633 · 2025-11-25T23:06:45.000-05:00
Two critical fixes for multi-node CockroachDB clusters:

1. Connection Timeout Handling:
   On multi-node v25.4 clusters, CREATE VECTOR INDEX from subprocess
   contexts experiences a 30-second connection timeout. The index
   creation continues successfully in the background. This fix detects
   the timeout and polls for completion (up to 5 minutes).

2. Vector Index Usage:
   Fixed vector_search_beam_size not being set on pooled connections,
   causing queries to use full table scan instead of the vector index.
   Now configures every connection from the pool with proper beam size.

Testing:
- Single-node: Works without timeout (178s index creation)
- Multi-node: Successfully handles timeout and completes (131s total)
- Vector index: Now properly used for all searches (verified with EXPLAIN)
- Both achieve ~83% recall with good QPS

Fixes issues where:
- Benchmarks would fail despite successful index creation
- Searches were slow due to full table scans instead of index usage
diff --git a/vectordb_bench/backend/clients/cockroachdb/cockroachdb.py b/vectordb_bench/backend/clients/cockroachdb/cockroachdb.py
@@ -154,14 +154,25 @@ def _create_connection_pool(self) -> ConnectionPool:
         # Add statement timeout for long-running vector index operations
         conninfo += " options='-c statement_timeout=600s'"
 
+        # Configure each connection with vector support and search parameters
+        def configure_connection(conn):
+            register_vector(conn)
+            # Set vector_search_beam_size on every connection for index usage
+            if self.case_config is not None:
+                search_param = self.case_config.search_param()
+                beam_size = search_param.get("vector_search_beam_size", 32)
+                with conn.cursor() as cur:
+                    cur.execute(f"SET vector_search_beam_size = {beam_size}")
+                conn.commit()
+
         return ConnectionPool(
             conninfo=conninfo,
             min_size=self.pool_size,
             max_size=self.pool_size + self.max_overflow,
             max_lifetime=self.pool_recycle,
             max_idle=300,
             reconnect_timeout=10.0,
-            configure=lambda conn: register_vector(conn),
+            configure=configure_connection,
         )
 
     @contextmanager
@@ -307,38 +318,105 @@ def _create_index(self):
     def optimize(self, data_size: int | None = None):
         """Post-insert optimization: create index if needed.
 
-        Note: Uses connection pool instead of creating new connection to avoid
-        subprocess timeout issues in CockroachDB.
+        Note: On multi-node clusters, CockroachDB v25.4 may close connections
+        at 30s during CREATE VECTOR INDEX from subprocess contexts. The index
+        creation continues in background. We handle this gracefully by checking
+        if the index was created successfully after timeout.
         """
         log.info(f"{self.name} post-insert optimization")
         if self.case_config is not None and self.case_config.create_index_after_load:
-            # Use existing pool connection instead of creating new one
-            with self.pool.connection() as conn:
-                register_vector(conn)
-                conn.autocommit = True
-                cursor = conn.cursor()
-
-                try:
-                    # Build CREATE INDEX SQL (SKIP DROP to avoid timeouts)
-                    index_param = self.case_config.index_param()
-                    options_list = []
-                    for option in index_param["index_creation_with_options"]:
-                        if option["val"] is not None:
-                            options_list.append(f"{option['option_name']} = {option['val']}")
-
-                    with_clause = f" WITH ({', '.join(options_list)})" if options_list else ""
-                    sql_str = (
-                        f"CREATE VECTOR INDEX IF NOT EXISTS {self._index_name} "
-                        f"ON {self.table_name} ({self._vector_field} {index_param['metric']})"
-                        f"{with_clause}"
-                    )
-
-                    log.info(f"{self.name} creating vector index: {self._index_name}")
-                    log.info(f"Index SQL: {sql_str}")
-                    cursor.execute(sql_str)
-
-                finally:
-                    cursor.close()
+            import time
+
+            # Build CREATE INDEX SQL
+            index_param = self.case_config.index_param()
+            options_list = []
+            for option in index_param["index_creation_with_options"]:
+                if option["val"] is not None:
+                    options_list.append(f"{option['option_name']} = {option['val']}")
+
+            with_clause = f" WITH ({', '.join(options_list)})" if options_list else ""
+            sql_str = (
+                f"CREATE VECTOR INDEX IF NOT EXISTS {self._index_name} "
+                f"ON {self.table_name} ({self._vector_field} {index_param['metric']})"
+                f"{with_clause}"
+            )
+
+            log.info(f"{self.name} creating vector index: {self._index_name}")
+            log.info(f"Index SQL: {sql_str}")
+
+            start_time = time.time()
+            connection_closed = False
+
+            # Try to create index
+            try:
+                with self.pool.connection() as conn:
+                    register_vector(conn)
+                    conn.autocommit = True
+                    cursor = conn.cursor()
+                    try:
+                        cursor.execute(sql_str)
+                        elapsed = time.time() - start_time
+                        log.info(f"{self.name} index created successfully in {elapsed:.1f}s")
+                        return  # Success!
+                    finally:
+                        cursor.close()
+            except Exception as e:
+                elapsed = time.time() - start_time
+                # Check if this is the expected 30s timeout on multi-node clusters
+                if "server closed the connection" in str(e) or "connection" in str(e).lower():
+                    log.warning(f"Connection closed after {elapsed:.1f}s during index creation: {e}")
+                    log.info(f"This is expected on multi-node clusters - checking if index was created...")
+                    connection_closed = True
+                else:
+                    # Unexpected error, re-raise
+                    raise
+
+            # Connection closed - wait for background index creation to complete
+            if connection_closed:
+                max_wait = 300  # 5 minutes max
+                poll_interval = 5
+                waited = 0
+
+                while waited < max_wait:
+                    time.sleep(poll_interval)
+                    waited += poll_interval
+
+                    # Create fresh connection to check status
+                    try:
+                        check_conn = psycopg.connect(**self.connect_config)
+                        check_cursor = check_conn.cursor()
+                        try:
+                            # Check if index exists
+                            check_cursor.execute(
+                                "SELECT 1 FROM pg_indexes WHERE tablename = %s AND indexname = %s",
+                                (self.table_name, self._index_name),
+                            )
+                            if check_cursor.fetchone():
+                                # Index exists! Verify it's usable by doing a quick test query
+                                try:
+                                    check_cursor.execute(f"SELECT 1 FROM {self.table_name} LIMIT 1")
+                                    check_cursor.fetchone()
+                                    total_time = time.time() - start_time
+                                    log.info(
+                                        f"✅ Index {self._index_name} created successfully (total time: {total_time:.1f}s)"
+                                    )
+                                    return
+                                except Exception as query_error:
+                                    # Index not yet usable
+                                    log.info(
+                                        f"Index exists but not yet usable... ({waited}s elapsed, error: {query_error})"
+                                    )
+                        finally:
+                            check_cursor.close()
+                            check_conn.close()
+                    except Exception as check_error:
+                        log.warning(f"Error checking index status: {check_error}")
+                        # Continue waiting
+
+                # Timeout waiting for index
+                msg = f"Timeout waiting for index {self._index_name} after {waited}s"
+                log.error(msg)
+                raise RuntimeError(msg)
 
     @db_retry(max_attempts=3, initial_delay=0.5, backoff_factor=2.0)
     def insert_embeddings(