TileDB-Inc
diff --git a/‎apis/python/src/tiledb/vector_search/index.py‎
Lines changed: 5 additions & 7 deletions b/‎apis/python/src/tiledb/vector_search/index.py‎
Lines changed: 5 additions & 7 deletions
diff --git a/‎apis/python/src/tiledb/vector_search/module.cc‎
Lines changed: 9 additions & 19 deletions b/‎apis/python/src/tiledb/vector_search/module.cc‎
Lines changed: 9 additions & 19 deletions
diff --git a/‎apis/python/src/tiledb/vector_search/module.py‎
Lines changed: 0 additions & 8 deletions b/‎apis/python/src/tiledb/vector_search/module.py‎
Lines changed: 0 additions & 8 deletions
diff --git a/‎apis/python/test/test_ingestion.py‎
Lines changed: 24 additions & 24 deletions b/‎apis/python/test/test_ingestion.py‎
Lines changed: 24 additions & 24 deletions
@@ -100,9 +100,9 @@ def query(
         assert targets.dtype == np.float32
 
         targets_m = array_to_matrix(np.transpose(targets))
-        r = query_vq_heap(self._db, targets_m, self._ids, k, nthreads)
+        _, r = query_vq_heap(self._db, targets_m, self._ids, k, nthreads)
 
-        return np.transpose(np.array(r))
+        return np.transpose(np.array(_)), np.transpose(np.array(r))
 
 
 class IVFFlatIndex(Index):
@@ -222,7 +222,7 @@ def query(
         if mode is None:
             queries_m = array_to_matrix(np.transpose(queries))
             if self.memory_budget == -1:
-                r = ivf_query_ram(
+                _, r = ivf_query_ram(
                     self.dtype,
                     self._db,
                     self._centroids,
@@ -231,13 +231,12 @@ def query(
                     self._ids,
                     nprobe=nprobe,
                     k_nn=k,
-                    nth=True,  # ??
                     nthreads=nthreads,
                     ctx=self.ctx,
                     use_nuv_implementation=use_nuv_implementation,
                 )
             else:
-                r = ivf_query(
+                _, r = ivf_query(
                     self.dtype,
                     self.parts_db_uri,
                     self._centroids,
@@ -247,13 +246,12 @@ def query(
                     nprobe=nprobe,
                     k_nn=k,
                     memory_budget=self.memory_budget,
-                    nth=True,  # ??
                     nthreads=nthreads,
                     ctx=self.ctx,
                     use_nuv_implementation=use_nuv_implementation,
                 )
 
-            return np.transpose(np.array(r))
+            return np.transpose(np.array(_)), np.transpose(np.array(r))
         else:
             return self.taskgraph_query(
                 queries=queries,
 
@@ -5,15 +5,13 @@
 #include <pybind11/stl.h>
 
 #include "linalg.h"
-#include "ivf_index.h"
 #include "ivf_query.h"
 #include "flat_query.h"
 
 namespace py = pybind11;
 using Ctx = tiledb::Context;
 
 bool global_debug = false;
-double global_time_of_interest;
 
 bool enable_stats = false;
 std::vector<json> core_stats;
@@ -113,8 +111,7 @@ static void declare_qv_query_heap_infinite_ram(py::module& m, const std::string&
          std::vector<Id_Type>& ids,
          size_t nprobe,
          size_t k_nn,
-         bool nth,
-         size_t nthreads) -> ColMajorMatrix<size_t> { // TODO change return type
+         size_t nthreads) -> std::tuple<ColMajorMatrix<float>, ColMajorMatrix<size_t>> { // TODO change return type
 
         auto r = detail::ivf::qv_query_heap_infinite_ram(
             parts,
@@ -124,7 +121,6 @@ static void declare_qv_query_heap_infinite_ram(py::module& m, const std::string&
             ids,
             nprobe,
             k_nn,
-            nth,
             nthreads);
         return r;
         }, py::keep_alive<1,2>());
@@ -142,8 +138,7 @@ static void declare_qv_query_heap_finite_ram(py::module& m, const std::string& s
          size_t nprobe,
          size_t k_nn,
          size_t upper_bound,
-         bool nth,
-         size_t nthreads) -> ColMajorMatrix<size_t> { // TODO change return type
+         size_t nthreads) -> std::tuple<ColMajorMatrix<float>, ColMajorMatrix<size_t>> { // TODO change return type
 
         auto r = detail::ivf::qv_query_heap_finite_ram<T, Id_Type>(
             ctx,
@@ -155,7 +150,6 @@ static void declare_qv_query_heap_finite_ram(py::module& m, const std::string& s
             nprobe,
             k_nn,
             upper_bound,
-            nth,
             nthreads);
         return r;
         }, py::keep_alive<1,2>());
@@ -171,8 +165,7 @@ static void declare_nuv_query_heap_infinite_ram(py::module& m, const std::string
          std::vector<Id_Type>& ids,
          size_t nprobe,
          size_t k_nn,
-         bool nth,
-         size_t nthreads) -> ColMajorMatrix<size_t> { // TODO change return type
+         size_t nthreads) -> std::tuple<ColMajorMatrix<float>, ColMajorMatrix<size_t>> { // TODO change return type
 
         auto r = detail::ivf::nuv_query_heap_infinite_ram_reg_blocked(
             parts,
@@ -182,7 +175,6 @@ static void declare_nuv_query_heap_infinite_ram(py::module& m, const std::string
             ids,
             nprobe,
             k_nn,
-            nth,
             nthreads);
         return r;
         }, py::keep_alive<1,2>());
@@ -200,8 +192,7 @@ static void declare_nuv_query_heap_finite_ram(py::module& m, const std::string&
          size_t nprobe,
          size_t k_nn,
          size_t upper_bound,
-         bool nth,
-         size_t nthreads) -> ColMajorMatrix<size_t> { // TODO change return type
+         size_t nthreads) -> std::tuple<ColMajorMatrix<float>, ColMajorMatrix<size_t>> { // TODO change return type
 
         auto r = detail::ivf::nuv_query_heap_finite_ram_reg_blocked<T, Id_Type>(
             ctx,
@@ -213,7 +204,6 @@ static void declare_nuv_query_heap_finite_ram(py::module& m, const std::string&
             nprobe,
             k_nn,
             upper_bound,
-            nth,
             nthreads);
         return r;
         }, py::keep_alive<1,2>());
@@ -394,7 +384,7 @@ static void declare_vq_query_heap(py::module& m, const std::string& suffix) {
            ColMajorMatrix<float>& query_vectors,
            const std::vector<uint64_t> &ids,
            int k,
-           size_t nthreads) -> ColMajorMatrix<size_t> {
+           size_t nthreads) -> std::tuple<ColMajorMatrix<float>, ColMajorMatrix<size_t>> {
           auto r = detail::flat::vq_query_heap(data, query_vectors, ids, k, nthreads);
           return r;
         });
@@ -477,17 +467,17 @@ PYBIND11_MODULE(_tiledbvspy, m) {
         [](ColMajorMatrix<float>& data,
            ColMajorMatrix<float>& query_vectors,
            int k,
-           size_t nthreads) -> ColMajorMatrix<size_t> {
-          auto r = detail::flat::vq_query_nth(data, query_vectors, k, true, nthreads);
+           size_t nthreads) -> std::tuple<ColMajorMatrix<float>, ColMajorMatrix<size_t>> {
+          auto r = detail::flat::vq_query_heap(data, query_vectors, k, nthreads);
           return r;
         });
 
   m.def("query_vq_u8",
         [](tdbColMajorMatrix<uint8_t>& data,
            ColMajorMatrix<float>& query_vectors,
            int k,
-           size_t nthreads) -> ColMajorMatrix<size_t> {
-          auto r = detail::flat::vq_query_nth(data, query_vectors, k, true, nthreads);
+           size_t nthreads) -> std::tuple<ColMajorMatrix<float>, ColMajorMatrix<size_t>> {
+          auto r = detail::flat::vq_query_heap(data, query_vectors, k, nthreads);
           return r;
         });
 
 
@@ -188,7 +188,6 @@ def ivf_query_ram(
     ids: "Vector",
     nprobe: int,
     k_nn: int,
-    nth: bool,
     nthreads: int,
     ctx: "Ctx" = None,
     use_nuv_implementation: bool = False,
@@ -214,8 +213,6 @@ def ivf_query_ram(
         Number of probs
     k_nn: int
         Number of nn
-    nth: bool
-        Return nth records
     nthreads: int
         Number of theads
     ctx: Ctx
@@ -233,7 +230,6 @@ def ivf_query_ram(
             ids,
             nprobe,
             k_nn,
-            nth,
             nthreads,
         ]
     )
@@ -262,7 +258,6 @@ def ivf_query(
     nprobe: int,
     k_nn: int,
     memory_budget: int,
-    nth: bool,
     nthreads: int,
     ctx: "Ctx" = None,
     use_nuv_implementation: bool = False,
@@ -290,8 +285,6 @@ def ivf_query(
         Number of nn
     memory_budget: int
         Main memory budget
-    nth: bool
-        Return nth records
     nthreads: int
         Number of theads
     ctx: Ctx
@@ -311,7 +304,6 @@ def ivf_query(
             nprobe,
             k_nn,
             memory_budget,
-            nth,
             nthreads,
         ]
     )
 
@@ -25,7 +25,7 @@ def test_flat_ingestion_u8(tmp_path):
         index_uri=index_uri,
         source_uri=os.path.join(dataset_dir, "data.u8bin"),
     )
-    result = index.query(query_vectors, k=k)
+    _, result = index.query(query_vectors, k=k)
     assert accuracy(result, gt_i) > MINIMUM_ACCURACY
 
 
@@ -44,11 +44,11 @@ def test_flat_ingestion_f32(tmp_path):
         index_uri=index_uri,
         source_uri=os.path.join(dataset_dir, "data.f32bin"),
     )
-    result = index.query(query_vectors, k=k)
+    _, result = index.query(query_vectors, k=k)
     assert accuracy(result, gt_i) > MINIMUM_ACCURACY
 
     index_ram = FlatIndex(uri=index_uri)
-    result = index_ram.query(query_vectors, k=k)
+    _, result = index_ram.query(query_vectors, k=k)
     assert accuracy(result, gt_i) > MINIMUM_ACCURACY
 
 
@@ -71,7 +71,7 @@ def test_flat_ingestion_external_id_u8(tmp_path):
         source_uri=os.path.join(dataset_dir, "data.u8bin"),
         external_ids=external_ids
     )
-    result = index.query(query_vectors, k=k)
+    _, result = index.query(query_vectors, k=k)
     assert accuracy(result, gt_i, external_ids_offset=external_ids_offset) > MINIMUM_ACCURACY
 
 
@@ -96,22 +96,22 @@ def test_ivf_flat_ingestion_u8(tmp_path):
         partitions=partitions,
         input_vectors_per_work_item=int(size / 10),
     )
-    result = index.query(query_vectors, k=k, nprobe=nprobe)
+    _, result = index.query(query_vectors, k=k, nprobe=nprobe)
     assert accuracy(result, gt_i) > MINIMUM_ACCURACY
 
     index_ram = IVFFlatIndex(uri=index_uri, memory_budget=int(size / 10))
-    result = index_ram.query(query_vectors, k=k, nprobe=nprobe)
+    _, result = index_ram.query(query_vectors, k=k, nprobe=nprobe)
     assert accuracy(result, gt_i) > MINIMUM_ACCURACY
 
-    result = index_ram.query(
+    _, result = index_ram.query(
         query_vectors,
         k=k,
         nprobe=nprobe,
         use_nuv_implementation=True,
     )
     assert accuracy(result, gt_i) > MINIMUM_ACCURACY
 
-    result = index_ram.query(
+    _, result = index_ram.query(
         query_vectors,
         k=k,
         nprobe=nprobe,
@@ -144,26 +144,26 @@ def test_ivf_flat_ingestion_f32(tmp_path):
         input_vectors_per_work_item=int(size / 10),
     )
 
-    result = index.query(query_vectors, k=k, nprobe=nprobe)
+    _, result = index.query(query_vectors, k=k, nprobe=nprobe)
     assert accuracy(result, gt_i) > MINIMUM_ACCURACY
 
     index_ram = IVFFlatIndex(uri=index_uri, memory_budget=int(size / 10))
-    result = index_ram.query(query_vectors, k=k, nprobe=nprobe)
+    _, result = index_ram.query(query_vectors, k=k, nprobe=nprobe)
     assert accuracy(result, gt_i) > MINIMUM_ACCURACY
 
     index_ram = IVFFlatIndex(uri=index_uri, memory_budget=int(size / 10))
-    result = index_ram.query(query_vectors, k=k, nprobe=nprobe)
+    _, result = index_ram.query(query_vectors, k=k, nprobe=nprobe)
     assert accuracy(result, gt_i) > MINIMUM_ACCURACY
 
-    result = index_ram.query(
+    _, result = index_ram.query(
         query_vectors,
         k=k,
         nprobe=nprobe,
         use_nuv_implementation=True,
     )
     assert accuracy(result, gt_i) > MINIMUM_ACCURACY
 
-    result = index_ram.query(query_vectors, k=k, nprobe=nprobe, mode=Mode.LOCAL)
+    _, result = index_ram.query(query_vectors, k=k, nprobe=nprobe, mode=Mode.LOCAL)
     assert accuracy(result, gt_i) > MINIMUM_ACCURACY
 
 
@@ -186,26 +186,26 @@ def test_ivf_flat_ingestion_fvec(tmp_path):
         source_uri=source_uri,
         partitions=partitions,
     )
-    result = index.query(query_vectors, k=k, nprobe=nprobe)
+    _, result = index.query(query_vectors, k=k, nprobe=nprobe)
     assert accuracy(result, gt_i) > MINIMUM_ACCURACY
 
     # Test single query vector handling
-    result1 = index.query(query_vectors[10], k=k, nprobe=nprobe)
+    _, result1 = index.query(query_vectors[10], k=k, nprobe=nprobe)
     assert accuracy(result1, np.array([gt_i[10]])) > MINIMUM_ACCURACY
 
     index_ram = IVFFlatIndex(uri=index_uri)
-    result = index_ram.query(query_vectors, k=k, nprobe=nprobe)
+    _, result = index_ram.query(query_vectors, k=k, nprobe=nprobe)
     assert accuracy(result, gt_i) > MINIMUM_ACCURACY
 
-    result = index_ram.query(
+    _, result = index_ram.query(
         query_vectors,
         k=k,
         nprobe=nprobe,
         use_nuv_implementation=True,
     )
     assert accuracy(result, gt_i) > MINIMUM_ACCURACY
 
-    result = index_ram.query(query_vectors, k=k, nprobe=nprobe, mode=Mode.LOCAL)
+    _, result = index_ram.query(query_vectors, k=k, nprobe=nprobe, mode=Mode.LOCAL)
     assert accuracy(result, gt_i) > MINIMUM_ACCURACY
 
 
@@ -230,26 +230,26 @@ def test_ivf_flat_ingestion_numpy(tmp_path):
         input_vectors=input_vectors,
         partitions=partitions,
     )
-    result = index.query(query_vectors, k=k, nprobe=nprobe)
+    _, result = index.query(query_vectors, k=k, nprobe=nprobe)
     assert accuracy(result, gt_i) > MINIMUM_ACCURACY
 
     # Test single query vector handling
-    result1 = index.query(query_vectors[10], k=k, nprobe=nprobe)
+    _, result1 = index.query(query_vectors[10], k=k, nprobe=nprobe)
     assert accuracy(result1, np.array([gt_i[10]])) > MINIMUM_ACCURACY
 
     index_ram = IVFFlatIndex(uri=index_uri)
-    result = index_ram.query(query_vectors, k=k, nprobe=nprobe)
+    _, result = index_ram.query(query_vectors, k=k, nprobe=nprobe)
     assert accuracy(result, gt_i) > MINIMUM_ACCURACY
 
-    result = index_ram.query(
+    _, result = index_ram.query(
         query_vectors,
         k=k,
         nprobe=nprobe,
         use_nuv_implementation=True,
     )
     assert accuracy(result, gt_i) > MINIMUM_ACCURACY
 
-    result = index_ram.query(query_vectors, k=k, nprobe=nprobe, mode=Mode.LOCAL)
+    _, result = index_ram.query(query_vectors, k=k, nprobe=nprobe, mode=Mode.LOCAL)
     assert accuracy(result, gt_i) > MINIMUM_ACCURACY
 def test_ivf_flat_ingestion_external_ids_numpy(tmp_path):
     source_uri = "test/data/siftsmall/siftsmall_base.fvecs"
@@ -275,5 +275,5 @@ def test_ivf_flat_ingestion_external_ids_numpy(tmp_path):
         partitions=partitions,
         external_ids=external_ids
     )
-    result = index.query(query_vectors, k=k, nprobe=nprobe)
+    _, result = index.query(query_vectors, k=k, nprobe=nprobe)
     assert accuracy(result, gt_i, external_ids_offset) > MINIMUM_ACCURACY