Merge pull request #80 from TileDB-Inc/npapa/fix_query

NikolaosPapailiou · web-flow · commit a4436be5561e · 2023-07-06T18:37:25.000+03:00
Fix segfault in finite ram queries
diff --git a/apis/python/test/common.py b/apis/python/test/common.py
@@ -181,3 +181,11 @@ def create_array(path: str, data):
     tiledb.Array.create(path, schema)
     with tiledb.open(path, "w") as A:
         A[:] = data
+
+def accuracy(result, gt):
+    found = 0
+    total = 0
+    for i in range(len(result)):
+        total+=len(result[i])
+        found+=len(np.intersect1d(result[i], gt[i]))
+    return found/total
diff --git a/apis/python/test/test_ingestion.py b/apis/python/test/test_ingestion.py
@@ -22,7 +22,7 @@ def test_flat_ingestion_u8(tmp_path):
         source_type=source_type,
     )
     result = np.transpose(index.query(np.transpose(query_vectors), k=k))
-    assert np.array_equal(np.sort(result, axis=1), np.sort(gt_i, axis=1))
+    assert accuracy(result, gt_i) > 0.98
 
 
 def test_flat_ingestion_f32(tmp_path):
@@ -43,7 +43,7 @@ def test_flat_ingestion_f32(tmp_path):
         source_type=source_type,
     )
     result = np.transpose(index.query(np.transpose(query_vectors), k=k))
-    assert np.array_equal(np.sort(result, axis=1), np.sort(gt_i, axis=1))
+    assert accuracy(result, gt_i) > 0.98
 
 
 def test_ivf_flat_ingestion_u8(tmp_path):
@@ -52,13 +52,12 @@ def test_ivf_flat_ingestion_u8(tmp_path):
     k = 10
     size = 100000
     partitions = 100
-    create_random_dataset_u8(nb=size, d=100, nq=2, k=k, path=dataset_dir)
+    create_random_dataset_u8(nb=size, d=100, nq=10, k=k, path=dataset_dir)
     source_type = "U8BIN"
     dtype = np.uint8
 
     query_vectors = get_queries(dataset_dir, dtype=dtype)
     gt_i, gt_d = get_groundtruth(dataset_dir, k)
-
     index = ingest(
         index_type="IVF_FLAT",
         array_uri=array_uri,
@@ -68,15 +67,15 @@ def test_ivf_flat_ingestion_u8(tmp_path):
         input_vectors_per_work_item=int(size / 10),
     )
     result = np.transpose(
-        index.query(np.transpose(query_vectors), k=k, nprobe=partitions)
+        index.query(np.transpose(query_vectors), k=k, nprobe=10)
     )
-    assert np.array_equal(np.sort(result, axis=1), np.sort(gt_i, axis=1))
+    assert accuracy(result, gt_i) > 0.98
 
-    index_ram = IVFFlatIndex(uri=array_uri, dtype=dtype)
+    index_ram = IVFFlatIndex(uri=array_uri, dtype=dtype, memory_budget=int(size / 10))
     result = np.transpose(
         index_ram.query(np.transpose(query_vectors), k=k, nprobe=partitions)
     )
-    assert np.array_equal(np.sort(result, axis=1), np.sort(gt_i, axis=1))
+    assert accuracy(result, gt_i) > 0.98
     result = np.transpose(
         index_ram.query(
             np.transpose(query_vectors),
@@ -85,7 +84,7 @@ def test_ivf_flat_ingestion_u8(tmp_path):
             use_nuv_implementation=True,
         )
     )
-    assert np.array_equal(np.sort(result, axis=1), np.sort(gt_i, axis=1))
+    assert accuracy(result, gt_i) > 0.98
 
 
 def test_ivf_flat_ingestion_f32(tmp_path):
@@ -112,13 +111,13 @@ def test_ivf_flat_ingestion_f32(tmp_path):
     result = np.transpose(
         index.query(np.transpose(query_vectors), k=k, nprobe=partitions)
     )
-    assert np.array_equal(np.sort(result, axis=1), np.sort(gt_i, axis=1))
+    assert accuracy(result, gt_i) > 0.98
 
-    index_ram = IVFFlatIndex(uri=array_uri, dtype=dtype)
+    index_ram = IVFFlatIndex(uri=array_uri, dtype=dtype, memory_budget=int(size / 10))
     result = np.transpose(
         index_ram.query(np.transpose(query_vectors), k=k, nprobe=partitions)
     )
-    assert np.array_equal(np.sort(result, axis=1), np.sort(gt_i, axis=1))
+    assert accuracy(result, gt_i) > 0.98
     result = np.transpose(
         index_ram.query(
             np.transpose(query_vectors),
@@ -127,7 +126,7 @@ def test_ivf_flat_ingestion_f32(tmp_path):
             use_nuv_implementation=True,
         )
     )
-    assert np.array_equal(np.sort(result, axis=1), np.sort(gt_i, axis=1))
+    assert accuracy(result, gt_i) > 0.98
 
 
 def test_ivf_flat_ingestion_fvec(tmp_path):
@@ -157,13 +156,13 @@ def test_ivf_flat_ingestion_fvec(tmp_path):
     result = np.transpose(
         index.query(np.transpose(query_vectors), k=k, nprobe=partitions)
     )
-    assert np.array_equal(np.sort(result, axis=1), np.sort(gt_i, axis=1))
+    assert accuracy(result, gt_i) > 0.98
 
     index_ram = IVFFlatIndex(uri=array_uri, dtype=dtype)
     result = np.transpose(
         index_ram.query(np.transpose(query_vectors), k=k, nprobe=partitions)
     )
-    assert np.array_equal(np.sort(result, axis=1), np.sort(gt_i, axis=1))
+    assert accuracy(result, gt_i) > 0.98
     result = np.transpose(
         index_ram.query(
             np.transpose(query_vectors),
@@ -172,4 +171,4 @@ def test_ivf_flat_ingestion_fvec(tmp_path):
             use_nuv_implementation=True,
         )
     )
-    assert np.array_equal(np.sort(result, axis=1), np.sort(gt_i, axis=1))
+    assert accuracy(result, gt_i) > 0.98
diff --git a/src/include/detail/ivf/qv.h b/src/include/detail/ivf/qv.h
@@ -609,16 +609,16 @@ auto nuv_query_heap_finite_ram(
     _i.start();
 
     size_t parts_per_thread =
-        (size(active_partitions) + nthreads - 1) / nthreads;
+        (shuffled_db.num_col_parts() + nthreads - 1) / nthreads;
 
     std::vector<std::future<void>> futs;
     futs.reserve(nthreads);
 
     for (size_t n = 0; n < nthreads; ++n) {
       auto first_part =
-          std::min<size_t>(n * parts_per_thread, size(active_partitions));
+          std::min<size_t>(n * parts_per_thread, shuffled_db.num_col_parts());
       auto last_part =
-          std::min<size_t>((n + 1) * parts_per_thread, size(active_partitions));
+          std::min<size_t>((n + 1) * parts_per_thread, shuffled_db.num_col_parts());
 
       if (first_part != last_part) {
         futs.emplace_back(std::async(
@@ -794,16 +794,16 @@ auto qv_query_heap_finite_ram(
 
     // size_t block_size = (size(active_partitions) + nthreads - 1) / nthreads;
     size_t parts_per_thread =
-        (size(active_partitions) + nthreads - 1) / nthreads;
+        (shuffled_db.num_col_parts() + nthreads - 1) / nthreads;
 
     std::vector<std::future<void>> futs;
     futs.reserve(nthreads);
 
     for (size_t n = 0; n < nthreads; ++n) {
       auto first_part =
-          std::min<size_t>(n * parts_per_thread, size(active_partitions));
+          std::min<size_t>(n * parts_per_thread, shuffled_db.num_col_parts());
       auto last_part =
-          std::min<size_t>((n + 1) * parts_per_thread, size(active_partitions));
+          std::min<size_t>((n + 1) * parts_per_thread, shuffled_db.num_col_parts());
 
       if (first_part != last_part) {
         futs.emplace_back(