facebookresearch
diff --git a/‎benchs/bench_hnsw_flat_panorama.py‎
Lines changed: 153 additions & 0 deletions b/‎benchs/bench_hnsw_flat_panorama.py‎
Lines changed: 153 additions & 0 deletions
diff --git a/‎faiss/IndexAdditiveQuantizer.cpp‎
Lines changed: 1 addition & 0 deletions b/‎faiss/IndexAdditiveQuantizer.cpp‎
Lines changed: 1 addition & 0 deletions
diff --git a/‎faiss/IndexBinaryHNSW.cpp‎
Lines changed: 5 additions & 1 deletion b/‎faiss/IndexBinaryHNSW.cpp‎
Lines changed: 5 additions & 1 deletion
diff --git a/‎faiss/IndexFlat.cpp‎
Lines changed: 58 additions & 4 deletions b/‎faiss/IndexFlat.cpp‎
Lines changed: 58 additions & 4 deletions
diff --git a/‎faiss/IndexHNSW.cpp‎
Lines changed: 90 additions & 1 deletion b/‎faiss/IndexHNSW.cpp‎
Lines changed: 90 additions & 1 deletion
@@ -0,0 +1,153 @@
+# Copyright (c) Meta Platforms, Inc. and affiliates.
+#
+# This source code is licensed under the MIT license found in the
+# LICENSE file in the root directory of this source tree.
+
+import multiprocessing as mp
+import time
+
+import faiss
+import matplotlib.pyplot as plt
+import numpy as np
+
+try:
+    from faiss.contrib.datasets_fb import (
+        DatasetSIFT1M,
+        DatasetGIST1M,
+        SyntheticDataset,
+    )
+except ImportError:
+    from faiss.contrib.datasets import (
+        DatasetSIFT1M,
+        DatasetGIST1M,
+        SyntheticDataset,
+    )
+
+
+def eval_recall(index, efSearch_val, xq, gt, k):
+    """Evaluate recall and QPS for a given efSearch value."""
+    t0 = time.time()
+    _, I = index.search(xq, k=k)
+    t = time.time() - t0
+    speed = t * 1000 / len(xq)
+    qps = 1000 / speed
+
+    corrects = (gt == I).sum()
+    recall = corrects / (len(xq) * k)
+    print(
+        f"\tefSearch {efSearch_val:3d}, Recall@{k}: "
+        f"{recall:.6f}, speed: {speed:.6f} ms/query, QPS: {qps:.2f}"
+    )
+
+    return recall, qps
+
+
+def get_hnsw_index(index):
+    """Extract the underlying HNSW index from a PreTransform index."""
+    if isinstance(index, faiss.IndexPreTransform):
+        return faiss.downcast_index(index.index)
+    return index
+
+
+def eval_and_plot(name, ds, k=10, nlevels=8, plot_data=None):
+    """Evaluate an index configuration and collect data for plotting."""
+    xq = ds.get_queries()
+    xb = ds.get_database()
+    gt = ds.get_groundtruth()
+
+    if hasattr(ds, "get_train"):
+        xt = ds.get_train()
+    else:
+        # Use database as training data if no separate train set
+        xt = xb
+
+    nb, d = xb.shape
+    nq, d = xq.shape
+    gt = gt[:, :k]
+
+    print(f"\n======{name} on {ds.__class__.__name__}======")
+    print(f"Database: {nb} vectors, {d} dimensions")
+    print(f"Queries: {nq} vectors")
+
+    # Create index
+    index = faiss.index_factory(d, name)
+
+    faiss.omp_set_num_threads(mp.cpu_count())
+    index.train(xt)
+    index.add(xb)
+
+    faiss.omp_set_num_threads(1)
+
+    # Get the underlying HNSW index for setting efSearch
+    hnsw_index = get_hnsw_index(index)
+
+    data = []
+    for efSearch in [16, 32, 64, 128, 256, 512]:
+        hnsw_index.hnsw.efSearch = efSearch
+        recall, qps = eval_recall(index, efSearch, xq, gt, k)
+        data.append((recall, qps))
+
+    if plot_data is not None:
+        data = np.array(data)
+        plot_data.append((name, data))
+
+
+def benchmark_dataset(ds, dataset_name, k=10, nlevels=8, M=32):
+    """Benchmark both regular HNSW and HNSW Panorama on a dataset."""
+    d = ds.d
+
+    plot_data = []
+
+    # HNSW Flat (baseline)
+    eval_and_plot(f"HNSW{M},Flat", ds, k=k, nlevels=nlevels, plot_data=plot_data)
+
+    # HNSW Flat Panorama (with PCA to concentrate energy)
+    eval_and_plot(
+        f"PCA{d},HNSW{M},FlatPanorama{nlevels}",
+        ds,
+        k=k,
+        nlevels=nlevels,
+        plot_data=plot_data,
+    )
+
+    # Plot results
+    plt.figure(figsize=(8, 6), dpi=80)
+    for name, data in plot_data:
+        plt.plot(data[:, 0], data[:, 1], marker="o", label=name)
+
+    plt.title(f"HNSW Indexes on {dataset_name}")
+    plt.xlabel(f"Recall@{k}")
+    plt.ylabel("QPS")
+    plt.yscale("log")
+    plt.legend(bbox_to_anchor=(1.02, 0.1), loc="upper left", borderaxespad=0)
+    plt.grid(True, alpha=0.3)
+
+    output_file = f"bench_hnsw_flat_panorama_{dataset_name}.png"
+    plt.savefig(output_file, bbox_inches="tight")
+    print(f"Saved plot to {output_file}")
+    plt.close()
+
+
+if __name__ == "__main__":
+    k = 10
+    nlevels = 8
+    M = 32
+
+    # Test on 3 datasets with varying dimensionality:
+    # SIFT1M (128d), GIST1M (960d), and Synthetic high-dim (2048d)
+    datasets = [
+        (DatasetSIFT1M(), "SIFT1M"),
+        (DatasetGIST1M(), "GIST1M"),
+        # Synthetic high-dimensional dataset: 2048d, 100k train, 1M database, 10k queries
+        (SyntheticDataset(2048, 100000, 1000000, 10000), "Synthetic2048D"),
+    ]
+
+    for ds, name in datasets:
+        print(f"\n{'='*60}")
+        print(f"Benchmarking on {name}")
+        print(f"{'='*60}")
+        benchmark_dataset(ds, name, k=k, nlevels=nlevels, M=M)
+
+    print("\n" + "="*60)
+    print("All benchmarks completed!")
+    print("="*60)
@@ -86,6 +86,7 @@ struct AQDistanceComputerLUT : FlatCodesDistanceComputer {
 
     float bias;
     void set_query(const float* x) final {
+        q = x;
         // this is quite sub-optimal for multiple queries
         aq.compute_LUT(1, x, LUT.data());
         if (is_IP) {
 
@@ -227,7 +227,11 @@ void IndexBinaryHNSW::search(
         for (idx_t i = 0; i < n; i++) {
             res.begin(i);
             dis->set_query((float*)(x + i * code_size));
-            hnsw.search(*dis, res, vt);
+            // Given that IndexBinaryHNSW is not an IndexHNSW, we pass nullptr
+            // as the index parameter. This state does not get used in the
+            // search function, as it is merely there to to enable Panorama
+            // execution for IndexHNSWFlatPanorama.
+            hnsw.search(*dis, nullptr, res, vt);
             res.end();
         }
     }
 
@@ -103,28 +103,38 @@ namespace {
 struct FlatL2Dis : FlatCodesDistanceComputer {
     size_t d;
     idx_t nb;
-    const float* q;
     const float* b;
     size_t ndis;
+    size_t npartial_dot_products;
 
     float distance_to_code(const uint8_t* code) final {
         ndis++;
         return fvec_L2sqr(q, (float*)code, d);
     }
 
+    float partial_dot_product(
+            const idx_t i,
+            const uint32_t offset,
+            const uint32_t num_components) final override {
+        npartial_dot_products++;
+        return fvec_inner_product(
+                q + offset, b + i * d + offset, num_components);
+    }
+
     float symmetric_dis(idx_t i, idx_t j) override {
         return fvec_L2sqr(b + j * d, b + i * d, d);
     }
 
     explicit FlatL2Dis(const IndexFlat& storage, const float* q = nullptr)
             : FlatCodesDistanceComputer(
                       storage.codes.data(),
-                      storage.code_size),
+                      storage.code_size,
+                      q),
               d(storage.d),
               nb(storage.ntotal),
-              q(q),
               b(storage.get_xb()),
-              ndis(0) {}
+              ndis(0),
+              npartial_dot_products(0) {}
 
     void set_query(const float* x) override {
         q = x;
@@ -162,6 +172,50 @@ struct FlatL2Dis : FlatCodesDistanceComputer {
         dis2 = dp2;
         dis3 = dp3;
     }
+
+    void partial_dot_product_batch_4(
+            const idx_t idx0,
+            const idx_t idx1,
+            const idx_t idx2,
+            const idx_t idx3,
+            float& dp0,
+            float& dp1,
+            float& dp2,
+            float& dp3,
+            const uint32_t offset,
+            const uint32_t num_components) final override {
+        npartial_dot_products += 4;
+
+        // compute first, assign next
+        const float* __restrict y0 =
+                reinterpret_cast<const float*>(codes + idx0 * code_size);
+        const float* __restrict y1 =
+                reinterpret_cast<const float*>(codes + idx1 * code_size);
+        const float* __restrict y2 =
+                reinterpret_cast<const float*>(codes + idx2 * code_size);
+        const float* __restrict y3 =
+                reinterpret_cast<const float*>(codes + idx3 * code_size);
+
+        float dp0_ = 0;
+        float dp1_ = 0;
+        float dp2_ = 0;
+        float dp3_ = 0;
+        fvec_inner_product_batch_4(
+                q + offset,
+                y0 + offset,
+                y1 + offset,
+                y2 + offset,
+                y3 + offset,
+                num_components,
+                dp0_,
+                dp1_,
+                dp2_,
+                dp3_);
+        dp0 = dp0_;
+        dp1 = dp1_;
+        dp2 = dp2_;
+        dp3 = dp3_;
+    }
 };
 
 struct FlatIPDis : FlatCodesDistanceComputer {
 
@@ -276,7 +276,7 @@ void hnsw_search(
                 res.begin(i);
                 dis->set_query(x + i * index->d);
 
-                HNSWStats stats = hnsw.search(*dis, res, vt, params);
+                HNSWStats stats = hnsw.search(*dis, index, res, vt, params);
                 n1 += stats.n1;
                 n2 += stats.n2;
                 ndis += stats.ndis;
@@ -649,6 +649,95 @@ IndexHNSWFlat::IndexHNSWFlat(int d, int M, MetricType metric)
     is_trained = true;
 }
 
+/**************************************************************
+ * IndexHNSWFlatPanorama implementation
+ **************************************************************/
+
+void IndexHNSWFlatPanorama::compute_cum_sums(
+        const float* x,
+        float* dst_cum_sums,
+        int d,
+        int num_panorama_levels,
+        int panorama_level_width) {
+    // Iterate backwards through levels, accumulating sum as we go.
+    // This avoids computing the suffix sum for each vector, which takes
+    // extra memory.
+
+    float sum = 0.0f;
+    dst_cum_sums[num_panorama_levels] = 0.0f;
+    for (int level = num_panorama_levels - 1; level >= 0; level--) {
+        int start_idx = level * panorama_level_width;
+        int end_idx = std::min(start_idx + panorama_level_width, d);
+        for (int j = start_idx; j < end_idx; j++) {
+            sum += x[j] * x[j];
+        }
+        dst_cum_sums[level] = std::sqrt(sum);
+    }
+}
+
+IndexHNSWFlatPanorama::IndexHNSWFlatPanorama()
+        : IndexHNSWFlat(),
+          cum_sums(),
+          panorama_level_width(0),
+          num_panorama_levels(0) {}
+
+IndexHNSWFlatPanorama::IndexHNSWFlatPanorama(
+        int d,
+        int M,
+        int num_panorama_levels,
+        MetricType metric)
+        : IndexHNSWFlat(d, M, metric),
+          cum_sums(),
+          panorama_level_width(
+                  (d + num_panorama_levels - 1) / num_panorama_levels),
+          num_panorama_levels(num_panorama_levels) {
+    // For now, we only support L2 distance.
+    // Supporting dot product and cosine distance is a trivial addition
+    // left for future work.
+    FAISS_THROW_IF_NOT(metric == METRIC_L2);
+
+    // Enable Panorama search mode.
+    // This is not ideal, but is still more simple than making a subclass of
+    // HNSW and overriding the search logic.
+    hnsw.is_panorama = true;
+}
+
+void IndexHNSWFlatPanorama::add(idx_t n, const float* x) {
+    idx_t n0 = ntotal;
+    cum_sums.resize((ntotal + n) * (num_panorama_levels + 1));
+
+    for (size_t idx = 0; idx < n; idx++) {
+        const float* vector = x + idx * d;
+        compute_cum_sums(
+                vector,
+                &cum_sums[(n0 + idx) * (num_panorama_levels + 1)],
+                d,
+                num_panorama_levels,
+                panorama_level_width);
+    }
+
+    IndexHNSWFlat::add(n, x);
+}
+
+void IndexHNSWFlatPanorama::reset() {
+    cum_sums.clear();
+    IndexHNSWFlat::reset();
+}
+
+void IndexHNSWFlatPanorama::permute_entries(const idx_t* perm) {
+    std::vector<float> new_cum_sums(ntotal * (num_panorama_levels + 1));
+
+    for (idx_t i = 0; i < ntotal; i++) {
+        idx_t src = perm[i];
+        memcpy(&new_cum_sums[i * (num_panorama_levels + 1)],
+               &cum_sums[src * (num_panorama_levels + 1)],
+               (num_panorama_levels + 1) * sizeof(float));
+    }
+
+    std::swap(cum_sums, new_cum_sums);
+    IndexHNSWFlat::permute_entries(perm);
+}
+
 /**************************************************************
  * IndexHNSWPQ implementation
  **************************************************************/
Original file line number	Diff line number	Diff line change
`@@ -227,7 +227,11 @@ void IndexBinaryHNSW::search(`
`227`	`227`	`for (idx_t i = 0; i < n; i++) {`
`228`	`228`	`res.begin(i);`
`229`	`229`	`dis->set_query((float)(x + i code_size));`
`230`		`- hnsw.search(*dis, res, vt);`
	`230`	`+ // Given that IndexBinaryHNSW is not an IndexHNSW, we pass nullptr`
	`231`	`+ // as the index parameter. This state does not get used in the`
	`232`	`+ // search function, as it is merely there to to enable Panorama`
	`233`	`+ // execution for IndexHNSWFlatPanorama.`
	`234`	`+ hnsw.search(*dis, nullptr, res, vt);`
`231`	`235`	`res.end();`
`232`	`236`	`}`
`233`	`237`	`}`