littleniuer
diff --git a/‎CMakeLists.txt‎
Lines changed: 1 addition & 5 deletions b/‎CMakeLists.txt‎
Lines changed: 1 addition & 5 deletions
diff --git a/‎INSTALL.md‎
Lines changed: 5 additions & 5 deletions b/‎INSTALL.md‎
Lines changed: 5 additions & 5 deletions
diff --git a/‎benchs/README.md‎
Lines changed: 1 addition & 0 deletions b/‎benchs/README.md‎
Lines changed: 1 addition & 0 deletions
diff --git a/‎benchs/bench_hnsw_prune_headroom.py‎
Lines changed: 234 additions & 0 deletions b/‎benchs/bench_hnsw_prune_headroom.py‎
Lines changed: 234 additions & 0 deletions
diff --git a/‎c_api/impl/AuxIndexStructures_c.cpp‎
Lines changed: 1 addition & 1 deletion b/‎c_api/impl/AuxIndexStructures_c.cpp‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎cmake/thirdparty/fetch_rapids.cmake‎
Lines changed: 2 additions & 2 deletions b/‎cmake/thirdparty/fetch_rapids.cmake‎
Lines changed: 2 additions & 2 deletions
diff --git a/‎conda/faiss-gpu-cuvs/meta.yaml‎
Lines changed: 16 additions & 8 deletions b/‎conda/faiss-gpu-cuvs/meta.yaml‎
Lines changed: 16 additions & 8 deletions
@@ -53,11 +53,7 @@ project(faiss
   LANGUAGES ${FAISS_LANGUAGES})
 include(GNUInstallDirs)
 
-if(FAISS_ENABLE_CUVS)
-  set(CMAKE_CXX_STANDARD 17)
-else()
-  set(CMAKE_CXX_STANDARD 20)
-endif()
+set(CMAKE_CXX_STANDARD 20)
 
 list(APPEND CMAKE_MODULE_PATH "${PROJECT_SOURCE_DIR}/cmake")
 
 
@@ -6,7 +6,7 @@ pre-release nightly builds.
 
 - The CPU-only faiss-cpu conda package is currently available on Linux (x86-64 and aarch64), OSX (arm64 only), and Windows (x86-64)
 - faiss-gpu, containing both CPU and GPU indices, is available on Linux (x86-64 only) for CUDA 11.4 and 12.1
-- faiss-gpu-cuvs package containing GPU indices provided by [NVIDIA cuVS](https://github.com/rapidsai/cuvs/) version 25.10, is available on Linux (x86-64 only) for CUDA 12.4.
+- faiss-gpu-cuvs package containing GPU indices provided by [NVIDIA cuVS](https://github.com/rapidsai/cuvs/) version 26.02, is available on Linux (x86-64 only) for CUDA 12.4.
 
 To install the latest stable release:
 
@@ -61,7 +61,7 @@ found to run on other platforms as well, see
 [other platforms](https://github.com/facebookresearch/faiss/wiki/Related-projects#bindings-to-other-languages-and-porting-to-other-platforms).
 
 The basic requirements are:
-- a C++17 compiler (with OpenMP support version 2 or higher),
+- a C++20 compiler (with OpenMP support version 2 or higher),
 - a BLAS implementation (on Intel machines we strongly recommend using Intel MKL for best
 performance).
 
@@ -72,7 +72,7 @@ The optional requirements are:
 - for AMD GPUs:
   - AMD ROCm,
 - for using NVIDIA cuVS implementations:
-  - libcuvs=25.10
+  - libcuvs=26.02
 - for the python bindings:
   - python 3,
   - numpy,
@@ -87,9 +87,9 @@ section of the wiki](https://github.com/facebookresearch/faiss/wiki/Troubleshoot
 
 The libcuvs dependency should be installed via conda:
 ```
-conda install -c rapidsai -c conda-forge -c nvidia libcuvs=25.10 'cuda-version=12.6'
+conda install -c rapidsai -c conda-forge -c nvidia libcuvs=26.02 'cuda-version=12.6'
 ```
-For more ways to install cuVS 25.10, refer to the [RAPIDS Installation Guide](https://docs.rapids.ai/install).
+For more ways to install cuVS 26.02, refer to the [RAPIDS Installation Guide](https://docs.rapids.ai/install).
 
 ### Building with Intel(R) SVS
 
 
@@ -348,6 +348,7 @@ Certain tests / benchmarks might be outdated.
 * bench_hamming_computer.cpp - specialized implementations for Hamming distance computations
 * bench_heap_replace.cpp - benchmarks different implementations of certain calls for a Heap data structure
 * bench_hnsw.py - benchmarks HNSW in combination with other ones for SIFT1M dataset
+* bench_hnsw_prune_headroom.py - benchmarks HNSW prune_headroom recall and build time impact
 * bench_index_flat.py - benchmarks IndexFlatL2 on a synthetic dataset
 * bench_index_pq.py - benchmarks PQ on SIFT1M dataset
 * bench_ivf_fastscan_single_query.py - benchmarks a single query for different nprobe levels for IVF{nlist},PQ{M}x4fs on BIGANN dataset
 
@@ -0,0 +1,234 @@
+# Copyright (c) Meta Platforms, Inc. and affiliates.
+#
+# This source code is licensed under the MIT license found in the
+# LICENSE file in the root directory of this source tree.
+
+"""
+Benchmark script for testing HNSW prune_headroom recall impact.
+
+Compares recall and build time between different prune_headroom values.
+Default comparison is between:
+- Baseline: prune_headroom = 0.0 (original behavior, no headroom)
+- With headroom: prune_headroom = 0.2 (proposed default)
+
+Usage:
+    python bench_hnsw_prune_headroom.py
+    python bench_hnsw_prune_headroom.py --nb 100000 --d 256
+    python bench_hnsw_prune_headroom.py --headroom_values 0.0 0.1 0.2 0.3
+"""
+
+import argparse
+import time
+
+import faiss
+
+try:
+    from faiss.contrib.datasets_fb import DatasetSIFT1M
+except ImportError:
+    from faiss.contrib.datasets import DatasetSIFT1M
+
+from faiss.contrib.datasets import SyntheticDataset
+
+
+def compute_recall(I, gt, k):
+    """Compute recall@k given search results I and ground truth gt."""
+    nq = gt.shape[0]
+    return faiss.eval_intersection(I[:, :k], gt[:, :k]) / (nq * k)
+
+
+def build_hnsw_index(d, m, xb, ef_construction, prune_headroom):
+    """Build an HNSW index with the specified configuration."""
+    index = faiss.IndexHNSWSQ(d, faiss.ScalarQuantizer.QT_4bit, m)
+    index.hnsw.efConstruction = ef_construction
+    index.hnsw.prune_headroom = prune_headroom
+
+    index.train(xb)
+    start_time = time.time()
+    index.add(xb)
+    build_time = time.time() - start_time
+
+    return index, build_time
+
+
+def run_benchmark(
+    d=384,
+    m=32,
+    nb=50000,
+    nq=1000,
+    reps=3,
+    ef_construction=40,
+    ef_search_values=None,
+    k_values=None,
+    headroom_values=None,
+    use_sift1m=False,
+):
+    """
+    Run the prune_headroom recall benchmark.
+
+    Args:
+        d: Dimension of vectors
+        nb: Number of base vectors
+        nq: Number of query vectors
+        ef_construction: efConstruction parameter for HNSW
+        ef_search_values: List of efSearch values to test
+        k_values: List of k values for recall@k
+        headroom_values: List of prune_headroom values to compare
+        use_sift1m: Use SIFT1M dataset instead of synthetic
+
+    Returns:
+        Dictionary containing benchmark results
+    """
+    if ef_search_values is None:
+        ef_search_values = [16, 32, 64, 128, 256]
+    if k_values is None:
+        k_values = [1, 10]
+    if headroom_values is None:
+        headroom_values = [0.0, 0.2]
+
+    if use_sift1m:
+        print("Loading SIFT1M dataset")
+        ds = DatasetSIFT1M()
+        xb = ds.get_database()
+        xq = ds.get_queries()
+        d = xb.shape[1]
+        nb = xb.shape[0]
+        nq = xq.shape[0]
+    else:
+        print(f"Generating synthetic dataset: d={d}, nb={nb}, nq={nq}")
+        ds = SyntheticDataset(d=d, nt=0, nb=nb, nq=nq)
+        xb = ds.get_database()
+        xq = ds.get_queries()
+
+    max_k = max(k_values)
+    print(f"Computing ground truth for k={max_k}")
+    gt = ds.get_groundtruth(k=max_k)
+
+    results = {"build_times": {}, "ndis_search": {}, "recalls": {}}
+
+    for headroom in headroom_values:
+        for rep in range(reps):
+            index, build_time = build_hnsw_index(
+                d, m, xb, ef_construction, headroom)
+            results["build_times"][headroom] = build_time
+
+            faiss.cvar.hnsw_stats.reset()
+            row = {}
+            results["recalls"][(headroom, rep)] = row
+            for ef_search in ef_search_values:
+                index.hnsw.efSearch = ef_search
+                _, I = index.search(xq, max_k)
+
+                col = {}
+                row[ef_search] = col
+                for k in k_values:
+                    recall = compute_recall(I, gt, k)
+                    col[k] = recall
+            ndis_search = faiss.cvar.hnsw_stats.ndis / nq
+            results["ndis_search"][headroom] = ndis_search
+            print(
+                f"HNSW{m}(prune_headroom={headroom:4.2f}): "
+                f"{build_time=:4.2f}s, {ndis_search=:5.1f}"
+            )
+
+    print_results_table(results, ef_search_values, k_values, headroom_values)
+    return results
+
+
+def print_results_table(results, ef_search_values, k_values, headroom_values):
+
+    for k in k_values:
+        header_parts = [f"{k=:2}  "]
+        for ef_search in ef_search_values:
+            header_parts.append(f"ef={ef_search:3}")
+        header = " | ".join(header_parts)
+
+        print(f"\n{header}")
+        print("-" * len(header))
+        for (h, _), row in results["recalls"].items():
+            row_parts = [f"h={h:4.2f}"]
+            for ef_search in ef_search_values:
+                recall = row[ef_search][k]
+                row_parts.append(f"{recall:6.4f}")
+            print(" | ".join(row_parts))
+
+
+if __name__ == "__main__":
+    parser = argparse.ArgumentParser(
+        description="HNSW prune_headroom recall and build time benchmark"
+    )
+    parser.add_argument(
+        "--d",
+        type=int,
+        default=128,
+        help="Dimension of vectors (default: 128)",
+    )
+    parser.add_argument(
+        "--m",
+        type=int,
+        default=32,
+        help="Node degree (M, default: 32)",
+    )
+    parser.add_argument(
+        "--nb",
+        type=int,
+        default=50000,
+        help="Number of base vectors (default: 50000)",
+    )
+    parser.add_argument(
+        "--nq",
+        type=int,
+        default=10000,
+        help="Number of query vectors (default: 10000)",
+    )
+    parser.add_argument(
+        "--ef_construction",
+        type=int,
+        default=40,
+        help="efConstruction parameter (default: 40)",
+    )
+    parser.add_argument(
+        "--ef_search",
+        type=int,
+        nargs="+",
+        default=[16, 32, 64, 128, 256],
+        help="efSearch values to test (default: 16 32 64 128 256)",
+    )
+    parser.add_argument(
+        "--k",
+        type=int,
+        nargs="+",
+        default=[1, 10],
+        help="k values for recall@k (default: 1 10)",
+    )
+    parser.add_argument(
+        "--headroom_values",
+        type=float,
+        nargs="+",
+        default=[0.0, 0.04, 0.08, 0.12, 0.16, 0.20],
+        help="prune_headroom values to compare (default: 0.0 0.2)",
+    )
+    parser.add_argument(
+        "--reps",
+        type=int,
+        default=3,
+        help="Number of repetitions (default: 3)",
+    )
+    parser.add_argument(
+        "--sift1m",
+        action="store_true",
+        help="Use SIFT1M dataset instead of synthetic",
+    )
+    args = parser.parse_args()
+
+    run_benchmark(
+        d=args.d,
+        m=args.m,
+        nb=args.nb,
+        nq=args.nq,
+        reps=args.reps,
+        ef_construction=args.ef_construction,
+        ef_search_values=args.ef_search,
+        k_values=args.k,
+        headroom_values=args.headroom_values,
+        use_sift1m=args.sift1m,
+    )
@@ -280,7 +280,7 @@ int faiss_RangeSearchPartialResult_new_result(
         idx_t qno,
         FaissRangeQueryResult** qr) {
     try {
-        auto q = &reinterpret_cast<RangeSearchPartialResult*>(res)->new_result(
+        auto& q = reinterpret_cast<RangeSearchPartialResult*>(res)->new_result(
                 qno);
         if (qr) {
             *qr = reinterpret_cast<FaissRangeQueryResult*>(&q);
 
@@ -15,11 +15,11 @@
 # or implied. See the License for the specific language governing permissions and limitations under
 # the License.
 # =============================================================================
-set(RAPIDS_VERSION "25.10")
+set(RAPIDS_VERSION "26.02")
 set(rapids-cmake-version ${RAPIDS_VERSION})
 
 if(NOT EXISTS ${CMAKE_CURRENT_BINARY_DIR}/FAISS_RAPIDS.cmake)
-    file(DOWNLOAD https://raw.githubusercontent.com/rapidsai/rapids-cmake/branch-${RAPIDS_VERSION}/RAPIDS.cmake
+    file(DOWNLOAD https://raw.githubusercontent.com/rapidsai/rapids-cmake/release/${RAPIDS_VERSION}/RAPIDS.cmake
             ${CMAKE_CURRENT_BINARY_DIR}/FAISS_RAPIDS.cmake)
 endif()
 include(${CMAKE_CURRENT_BINARY_DIR}/FAISS_RAPIDS.cmake)
@@ -6,9 +6,10 @@
 {% set version = environ.get('GIT_DESCRIBE_TAG').lstrip('v') %}
 {% set suffix = "_nightly" if environ.get('PACKAGE_TYPE') == 'nightly' else "" %}
 {% set number = GIT_DESCRIBE_NUMBER %}
-{% set cuda_constraints=">=12.6,<12.7" %}
-{% set libcublas_constraints=">=12.6,<12.7" %}
-{% set cudart_constraints=">=12.6,<12.7" %}
+{% set cuda_major = (cudatoolkit | default("12.0")).split('.')[0] | int %}
+{% set cuda_constraints=">=13.2,<13.3" %}
+{% set libcublas_constraints=">=13.3,<13.4" %}  # libcublas 13.3 is actually for cuda 13.2
+{% set cudart_constraints=">=13.2,<13.3" %}
 
 package:
   name: faiss-pkg
@@ -60,7 +61,7 @@ outputs:
         - _openmp_mutex =4.5=2_kmp_llvm  # [x86_64]
         - mkl >=2024.2.2  # [x86_64]
         - openblas =0.3.30 # [not x86_64]
-        - libcuvs =25.10
+        - libcuvs =26.02
         - cuda-version {{ cuda_constraints }}
         - libsvs-runtime =0.2.0  # [x86_64 and linux]
       run:
@@ -69,7 +70,7 @@ outputs:
         - openblas =0.3.30 # [not x86_64]
         - cuda-cudart {{ cuda_constraints }}
         - libcublas {{ libcublas_constraints }}
-        - libcuvs =25.10
+        - libcuvs =26.02
         - cuda-version {{ cuda_constraints }}
         - libnvjitlink
         - libsvs-runtime =0.2.0  # [x86_64 and linux]
@@ -91,10 +92,10 @@ outputs:
       string: "py{{ PY_VER }}_h{{ PKG_HASH }}_{{ number }}_cuda{{ cudatoolkit }}{{ suffix }}"
     requirements:
       build:
-        - {{ compiler('cxx') }} =12.4
-        - sysroot_linux-64 =2.17 # [linux64]
+        - {{ compiler('cxx') }} =14.2
+        - sysroot_linux-64 =2.34 # [linux64]
         - swig =4.0
-        - cmake >=3.26.4
+        - cmake >=3.30.4
         - make =4.2 # [not win]
         - _openmp_mutex =4.5=2_kmp_llvm  # [x86_64]
         - mkl >=2024.2.2  # [x86_64]
@@ -117,13 +118,20 @@ outputs:
       requires:
         - numpy >=2.0,<2.3
         - scipy
+# TODO: remove cuda_major guard when we move to PyPI (pytorch via PyPI works on CUDA 13)
+{% if cuda_major < 13 %}
         - pytorch-gpu >=2.7
+{% endif %}
       commands:
         - python -X faulthandler -m unittest discover -v -s tests/ -p "test_*"
+{% if cuda_major < 13 %}
         - python -X faulthandler -m unittest discover -v -s tests/ -p "torch_*"
+{% endif %}
         - cp tests/common_faiss_tests.py faiss/gpu/test
         - python -X faulthandler -m unittest discover -v -s faiss/gpu/test/ -p "test_*"
+{% if cuda_major < 13 %}
         - python -X faulthandler -m unittest discover -v -s faiss/gpu/test/ -p "torch_*"
+{% endif %}
         - sh test_cpu_dispatch.sh  # [linux64]
       files:
         - test_cpu_dispatch.sh  # [linux64]