From 889e9f502ae1ee690fa0af50782e0bd0b1141a4e Mon Sep 17 00:00:00 2001 From: Tamas Bela Feher Date: Wed, 18 Oct 2023 05:32:40 +0200 Subject: [PATCH 1/6] Fix python script location in ANN bench description (#1906) This PR adjusts the description of the low level ANN benchmarks. Authors: - Tamas Bela Feher (https://github.com/tfeher) Approvers: - Corey J. Nolet (https://github.com/cjnolet) URL: https://github.com/rapidsai/raft/pull/1906 --- docs/source/ann_benchmarks_low_level.md | 48 ++++++++++++------------- 1 file changed, 22 insertions(+), 26 deletions(-) diff --git a/docs/source/ann_benchmarks_low_level.md b/docs/source/ann_benchmarks_low_level.md index d08a3a1791..55238954ba 100644 --- a/docs/source/ann_benchmarks_low_level.md +++ b/docs/source/ann_benchmarks_low_level.md @@ -2,57 +2,53 @@ #### End-to-end Example An end-to-end example (run from the RAFT source code root directory): ```bash -# (1) prepare a dataset -pushd +# (0) get raft sources +git clone https://github.com/rapidsai/raft.git +cd raft -cd cpp/bench/ann -mkdir data && cd data -wget http://ann-benchmarks.com/glove-100-angular.hdf5 +# (1) prepare a dataset +export PYTHONPATH=python/raft-ann-bench/src:$PYTHONPATH +python -m raft-ann-bench.get_dataset --dataset glove-100-angular --normalize -# option -n is used here to normalize vectors so cosine distance is converted +# option --normalize is used here to normalize vectors so cosine distance is converted # to inner product; don't use -n for l2 distance -python scripts/hdf5_to_fbin.py -n glove-100-angular.hdf5 - -mkdir glove-100-inner -mv glove-100-angular.base.fbin glove-100-inner/base.fbin -mv glove-100-angular.query.fbin glove-100-inner/query.fbin -mv glove-100-angular.groundtruth.neighbors.ibin glove-100-inner/groundtruth.neighbors.ibin -mv glove-100-angular.groundtruth.distances.fbin glove-100-inner/groundtruth.distances.fbin -popd # (2) build index -./cpp/build/RAFT_IVF_FLAT_ANN_BENCH \ - --data_prefix=cpp/bench/ann/data \ +$CONDA_PREFIX/bin/ann/RAFT_IVF_FLAT_ANN_BENCH \ + --data_prefix=datasets \ --build \ --benchmark_filter="raft_ivf_flat\..*" \ - cpp/bench/ann/conf/glove-100-inner.json + python/raft-ann-bench/src/raft-ann-bench/run/conf/glove-100-inner.json # (3) search -./cpp/build/RAFT_IVF_FLAT_ANN_BENCH \ - --data_prefix=cpp/bench/ann/data \ +$CONDA_PREFIX/bin/ann/RAFT_IVF_FLAT_ANN_BENCH\ + --data_prefix=datasets \ --benchmark_min_time=2s \ --benchmark_out=ivf_flat_search.csv \ --benchmark_out_format=csv \ --benchmark_counters_tabular \ --search \ - --benchmark_filter="raft_ivf_flat\..*" - cpp/bench/ann/conf/glove-100-inner.json + --benchmark_filter="raft_ivf_flat\..*" \ + python/raft-ann-bench/src/raft-ann-bench/run/conf/glove-100-inner.json + # optional step: plot QPS-Recall figure using data in ivf_flat_search.csv with your favorite tool ``` ##### Step 1: Prepare Dataset +Note: the preferred way to download and process smaller (million scale) datasets is to use the `get_dataset` script as demonstrated in the example above. + A dataset usually has 4 binary files containing database vectors, query vectors, ground truth neighbors and their corresponding distances. For example, Glove-100 dataset has files `base.fbin` (database vectors), `query.fbin` (query vectors), `groundtruth.neighbors.ibin` (ground truth neighbors), and `groundtruth.distances.fbin` (ground truth distances). The first two files are for index building and searching, while the other two are associated with a particular distance and are used for evaluation. The file suffixes `.fbin`, `.f16bin`, `.ibin`, `.u8bin`, and `.i8bin` denote that the data type of vectors stored in the file are `float32`, `float16`(a.k.a `half`), `int`, `uint8`, and `int8`, respectively. These binary files are little-endian and the format is: the first 8 bytes are `num_vectors` (`uint32_t`) and `num_dimensions` (`uint32_t`), and the following `num_vectors * num_dimensions * sizeof(type)` bytes are vectors stored in row-major order. -Some implementation can take `float16` database and query vectors as inputs and will have better performance. Use `script/fbin_to_f16bin.py` to transform dataset from `float32` to `float16` type. +Some implementation can take `float16` database and query vectors as inputs and will have better performance. Use `python/raft-ann-bench/src/raft-ann-bench/get_dataset/fbin_to_f16bin.py` to transform dataset from `float32` to `float16` type. Commonly used datasets can be downloaded from two websites: 1. Million-scale datasets can be found at the [Data sets](https://github.com/erikbern/ann-benchmarks#data-sets) section of [`ann-benchmarks`](https://github.com/erikbern/ann-benchmarks). - However, these datasets are in HDF5 format. Use `cpp/bench/ann/scripts/hdf5_to_fbin.py` to transform the format. A few Python packages are required to run it: + However, these datasets are in HDF5 format. Use `python/raft-ann-bench/src/raft-ann-bench/get_dataset/fbin_to_f16bin.py/hdf5_to_fbin.py` to transform the format. A few Python packages are required to run it: ```bash pip3 install numpy h5py ``` @@ -72,8 +68,8 @@ Commonly used datasets can be downloaded from two websites: 2. Billion-scale datasets can be found at [`big-ann-benchmarks`](http://big-ann-benchmarks.com). The ground truth file contains both neighbors and distances, thus should be split. A script is provided for this: ```bash - $ cpp/bench/ann/scripts/split_groundtruth.pl - usage: script/split_groundtruth.pl input output_prefix + $ python/raft-ann-bench/src/raft-ann-bench/split_groundtruth/split_groundtruth.pl + usage: split_groundtruth.pl input output_prefix ``` Take Deep-1B dataset as an example: ```bash @@ -82,7 +78,7 @@ Commonly used datasets can be downloaded from two websites: mkdir -p data/deep-1B && cd data/deep-1B # download manually "Ground Truth" file of "Yandex DEEP" # suppose the file name is deep_new_groundtruth.public.10K.bin - ../../scripts/split_groundtruth.pl deep_new_groundtruth.public.10K.bin groundtruth + /path/to/raft/python/raft-ann-bench/src/raft-ann-bench/split_groundtruth/split_groundtruth.pl deep_new_groundtruth.public.10K.bin groundtruth # two files 'groundtruth.neighbors.ibin' and 'groundtruth.distances.fbin' should be produced popd ``` From 50a9081254829177af34b70dc79178aeb16be37b Mon Sep 17 00:00:00 2001 From: Jake Awe <50372925+AyodeAwe@users.noreply.github.com> Date: Wed, 18 Oct 2023 08:37:02 -0500 Subject: [PATCH 2/6] update workflow links (#1907) --- .github/workflows/build.yaml | 16 ++++++++-------- .github/workflows/pr.yaml | 24 ++++++++++++------------ .github/workflows/test.yaml | 8 ++++---- ci/release/update-version.sh | 2 +- 4 files changed, 25 insertions(+), 25 deletions(-) diff --git a/.github/workflows/build.yaml b/.github/workflows/build.yaml index c2d564dfda..5a883b64ed 100644 --- a/.github/workflows/build.yaml +++ b/.github/workflows/build.yaml @@ -28,7 +28,7 @@ concurrency: jobs: cpp-build: secrets: inherit - uses: rapidsai/shared-action-workflows/.github/workflows/conda-cpp-build.yaml@branch-23.12 + uses: rapidsai/shared-workflows/.github/workflows/conda-cpp-build.yaml@branch-23.12 with: build_type: ${{ inputs.build_type || 'branch' }} branch: ${{ inputs.branch }} @@ -37,7 +37,7 @@ jobs: python-build: needs: [cpp-build] secrets: inherit - uses: rapidsai/shared-action-workflows/.github/workflows/conda-python-build.yaml@branch-23.12 + uses: rapidsai/shared-workflows/.github/workflows/conda-python-build.yaml@branch-23.12 with: build_type: ${{ inputs.build_type || 'branch' }} branch: ${{ inputs.branch }} @@ -46,7 +46,7 @@ jobs: upload-conda: needs: [cpp-build, python-build] secrets: inherit - uses: rapidsai/shared-action-workflows/.github/workflows/conda-upload-packages.yaml@branch-23.12 + uses: rapidsai/shared-workflows/.github/workflows/conda-upload-packages.yaml@branch-23.12 with: build_type: ${{ inputs.build_type || 'branch' }} branch: ${{ inputs.branch }} @@ -57,7 +57,7 @@ jobs: if: github.ref_type == 'branch' needs: python-build secrets: inherit - uses: rapidsai/shared-action-workflows/.github/workflows/custom-job.yaml@branch-23.12 + uses: rapidsai/shared-workflows/.github/workflows/custom-job.yaml@branch-23.12 with: arch: "amd64" branch: ${{ inputs.branch }} @@ -69,7 +69,7 @@ jobs: sha: ${{ inputs.sha }} wheel-build-pylibraft: secrets: inherit - uses: rapidsai/shared-action-workflows/.github/workflows/wheels-build.yaml@branch-23.12 + uses: rapidsai/shared-workflows/.github/workflows/wheels-build.yaml@branch-23.12 with: build_type: ${{ inputs.build_type || 'branch' }} branch: ${{ inputs.branch }} @@ -79,7 +79,7 @@ jobs: wheel-publish-pylibraft: needs: wheel-build-pylibraft secrets: inherit - uses: rapidsai/shared-action-workflows/.github/workflows/wheels-publish.yaml@branch-23.12 + uses: rapidsai/shared-workflows/.github/workflows/wheels-publish.yaml@branch-23.12 with: build_type: ${{ inputs.build_type || 'branch' }} branch: ${{ inputs.branch }} @@ -89,7 +89,7 @@ jobs: wheel-build-raft-dask: needs: wheel-publish-pylibraft secrets: inherit - uses: rapidsai/shared-action-workflows/.github/workflows/wheels-build.yaml@branch-23.12 + uses: rapidsai/shared-workflows/.github/workflows/wheels-build.yaml@branch-23.12 with: build_type: ${{ inputs.build_type || 'branch' }} branch: ${{ inputs.branch }} @@ -99,7 +99,7 @@ jobs: wheel-publish-raft-dask: needs: wheel-build-raft-dask secrets: inherit - uses: rapidsai/shared-action-workflows/.github/workflows/wheels-publish.yaml@branch-23.12 + uses: rapidsai/shared-workflows/.github/workflows/wheels-publish.yaml@branch-23.12 with: build_type: ${{ inputs.build_type || 'branch' }} branch: ${{ inputs.branch }} diff --git a/.github/workflows/pr.yaml b/.github/workflows/pr.yaml index 8c99e3de6a..c8bd28d4bb 100644 --- a/.github/workflows/pr.yaml +++ b/.github/workflows/pr.yaml @@ -24,41 +24,41 @@ jobs: - wheel-tests-raft-dask - devcontainer secrets: inherit - uses: rapidsai/shared-action-workflows/.github/workflows/pr-builder.yaml@branch-23.12 + uses: rapidsai/shared-workflows/.github/workflows/pr-builder.yaml@branch-23.12 checks: secrets: inherit - uses: rapidsai/shared-action-workflows/.github/workflows/checks.yaml@branch-23.12 + uses: rapidsai/shared-workflows/.github/workflows/checks.yaml@branch-23.12 with: enable_check_generated_files: false conda-cpp-build: needs: checks secrets: inherit - uses: rapidsai/shared-action-workflows/.github/workflows/conda-cpp-build.yaml@branch-23.12 + uses: rapidsai/shared-workflows/.github/workflows/conda-cpp-build.yaml@branch-23.12 with: build_type: pull-request node_type: cpu16 conda-cpp-tests: needs: conda-cpp-build secrets: inherit - uses: rapidsai/shared-action-workflows/.github/workflows/conda-cpp-tests.yaml@branch-23.12 + uses: rapidsai/shared-workflows/.github/workflows/conda-cpp-tests.yaml@branch-23.12 with: build_type: pull-request conda-python-build: needs: conda-cpp-build secrets: inherit - uses: rapidsai/shared-action-workflows/.github/workflows/conda-python-build.yaml@branch-23.12 + uses: rapidsai/shared-workflows/.github/workflows/conda-python-build.yaml@branch-23.12 with: build_type: pull-request conda-python-tests: needs: conda-python-build secrets: inherit - uses: rapidsai/shared-action-workflows/.github/workflows/conda-python-tests.yaml@branch-23.12 + uses: rapidsai/shared-workflows/.github/workflows/conda-python-tests.yaml@branch-23.12 with: build_type: pull-request docs-build: needs: conda-python-build secrets: inherit - uses: rapidsai/shared-action-workflows/.github/workflows/custom-job.yaml@branch-23.12 + uses: rapidsai/shared-workflows/.github/workflows/custom-job.yaml@branch-23.12 with: build_type: pull-request node_type: "gpu-v100-latest-1" @@ -68,34 +68,34 @@ jobs: wheel-build-pylibraft: needs: checks secrets: inherit - uses: rapidsai/shared-action-workflows/.github/workflows/wheels-build.yaml@branch-23.12 + uses: rapidsai/shared-workflows/.github/workflows/wheels-build.yaml@branch-23.12 with: build_type: pull-request script: ci/build_wheel_pylibraft.sh wheel-tests-pylibraft: needs: wheel-build-pylibraft secrets: inherit - uses: rapidsai/shared-action-workflows/.github/workflows/wheels-test.yaml@branch-23.12 + uses: rapidsai/shared-workflows/.github/workflows/wheels-test.yaml@branch-23.12 with: build_type: pull-request script: ci/test_wheel_pylibraft.sh wheel-build-raft-dask: needs: wheel-tests-pylibraft secrets: inherit - uses: rapidsai/shared-action-workflows/.github/workflows/wheels-build.yaml@branch-23.12 + uses: rapidsai/shared-workflows/.github/workflows/wheels-build.yaml@branch-23.12 with: build_type: pull-request script: "ci/build_wheel_raft_dask.sh" wheel-tests-raft-dask: needs: wheel-build-raft-dask secrets: inherit - uses: rapidsai/shared-action-workflows/.github/workflows/wheels-test.yaml@branch-23.12 + uses: rapidsai/shared-workflows/.github/workflows/wheels-test.yaml@branch-23.12 with: build_type: pull-request script: ci/test_wheel_raft_dask.sh devcontainer: secrets: inherit - uses: rapidsai/shared-action-workflows/.github/workflows/build-in-devcontainer.yaml@branch-23.12 + uses: rapidsai/shared-workflows/.github/workflows/build-in-devcontainer.yaml@branch-23.12 with: build_command: | sccache -z; diff --git a/.github/workflows/test.yaml b/.github/workflows/test.yaml index 4e45ae29f6..1c2395cb68 100644 --- a/.github/workflows/test.yaml +++ b/.github/workflows/test.yaml @@ -16,7 +16,7 @@ on: jobs: conda-cpp-tests: secrets: inherit - uses: rapidsai/shared-action-workflows/.github/workflows/conda-cpp-tests.yaml@branch-23.12 + uses: rapidsai/shared-workflows/.github/workflows/conda-cpp-tests.yaml@branch-23.12 with: build_type: nightly branch: ${{ inputs.branch }} @@ -24,7 +24,7 @@ jobs: sha: ${{ inputs.sha }} conda-python-tests: secrets: inherit - uses: rapidsai/shared-action-workflows/.github/workflows/conda-python-tests.yaml@branch-23.12 + uses: rapidsai/shared-workflows/.github/workflows/conda-python-tests.yaml@branch-23.12 with: build_type: nightly branch: ${{ inputs.branch }} @@ -32,7 +32,7 @@ jobs: sha: ${{ inputs.sha }} wheel-tests-pylibraft: secrets: inherit - uses: rapidsai/shared-action-workflows/.github/workflows/wheels-test.yaml@branch-23.12 + uses: rapidsai/shared-workflows/.github/workflows/wheels-test.yaml@branch-23.12 with: build_type: nightly branch: ${{ inputs.branch }} @@ -41,7 +41,7 @@ jobs: script: ci/test_wheel_pylibraft.sh wheel-tests-raft-dask: secrets: inherit - uses: rapidsai/shared-action-workflows/.github/workflows/wheels-test.yaml@branch-23.12 + uses: rapidsai/shared-workflows/.github/workflows/wheels-test.yaml@branch-23.12 with: build_type: nightly branch: ${{ inputs.branch }} diff --git a/ci/release/update-version.sh b/ci/release/update-version.sh index a867a71f68..63e0fd5ba9 100755 --- a/ci/release/update-version.sh +++ b/ci/release/update-version.sh @@ -82,7 +82,7 @@ for FILE in .github/workflows/*.yaml; do done for FILE in .github/workflows/*.yaml; do - sed_runner "/shared-action-workflows/ s/@.*/@branch-${NEXT_SHORT_TAG}/g" "${FILE}" + sed_runner "/shared-workflows/ s/@.*/@branch-${NEXT_SHORT_TAG}/g" "${FILE}" done sed_runner "s/RAPIDS_VERSION_NUMBER=\".*/RAPIDS_VERSION_NUMBER=\"${NEXT_SHORT_TAG}\"/g" ci/build_docs.sh From eb96fc6321f0b939171853fefbf5fe87cc6482d3 Mon Sep 17 00:00:00 2001 From: Tamas Bela Feher Date: Wed, 18 Oct 2023 21:17:33 +0200 Subject: [PATCH 3/6] Remove unnecessary dataset path check in ANN bench (#1908) This PR removes a superfluous path check. This check is not necessary, since the actual dataset path is computed differently (see `legacy_result_folder`), using the path field in the config file. The existing test ties the dataset file name to the config file name, therefore imposes an unnecessary restriction. In practice I often have multiple json configs using the same dataset dir. Authors: - Tamas Bela Feher (https://github.com/tfeher) Approvers: - Ben Frederickson (https://github.com/benfred) URL: https://github.com/rapidsai/raft/pull/1908 --- python/raft-ann-bench/src/raft-ann-bench/run/__main__.py | 2 -- 1 file changed, 2 deletions(-) diff --git a/python/raft-ann-bench/src/raft-ann-bench/run/__main__.py b/python/raft-ann-bench/src/raft-ann-bench/run/__main__.py index 9e2da7328d..3b670dc464 100644 --- a/python/raft-ann-bench/src/raft-ann-bench/run/__main__.py +++ b/python/raft-ann-bench/src/raft-ann-bench/run/__main__.py @@ -243,8 +243,6 @@ def main(): dataset_path = args.dataset_path if not os.path.exists(conf_filepath): raise FileNotFoundError(conf_filename) - if not os.path.exists(os.path.join(args.dataset_path, dataset_name)): - raise FileNotFoundError(os.path.join(args.dataset_path, dataset_name)) with open(conf_filepath, "r") as f: conf_file = json.load(f) From 6fdb886818876e416aa0cbac392dc26f0507b275 Mon Sep 17 00:00:00 2001 From: Ben Frederickson Date: Wed, 18 Oct 2023 19:05:44 -0700 Subject: [PATCH 4/6] Remove dynamic entry-points from raft-ann-bench (#1910) Building raft-ann-bench can throw a ``` distutils.errors.DistutilsOptionError: No configuration found for dynamic 'entry-points'. Some dynamic fields need to be specified via `tool.setuptools.dynamic` others must be specified via the equivalent attribute in `setup.py`. ``` error sometimes depending on distutils version. This is becase we were specifying dynamic=entry-points, but not including the relevant `tool.setuptools.dynamic` section in pyproject.toml. Remove this to allow building Authors: - Ben Frederickson (https://github.com/benfred) Approvers: - Corey J. Nolet (https://github.com/cjnolet) URL: https://github.com/rapidsai/raft/pull/1910 --- python/raft-ann-bench/pyproject.toml | 1 - 1 file changed, 1 deletion(-) diff --git a/python/raft-ann-bench/pyproject.toml b/python/raft-ann-bench/pyproject.toml index 6562937548..0cb36deaa7 100644 --- a/python/raft-ann-bench/pyproject.toml +++ b/python/raft-ann-bench/pyproject.toml @@ -27,7 +27,6 @@ classifiers = [ "Programming Language :: Python :: 3.9", "Programming Language :: Python :: 3.10", ] -dynamic = ["entry-points"] [project.urls] Homepage = "https://github.com/rapidsai/raft" From b5e14e1623fd157259d4345a209732a10b4fd95d Mon Sep 17 00:00:00 2001 From: "Corey J. Nolet" Date: Thu, 19 Oct 2023 04:07:07 +0200 Subject: [PATCH 5/6] Fixing Googletests and re-enabling in CI (#1904) Recently, the CI script to run the C++ gtests was changed to call `ctest` but it looks like this command has been failing in CI for quite some time. It's a little scary as most of RAFT's C++ APIs are not exposed through Python and so we cannot rely on those Python tests to guarantee quality of the C++ APIs. I'm reverting the change back to invoking the C++ binaries directly so that we can get the tests running again. Once we figure out why `ctest` isn't running the tests then we can make the change to use that again. Authors: - Corey J. Nolet (https://github.com/cjnolet) Approvers: - William Hicks (https://github.com/wphicks) - Robert Maynard (https://github.com/robertmaynard) - Ray Douglass (https://github.com/raydouglass) - Ben Frederickson (https://github.com/benfred) URL: https://github.com/rapidsai/raft/pull/1904 --- ci/test_cpp.sh | 1 + .../distance/detail/distance_ops/l2_exp.cuh | 42 +++++++++++++++---- .../raft/neighbors/detail/knn_brute_force.cuh | 14 +++---- cpp/test/distance/fused_l2_nn.cu | 3 +- cpp/test/neighbors/ann_cagra.cuh | 6 +-- cpp/test/neighbors/ann_ivf_pq.cuh | 2 +- docs/source/raft_ann_benchmarks.md | 33 ++++++--------- .../pylibraft/pylibraft/test/test_distance.py | 8 +--- 8 files changed, 59 insertions(+), 50 deletions(-) diff --git a/ci/test_cpp.sh b/ci/test_cpp.sh index 9c487be156..0f8efb171e 100755 --- a/ci/test_cpp.sh +++ b/ci/test_cpp.sh @@ -36,6 +36,7 @@ trap "EXITCODE=1" ERR set +e # Run libraft gtests from libraft-tests package +cd "$CONDA_PREFIX"/bin/gtests/libraft ctest -j8 --output-on-failure rapids-logger "Test script exiting with value: $EXITCODE" diff --git a/cpp/include/raft/distance/detail/distance_ops/l2_exp.cuh b/cpp/include/raft/distance/detail/distance_ops/l2_exp.cuh index 5e93d9e33b..5b4048c1c3 100644 --- a/cpp/include/raft/distance/detail/distance_ops/l2_exp.cuh +++ b/cpp/include/raft/distance/detail/distance_ops/l2_exp.cuh @@ -21,6 +21,22 @@ namespace raft::distance::detail::ops { +/** + * Reserve 1 digit of precision from each floating-point type + * for round-off error tolerance. + * @tparam DataT + */ +template +__device__ constexpr DataT get_clamp_precision() +{ + switch (sizeof(DataT)) { + case 2: return 1e-3; + case 4: return 1e-6; + case 8: return 1e-15; + default: return 0; + } +} + // Epilogue operator for CUTLASS based kernel template struct l2_exp_cutlass_op { @@ -31,11 +47,13 @@ struct l2_exp_cutlass_op { __device__ AccT operator()(DataT& aNorm, const DataT& bNorm, DataT& accVal) const noexcept { AccT outVal = aNorm + bNorm - DataT(2.0) * accVal; - // outVal could be negative due to numerical instability, especially when - // calculating self distance. - // clamp to 0 to avoid potential NaN in sqrt - outVal = outVal * (raft::abs(outVal) >= DataT(0.0001)); - return sqrt ? raft::sqrt(outVal) : outVal; + + /** + * Self-neighboring points should have (aNorm == bNorm) == accVal and the dot product (accVal) + * can sometimes have round-off errors, which will cause (aNorm == bNorm) ~ accVal instead. + */ + outVal = outVal * !((outVal * outVal < get_clamp_precision()) * (aNorm == bNorm)); + return sqrt ? raft::sqrt(outVal * (outVal > 0)) : outVal; } __device__ AccT operator()(DataT aData) const noexcept { return aData; } @@ -86,10 +104,16 @@ struct l2_exp_distance_op { for (int i = 0; i < Policy::AccRowsPerTh; ++i) { #pragma unroll for (int j = 0; j < Policy::AccColsPerTh; ++j) { - DataT val = regxn[i] + regyn[j] - (DataT)2.0 * acc[i][j]; - // val could be negative due to numerical instability, especially when - // calculating self distance. Clamp to 0 to avoid potential NaN in sqrt - acc[i][j] = val * (raft::abs(val) >= DataT(0.0001)); + DataT accVal = acc[i][j]; + DataT val = regxn[i] + regyn[j] - (DataT)2.0 * accVal; + + /** + * Self-neighboring points should have (aNorm == bNorm) == accVal and the dot product + * (accVal) can sometimes have round-off errors, which will cause (aNorm == bNorm) ~ accVal + * instead. + */ + acc[i][j] = + val * (val > 0) * !((val * val < get_clamp_precision()) * (regxn[i] == regyn[j])); } } if (sqrt) { diff --git a/cpp/include/raft/neighbors/detail/knn_brute_force.cuh b/cpp/include/raft/neighbors/detail/knn_brute_force.cuh index be05d5545f..5da4e77874 100644 --- a/cpp/include/raft/neighbors/detail/knn_brute_force.cuh +++ b/cpp/include/raft/neighbors/detail/knn_brute_force.cuh @@ -29,6 +29,7 @@ #include #include #include +#include #include #include #include @@ -186,6 +187,7 @@ void tiled_brute_force_knn(const raft::resources& handle, auto row_norms = search_norms.data(); auto col_norms = precomputed_index_norms ? precomputed_index_norms : index_norms.data(); auto dist = temp_distances.data(); + bool sqrt = metric == raft::distance::DistanceType::L2SqrtExpanded; raft::linalg::map_offset( handle, @@ -194,15 +196,9 @@ void tiled_brute_force_knn(const raft::resources& handle, IndexType row = i + (idx / current_centroid_size); IndexType col = j + (idx % current_centroid_size); - auto val = row_norms[row] + col_norms[col] - 2.0 * dist[idx]; - - // due to numerical instability (especially around self-distance) - // the distances here could be slightly negative, which will - // cause NaN values in the subsequent sqrt. Clamp to 0 - val = val * (val >= 0.0001); - if (metric == raft::distance::DistanceType::L2SqrtExpanded) { val = sqrt(val); } - val = distance_epilogue(val, row, col); - return val; + raft::distance::detail::ops::l2_exp_cutlass_op l2_op(sqrt); + auto val = l2_op(row_norms[row], col_norms[col], dist[idx]); + return distance_epilogue(val, row, col); }); } else if (metric == raft::distance::DistanceType::CosineExpanded) { auto row_norms = search_norms.data(); diff --git a/cpp/test/distance/fused_l2_nn.cu b/cpp/test/distance/fused_l2_nn.cu index 27c923b11d..565895565f 100644 --- a/cpp/test/distance/fused_l2_nn.cu +++ b/cpp/test/distance/fused_l2_nn.cu @@ -57,6 +57,7 @@ RAFT_KERNEL naiveKernel(raft::KeyValuePair* min, auto diff = midx >= m || nidx >= n ? DataT(0) : x[xidx] - y[yidx]; acc += diff * diff; } + if (Sqrt) { acc = raft::sqrt(acc); } ReduceOpT redOp; typedef cub::WarpReduce> WarpReduce; @@ -343,7 +344,7 @@ const std::vector> inputsd = { {0.00001, 128, 32, 33, 1234ULL}, {0.00001, 128, 64, 33, 1234ULL}, {0.00001, 128, 128, 65, 1234ULL}, {0.00001, 64, 128, 129, 1234ULL}, - {0.00001, 1805, 134, 2, 1234ULL}, {0.00001, 8192, 1024, 25, 1234ULL}, + {0.00001, 1805, 134, 2, 1234ULL}, //{0.00001, 8192, 1024, 25, 1234ULL}, }; typedef FusedL2NNTest FusedL2NNTestD_Sq; TEST_P(FusedL2NNTestD_Sq, Result) diff --git a/cpp/test/neighbors/ann_cagra.cuh b/cpp/test/neighbors/ann_cagra.cuh index c9336c16cd..1f4531071f 100644 --- a/cpp/test/neighbors/ann_cagra.cuh +++ b/cpp/test/neighbors/ann_cagra.cuh @@ -274,7 +274,7 @@ class AnnCagraTest : public ::testing::TestWithParam { distances_Cagra, ps.n_queries, ps.k, - 0.001, + 0.003, min_recall)); EXPECT_TRUE(eval_distances(handle_, database.data(), @@ -515,7 +515,7 @@ class AnnCagraFilterTest : public ::testing::TestWithParam { distances_Cagra, ps.n_queries, ps.k, - 0.001, + 0.003, min_recall)); EXPECT_TRUE(eval_distances(handle_, database.data(), @@ -628,7 +628,7 @@ class AnnCagraFilterTest : public ::testing::TestWithParam { distances_Cagra, ps.n_queries, ps.k, - 0.001, + 0.003, min_recall)); EXPECT_TRUE(eval_distances(handle_, database.data(), diff --git a/cpp/test/neighbors/ann_ivf_pq.cuh b/cpp/test/neighbors/ann_ivf_pq.cuh index d1f5ee5b03..87baf31c2b 100644 --- a/cpp/test/neighbors/ann_ivf_pq.cuh +++ b/cpp/test/neighbors/ann_ivf_pq.cuh @@ -312,7 +312,7 @@ class ivf_pq_test : public ::testing::TestWithParam { // Hence, encoding-decoding chain often leads to altering both the PQ codes and the // reconstructed data. compare_vectors_l2( - handle_, vectors_1.view(), vectors_2.view(), label, compression_ratio, 0.025); + handle_, vectors_1.view(), vectors_2.view(), label, compression_ratio, 0.04); // 0.025); } void check_packing(index* index, uint32_t label) diff --git a/docs/source/raft_ann_benchmarks.md b/docs/source/raft_ann_benchmarks.md index 315e2245d8..25fdf3f0f6 100644 --- a/docs/source/raft_ann_benchmarks.md +++ b/docs/source/raft_ann_benchmarks.md @@ -84,8 +84,6 @@ You can see the exact versions as well in the dockerhub site: [//]: # (```) - - ## How to run the benchmarks We provide a collection of lightweight Python scripts to run the benchmarks. There are 4 general steps to running the benchmarks and visualizing the results. @@ -118,17 +116,6 @@ will be written at location `datasets/glove-100-inner/`. ### Step 2: Build and Search Index The script `raft-ann-bench.run` will build and search indices for a given dataset and its specified configuration. -To confirgure which algorithms are available, we use `algos.yaml`. -To configure building/searching indices for a dataset, look at [index configuration](#json-index-config). -An entry in `algos.yaml` looks like: -```yaml -raft_ivf_pq: - executable: RAFT_IVF_PQ_ANN_BENCH - requires_gpu: true -``` -`executable` : specifies the name of the binary that will build/search the index. It is assumed to be -available in `raft/cpp/build/`. -`requires_gpu` : denotes whether an algorithm requires GPU to run. The usage of the script `raft-ann-bench.run` is: ```bash @@ -294,8 +281,6 @@ options: Path to billion-scale dataset groundtruth file (default: None) ``` - - ### Running with Docker containers Two methods are provided for running the benchmarks with the Docker containers. @@ -410,14 +395,8 @@ The table below contains the possible settings for the `algo` field. Each unique | HNSWlib | `hnswlib` | | RAFT | `raft_brute_force`, `raft_cagra`, `raft_ivf_flat`, `raft_ivf_pq` | - - - By default, the index will be placed in `bench/ann/data//index/`. Using `sift-128-euclidean` for the dataset with the `algo` example above, the indexes would be placed in `bench/ann/data/sift-128-euclidean/index/algo_name/param1_val1-param2_val2`. - - - ## Adding a new ANN algorithm ### Implementation and Configuration @@ -490,6 +469,7 @@ How to interpret these JSON objects is totally left to the implementation and sh } ``` + ### Adding a CMake Target In `raft/cpp/bench/ann/CMakeLists.txt`, we provide a `CMake` function to configure a new Benchmark target with the following signature: ``` @@ -511,3 +491,14 @@ ConfigureAnnBench( ``` This will create an executable called `HNSWLIB_ANN_BENCH`, which can then be used to run `HNSWLIB` benchmarks. + +Add a new entry to `algos.yaml` to map the name of the algorithm to its binary executable and specify whether the algorithm requires GPU support. +```yaml +raft_ivf_pq: + executable: RAFT_IVF_PQ_ANN_BENCH + requires_gpu: true +``` + +`executable` : specifies the name of the binary that will build/search the index. It is assumed to be +available in `raft/cpp/build/`. +`requires_gpu` : denotes whether an algorithm requires GPU to run. diff --git a/python/pylibraft/pylibraft/test/test_distance.py b/python/pylibraft/pylibraft/test/test_distance.py index f9d3890ff7..34ed86db01 100644 --- a/python/pylibraft/pylibraft/test/test_distance.py +++ b/python/pylibraft/pylibraft/test/test_distance.py @@ -21,8 +21,8 @@ from pylibraft.distance import pairwise_distance -@pytest.mark.parametrize("n_rows", [32, 100]) -@pytest.mark.parametrize("n_cols", [40, 100]) +@pytest.mark.parametrize("n_rows", [50, 100]) +@pytest.mark.parametrize("n_cols", [10, 50]) @pytest.mark.parametrize( "metric", [ @@ -63,8 +63,6 @@ def test_distance(n_rows, n_cols, inplace, metric, order, dtype): else: expected = cdist(input1, input1, metric) - expected[expected <= 1e-5] = 0.0 - input1_device = device_ndarray(input1) output_device = device_ndarray(output) if inplace else None @@ -79,6 +77,4 @@ def test_distance(n_rows, n_cols, inplace, metric, order, dtype): actual = output_device.copy_to_host() - actual[actual <= 1e-5] = 0.0 - assert np.allclose(expected, actual, atol=1e-3, rtol=1e-3) From 747f6a65b4a479926d7064e31532f964d54456e1 Mon Sep 17 00:00:00 2001 From: Divye Gala Date: Wed, 18 Oct 2023 22:08:59 -0400 Subject: [PATCH 6/6] Fix filepath in `raft-ann-bench/split_groundtruth` module (#1911) Authors: - Divye Gala (https://github.com/divyegala) Approvers: - Corey J. Nolet (https://github.com/cjnolet) - Dante Gama Dessavre (https://github.com/dantegd) URL: https://github.com/rapidsai/raft/pull/1911 --- .../raft-ann-bench/src/raft-ann-bench/run/__main__.py | 3 ++- .../src/raft-ann-bench/split_groundtruth/__main__.py | 10 +++++++--- 2 files changed, 9 insertions(+), 4 deletions(-) diff --git a/python/raft-ann-bench/src/raft-ann-bench/run/__main__.py b/python/raft-ann-bench/src/raft-ann-bench/run/__main__.py index 3b670dc464..a0d4fabb77 100644 --- a/python/raft-ann-bench/src/raft-ann-bench/run/__main__.py +++ b/python/raft-ann-bench/src/raft-ann-bench/run/__main__.py @@ -239,7 +239,6 @@ def main(): ) conf_filename = conf_filepath.split("/")[-1] conf_filedir = "/".join(conf_filepath.split("/")[:-1]) - dataset_name = conf_filename.replace(".json", "") dataset_path = args.dataset_path if not os.path.exists(conf_filepath): raise FileNotFoundError(conf_filename) @@ -247,6 +246,8 @@ def main(): with open(conf_filepath, "r") as f: conf_file = json.load(f) + dataset_name = conf_file["dataset"]["name"] + executables_to_run = dict() # At least one named index should exist in config file if args.indices: diff --git a/python/raft-ann-bench/src/raft-ann-bench/split_groundtruth/__main__.py b/python/raft-ann-bench/src/raft-ann-bench/split_groundtruth/__main__.py index e8625ce7d7..b886d40ea7 100644 --- a/python/raft-ann-bench/src/raft-ann-bench/split_groundtruth/__main__.py +++ b/python/raft-ann-bench/src/raft-ann-bench/split_groundtruth/__main__.py @@ -19,10 +19,14 @@ def split_groundtruth(groundtruth_filepath): - ann_bench_scripts_path = "split_groundtruth.pl" + ann_bench_scripts_path = os.path.join( + os.path.dirname(os.path.realpath(__file__)), "split_groundtruth.pl" + ) pwd = os.getcwd() - os.chdir("/".join(groundtruth_filepath.split("/")[:-1])) - groundtruth_filename = groundtruth_filepath.split("/")[-1] + path_to_groundtruth = os.path.normpath(groundtruth_filepath).split(os.sep) + if len(path_to_groundtruth) > 1: + os.chdir(os.path.join(*path_to_groundtruth[:-1])) + groundtruth_filename = path_to_groundtruth[-1] subprocess.run( [ann_bench_scripts_path, groundtruth_filename, "groundtruth"], check=True,