From b882590a6525e7aa2fcc521bbb42316aaa5a3b5e Mon Sep 17 00:00:00 2001 From: Tarang Jain <40517122+tarang-jain@users.noreply.github.com> Date: Sat, 27 Jul 2024 15:26:36 -0400 Subject: [PATCH 1/2] Enable building FAISS main statically (#241) Port https://github.com/rapidsai/raft/pull/2323 PR from RAFT [Cleans up a collection of anti-patterns in the cuvs CMake code while also enabling building faiss from latest main] Authors: - Tarang Jain (https://github.com/tarang-jain) Approvers: - Robert Maynard (https://github.com/robertmaynard) - Corey J. Nolet (https://github.com/cjnolet) - Paul Taylor (https://github.com/trxcllnt) - Ray Douglass (https://github.com/raydouglass) URL: https://github.com/rapidsai/cuvs/pull/241 --- .devcontainer/Dockerfile | 7 + cpp/CMakeLists.txt | 6 +- cpp/bench/ann/CMakeLists.txt | 109 ++++++-------- cpp/cmake/patches/faiss_override.json | 9 ++ cpp/cmake/patches/ggnn_override.json | 16 ++ cpp/cmake/patches/hnswlib_override.json | 16 ++ cpp/cmake/thirdparty/get_faiss.cmake | 187 +++++++++++++----------- cpp/cmake/thirdparty/get_ggnn.cmake | 43 +++--- cpp/cmake/thirdparty/get_hnswlib.cmake | 76 +++++----- cpp/test/CMakeLists.txt | 84 +++++------ 10 files changed, 286 insertions(+), 267 deletions(-) create mode 100644 cpp/cmake/patches/faiss_override.json create mode 100644 cpp/cmake/patches/ggnn_override.json create mode 100644 cpp/cmake/patches/hnswlib_override.json diff --git a/.devcontainer/Dockerfile b/.devcontainer/Dockerfile index 9d35e3f97..594ba8c3c 100644 --- a/.devcontainer/Dockerfile +++ b/.devcontainer/Dockerfile @@ -5,6 +5,13 @@ ARG PYTHON_PACKAGE_MANAGER=conda FROM ${BASE} as pip-base +RUN apt update -y \ + && DEBIAN_FRONTEND=noninteractive apt install -y --no-install-recommends \ + # faiss dependencies + libblas-dev \ + liblapack-dev \ + && rm -rf /tmp/* /var/tmp/* /var/cache/apt/* /var/lib/apt/lists/*; + ENV DEFAULT_VIRTUAL_ENV=rapids FROM ${BASE} as conda-base diff --git a/cpp/CMakeLists.txt b/cpp/CMakeLists.txt index 5060f4591..d204a9a23 100644 --- a/cpp/CMakeLists.txt +++ b/cpp/CMakeLists.txt @@ -682,13 +682,13 @@ rapids_export( # * build test executable ---------------------------------------------------- if(BUILD_TESTS OR BUILD_C_TESTS) - include(internal/CMakeLists.txt) - include(test/CMakeLists.txt) + add_subdirectory(internal) + add_subdirectory(test) endif() # ################################################################################################## # * build ann benchmark executable ----------------------------------------------- if(BUILD_ANN_BENCH) - include(bench/ann/CMakeLists.txt) + add_subdirectory(bench/ann/) endif() diff --git a/cpp/bench/ann/CMakeLists.txt b/cpp/bench/ann/CMakeLists.txt index 6e9e66fad..80c1f3530 100644 --- a/cpp/bench/ann/CMakeLists.txt +++ b/cpp/bench/ann/CMakeLists.txt @@ -12,6 +12,8 @@ # the License. # ============================================================================= +list(APPEND CMAKE_MODULE_PATH "${CUVS_SOURCE_DIR}") + # ################################################################################################## # * benchmark options ------------------------------------------------------------------------------ @@ -39,31 +41,18 @@ option(CUVS_ANN_BENCH_SINGLE_EXE find_package(Threads REQUIRED) +set(CUVS_ANN_BENCH_USE_FAISS ON) +set(CUVS_FAISS_ENABLE_GPU ON) +set(CUVS_USE_FAISS_STATIC ON) + if(BUILD_CPU_ONLY) set(CUVS_FAISS_ENABLE_GPU OFF) - set(CUVS_ANN_BENCH_USE_FAISS_GPU_FLAT OFF) - set(CUVS_ANN_BENCH_USE_FAISS_GPU_IVF_FLAT OFF) - set(CUVS_ANN_BENCH_USE_FAISS_GPU_IVF_PQ OFF) set(CUVS_ANN_BENCH_USE_CUVS_IVF_FLAT OFF) set(CUVS_ANN_BENCH_USE_CUVS_IVF_PQ OFF) set(CUVS_ANN_BENCH_USE_CUVS_CAGRA OFF) set(CUVS_ANN_BENCH_USE_CUVS_BRUTE_FORCE OFF) set(CUVS_ANN_BENCH_USE_CUVS_CAGRA_HNSWLIB OFF) set(CUVS_ANN_BENCH_USE_GGNN OFF) -else() - set(CUVS_FAISS_ENABLE_GPU ON) -endif() - -set(CUVS_ANN_BENCH_USE_FAISS OFF) -if(CUVS_ANN_BENCH_USE_FAISS_GPU_FLAT - OR CUVS_ANN_BENCH_USE_FAISS_GPU_IVF_PQ - OR CUVS_ANN_BENCH_USE_FAISS_GPU_IVF_FLAT - OR CUVS_ANN_BENCH_USE_FAISS_CPU_FLAT - OR CUVS_ANN_BENCH_USE_FAISS_CPU_IVF_PQ - OR CUVS_ANN_BENCH_USE_FAISS_CPU_IVF_FLAT -) - set(CUVS_ANN_BENCH_USE_FAISS ON) - set(CUVS_USE_FAISS_STATIC ON) endif() set(CUVS_ANN_BENCH_USE_CUVS OFF) @@ -80,21 +69,17 @@ endif() # * Fetch requirements ------------------------------------------------------------- if(CUVS_ANN_BENCH_USE_HNSWLIB OR CUVS_ANN_BENCH_USE_CUVS_CAGRA_HNSWLIB) - include(cmake/thirdparty/get_hnswlib.cmake) + include(cmake/thirdparty/get_hnswlib) endif() -include(cmake/thirdparty/get_nlohmann_json.cmake) +include(cmake/thirdparty/get_nlohmann_json) if(CUVS_ANN_BENCH_USE_GGNN) - include(cmake/thirdparty/get_ggnn.cmake) + include(cmake/thirdparty/get_ggnn) endif() if(CUVS_ANN_BENCH_USE_FAISS) - # We need to ensure that faiss has all the conda information. So we currently use the very ugly - # hammer of `link_libraries` to ensure that all targets in this directory and the faiss directory - # will have the conda includes/link dirs - link_libraries($) - include(cmake/thirdparty/get_faiss.cmake) + include(cmake/thirdparty/get_faiss) endif() # ################################################################################################## @@ -154,8 +139,6 @@ function(ConfigureAnnBench) $<$:CUDA::cudart_static> $ $ - -static-libgcc - -static-libstdc++ ) set_target_properties( @@ -210,27 +193,34 @@ endif() if(CUVS_ANN_BENCH_USE_HNSWLIB) ConfigureAnnBench( - NAME HNSWLIB PATH bench/ann/src/hnswlib/hnswlib_benchmark.cpp LINKS hnswlib::hnswlib + NAME HNSWLIB PATH src/hnswlib/hnswlib_benchmark.cpp LINKS hnswlib::hnswlib ) endif() if(CUVS_ANN_BENCH_USE_CUVS_IVF_PQ) ConfigureAnnBench( - NAME CUVS_IVF_PQ PATH bench/ann/src/cuvs/cuvs_benchmark.cu - $<$:bench/ann/src/cuvs/cuvs_ivf_pq.cu> LINKS cuvs + NAME CUVS_IVF_PQ + PATH + src/cuvs/cuvs_benchmark.cu + src/cuvs/cuvs_ivf_pq.cu + LINKS cuvs ) endif() if(CUVS_ANN_BENCH_USE_CUVS_IVF_FLAT) ConfigureAnnBench( - NAME CUVS_IVF_FLAT PATH bench/ann/src/cuvs/cuvs_benchmark.cu - $<$:bench/ann/src/cuvs/cuvs_ivf_flat.cu> LINKS cuvs + NAME CUVS_IVF_FLAT + PATH + src/cuvs/cuvs_benchmark.cu + src/cuvs/cuvs_ivf_flat.cu + LINKS + cuvs ) endif() if(CUVS_ANN_BENCH_USE_CUVS_BRUTE_FORCE) - ConfigureAnnBench(NAME CUVS_BRUTE_FORCE PATH bench/ann/src/cuvs/cuvs_benchmark.cu LINKS cuvs) + ConfigureAnnBench(NAME CUVS_BRUTE_FORCE PATH src/cuvs/cuvs_benchmark.cu LINKS cuvs) endif() if(CUVS_ANN_BENCH_USE_CUVS_CAGRA) @@ -238,11 +228,11 @@ if(CUVS_ANN_BENCH_USE_CUVS_CAGRA) NAME CUVS_CAGRA PATH - bench/ann/src/cuvs/cuvs_benchmark.cu - $<$:bench/ann/src/cuvs/cuvs_cagra_float.cu> - $<$:bench/ann/src/cuvs/cuvs_cagra_half.cu> - $<$:bench/ann/src/cuvs/cuvs_cagra_int8_t.cu> - $<$:bench/ann/src/cuvs/cuvs_cagra_uint8_t.cu> + src/cuvs/cuvs_benchmark.cu + src/cuvs/cuvs_cagra_float.cu + src/cuvs/cuvs_cagra_half.cu + src/cuvs/cuvs_cagra_int8_t.cu + src/cuvs/cuvs_cagra_uint8_t.cu LINKS cuvs ) @@ -250,78 +240,65 @@ endif() if(CUVS_ANN_BENCH_USE_CUVS_CAGRA_HNSWLIB) ConfigureAnnBench( - NAME CUVS_CAGRA_HNSWLIB PATH bench/ann/src/cuvs/cuvs_cagra_hnswlib.cu LINKS cuvs + NAME CUVS_CAGRA_HNSWLIB PATH src/cuvs/cuvs_cagra_hnswlib.cu LINKS cuvs hnswlib::hnswlib ) endif() -set(CUVS_FAISS_TARGETS faiss::faiss) -if(TARGET faiss::faiss_avx2) - set(CUVS_FAISS_TARGETS faiss::faiss_avx2) -endif() - message("CUVS_FAISS_TARGETS: ${CUVS_FAISS_TARGETS}") message("CUDAToolkit_LIBRARY_DIR: ${CUDAToolkit_LIBRARY_DIR}") if(CUVS_ANN_BENCH_USE_FAISS_CPU_FLAT) ConfigureAnnBench( - NAME FAISS_CPU_FLAT PATH bench/ann/src/faiss/faiss_cpu_benchmark.cpp LINKS + NAME FAISS_CPU_FLAT PATH src/faiss/faiss_cpu_benchmark.cpp LINKS ${CUVS_FAISS_TARGETS} ) endif() if(CUVS_ANN_BENCH_USE_FAISS_CPU_IVF_FLAT) ConfigureAnnBench( - NAME FAISS_CPU_IVF_FLAT PATH bench/ann/src/faiss/faiss_cpu_benchmark.cpp LINKS + NAME FAISS_CPU_IVF_FLAT PATH src/faiss/faiss_cpu_benchmark.cpp LINKS ${CUVS_FAISS_TARGETS} ) endif() if(CUVS_ANN_BENCH_USE_FAISS_CPU_IVF_PQ) ConfigureAnnBench( - NAME FAISS_CPU_IVF_PQ PATH bench/ann/src/faiss/faiss_cpu_benchmark.cpp LINKS + NAME FAISS_CPU_IVF_PQ PATH src/faiss/faiss_cpu_benchmark.cpp LINKS ${CUVS_FAISS_TARGETS} ) endif() -if(CUVS_ANN_BENCH_USE_FAISS_GPU_IVF_FLAT) +if(CUVS_ANN_BENCH_USE_FAISS_GPU_IVF_FLAT AND CUVS_FAISS_ENABLE_GPU) ConfigureAnnBench( - NAME FAISS_GPU_IVF_FLAT PATH bench/ann/src/faiss/faiss_gpu_benchmark.cu LINKS + NAME FAISS_GPU_IVF_FLAT PATH src/faiss/faiss_gpu_benchmark.cu LINKS ${CUVS_FAISS_TARGETS} ) endif() -if(CUVS_ANN_BENCH_USE_FAISS_GPU_IVF_PQ) +if(CUVS_ANN_BENCH_USE_FAISS_GPU_IVF_PQ AND CUVS_FAISS_ENABLE_GPU) ConfigureAnnBench( - NAME FAISS_GPU_IVF_PQ PATH bench/ann/src/faiss/faiss_gpu_benchmark.cu LINKS + NAME FAISS_GPU_IVF_PQ PATH src/faiss/faiss_gpu_benchmark.cu LINKS ${CUVS_FAISS_TARGETS} ) endif() -if(CUVS_ANN_BENCH_USE_FAISS_GPU_FLAT) +if(CUVS_ANN_BENCH_USE_FAISS_GPU_FLAT AND CUVS_FAISS_ENABLE_GPU) ConfigureAnnBench( - NAME FAISS_GPU_FLAT PATH bench/ann/src/faiss/faiss_gpu_benchmark.cu LINKS ${CUVS_FAISS_TARGETS} + NAME FAISS_GPU_FLAT PATH src/faiss/faiss_gpu_benchmark.cu LINKS ${CUVS_FAISS_TARGETS} ) endif() if(CUVS_ANN_BENCH_USE_GGNN) - include(cmake/thirdparty/get_glog.cmake) + include(cmake/thirdparty/get_glog) ConfigureAnnBench( - NAME GGNN PATH bench/ann/src/ggnn/ggnn_benchmark.cu LINKS glog::glog ggnn::ggnn CUDA::curand + NAME GGNN PATH src/ggnn/ggnn_benchmark.cu LINKS glog::glog ggnn::ggnn CUDA::curand ) endif() # ################################################################################################## # * Dynamically-loading ANN_BENCH executable ------------------------------------------------------- if(CUVS_ANN_BENCH_SINGLE_EXE) - add_executable(ANN_BENCH bench/ann/src/common/benchmark.cpp) - - # Build and link static version of the GBench to keep ANN_BENCH self-contained. - get_target_property(TMP_PROP benchmark::benchmark SOURCES) - add_library(benchmark_static STATIC ${TMP_PROP}) - get_target_property(TMP_PROP benchmark::benchmark INCLUDE_DIRECTORIES) - target_include_directories(benchmark_static PUBLIC ${TMP_PROP}) - get_target_property(TMP_PROP benchmark::benchmark LINK_LIBRARIES) - target_link_libraries(benchmark_static PUBLIC ${TMP_PROP}) + add_executable(ANN_BENCH src/common/benchmark.cpp) target_include_directories(ANN_BENCH PRIVATE ${CMAKE_CUDA_TOOLKIT_INCLUDE_DIRECTORIES}) @@ -329,12 +306,10 @@ if(CUVS_ANN_BENCH_SINGLE_EXE) ANN_BENCH PRIVATE raft::raft nlohmann_json::nlohmann_json - benchmark_static + benchmark::benchmark dl - -static-libgcc fmt::fmt-header-only spdlog::spdlog_header_only - -static-libstdc++ $<$:CUDA::nvtx3> ) set_target_properties( diff --git a/cpp/cmake/patches/faiss_override.json b/cpp/cmake/patches/faiss_override.json new file mode 100644 index 000000000..c39abdc2b --- /dev/null +++ b/cpp/cmake/patches/faiss_override.json @@ -0,0 +1,9 @@ +{ + "packages" : { + "faiss" : { + "version": "1.7.4", + "git_url": "https://github.com/facebookresearch/faiss.git", + "git_tag": "main" + } + } + } \ No newline at end of file diff --git a/cpp/cmake/patches/ggnn_override.json b/cpp/cmake/patches/ggnn_override.json new file mode 100644 index 000000000..c9a1b6978 --- /dev/null +++ b/cpp/cmake/patches/ggnn_override.json @@ -0,0 +1,16 @@ +{ + "packages" : { + "ggnn" : { + "version": "0.5", + "git_url": "https://github.com/cgtuebingen/ggnn.git", + "git_tag": "release_${version}", + "patches" : [ + { + "file" : "${current_json_dir}/ggnn.diff", + "issue" : "Correct compilation issues", + "fixed_in" : "" + } + ] + } + } + } \ No newline at end of file diff --git a/cpp/cmake/patches/hnswlib_override.json b/cpp/cmake/patches/hnswlib_override.json new file mode 100644 index 000000000..aef2da772 --- /dev/null +++ b/cpp/cmake/patches/hnswlib_override.json @@ -0,0 +1,16 @@ +{ + "packages" : { + "hnswlib" : { + "version": "0.6.2", + "git_url": "https://github.com/nmslib/hnswlib.git", + "git_tag": "v${version}", + "patches" : [ + { + "file" : "${current_json_dir}/hnswlib.diff", + "issue" : "Correct compilation issues", + "fixed_in" : "" + } + ] + } + } + } \ No newline at end of file diff --git a/cpp/cmake/thirdparty/get_faiss.cmake b/cpp/cmake/thirdparty/get_faiss.cmake index 89446332d..d6261d248 100644 --- a/cpp/cmake/thirdparty/get_faiss.cmake +++ b/cpp/cmake/thirdparty/get_faiss.cmake @@ -15,95 +15,104 @@ #============================================================================= function(find_and_configure_faiss) - set(oneValueArgs VERSION REPOSITORY PINNED_TAG BUILD_STATIC_LIBS EXCLUDE_FROM_ALL ENABLE_GPU) - cmake_parse_arguments(PKG "${options}" "${oneValueArgs}" - "${multiValueArgs}" ${ARGN} ) + set(oneValueArgs VERSION REPOSITORY PINNED_TAG BUILD_STATIC_LIBS EXCLUDE_FROM_ALL ENABLE_GPU) + cmake_parse_arguments(PKG "${options}" "${oneValueArgs}" + "${multiValueArgs}" ${ARGN} ) + + rapids_find_generate_module(faiss + HEADER_NAMES faiss/IndexFlat.h + LIBRARY_NAMES faiss + ) + + set(patch_dir "${CMAKE_CURRENT_FUNCTION_LIST_DIR}/../patches") + rapids_cpm_package_override("${patch_dir}/faiss_override.json") + + include("${rapids-cmake-dir}/cpm/detail/package_details.cmake") + rapids_cpm_package_details(faiss version repository tag shallow exclude) + + include("${rapids-cmake-dir}/cpm/detail/generate_patch_command.cmake") + rapids_cpm_generate_patch_command(faiss ${version} patch_command) + + set(BUILD_SHARED_LIBS ON) + if (PKG_BUILD_STATIC_LIBS) + set(BUILD_SHARED_LIBS OFF) + set(CPM_DOWNLOAD_faiss ON) + endif() + + include(cmake/modules/FindAVX) + # Link against AVX CPU lib if it exists + set(CUVS_FAISS_OPT_LEVEL "generic") + if(CXX_AVX2_FOUND) + set(CUVS_FAISS_OPT_LEVEL "avx2") + endif() + + rapids_cpm_find(faiss ${version} + GLOBAL_TARGETS faiss faiss_avx2 faiss_gpu faiss::faiss faiss::faiss_avx2 + CPM_ARGS + GIT_REPOSITORY ${repository} + GIT_TAG ${tag} + GIT_SHALLOW ${shallow} ${patch_command} + EXCLUDE_FROM_ALL ${exclude} + OPTIONS + "FAISS_ENABLE_GPU ${PKG_ENABLE_GPU}" + "FAISS_ENABLE_PYTHON OFF" + "FAISS_OPT_LEVEL ${CUVS_FAISS_OPT_LEVEL}" + "FAISS_USE_CUDA_TOOLKIT_STATIC ${CUDA_STATIC_RUNTIME}" + "BUILD_TESTING OFF" + "CMAKE_MESSAGE_LOG_LEVEL VERBOSE" + ) + + + include("${rapids-cmake-dir}/cpm/detail/display_patch_status.cmake") + rapids_cpm_display_patch_status(faiss) + + if(TARGET faiss AND NOT TARGET faiss::faiss) + add_library(faiss::faiss ALIAS faiss) + # We need to ensure that faiss has all the conda information. So we use this approach so that + # faiss will have the conda includes/link dirs + target_link_libraries(faiss PRIVATE $) + endif() + if(TARGET faiss_avx2 AND NOT TARGET faiss::faiss_avx2) + add_library(faiss::faiss_avx2 ALIAS faiss_avx2) + # We need to ensure that faiss has all the conda information. So we use this approach so that + # faiss will have the conda includes/link dirs + target_link_libraries(faiss_avx2 PRIVATE $) + endif() + if(TARGET faiss_gpu AND NOT TARGET faiss::faiss_gpu) + add_library(faiss::faiss_gpu ALIAS faiss_gpu) + # We need to ensure that faiss has all the conda information. So we use this approach so that + # faiss will have the conda includes/link dirs + target_link_libraries(faiss_gpu PRIVATE $) + endif() + + if(faiss_ADDED) + rapids_export(BUILD faiss + EXPORT_SET faiss-targets + GLOBAL_TARGETS ${CUVS_FAISS_EXPORT_GLOBAL_TARGETS} + NAMESPACE faiss::) + endif() + + # Need to tell CMake to rescan the link group of faiss::faiss_gpu and faiss + # so that we get proper link order when they are static + # + # We don't look at the existence of `faiss_avx2` as it will always exist + # even when CXX_AVX2_FOUND is false. In addition for arm builds the + # faiss_avx2 is marked as `EXCLUDE_FROM_ALL` so we don't want to add + # a dependency to it. Adding a dependency will cause it to compile, + # and fail due to invalid compiler flags. + if(PKG_ENABLE_GPU AND PKG_BUILD_STATIC_LIBS AND CXX_AVX2_FOUND) + set(CUVS_FAISS_TARGETS "$,faiss::faiss_avx2>" PARENT_SCOPE) + elseif(PKG_ENABLE_GPU AND PKG_BUILD_STATIC_LIBS) + set(CUVS_FAISS_TARGETS "$,faiss::faiss>" PARENT_SCOPE) + elseif(CXX_AVX2_FOUND) + set(CUVS_FAISS_TARGETS faiss::faiss_avx2 PARENT_SCOPE) + else() + set(CUVS_FAISS_TARGETS faiss::faiss PARENT_SCOPE) + endif() - rapids_find_generate_module(faiss - HEADER_NAMES faiss/IndexFlat.h - LIBRARY_NAMES faiss - ) - - set(BUILD_SHARED_LIBS ON) - if (PKG_BUILD_STATIC_LIBS) - set(BUILD_SHARED_LIBS OFF) - set(CPM_DOWNLOAD_faiss ON) - endif() - - include(cmake/modules/FindAVX.cmake) - - # Link against AVX CPU lib if it exists - set(CUVS_FAISS_GLOBAL_TARGETS faiss::faiss) - set(CUVS_FAISS_EXPORT_GLOBAL_TARGETS faiss) - set(CUVS_FAISS_OPT_LEVEL "generic") - if(CXX_AVX_FOUND) - set(CUVS_FAISS_OPT_LEVEL "avx2") - list(APPEND CUVS_FAISS_GLOBAL_TARGETS faiss::faiss_avx2) - list(APPEND CUVS_FAISS_EXPORT_GLOBAL_TARGETS faiss_avx2) - endif() - - rapids_cpm_find(faiss ${PKG_VERSION} - GLOBAL_TARGETS ${CUVS_FAISS_GLOBAL_TARGETS} - CPM_ARGS - GIT_REPOSITORY ${PKG_REPOSITORY} - GIT_TAG ${PKG_PINNED_TAG} - EXCLUDE_FROM_ALL ${PKG_EXCLUDE_FROM_ALL} - OPTIONS - "FAISS_ENABLE_GPU ${PKG_ENABLE_GPU}" - "FAISS_ENABLE_PYTHON OFF" - "FAISS_OPT_LEVEL ${CUVS_FAISS_OPT_LEVEL}" - "FAISS_USE_CUDA_TOOLKIT_STATIC ${CUDA_STATIC_RUNTIME}" - "BUILD_TESTING OFF" - "CMAKE_MESSAGE_LOG_LEVEL VERBOSE" - ) - - if(TARGET faiss AND NOT TARGET faiss::faiss) - add_library(faiss::faiss ALIAS faiss) - endif() - - if(CXX_AVX_FOUND) - - if(TARGET faiss_avx2 AND NOT TARGET faiss::faiss_avx2) - add_library(faiss::faiss_avx2 ALIAS faiss_avx2) - endif() - endif() - - - if(faiss_ADDED) - rapids_export(BUILD faiss - EXPORT_SET faiss-targets - GLOBAL_TARGETS ${CUVS_FAISS_EXPORT_GLOBAL_TARGETS} - NAMESPACE faiss::) - endif() - - # We generate the faiss-config files when we built faiss locally, so always do `find_dependency` - rapids_export_package(BUILD OpenMP cuvs-ann-bench-exports) # faiss uses openMP but doesn't export a need for it - rapids_export_package(BUILD faiss cuvs-ann-bench-exports GLOBAL_TARGETS ${CUVS_FAISS_GLOBAL_TARGETS} ${CUVS_FAISS_EXPORT_GLOBAL_TARGETS}) - rapids_export_package(INSTALL faiss cuvs-ann-bench-exports GLOBAL_TARGETS ${CUVS_FAISS_GLOBAL_TARGETS} ${CUVS_FAISS_EXPORT_GLOBAL_TARGETS}) - - # Tell cmake where it can find the generated faiss-config.cmake we wrote. - include("${rapids-cmake-dir}/export/find_package_root.cmake") - rapids_export_find_package_root(BUILD faiss [=[${CMAKE_CURRENT_LIST_DIR}]=] - EXPORT_SET cuvs-ann-bench-exports) endfunction() -if(NOT CUVS_FAISS_GIT_TAG) - # TODO: Remove this once faiss supports FAISS_USE_CUDA_TOOLKIT_STATIC - # (https://github.com/facebookresearch/faiss/pull/2446) - set(CUVS_FAISS_GIT_TAG fea/statically-link-ctk) - # set(CUVS_FAISS_GIT_TAG bde7c0027191f29c9dadafe4f6e68ca0ee31fb30) -endif() - -if(NOT CUVS_FAISS_GIT_REPOSITORY) - # TODO: Remove this once faiss supports FAISS_USE_CUDA_TOOLKIT_STATIC - # (https://github.com/facebookresearch/faiss/pull/2446) - set(CUVS_FAISS_GIT_REPOSITORY https://github.com/cjnolet/faiss.git) - # set(CUVS_FAISS_GIT_REPOSITORY https://github.com/facebookresearch/faiss.git) -endif() - -find_and_configure_faiss(VERSION 1.7.4 - REPOSITORY ${CUVS_FAISS_GIT_REPOSITORY} - PINNED_TAG ${CUVS_FAISS_GIT_TAG} - BUILD_STATIC_LIBS ${CUVS_USE_FAISS_STATIC} - EXCLUDE_FROM_ALL ${CUVS_EXCLUDE_FAISS_FROM_ALL} - ENABLE_GPU ${CUVS_FAISS_ENABLE_GPU}) +find_and_configure_faiss( + BUILD_STATIC_LIBS ${CUVS_USE_FAISS_STATIC} + ENABLE_GPU ${CUVS_FAISS_ENABLE_GPU} +) diff --git a/cpp/cmake/thirdparty/get_ggnn.cmake b/cpp/cmake/thirdparty/get_ggnn.cmake index 8137ef84e..2ccfbc64d 100644 --- a/cpp/cmake/thirdparty/get_ggnn.cmake +++ b/cpp/cmake/thirdparty/get_ggnn.cmake @@ -15,29 +15,30 @@ #============================================================================= function(find_and_configure_ggnn) - set(oneValueArgs VERSION REPOSITORY PINNED_TAG) - cmake_parse_arguments(PKG "${options}" "${oneValueArgs}" - "${multiValueArgs}" ${ARGN} ) + include(${rapids-cmake-dir}/cpm/package_override.cmake) + set(patch_dir "${CMAKE_CURRENT_FUNCTION_LIST_DIR}/../patches") + rapids_cpm_package_override("${patch_dir}/ggnn_override.json") - set(patch_files_to_run "${CMAKE_CURRENT_SOURCE_DIR}/cmake/patches/ggnn.diff") - set(patch_issues_to_ref "fix compile issues") - set(patch_script "${CMAKE_BINARY_DIR}/rapids-cmake/patches/ggnn/patch.cmake") - set(log_file "${CMAKE_BINARY_DIR}/rapids-cmake/patches/ggnn/log") - string(TIMESTAMP current_year "%Y" UTC) - configure_file(${rapids-cmake-dir}/cpm/patches/command_template.cmake.in "${patch_script}" - @ONLY) + include("${rapids-cmake-dir}/cpm/detail/package_details.cmake") + rapids_cpm_package_details(ggnn version repository tag shallow exclude) + + include("${rapids-cmake-dir}/cpm/detail/generate_patch_command.cmake") + rapids_cpm_generate_patch_command(ggnn ${version} patch_command) rapids_cpm_find( - ggnn ${PKG_VERSION} + ggnn ${version} GLOBAL_TARGETS ggnn::ggnn CPM_ARGS - GIT_REPOSITORY ${PKG_REPOSITORY} - GIT_TAG ${PKG_PINNED_TAG} - GIT_SHALLOW TRUE + GIT_REPOSITORY ${repository} + GIT_TAG ${tag} + GIT_SHALLOW ${shallow} ${patch_command} DOWNLOAD_ONLY ON - PATCH_COMMAND ${CMAKE_COMMAND} -P ${patch_script} ) + + include("${rapids-cmake-dir}/cpm/detail/display_patch_status.cmake") + rapids_cpm_display_patch_status(ggnn) + if(NOT TARGET ggnn::ggnn) add_library(ggnn INTERFACE) target_include_directories(ggnn INTERFACE "$") @@ -45,14 +46,4 @@ function(find_and_configure_ggnn) endif() endfunction() -if(NOT RAFT_GGNN_GIT_TAG) - set(RAFT_GGNN_GIT_TAG release_0.5) -endif() - -if(NOT RAFT_GGNN_GIT_REPOSITORY) - set(RAFT_GGNN_GIT_REPOSITORY https://github.com/cgtuebingen/ggnn.git) -endif() -find_and_configure_ggnn(VERSION 0.5 - REPOSITORY ${RAFT_GGNN_GIT_REPOSITORY} - PINNED_TAG ${RAFT_GGNN_GIT_TAG} - ) +find_and_configure_ggnn() diff --git a/cpp/cmake/thirdparty/get_hnswlib.cmake b/cpp/cmake/thirdparty/get_hnswlib.cmake index 054a12f1e..2e6c895e5 100644 --- a/cpp/cmake/thirdparty/get_hnswlib.cmake +++ b/cpp/cmake/thirdparty/get_hnswlib.cmake @@ -15,78 +15,74 @@ #============================================================================= function(find_and_configure_hnswlib) - set(oneValueArgs VERSION REPOSITORY PINNED_TAG EXCLUDE_FROM_ALL) - cmake_parse_arguments(PKG "${options}" "${oneValueArgs}" - "${multiValueArgs}" ${ARGN} ) + set(oneValueArgs) - set(patch_files_to_run "${CMAKE_CURRENT_SOURCE_DIR}/cmake/patches/hnswlib.diff") - set(patch_issues_to_ref "fix compile issues") - set(patch_script "${CMAKE_BINARY_DIR}/rapids-cmake/patches/hnswlib/patch.cmake") - set(log_file "${CMAKE_BINARY_DIR}/rapids-cmake/patches/hnswlib/log") - string(TIMESTAMP current_year "%Y" UTC) - configure_file(${rapids-cmake-dir}/cpm/patches/command_template.cmake.in "${patch_script}" - @ONLY) + include(${rapids-cmake-dir}/cpm/package_override.cmake) + set(patch_dir "${CMAKE_CURRENT_FUNCTION_LIST_DIR}/../patches") + rapids_cpm_package_override("${patch_dir}/hnswlib_override.json") + + include("${rapids-cmake-dir}/cpm/detail/package_details.cmake") + rapids_cpm_package_details(hnswlib version repository tag shallow exclude) + + include("${rapids-cmake-dir}/cpm/detail/generate_patch_command.cmake") + rapids_cpm_generate_patch_command(hnswlib ${version} patch_command) rapids_cpm_find( - hnswlib ${PKG_VERSION} - GLOBAL_TARGETS hnswlib::hnswlib - BUILD_EXPORT_SET raft-exports - INSTALL_EXPORT_SET raft-exports + hnswlib ${version} + GLOBAL_TARGETS hnswlib hnswlib::hnswlib CPM_ARGS - GIT_REPOSITORY ${PKG_REPOSITORY} - GIT_TAG ${PKG_PINNED_TAG} - GIT_SHALLOW TRUE + GIT_REPOSITORY ${repository} + GIT_TAG ${tag} + GIT_SHALLOW ${shallow} ${patch_command} + EXCLUDE_FROM_ALL ${exclude} DOWNLOAD_ONLY ON - PATCH_COMMAND ${CMAKE_COMMAND} -P ${patch_script} ) + + include("${rapids-cmake-dir}/cpm/detail/display_patch_status.cmake") + rapids_cpm_display_patch_status(hnswlib) + if(NOT TARGET hnswlib::hnswlib) add_library(hnswlib INTERFACE ) add_library(hnswlib::hnswlib ALIAS hnswlib) target_include_directories(hnswlib INTERFACE "$" "$") + endif() - if(NOT PKG_EXCLUDE_FROM_ALL) - install(TARGETS hnswlib EXPORT hnswlib-exports) + if(hnswlib_ADDED) + # write build export rules + install(TARGETS hnswlib EXPORT hnswlib-exports) + if(NOT exclude) install(DIRECTORY "${hnswlib_SOURCE_DIR}/hnswlib/" DESTINATION include/hnswlib) # write install export rules rapids_export( INSTALL hnswlib - VERSION ${PKG_VERSION} + VERSION ${version} EXPORT_SET hnswlib-exports GLOBAL_TARGETS hnswlib NAMESPACE hnswlib::) endif() - # write build export rules rapids_export( BUILD hnswlib - VERSION ${PKG_VERSION} + VERSION ${version} EXPORT_SET hnswlib-exports GLOBAL_TARGETS hnswlib NAMESPACE hnswlib::) - include("${rapids-cmake-dir}/export/find_package_root.cmake") + include("${rapids-cmake-dir}/export/package.cmake") + rapids_export_package(INSTALL hnswlib cuvs-exports VERSION ${version} GLOBAL_TARGETS hnswlib hnswlib::hnswlib) + rapids_export_package(BUILD hnswlib cuvs-exports VERSION ${version} GLOBAL_TARGETS hnswlib hnswlib::hnswlib) + - # When using RAFT from the build dir, ensure hnswlib is also found in RAFT's build dir. This - # line adds `set(hnswlib_ROOT "${CMAKE_CURRENT_LIST_DIR}")` to build/raft-dependencies.cmake + # When using cuVS from the build dir, ensure hnswlib is also found in cuVS' build dir. This + # line adds `set(hnswlib_ROOT "${CMAKE_CURRENT_LIST_DIR}")` to build/cuvs-dependencies.cmake + include("${rapids-cmake-dir}/export/find_package_root.cmake") rapids_export_find_package_root( - BUILD hnswlib [=[${CMAKE_CURRENT_LIST_DIR}]=] EXPORT_SET raft-exports + BUILD hnswlib [=[${CMAKE_CURRENT_LIST_DIR}]=] EXPORT_SET cuvs-exports ) endif() endfunction() - -if(NOT CUVS_HNSWLIB_GIT_TAG) - set(CUVS_HNSWLIB_GIT_TAG v0.6.2) -endif() - -if(NOT CUVS_HNSWLIB_GIT_REPOSITORY) - set(CUVS_HNSWLIB_GIT_REPOSITORY https://github.com/nmslib/hnswlib.git) -endif() -find_and_configure_hnswlib(VERSION 0.6.2 - REPOSITORY ${CUVS_HNSWLIB_GIT_REPOSITORY} - PINNED_TAG ${CUVS_HNSWLIB_GIT_TAG} - EXCLUDE_FROM_ALL OFF - ) +find_and_configure_hnswlib() diff --git a/cpp/test/CMakeLists.txt b/cpp/test/CMakeLists.txt index 7921fffd3..3495b2344 100644 --- a/cpp/test/CMakeLists.txt +++ b/cpp/test/CMakeLists.txt @@ -91,22 +91,22 @@ endfunction() if(BUILD_TESTS) ConfigureTest( - NAME NEIGHBORS_TEST PATH test/neighbors/brute_force.cu - test/neighbors/brute_force_prefiltered.cu test/neighbors/refine.cu GPUS 1 PERCENT 100 + NAME NEIGHBORS_TEST PATH neighbors/brute_force.cu + neighbors/brute_force_prefiltered.cu neighbors/refine.cu GPUS 1 PERCENT 100 ) ConfigureTest( - NAME CLUSTER_TEST PATH test/cluster/kmeans.cu test/cluster/kmeans_balanced.cu - test/cluster/kmeans_find_k.cu test/cluster/linkage.cu GPUS 1 PERCENT 100 + NAME CLUSTER_TEST PATH cluster/kmeans.cu cluster/kmeans_balanced.cu + cluster/kmeans_find_k.cu cluster/linkage.cu GPUS 1 PERCENT 100 ) ConfigureTest( NAME NEIGHBORS_ANN_IVF_FLAT_TEST PATH - test/neighbors/ann_ivf_flat/test_float_int64_t.cu - test/neighbors/ann_ivf_flat/test_int8_t_int64_t.cu - test/neighbors/ann_ivf_flat/test_uint8_t_int64_t.cu + neighbors/ann_ivf_flat/test_float_int64_t.cu + neighbors/ann_ivf_flat/test_int8_t_int64_t.cu + neighbors/ann_ivf_flat/test_uint8_t_int64_t.cu GPUS 1 PERCENT @@ -117,9 +117,9 @@ if(BUILD_TESTS) NAME NEIGHBORS_ANN_IVF_PQ_TEST PATH - test/neighbors/ann_ivf_pq/test_float_int64_t.cu - test/neighbors/ann_ivf_pq/test_int8_t_int64_t.cu - test/neighbors/ann_ivf_pq/test_uint8_t_int64_t.cu + neighbors/ann_ivf_pq/test_float_int64_t.cu + neighbors/ann_ivf_pq/test_int8_t_int64_t.cu + neighbors/ann_ivf_pq/test_uint8_t_int64_t.cu GPUS 1 PERCENT @@ -130,9 +130,9 @@ if(BUILD_TESTS) NAME NEIGHBORS_ANN_CAGRA_TEST PATH - test/neighbors/ann_cagra/test_float_uint32_t.cu - test/neighbors/ann_cagra/test_int8_t_uint32_t.cu - test/neighbors/ann_cagra/test_uint8_t_uint32_t.cu + neighbors/ann_cagra/test_float_uint32_t.cu + neighbors/ann_cagra/test_int8_t_uint32_t.cu + neighbors/ann_cagra/test_uint8_t_uint32_t.cu GPUS 1 PERCENT @@ -143,9 +143,9 @@ if(BUILD_TESTS) NAME NEIGHBORS_ANN_NN_DESCENT_TEST PATH - test/neighbors/ann_nn_descent/test_float_uint32_t.cu - test/neighbors/ann_nn_descent/test_int8_t_uint32_t.cu - test/neighbors/ann_nn_descent/test_uint8_t_uint32_t.cu + neighbors/ann_nn_descent/test_float_uint32_t.cu + neighbors/ann_nn_descent/test_int8_t_uint32_t.cu + neighbors/ann_nn_descent/test_uint8_t_uint32_t.cu GPUS 1 PERCENT @@ -153,29 +153,29 @@ if(BUILD_TESTS) ) if(BUILD_CAGRA_HNSWLIB) - ConfigureTest(NAME NEIGHBORS_HNSW_TEST PATH test/neighbors/hnsw.cu GPUS 1 PERCENT 100) + ConfigureTest(NAME NEIGHBORS_HNSW_TEST PATH neighbors/hnsw.cu GPUS 1 PERCENT 100) endif() ConfigureTest( NAME DISTANCE_TEST PATH - test/distance/dist_canberra.cu - test/distance/dist_correlation.cu - test/distance/dist_cos.cu - test/distance/dist_hamming.cu - test/distance/dist_hellinger.cu - test/distance/dist_inner_product.cu - test/distance/dist_jensen_shannon.cu - test/distance/dist_kl_divergence.cu - test/distance/dist_l1.cu - test/distance/dist_l2_exp.cu - test/distance/dist_l2_sqrt_exp.cu - test/distance/dist_l_inf.cu - test/distance/dist_lp_unexp.cu - test/distance/dist_russell_rao.cu - test/distance/masked_nn.cu - test/sparse/neighbors/cross_component_nn.cu + distance/dist_canberra.cu + distance/dist_correlation.cu + distance/dist_cos.cu + distance/dist_hamming.cu + distance/dist_hellinger.cu + distance/dist_inner_product.cu + distance/dist_jensen_shannon.cu + distance/dist_kl_divergence.cu + distance/dist_l1.cu + distance/dist_l2_exp.cu + distance/dist_l2_sqrt_exp.cu + distance/dist_l_inf.cu + distance/dist_lp_unexp.cu + distance/dist_russell_rao.cu + distance/masked_nn.cu + sparse/neighbors/cross_component_nn.cu GPUS 1 PERCENT @@ -184,27 +184,27 @@ if(BUILD_TESTS) endif() if(BUILD_C_TESTS) - ConfigureTest(NAME INTEROP_TEST PATH test/core/interop.cu C_LIB) + ConfigureTest(NAME INTEROP_TEST PATH core/interop.cu C_LIB) ConfigureTest( - NAME DISTANCE_C_TEST PATH test/distance/run_pairwise_distance_c.c - test/distance/pairwise_distance_c.cu C_LIB + NAME DISTANCE_C_TEST PATH distance/run_pairwise_distance_c.c + distance/pairwise_distance_c.cu C_LIB ) ConfigureTest( - NAME BRUTEFORCE_C_TEST PATH test/neighbors/run_brute_force_c.c test/neighbors/brute_force_c.cu + NAME BRUTEFORCE_C_TEST PATH neighbors/run_brute_force_c.c neighbors/brute_force_c.cu C_LIB ) ConfigureTest( - NAME IVF_FLAT_C_TEST PATH test/neighbors/run_ivf_flat_c.c test/neighbors/ann_ivf_flat_c.cu + NAME IVF_FLAT_C_TEST PATH neighbors/run_ivf_flat_c.c neighbors/ann_ivf_flat_c.cu C_LIB ) ConfigureTest( - NAME IVF_PQ_C_TEST PATH test/neighbors/run_ivf_pq_c.c test/neighbors/ann_ivf_pq_c.cu C_LIB + NAME IVF_PQ_C_TEST PATH neighbors/run_ivf_pq_c.c neighbors/ann_ivf_pq_c.cu C_LIB ) - ConfigureTest(NAME CAGRA_C_TEST PATH test/neighbors/ann_cagra_c.cu C_LIB) + ConfigureTest(NAME CAGRA_C_TEST PATH neighbors/ann_cagra_c.cu C_LIB) endif() # ################################################################################################## @@ -215,9 +215,9 @@ rapids_test_install_relocatable(INSTALL_COMPONENT_SET testing DESTINATION bin/gt if(BUILD_C_TESTS) enable_language(C) - add_executable(cuvs_c_test test/core/c_api.c) + add_executable(cuvs_c_test core/c_api.c) target_link_libraries(cuvs_c_test PUBLIC cuvs::c_api) - add_executable(cuvs_c_neighbors_test test/neighbors/c_api.c) + add_executable(cuvs_c_neighbors_test neighbors/c_api.c) target_link_libraries(cuvs_c_neighbors_test PUBLIC cuvs::c_api) endif() From 98c07f90a30c04b8bd6a90e7a6535a19c9ab9731 Mon Sep 17 00:00:00 2001 From: "Artem M. Chirkin" <9253178+achirkin@users.noreply.github.com> Date: Mon, 29 Jul 2024 12:58:39 +0200 Subject: [PATCH 2/2] Add more info to ANN_BENCH context (#248) Add extra information to benchmark context for better reproducibility and performance analysis: 1. Full command line used to call the executable (so you can copy-paste and run again). 2. More CUDA device information: whether HMM, AST, or host atomics are available (how GPU can efficiently communicate with CPU). 3. Host information: min/max frequences, used virtual processors and cores, available physical memory and swap (does the benchmark segfault due to not enough host memory? is SMT enabled? etc). Addresses parts of https://github.com/rapidsai/cuvs/issues/160 Authors: - Artem M. Chirkin (https://github.com/achirkin) Approvers: - Tamas Bela Feher (https://github.com/tfeher) URL: https://github.com/rapidsai/cuvs/pull/248 --- cpp/bench/ann/src/common/benchmark.hpp | 24 +++++++-- cpp/bench/ann/src/common/util.hpp | 72 ++++++++++++++++++++++++++ 2 files changed, 91 insertions(+), 5 deletions(-) diff --git a/cpp/bench/ann/src/common/benchmark.hpp b/cpp/bench/ann/src/common/benchmark.hpp index e6462c157..5d7b8934f 100644 --- a/cpp/bench/ann/src/common/benchmark.hpp +++ b/cpp/bench/ann/src/common/benchmark.hpp @@ -461,7 +461,8 @@ void register_search(std::shared_ptr> dataset, } template -void dispatch_benchmark(const configuration& conf, +void dispatch_benchmark(std::string cmdline, + const configuration& conf, bool force_overwrite, bool build_mode, bool search_mode, @@ -471,6 +472,10 @@ void dispatch_benchmark(const configuration& conf, Mode metric_objective, const std::vector& threads) { + ::benchmark::AddCustomContext("command_line", cmdline); + for (auto [key, value] : host_info()) { + ::benchmark::AddCustomContext(key, value); + } if (cudart.found()) { for (auto [key, value] : cuda_info()) { ::benchmark::AddCustomContext(key, value); @@ -586,6 +591,11 @@ inline auto run_main(int argc, char** argv) -> int printf_usage(); return -1; } + // Save command line for reproducibility. + std::string cmdline(argv[0]); + for (int i = 1; i < argc; i++) { + cmdline += " " + std::string(argv[i]); + } char* conf_path = argv[--argc]; std::ifstream conf_stream(conf_path); @@ -667,7 +677,8 @@ inline auto run_main(int argc, char** argv) -> int std::string dtype = conf.get_dataset_conf().dtype; if (dtype == "float") { - dispatch_benchmark(conf, + dispatch_benchmark(cmdline, + conf, force_overwrite, build_mode, search_mode, @@ -677,7 +688,8 @@ inline auto run_main(int argc, char** argv) -> int metric_objective, threads); // } else if (dtype == "half") { - // dispatch_benchmark(conf, + // dispatch_benchmark(cmdline + // conf, // force_overwrite, // build_mode, // search_mode, @@ -687,7 +699,8 @@ inline auto run_main(int argc, char** argv) -> int // metric_objective, // threads); } else if (dtype == "uint8") { - dispatch_benchmark(conf, + dispatch_benchmark(cmdline, + conf, force_overwrite, build_mode, search_mode, @@ -697,7 +710,8 @@ inline auto run_main(int argc, char** argv) -> int metric_objective, threads); } else if (dtype == "int8") { - dispatch_benchmark(conf, + dispatch_benchmark(cmdline, + conf, force_overwrite, build_mode, search_mode, diff --git a/cpp/bench/ann/src/common/util.hpp b/cpp/bench/ann/src/common/util.hpp index 490b0326e..e01e3847b 100644 --- a/cpp/bench/ann/src/common/util.hpp +++ b/cpp/bench/ann/src/common/util.hpp @@ -22,8 +22,11 @@ #include #endif +#include // sched_getaffinity #include +#include #include +#include #include #include @@ -32,9 +35,11 @@ #include #include #include +#include #include #include #include +#include #include #include #include @@ -293,6 +298,64 @@ inline void reset_global_device_resources() #endif } +inline auto host_info() +{ + std::vector> props; + + // Memory info + auto page_size = sysconf(_SC_PAGE_SIZE); + props.emplace_back("host_pagesize", std::to_string(page_size)); + + struct sysinfo sys_info; + if (sysinfo(&sys_info) != -1) { + props.emplace_back("host_total_ram_size", + std::to_string(size_t(sys_info.totalram) * size_t(sys_info.mem_unit))); + props.emplace_back("host_total_swap_size", + std::to_string(size_t(sys_info.totalswap) * size_t(sys_info.mem_unit))); + } + + // CPU info + int host_processors_configured = sysconf(_SC_NPROCESSORS_CONF); + props.emplace_back("host_processors_sysconf", std::to_string(host_processors_configured)); + std::vector affinity_mask_buf(CPU_ALLOC_SIZE(host_processors_configured)); + cpu_set_t* affinity_mask = reinterpret_cast(affinity_mask_buf.data()); + sched_getaffinity(0, affinity_mask_buf.size(), affinity_mask); + uint64_t cpu_freq_min = 0; + uint64_t cpu_freq_max = 0; + int host_processors_used = 0; + int host_cores_used = 0; + std::set host_cores_selected{}; + for (int cpu_id = 0; cpu_id < host_processors_configured; cpu_id++) { + if (CPU_ISSET_S(cpu_id, affinity_mask_buf.size(), affinity_mask) == 0) { continue; } + host_processors_used++; + std::string cpu_fpath = "/sys/devices/system/cpu/cpu" + std::to_string(cpu_id); + if (!std::filesystem::exists(cpu_fpath)) { continue; } + + int this_cpu_core = 0; + uint64_t this_cpu_freq_min = 0; + uint64_t this_cpu_freq_max = 0; + std::ifstream(cpu_fpath + "/topology/core_id") >> this_cpu_core; + std::ifstream(cpu_fpath + "/cpufreq/scaling_min_freq") >> this_cpu_freq_min; + std::ifstream(cpu_fpath + "/cpufreq/scaling_max_freq") >> this_cpu_freq_max; + host_cores_selected.insert(this_cpu_core); + cpu_freq_min = cpu_freq_min == 0 + ? (this_cpu_freq_min * 1000ull) + : std::min(this_cpu_freq_min * 1000ull, cpu_freq_min); + cpu_freq_max = std::max(this_cpu_freq_max * 1000ull, cpu_freq_max); + } + host_cores_used = host_cores_selected.size(); + if (host_processors_used != 0) { + props.emplace_back("host_processors_used", std::to_string(host_processors_used)); + } + if (host_cores_used != 0) { + props.emplace_back("host_cores_used", std::to_string(host_cores_used)); + } + if (cpu_freq_min != 0) { props.emplace_back("host_cpu_freq_min", std::to_string(cpu_freq_min)); } + if (cpu_freq_max != 0) { props.emplace_back("host_cpu_freq_max", std::to_string(cpu_freq_max)); } + + return props; +} + inline auto cuda_info() { std::vector> props; @@ -315,6 +378,15 @@ inline auto cuda_info() std::to_string(driver / 1000) + "." + std::to_string((driver % 100) / 10)); props.emplace_back("gpu_runtime_version", std::to_string(runtime / 1000) + "." + std::to_string((runtime % 100) / 10)); + props.emplace_back("gpu_hostNativeAtomicSupported", + std::to_string(device_prop.hostNativeAtomicSupported)); + props.emplace_back("gpu_pageableMemoryAccess", std::to_string(device_prop.pageableMemoryAccess)); + props.emplace_back("gpu_pageableMemoryAccessUsesHostPageTables", + std::to_string(device_prop.pageableMemoryAccessUsesHostPageTables)); +#if defined(CUDART_VERSION) && CUDART_VERSION >= 12000 + props.emplace_back("gpu_gpuDirectRDMASupported", + std::to_string(device_prop.gpuDirectRDMASupported)); +#endif #endif return props; }