From 49970f4e81fe5703329245080dbda76da4da4887 Mon Sep 17 00:00:00 2001 From: Ben Frederickson Date: Wed, 13 Dec 2023 12:47:25 -0800 Subject: [PATCH 1/8] Benchmark brute force knn Add our bfknn code to the raft-ann-bench project --- cpp/bench/ann/CMakeLists.txt | 5 +- .../src/raft/raft_ann_bench_param_parser.h | 2 +- cpp/bench/ann/src/raft/raft_benchmark.cu | 9 ++- cpp/bench/ann/src/raft/raft_wrapper.h | 71 +++++++++---------- 4 files changed, 42 insertions(+), 45 deletions(-) diff --git a/cpp/bench/ann/CMakeLists.txt b/cpp/bench/ann/CMakeLists.txt index 5919de07e7..1f6d8e3e3a 100644 --- a/cpp/bench/ann/CMakeLists.txt +++ b/cpp/bench/ann/CMakeLists.txt @@ -18,9 +18,6 @@ option(RAFT_ANN_BENCH_USE_FAISS_GPU_FLAT "Include faiss' brute-force knn algorithm in benchmark" ON) option(RAFT_ANN_BENCH_USE_FAISS_GPU_IVF_FLAT "Include faiss' ivf flat algorithm in benchmark" ON) option(RAFT_ANN_BENCH_USE_FAISS_GPU_IVF_PQ "Include faiss' ivf pq algorithm in benchmark" ON) -option(RAFT_ANN_BENCH_USE_FAISS_CPU_FLAT - "Include faiss' cpu brute-force knn algorithm in benchmark" ON -) option(RAFT_ANN_BENCH_USE_FAISS_CPU_FLAT "Include faiss' cpu brute-force algorithm in benchmark" ON) option(RAFT_ANN_BENCH_USE_FAISS_CPU_IVF_FLAT "Include faiss' cpu ivf flat algorithm in benchmark" @@ -30,6 +27,7 @@ option(RAFT_ANN_BENCH_USE_FAISS_CPU_IVF_PQ "Include faiss' cpu ivf pq algorithm option(RAFT_ANN_BENCH_USE_RAFT_IVF_FLAT "Include raft's ivf flat algorithm in benchmark" ON) option(RAFT_ANN_BENCH_USE_RAFT_IVF_PQ "Include raft's ivf pq algorithm in benchmark" ON) option(RAFT_ANN_BENCH_USE_RAFT_CAGRA "Include raft's CAGRA in benchmark" ON) +option(RAFT_ANN_BENCH_USE_RAFT_BRUTE_FORCE "Include raft's brute force knn in benchmark" ON) option(RAFT_ANN_BENCH_USE_RAFT_CAGRA_HNSWLIB "Include raft's CAGRA in benchmark" ON) option(RAFT_ANN_BENCH_USE_HNSWLIB "Include hnsw algorithm in benchmark" ON) option(RAFT_ANN_BENCH_USE_GGNN "Include ggnn algorithm in benchmark" ON) @@ -55,6 +53,7 @@ if(BUILD_CPU_ONLY) set(RAFT_ANN_BENCH_USE_RAFT_IVF_FLAT OFF) set(RAFT_ANN_BENCH_USE_RAFT_IVF_PQ OFF) set(RAFT_ANN_BENCH_USE_RAFT_CAGRA OFF) + set(RAFT_ANN_BENCH_USE_RAFT_CAGRA OFF) set(RAFT_ANN_BENCH_USE_RAFT_CAGRA_HNSWLIB OFF) set(RAFT_ANN_BENCH_USE_GGNN OFF) else() diff --git a/cpp/bench/ann/src/raft/raft_ann_bench_param_parser.h b/cpp/bench/ann/src/raft/raft_ann_bench_param_parser.h index 1eb0e53cc5..2a021a8a12 100644 --- a/cpp/bench/ann/src/raft/raft_ann_bench_param_parser.h +++ b/cpp/bench/ann/src/raft/raft_ann_bench_param_parser.h @@ -20,7 +20,7 @@ #include #undef WARP_SIZE -#ifdef RAFT_ANN_BENCH_USE_RAFT_BFKNN +#ifdef RAFT_ANN_BENCH_USE_RAFT_BRUTE_FORCE #include "raft_wrapper.h" #endif #ifdef RAFT_ANN_BENCH_USE_RAFT_IVF_FLAT diff --git a/cpp/bench/ann/src/raft/raft_benchmark.cu b/cpp/bench/ann/src/raft/raft_benchmark.cu index f8c65a2d6e..625451d17e 100644 --- a/cpp/bench/ann/src/raft/raft_benchmark.cu +++ b/cpp/bench/ann/src/raft/raft_benchmark.cu @@ -22,6 +22,7 @@ #include #include #include +#include #include #include #include @@ -47,8 +48,10 @@ std::unique_ptr> create_algo(const std::string& algo, std::unique_ptr> ann; if constexpr (std::is_same_v) { -#ifdef RAFT_ANN_BENCH_USE_RAFT_BFKNN - if (algo == "raft_bfknn") { ann = std::make_unique>(metric, dim); } +#ifdef RAFT_ANN_BENCH_USE_RAFT_BRUTE_FORCE + if (algo == "raft_brute_force") { + ann = std::make_unique>(metric, dim); + } #endif } @@ -85,7 +88,7 @@ template std::unique_ptr::AnnSearchParam> create_search_param( const std::string& algo, const nlohmann::json& conf) { -#ifdef RAFT_ANN_BENCH_USE_RAFT_BFKNN +#ifdef RAFT_ANN_BENCH_USE_RAFT_BRUTE_FORCE if (algo == "raft_brute_force") { auto param = std::make_unique::AnnSearchParam>(); return param; diff --git a/cpp/bench/ann/src/raft/raft_wrapper.h b/cpp/bench/ann/src/raft/raft_wrapper.h index 499bdf29a1..a408d979e5 100644 --- a/cpp/bench/ann/src/raft/raft_wrapper.h +++ b/cpp/bench/ann/src/raft/raft_wrapper.h @@ -17,9 +17,11 @@ #include #include +#include #include #include -#include +#include +#include #include #include #include @@ -30,20 +32,16 @@ namespace raft_temp { inline raft::distance::DistanceType parse_metric_type(raft::bench::ann::Metric metric) { - if (metric == raft::bench::ann::Metric::kInnerProduct) { - return raft::distance::DistanceType::InnerProduct; - } else if (metric == raft::bench::ann::Metric::kEuclidean) { - return raft::distance::DistanceType::L2Expanded; - } else { - throw std::runtime_error("raft supports only metric type of inner product and L2"); + switch (metric) { + case raft::bench::ann::Metric::kInnerProduct: return raft::distance::DistanceType::InnerProduct; + case raft::bench::ann::Metric::kEuclidean: return raft::distance::DistanceType::L2Expanded; } } - } // namespace raft_temp namespace raft::bench::ann { -// brute force fused L2 KNN - RAFT +// brute force KNN - RAFT template class RaftGpu : public ANN { public: @@ -74,9 +72,11 @@ class RaftGpu : public ANN { } void set_search_dataset(const T* dataset, size_t nrow) override; void save(const std::string& file) const override; - void load(const std::string&) override { return; }; + void load(const std::string&) override; protected: + raft::device_resources handle_; + std::optional> index_; raft::distance::DistanceType metric_type_; int device_; const T* dataset_; @@ -85,17 +85,18 @@ class RaftGpu : public ANN { template RaftGpu::RaftGpu(Metric metric, int dim) - : ANN(metric, dim), metric_type_(raft_temp::parse_metric_type(metric)) + : ANN(metric, dim), + metric_type_(raft_temp::parse_metric_type(metric)), + handle_(cudaStreamPerThread) { - static_assert(std::is_same_v, "raft support only float type"); - assert(metric_type_ == raft::distance::DistanceType::L2Expanded); RAFT_CUDA_TRY(cudaGetDevice(&device_)); } template -void RaftGpu::build(const T*, size_t, cudaStream_t) +void RaftGpu::build(const T* dataset, size_t nrow, cudaStream_t) { - // as this is brute force algo so no index building required + auto dataset_view = raft::make_host_matrix_view(dataset, nrow, this->dim_); + index_.emplace(raft::neighbors::brute_force::build(handle_, dataset_view)); return; } @@ -115,15 +116,13 @@ void RaftGpu::set_search_dataset(const T* dataset, size_t nrow) template void RaftGpu::save(const std::string& file) const { - // create a empty index file as no index to store. - std::fstream fp; - fp.open(file.c_str(), std::ios::out); - if (!fp) { - printf("Error in creating file!!!\n"); - ; - return; - } - fp.close(); + raft::neighbors::brute_force::serialize(handle_, file, *index_); +} + +template +void RaftGpu::load(const std::string& file) +{ + index_ = raft::neighbors::brute_force::deserialize(handle_, file); } template @@ -134,20 +133,16 @@ void RaftGpu::search(const T* queries, float* distances, cudaStream_t stream) const { - // TODO: Integrate new `raft::brute_force::index` (from - // https://github.com/rapidsai/raft/pull/1817) - raft::spatial::knn::detail::fusedL2Knn(this->dim_, - reinterpret_cast(neighbors), - distances, - dataset_, - queries, - nrow_, - static_cast(batch_size), - k, - true, - true, - stream, - metric_type_); + auto queries_view = + raft::make_device_matrix_view(queries, batch_size, this->dim_); + + auto neighbors_view = raft::make_device_matrix_view(neighbors, batch_size, k); + auto distances_view = raft::make_device_matrix_view(distances, batch_size, k); + + raft::neighbors::brute_force::search( + handle_, *index_, queries_view, neighbors_view, distances_view); + + handle_.sync_stream(); } } // namespace raft::bench::ann From 1fa690ba91f0c64c2da54ded083dd4c18d0d1874 Mon Sep 17 00:00:00 2001 From: Ben Frederickson Date: Wed, 13 Dec 2023 12:48:44 -0800 Subject: [PATCH 2/8] . --- cpp/bench/ann/CMakeLists.txt | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/cpp/bench/ann/CMakeLists.txt b/cpp/bench/ann/CMakeLists.txt index 1f6d8e3e3a..f70339374b 100644 --- a/cpp/bench/ann/CMakeLists.txt +++ b/cpp/bench/ann/CMakeLists.txt @@ -53,7 +53,7 @@ if(BUILD_CPU_ONLY) set(RAFT_ANN_BENCH_USE_RAFT_IVF_FLAT OFF) set(RAFT_ANN_BENCH_USE_RAFT_IVF_PQ OFF) set(RAFT_ANN_BENCH_USE_RAFT_CAGRA OFF) - set(RAFT_ANN_BENCH_USE_RAFT_CAGRA OFF) + set(RAFT_ANN_BENCH_USE_RAFT_BRUTE_FORCE OFF) set(RAFT_ANN_BENCH_USE_RAFT_CAGRA_HNSWLIB OFF) set(RAFT_ANN_BENCH_USE_GGNN OFF) else() From aa98240bb3afacec32843fc74e8acc82a2eae0a3 Mon Sep 17 00:00:00 2001 From: Ben Frederickson Date: Wed, 13 Dec 2023 12:49:49 -0800 Subject: [PATCH 3/8] . --- cpp/bench/ann/src/raft/raft_wrapper.h | 1 + 1 file changed, 1 insertion(+) diff --git a/cpp/bench/ann/src/raft/raft_wrapper.h b/cpp/bench/ann/src/raft/raft_wrapper.h index a408d979e5..ceca673662 100644 --- a/cpp/bench/ann/src/raft/raft_wrapper.h +++ b/cpp/bench/ann/src/raft/raft_wrapper.h @@ -35,6 +35,7 @@ inline raft::distance::DistanceType parse_metric_type(raft::bench::ann::Metric m switch (metric) { case raft::bench::ann::Metric::kInnerProduct: return raft::distance::DistanceType::InnerProduct; case raft::bench::ann::Metric::kEuclidean: return raft::distance::DistanceType::L2Expanded; + default: throw std::runtime_error("raft supports only metric type of inner product and L2"); } } } // namespace raft_temp From e1fada6d87160032e4ca8bf0a0535b5de8f335bb Mon Sep 17 00:00:00 2001 From: "Corey J. Nolet" Date: Wed, 13 Dec 2023 16:34:36 -0500 Subject: [PATCH 4/8] Adding yaml config files for brute force --- .../src/raft-ann-bench/run/conf/algos/faiss_cpu_flat.yaml | 5 +++++ .../src/raft-ann-bench/run/conf/algos/faiss_gpu_flat.yaml | 5 +++++ .../src/raft-ann-bench/run/conf/algos/raft_brute_force.yaml | 5 +++++ 3 files changed, 15 insertions(+) create mode 100644 python/raft-ann-bench/src/raft-ann-bench/run/conf/algos/faiss_cpu_flat.yaml create mode 100644 python/raft-ann-bench/src/raft-ann-bench/run/conf/algos/faiss_gpu_flat.yaml create mode 100644 python/raft-ann-bench/src/raft-ann-bench/run/conf/algos/raft_brute_force.yaml diff --git a/python/raft-ann-bench/src/raft-ann-bench/run/conf/algos/faiss_cpu_flat.yaml b/python/raft-ann-bench/src/raft-ann-bench/run/conf/algos/faiss_cpu_flat.yaml new file mode 100644 index 0000000000..25eaf03d40 --- /dev/null +++ b/python/raft-ann-bench/src/raft-ann-bench/run/conf/algos/faiss_cpu_flat.yaml @@ -0,0 +1,5 @@ +name: faiss_cpu_flat +groups: + base: + build: + search: diff --git a/python/raft-ann-bench/src/raft-ann-bench/run/conf/algos/faiss_gpu_flat.yaml b/python/raft-ann-bench/src/raft-ann-bench/run/conf/algos/faiss_gpu_flat.yaml new file mode 100644 index 0000000000..a722e1b91c --- /dev/null +++ b/python/raft-ann-bench/src/raft-ann-bench/run/conf/algos/faiss_gpu_flat.yaml @@ -0,0 +1,5 @@ +name: faiss_gpu_flat +groups: + base: + build: + search: diff --git a/python/raft-ann-bench/src/raft-ann-bench/run/conf/algos/raft_brute_force.yaml b/python/raft-ann-bench/src/raft-ann-bench/run/conf/algos/raft_brute_force.yaml new file mode 100644 index 0000000000..da99841f9b --- /dev/null +++ b/python/raft-ann-bench/src/raft-ann-bench/run/conf/algos/raft_brute_force.yaml @@ -0,0 +1,5 @@ +name: raft_brute_force +groups: + base: + build: + search: From 850d45bf808f3a7d620f3cc9062e74e3ef59c481 Mon Sep 17 00:00:00 2001 From: Ben Frederickson Date: Wed, 13 Dec 2023 14:06:28 -0800 Subject: [PATCH 5/8] fix build --- cpp/bench/ann/src/raft/raft_wrapper.h | 30 ++++++++++++++++++--------- 1 file changed, 20 insertions(+), 10 deletions(-) diff --git a/cpp/bench/ann/src/raft/raft_wrapper.h b/cpp/bench/ann/src/raft/raft_wrapper.h index ceca673662..adca790b1c 100644 --- a/cpp/bench/ann/src/raft/raft_wrapper.h +++ b/cpp/bench/ann/src/raft/raft_wrapper.h @@ -27,6 +27,7 @@ #include #include "../common/ann_types.hpp" +#include "raft_ann_bench_utils.h" namespace raft_temp { @@ -74,10 +75,12 @@ class RaftGpu : public ANN { void set_search_dataset(const T* dataset, size_t nrow) override; void save(const std::string& file) const override; void load(const std::string&) override; + std::unique_ptr> copy() override; protected: - raft::device_resources handle_; - std::optional> index_; + // handle_ must go first to make sure it dies last and all memory allocated in pool + configured_raft_resources handle_{}; + std::shared_ptr> index_; raft::distance::DistanceType metric_type_; int device_; const T* dataset_; @@ -86,19 +89,19 @@ class RaftGpu : public ANN { template RaftGpu::RaftGpu(Metric metric, int dim) - : ANN(metric, dim), - metric_type_(raft_temp::parse_metric_type(metric)), - handle_(cudaStreamPerThread) + : ANN(metric, dim), metric_type_(raft_temp::parse_metric_type(metric)) { RAFT_CUDA_TRY(cudaGetDevice(&device_)); } template -void RaftGpu::build(const T* dataset, size_t nrow, cudaStream_t) +void RaftGpu::build(const T* dataset, size_t nrow, cudaStream_t stream) { auto dataset_view = raft::make_host_matrix_view(dataset, nrow, this->dim_); - index_.emplace(raft::neighbors::brute_force::build(handle_, dataset_view)); - return; + index_ = std::make_shared>( + std::move(raft::neighbors::brute_force::build(handle_, dataset_view))); + + handle_.stream_wait(stream); } template @@ -123,7 +126,8 @@ void RaftGpu::save(const std::string& file) const template void RaftGpu::load(const std::string& file) { - index_ = raft::neighbors::brute_force::deserialize(handle_, file); + index_ = std::make_shared>( + std::move(raft::neighbors::brute_force::deserialize(handle_, file))); } template @@ -143,7 +147,13 @@ void RaftGpu::search(const T* queries, raft::neighbors::brute_force::search( handle_, *index_, queries_view, neighbors_view, distances_view); - handle_.sync_stream(); + handle_.stream_wait(stream); +} + +template +std::unique_ptr> RaftGpu::copy() +{ + return std::make_unique>(*this); // use copy constructor } } // namespace raft::bench::ann From 49a3ac029d1b1856960e60627a9e57436be7e503 Mon Sep 17 00:00:00 2001 From: Ben Frederickson Date: Wed, 13 Dec 2023 14:18:18 -0800 Subject: [PATCH 6/8] fix for no build/search params --- python/raft-ann-bench/src/raft-ann-bench/run/__main__.py | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/python/raft-ann-bench/src/raft-ann-bench/run/__main__.py b/python/raft-ann-bench/src/raft-ann-bench/run/__main__.py index 9841b47b98..a1f97d67d5 100644 --- a/python/raft-ann-bench/src/raft-ann-bench/run/__main__.py +++ b/python/raft-ann-bench/src/raft-ann-bench/run/__main__.py @@ -498,8 +498,8 @@ def add_algo_group(group_list): ) if executable not in executables_to_run: executables_to_run[executable] = {"index": []} - build_params = algos_conf[algo]["groups"][group]["build"] - search_params = algos_conf[algo]["groups"][group]["search"] + build_params = algos_conf[algo]["groups"][group]["build"] or {} + search_params = algos_conf[algo]["groups"][group]["search"] or {} param_names = [] param_lists = [] From 6a7cbb7986bca59011d0171f870ec5aea2e95fe4 Mon Sep 17 00:00:00 2001 From: Ben Frederickson Date: Wed, 13 Dec 2023 15:28:56 -0800 Subject: [PATCH 7/8] fix faiss_gpu_flat/faiss_cpu_flat --- cpp/bench/ann/src/faiss/faiss_cpu_benchmark.cpp | 2 +- cpp/bench/ann/src/faiss/faiss_gpu_benchmark.cu | 2 +- 2 files changed, 2 insertions(+), 2 deletions(-) diff --git a/cpp/bench/ann/src/faiss/faiss_cpu_benchmark.cpp b/cpp/bench/ann/src/faiss/faiss_cpu_benchmark.cpp index 97d1bbf307..e3e25a99a2 100644 --- a/cpp/bench/ann/src/faiss/faiss_cpu_benchmark.cpp +++ b/cpp/bench/ann/src/faiss/faiss_cpu_benchmark.cpp @@ -143,7 +143,7 @@ std::unique_ptr::AnnSearchParam> create_search parse_search_param(conf, *param); return param; } else if (algo == "faiss_cpu_flat") { - auto param = std::make_unique::AnnSearchParam>(); + auto param = std::make_unique::SearchParam>(); return param; } // else diff --git a/cpp/bench/ann/src/faiss/faiss_gpu_benchmark.cu b/cpp/bench/ann/src/faiss/faiss_gpu_benchmark.cu index 8b04ba1980..a9388531cc 100644 --- a/cpp/bench/ann/src/faiss/faiss_gpu_benchmark.cu +++ b/cpp/bench/ann/src/faiss/faiss_gpu_benchmark.cu @@ -143,7 +143,7 @@ std::unique_ptr::AnnSearchParam> create_search parse_search_param(conf, *param); return param; } else if (algo == "faiss_gpu_flat") { - auto param = std::make_unique::AnnSearchParam>(); + auto param = std::make_unique::SearchParam>(); return param; } // else From f71f6578dd39a1e9885177bd186832aa8f54cdf7 Mon Sep 17 00:00:00 2001 From: Ben Frederickson Date: Thu, 14 Dec 2023 21:12:58 -0800 Subject: [PATCH 8/8] add static assert --- cpp/bench/ann/src/raft/raft_wrapper.h | 2 ++ 1 file changed, 2 insertions(+) diff --git a/cpp/bench/ann/src/raft/raft_wrapper.h b/cpp/bench/ann/src/raft/raft_wrapper.h index adca790b1c..eae615cba1 100644 --- a/cpp/bench/ann/src/raft/raft_wrapper.h +++ b/cpp/bench/ann/src/raft/raft_wrapper.h @@ -91,6 +91,8 @@ template RaftGpu::RaftGpu(Metric metric, int dim) : ANN(metric, dim), metric_type_(raft_temp::parse_metric_type(metric)) { + static_assert(std::is_same_v || std::is_same_v, + "raft bfknn only supports float/double"); RAFT_CUDA_TRY(cudaGetDevice(&device_)); }