From 191235517c23e4ce4b8e69f2ff08a95c75456d69 Mon Sep 17 00:00:00 2001 From: Tamas Bela Feher Date: Tue, 28 May 2024 20:21:56 +0200 Subject: [PATCH] Accept host_mdspan for IVF-PQ build and extend (#148) This PR enables host input arrays for `ivf_pq::build` and `ivf_pq::extend`. closes #120 closes #143 Authors: - Tamas Bela Feher (https://github.com/tfeher) - Corey J. Nolet (https://github.com/cjnolet) Approvers: - Corey J. Nolet (https://github.com/cjnolet) URL: https://github.com/rapidsai/cuvs/pull/148 --- cpp/include/cuvs/neighbors/ivf_pq.hpp | 380 +++++++++++++++++- .../neighbors/detail/cagra/cagra_build.cuh | 3 +- .../ivf_pq/detail/generate_ivf_pq.py | 39 +- .../ivf_pq_build_extend_float_int64_t.cu | 35 +- .../detail/ivf_pq_build_extend_inst.cuh | 93 +++++ .../ivf_pq_build_extend_int8_t_int64_t.cu | 35 +- .../ivf_pq_build_extend_uint8_t_int64_t.cu | 35 +- cpp/src/neighbors/ivf_pq/ivf_pq_build.cuh | 59 ++- .../neighbors/ivf_pq/ivf_pq_deserialize.cu | 15 +- cpp/src/neighbors/ivf_pq/ivf_pq_serialize.cu | 15 +- cpp/test/neighbors/ann_ivf_pq.cuh | 18 +- 11 files changed, 527 insertions(+), 200 deletions(-) create mode 100644 cpp/src/neighbors/ivf_pq/detail/ivf_pq_build_extend_inst.cuh diff --git a/cpp/include/cuvs/neighbors/ivf_pq.hpp b/cpp/include/cuvs/neighbors/ivf_pq.hpp index d1e6b37c2f..8493882b43 100644 --- a/cpp/include/cuvs/neighbors/ivf_pq.hpp +++ b/cpp/include/cuvs/neighbors/ivf_pq.hpp @@ -593,6 +593,146 @@ void build(raft::resources const& handle, const cuvs::neighbors::ivf_pq::index_params& index_params, raft::device_matrix_view dataset, cuvs::neighbors::ivf_pq::index* idx); +/** + * @brief Build the index from the dataset for efficient search. + * + * Usage example: + * @code{.cpp} + * using namespace cuvs::neighbors; + * // use default index parameters + * ivf_pq::index_params index_params; + * // create and fill the index from a [N, D] dataset + * auto index = ivf_pq::build(handle, index_params, dataset); + * @endcode + * + * @param[in] handle + * @param[in] index_params configure the index building + * @param[in] dataset a host_matrix_view to a row-major matrix [n_rows, dim] + * + * @return the constructed ivf-pq index + */ +auto build(raft::resources const& handle, + const cuvs::neighbors::ivf_pq::index_params& index_params, + raft::host_matrix_view dataset) + -> cuvs::neighbors::ivf_pq::index; + +/** + * @brief Build the index from the dataset for efficient search. + * + * Usage example: + * @code{.cpp} + * using namespace cuvs::neighbors; + * // use default index parameters + * ivf_pq::index_params index_params; + * // create and fill the index from a [N, D] dataset + * ivf_pq::index index; + * ivf_pq::build(handle, index_params, dataset, index); + * @endcode + * + * @param[in] handle + * @param[in] index_params configure the index building + * @param[in] dataset raft::host_matrix_view to a row-major matrix [n_rows, dim] + * @param[out] idx reference to ivf_pq::index + * + */ +void build(raft::resources const& handle, + const cuvs::neighbors::ivf_pq::index_params& index_params, + raft::host_matrix_view dataset, + cuvs::neighbors::ivf_pq::index* idx); + +/** + * @brief Build the index from the dataset for efficient search. + * + * Usage example: + * @code{.cpp} + * using namespace cuvs::neighbors; + * // use default index parameters + * ivf_pq::index_params index_params; + * // create and fill the index from a [N, D] dataset + * auto index = ivf_pq::build(handle, index_params, dataset); + * @endcode + * + * @param[in] handle + * @param[in] index_params configure the index building + * @param[in] dataset a host_matrix_view to a row-major matrix [n_rows, dim] + * + * @return the constructed ivf-pq index + */ +auto build(raft::resources const& handle, + const cuvs::neighbors::ivf_pq::index_params& index_params, + raft::host_matrix_view dataset) + -> cuvs::neighbors::ivf_pq::index; + +/** + * @brief Build the index from the dataset for efficient search. + * + * Usage example: + * @code{.cpp} + * using namespace cuvs::neighbors; + * // use default index parameters + * ivf_pq::index_params index_params; + * // create and fill the index from a [N, D] dataset + * ivf_pq::index index; + * ivf_pq::build(handle, index_params, dataset, index); + * @endcode + * + * @param[in] handle + * @param[in] index_params configure the index building + * @param[in] dataset raft::host_matrix_view to a row-major matrix [n_rows, dim] + * @param[out] idx reference to ivf_pq::index + * + */ +void build(raft::resources const& handle, + const cuvs::neighbors::ivf_pq::index_params& index_params, + raft::host_matrix_view dataset, + cuvs::neighbors::ivf_pq::index* idx); + +/** + * @brief Build the index from the dataset for efficient search. + * + * Usage example: + * @code{.cpp} + * using namespace cuvs::neighbors; + * // use default index parameters + * ivf_pq::index_params index_params; + * // create and fill the index from a [N, D] dataset + * auto index = ivf_pq::build(handle, index_params, dataset); + * @endcode + * + * @param[in] handle + * @param[in] index_params configure the index building + * @param[in] dataset a host_matrix_view to a row-major matrix [n_rows, dim] + * + * @return the constructed ivf-pq index + */ +auto build(raft::resources const& handle, + const cuvs::neighbors::ivf_pq::index_params& index_params, + raft::host_matrix_view dataset) + -> cuvs::neighbors::ivf_pq::index; + +/** + * @brief Build the index from the dataset for efficient search. + * + * Usage example: + * @code{.cpp} + * using namespace cuvs::neighbors; + * // use default index parameters + * ivf_pq::index_params index_params; + * // create and fill the index from a [N, D] dataset + * ivf_pq::index index; + * ivf_pq::build(handle, index_params, dataset, index); + * @endcode + * + * @param[in] handle + * @param[in] index_params configure the index building + * @param[in] dataset raft::host_matrix_view to a row-major matrix [n_rows, dim] + * @param[out] idx reference to ivf_pq::index + * + */ +void build(raft::resources const& handle, + const cuvs::neighbors::ivf_pq::index_params& index_params, + raft::host_matrix_view dataset, + cuvs::neighbors::ivf_pq::index* idx); /** * @} */ @@ -771,6 +911,177 @@ void extend(raft::resources const& handle, raft::device_matrix_view new_vectors, std::optional> new_indices, cuvs::neighbors::ivf_pq::index* idx); + +/** + * @brief Extend the index with the new data. + * + * Usage example: + * @code{.cpp} + * using namespace cuvs::neighbors; + * ivf_pq::index_params index_params; + * index_params.add_data_on_build = false; // don't populate index on build + * index_params.kmeans_trainset_fraction = 1.0; // use whole dataset for kmeans training + * // train the index from a [N, D] dataset + * auto index_empty = ivf_pq::build(handle, index_params, dataset); + * // fill the index with the data + * std::optional> no_op = std::nullopt; + * auto index = ivf_pq::extend(handle, new_vectors, no_op, index_empty); + * @endcode + * + * @param[in] handle + * @param[in] new_vectors a device matrix view to a row-major matrix [n_rows, idx.dim()] + * @param[in] new_indices a device vector view to a vector of indices [n_rows]. + * If the original index is empty (`idx.size() == 0`), you can pass `std::nullopt` + * here to imply a continuous range `[0...n_rows)`. + * @param[inout] idx + */ +auto extend(raft::resources const& handle, + raft::host_matrix_view new_vectors, + std::optional> new_indices, + const cuvs::neighbors::ivf_pq::index& idx) + -> cuvs::neighbors::ivf_pq::index; + +/** + * @brief Extend the index with the new data. + * + * Usage example: + * @code{.cpp} + * using namespace cuvs::neighbors; + * ivf_pq::index_params index_params; + * index_params.add_data_on_build = false; // don't populate index on build + * index_params.kmeans_trainset_fraction = 1.0; // use whole dataset for kmeans training + * // train the index from a [N, D] dataset + * auto index_empty = ivf_pq::build(handle, index_params, dataset); + * // fill the index with the data + * std::optional> no_op = std::nullopt; + * ivf_pq::extend(handle, new_vectors, no_op, &index_empty); + * @endcode + * + * @param[in] handle + * @param[in] new_vectors a device matrix view to a row-major matrix [n_rows, idx.dim()] + * @param[in] new_indices a device vector view to a vector of indices [n_rows]. + * If the original index is empty (`idx.size() == 0`), you can pass `std::nullopt` + * here to imply a continuous range `[0...n_rows)`. + * @param[inout] idx + */ +void extend(raft::resources const& handle, + raft::host_matrix_view new_vectors, + std::optional> new_indices, + cuvs::neighbors::ivf_pq::index* idx); + +/** + * @brief Extend the index with the new data. + * + * Usage example: + * @code{.cpp} + * using namespace cuvs::neighbors; + * ivf_pq::index_params index_params; + * index_params.add_data_on_build = false; // don't populate index on build + * index_params.kmeans_trainset_fraction = 1.0; // use whole dataset for kmeans training + * // train the index from a [N, D] dataset + * auto index_empty = ivf_pq::build(handle, index_params, dataset); + * // fill the index with the data + * std::optional> no_op = std::nullopt; + * auto index = ivf_pq::extend(handle, new_vectors, no_op, index_empty); + * @endcode + * + * @param[in] handle + * @param[in] new_vectors a device matrix view to a row-major matrix [n_rows, idx.dim()] + * @param[in] new_indices a device vector view to a vector of indices [n_rows]. + * If the original index is empty (`idx.size() == 0`), you can pass `std::nullopt` + * here to imply a continuous range `[0...n_rows)`. + * @param[inout] idx + */ +auto extend(raft::resources const& handle, + raft::host_matrix_view new_vectors, + std::optional> new_indices, + const cuvs::neighbors::ivf_pq::index& idx) + -> cuvs::neighbors::ivf_pq::index; + +/** + * @brief Extend the index with the new data. + * + * Usage example: + * @code{.cpp} + * using namespace cuvs::neighbors; + * ivf_pq::index_params index_params; + * index_params.add_data_on_build = false; // don't populate index on build + * index_params.kmeans_trainset_fraction = 1.0; // use whole dataset for kmeans training + * // train the index from a [N, D] dataset + * auto index_empty = ivf_pq::build(handle, index_params, dataset); + * // fill the index with the data + * std::optional> no_op = std::nullopt; + * ivf_pq::extend(handle, new_vectors, no_op, &index_empty); + * @endcode + * + * @param[in] handle + * @param[in] new_vectors a device matrix view to a row-major matrix [n_rows, idx.dim()] + * @param[in] new_indices a device vector view to a vector of indices [n_rows]. + * If the original index is empty (`idx.size() == 0`), you can pass `std::nullopt` + * here to imply a continuous range `[0...n_rows)`. + * @param[inout] idx + */ +void extend(raft::resources const& handle, + raft::host_matrix_view new_vectors, + std::optional> new_indices, + cuvs::neighbors::ivf_pq::index* idx); + +/** + * @brief Extend the index with the new data. + * + * Usage example: + * @code{.cpp} + * using namespace cuvs::neighbors; + * ivf_pq::index_params index_params; + * index_params.add_data_on_build = false; // don't populate index on build + * index_params.kmeans_trainset_fraction = 1.0; // use whole dataset for kmeans training + * // train the index from a [N, D] dataset + * auto index_empty = ivf_pq::build(handle, index_params, dataset); + * // fill the index with the data + * std::optional> no_op = std::nullopt; + * auto index = ivf_pq::extend(handle, new_vectors, no_op, index_empty); + * @endcode + * + * @param[in] handle + * @param[in] new_vectors a device matrix view to a row-major matrix [n_rows, idx.dim()] + * @param[in] new_indices a device vector view to a vector of indices [n_rows]. + * If the original index is empty (`idx.size() == 0`), you can pass `std::nullopt` + * here to imply a continuous range `[0...n_rows)`. + * @param[inout] idx + */ +auto extend(raft::resources const& handle, + raft::host_matrix_view new_vectors, + std::optional> new_indices, + const cuvs::neighbors::ivf_pq::index& idx) + -> cuvs::neighbors::ivf_pq::index; + +/** + * @brief Extend the index with the new data. + * + * Usage example: + * @code{.cpp} + * using namespace cuvs::neighbors; + * ivf_pq::index_params index_params; + * index_params.add_data_on_build = false; // don't populate index on build + * index_params.kmeans_trainset_fraction = 1.0; // use whole dataset for kmeans training + * // train the index from a [N, D] dataset + * auto index_empty = ivf_pq::build(handle, index_params, dataset); + * // fill the index with the data + * std::optional> no_op = std::nullopt; + * ivf_pq::extend(handle, new_vectors, no_op, &index_empty); + * @endcode + * + * @param[in] handle + * @param[in] new_vectors a device matrix view to a row-major matrix [n_rows, idx.dim()] + * @param[in] new_indices a device vector view to a vector of indices [n_rows]. + * If the original index is empty (`idx.size() == 0`), you can pass `std::nullopt` + * here to imply a continuous range `[0...n_rows)`. + * @param[inout] idx + */ +void extend(raft::resources const& handle, + raft::host_matrix_view new_vectors, + std::optional> new_indices, + cuvs::neighbors::ivf_pq::index* idx); /** * @} */ @@ -1009,9 +1320,30 @@ void search_with_filtering( * @{ */ /** - * Save the index to file. + * Serialize the index to an output string. * - * Experimental, both the API and the serialization format are subject to change. + * @code{.cpp} + * #include + * + * raft::resources handle; + * + * // create an input string + * std::string str + * // create an index with `auto index = ivf_pq::build(...);` + * cuvs::serialize(handle, str, index); + * @endcode + * + * @param[in] handle the raft handle + * @param[out] str output string + * @param[in] index IVF-PQ index + * + */ +void serialize(raft::resources const& handle, + std::string& str, + const cuvs::neighbors::ivf_pq::index& index); + +/** + * Save the index to file. * * @code{.cpp} * #include @@ -1029,14 +1361,38 @@ void search_with_filtering( * @param[in] index IVF-PQ index * */ -void serialize(raft::resources const& handle, - std::string& filename, - const cuvs::neighbors::ivf_pq::index& index); +void serialize_file(raft::resources const& handle, + const std::string& filename, + const cuvs::neighbors::ivf_pq::index& index); /** - * Load index from file. + * Load index from input string. + * + * @code{.cpp} + * #include * - * Experimental, both the API and the serialization format are subject to change. + * raft::resources handle; + * + * std::string str = ... + * + * using IdxT = int64_t; // type of the index + * // create an empty index + * cuvs::neighbors::ivf_pq::index index(handl, index_params, dim); + * + * cuvs::deserialize(handle, filename, &index); + * @endcode + * + * @param[in] handle the raft handle + * @param[in] str the name of the file that stores the index + * @param[out] index IVF-PQ index + * + */ + +void deserialize(raft::resources const& handle, + const std::string& str, + cuvs::neighbors::ivf_pq::index* index); +/** + * Load index from file. * * @code{.cpp} * #include @@ -1046,7 +1402,9 @@ void serialize(raft::resources const& handle, * // create a string with a filepath * std::string filename("/path/to/index"); * using IdxT = int64_t; // type of the index - * // create an empty index with `ivf_pq::index index(handle, index_params, dim);` + * // create an empty index with + * ivf_pq::index index(handle, index_params, dim); + * * cuvs::deserialize(handle, filename, &index); * @endcode * @@ -1055,9 +1413,9 @@ void serialize(raft::resources const& handle, * @param[out] index IVF-PQ index * */ -void deserialize(raft::resources const& handle, - const std::string& filename, - cuvs::neighbors::ivf_pq::index* index); +void deserialize_file(raft::resources const& handle, + const std::string& filename, + cuvs::neighbors::ivf_pq::index* index); /** * @} */ diff --git a/cpp/src/neighbors/detail/cagra/cagra_build.cuh b/cpp/src/neighbors/detail/cagra/cagra_build.cuh index 2f6cb17e36..0ca97b9ca9 100644 --- a/cpp/src/neighbors/detail/cagra/cagra_build.cuh +++ b/cpp/src/neighbors/detail/cagra/cagra_build.cuh @@ -91,8 +91,7 @@ void build_knn_graph( }(); RAFT_LOG_DEBUG("# Building IVF-PQ index %s", model_name.c_str()); - auto index = cuvs::neighbors::ivf_pq::detail::build( - res, *build_params, dataset.data_handle(), dataset.extent(0), dataset.extent(1)); + auto index = cuvs::neighbors::ivf_pq::detail::build(res, *build_params, dataset); // // search top (k + 1) neighbors diff --git a/cpp/src/neighbors/ivf_pq/detail/generate_ivf_pq.py b/cpp/src/neighbors/ivf_pq/detail/generate_ivf_pq.py index 2ba513579c..878c7ee214 100644 --- a/cpp/src/neighbors/ivf_pq/detail/generate_ivf_pq.py +++ b/cpp/src/neighbors/ivf_pq/detail/generate_ivf_pq.py @@ -41,7 +41,7 @@ """ build_include_macro = """ -#include "../ivf_pq_build.cuh" +#include "ivf_pq_build_extend_inst.cuh" """ search_include_macro = """ #include "../ivf_pq_search.cuh" @@ -61,42 +61,7 @@ uint8_t_int64_t=("uint8_t", "int64_t"), ) -build_extend_macro = """ -#define CUVS_INST_IVF_PQ_BUILD_EXTEND(T, IdxT) \\ - auto build(raft::resources const& handle, \\ - const cuvs::neighbors::ivf_pq::index_params& params, \\ - raft::device_matrix_view dataset) \\ - ->cuvs::neighbors::ivf_pq::index \\ - { \\ - return cuvs::neighbors::ivf_pq::detail::build(handle, params, dataset); \\ - } \\ - \\ - void build(raft::resources const& handle, \\ - const cuvs::neighbors::ivf_pq::index_params& params, \\ - raft::device_matrix_view dataset, \\ - cuvs::neighbors::ivf_pq::index* idx) \\ - { \\ - cuvs::neighbors::ivf_pq::detail::build(handle, params, dataset, idx); \\ - } \\ - auto extend(raft::resources const& handle, \\ - raft::device_matrix_view new_vectors, \\ - std::optional> new_indices, \\ - const cuvs::neighbors::ivf_pq::index& orig_index) \\ - ->cuvs::neighbors::ivf_pq::index \\ - { \\ - return cuvs::neighbors::ivf_pq::detail::extend( \\ - handle, new_vectors, new_indices, orig_index); \\ - } \\ - \\ - void extend(raft::resources const& handle, \\ - raft::device_matrix_view new_vectors, \\ - std::optional> new_indices, \\ - cuvs::neighbors::ivf_pq::index* idx) \\ - { \\ - cuvs::neighbors::ivf_pq::detail::extend( \\ - handle, new_vectors, new_indices, idx); \\ - } -""" +build_extend_macro = "" # moved to header ivf_pq_build_extend_inst.cuh search_macro = """ #define CUVS_INST_IVF_PQ_SEARCH(T, IdxT) \\ diff --git a/cpp/src/neighbors/ivf_pq/detail/ivf_pq_build_extend_float_int64_t.cu b/cpp/src/neighbors/ivf_pq/detail/ivf_pq_build_extend_float_int64_t.cu index ee7f26381f..65c443d883 100644 --- a/cpp/src/neighbors/ivf_pq/detail/ivf_pq_build_extend_float_int64_t.cu +++ b/cpp/src/neighbors/ivf_pq/detail/ivf_pq_build_extend_float_int64_t.cu @@ -25,42 +25,9 @@ #include -#include "../ivf_pq_build.cuh" +#include "ivf_pq_build_extend_inst.cuh" namespace cuvs::neighbors::ivf_pq { - -#define CUVS_INST_IVF_PQ_BUILD_EXTEND(T, IdxT) \ - auto build(raft::resources const& handle, \ - const cuvs::neighbors::ivf_pq::index_params& params, \ - raft::device_matrix_view dataset) \ - ->cuvs::neighbors::ivf_pq::index \ - { \ - return cuvs::neighbors::ivf_pq::detail::build(handle, params, dataset); \ - } \ - \ - void build(raft::resources const& handle, \ - const cuvs::neighbors::ivf_pq::index_params& params, \ - raft::device_matrix_view dataset, \ - cuvs::neighbors::ivf_pq::index* idx) \ - { \ - cuvs::neighbors::ivf_pq::detail::build(handle, params, dataset, idx); \ - } \ - auto extend(raft::resources const& handle, \ - raft::device_matrix_view new_vectors, \ - std::optional> new_indices, \ - const cuvs::neighbors::ivf_pq::index& orig_index) \ - ->cuvs::neighbors::ivf_pq::index \ - { \ - return cuvs::neighbors::ivf_pq::detail::extend(handle, new_vectors, new_indices, orig_index); \ - } \ - \ - void extend(raft::resources const& handle, \ - raft::device_matrix_view new_vectors, \ - std::optional> new_indices, \ - cuvs::neighbors::ivf_pq::index* idx) \ - { \ - cuvs::neighbors::ivf_pq::detail::extend(handle, new_vectors, new_indices, idx); \ - } CUVS_INST_IVF_PQ_BUILD_EXTEND(float, int64_t); #undef CUVS_INST_IVF_PQ_BUILD_EXTEND diff --git a/cpp/src/neighbors/ivf_pq/detail/ivf_pq_build_extend_inst.cuh b/cpp/src/neighbors/ivf_pq/detail/ivf_pq_build_extend_inst.cuh new file mode 100644 index 0000000000..4b963b0b37 --- /dev/null +++ b/cpp/src/neighbors/ivf_pq/detail/ivf_pq_build_extend_inst.cuh @@ -0,0 +1,93 @@ +/* + * Copyright (c) 2024, NVIDIA CORPORATION. + * + * Licensed under the Apache License, Version 2.0 (the "License"); + * you may not use this file except in compliance with the License. + * You may obtain a copy of the License at + * + * http://www.apache.org/licenses/LICENSE-2.0 + * + * Unless required by applicable law or agreed to in writing, software + * distributed under the License is distributed on an "AS IS" BASIS, + * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. + * See the License for the specific language governing permissions and + * limitations under the License. + */ + +/* + * NOTE: this file is used by generate_ivf_pq.py + * + */ + +#include + +#include "../ivf_pq_build.cuh" + +namespace cuvs::neighbors::ivf_pq { + +#define CUVS_INST_IVF_PQ_BUILD_EXTEND(T, IdxT) \ + auto build(raft::resources const& handle, \ + const cuvs::neighbors::ivf_pq::index_params& params, \ + raft::device_matrix_view dataset) \ + ->cuvs::neighbors::ivf_pq::index \ + { \ + return cuvs::neighbors::ivf_pq::detail::build(handle, params, dataset); \ + } \ + \ + void build(raft::resources const& handle, \ + const cuvs::neighbors::ivf_pq::index_params& params, \ + raft::device_matrix_view dataset, \ + cuvs::neighbors::ivf_pq::index* idx) \ + { \ + cuvs::neighbors::ivf_pq::detail::build(handle, params, dataset, idx); \ + } \ + \ + auto build(raft::resources const& handle, \ + const cuvs::neighbors::ivf_pq::index_params& params, \ + raft::host_matrix_view dataset) \ + ->cuvs::neighbors::ivf_pq::index \ + { \ + return cuvs::neighbors::ivf_pq::detail::build(handle, params, dataset); \ + } \ + \ + void build(raft::resources const& handle, \ + const cuvs::neighbors::ivf_pq::index_params& params, \ + raft::host_matrix_view dataset, \ + cuvs::neighbors::ivf_pq::index* idx) \ + { \ + cuvs::neighbors::ivf_pq::detail::build(handle, params, dataset, idx); \ + } \ + auto extend( \ + raft::resources const& handle, \ + raft::device_matrix_view new_vectors, \ + std::optional> new_indices, \ + const cuvs::neighbors::ivf_pq::index& orig_index) \ + ->cuvs::neighbors::ivf_pq::index \ + { \ + return cuvs::neighbors::ivf_pq::detail::extend(handle, new_vectors, new_indices, orig_index); \ + } \ + void extend(raft::resources const& handle, \ + raft::device_matrix_view new_vectors, \ + std::optional> new_indices, \ + cuvs::neighbors::ivf_pq::index* idx) \ + { \ + cuvs::neighbors::ivf_pq::detail::extend(handle, new_vectors, new_indices, idx); \ + } \ + auto extend(raft::resources const& handle, \ + raft::host_matrix_view new_vectors, \ + std::optional> new_indices, \ + const cuvs::neighbors::ivf_pq::index& orig_index) \ + ->cuvs::neighbors::ivf_pq::index \ + { \ + return cuvs::neighbors::ivf_pq::detail::extend(handle, new_vectors, new_indices, orig_index); \ + } \ + \ + void extend(raft::resources const& handle, \ + raft::host_matrix_view new_vectors, \ + std::optional> new_indices, \ + cuvs::neighbors::ivf_pq::index* idx) \ + { \ + cuvs::neighbors::ivf_pq::detail::extend(handle, new_vectors, new_indices, idx); \ + } + +} // namespace cuvs::neighbors::ivf_pq diff --git a/cpp/src/neighbors/ivf_pq/detail/ivf_pq_build_extend_int8_t_int64_t.cu b/cpp/src/neighbors/ivf_pq/detail/ivf_pq_build_extend_int8_t_int64_t.cu index 8b612439d6..048560b5a4 100644 --- a/cpp/src/neighbors/ivf_pq/detail/ivf_pq_build_extend_int8_t_int64_t.cu +++ b/cpp/src/neighbors/ivf_pq/detail/ivf_pq_build_extend_int8_t_int64_t.cu @@ -25,42 +25,9 @@ #include -#include "../ivf_pq_build.cuh" +#include "ivf_pq_build_extend_inst.cuh" namespace cuvs::neighbors::ivf_pq { - -#define CUVS_INST_IVF_PQ_BUILD_EXTEND(T, IdxT) \ - auto build(raft::resources const& handle, \ - const cuvs::neighbors::ivf_pq::index_params& params, \ - raft::device_matrix_view dataset) \ - ->cuvs::neighbors::ivf_pq::index \ - { \ - return cuvs::neighbors::ivf_pq::detail::build(handle, params, dataset); \ - } \ - \ - void build(raft::resources const& handle, \ - const cuvs::neighbors::ivf_pq::index_params& params, \ - raft::device_matrix_view dataset, \ - cuvs::neighbors::ivf_pq::index* idx) \ - { \ - cuvs::neighbors::ivf_pq::detail::build(handle, params, dataset, idx); \ - } \ - auto extend(raft::resources const& handle, \ - raft::device_matrix_view new_vectors, \ - std::optional> new_indices, \ - const cuvs::neighbors::ivf_pq::index& orig_index) \ - ->cuvs::neighbors::ivf_pq::index \ - { \ - return cuvs::neighbors::ivf_pq::detail::extend(handle, new_vectors, new_indices, orig_index); \ - } \ - \ - void extend(raft::resources const& handle, \ - raft::device_matrix_view new_vectors, \ - std::optional> new_indices, \ - cuvs::neighbors::ivf_pq::index* idx) \ - { \ - cuvs::neighbors::ivf_pq::detail::extend(handle, new_vectors, new_indices, idx); \ - } CUVS_INST_IVF_PQ_BUILD_EXTEND(int8_t, int64_t); #undef CUVS_INST_IVF_PQ_BUILD_EXTEND diff --git a/cpp/src/neighbors/ivf_pq/detail/ivf_pq_build_extend_uint8_t_int64_t.cu b/cpp/src/neighbors/ivf_pq/detail/ivf_pq_build_extend_uint8_t_int64_t.cu index df6e12b7e3..755fb9f8d7 100644 --- a/cpp/src/neighbors/ivf_pq/detail/ivf_pq_build_extend_uint8_t_int64_t.cu +++ b/cpp/src/neighbors/ivf_pq/detail/ivf_pq_build_extend_uint8_t_int64_t.cu @@ -25,42 +25,9 @@ #include -#include "../ivf_pq_build.cuh" +#include "ivf_pq_build_extend_inst.cuh" namespace cuvs::neighbors::ivf_pq { - -#define CUVS_INST_IVF_PQ_BUILD_EXTEND(T, IdxT) \ - auto build(raft::resources const& handle, \ - const cuvs::neighbors::ivf_pq::index_params& params, \ - raft::device_matrix_view dataset) \ - ->cuvs::neighbors::ivf_pq::index \ - { \ - return cuvs::neighbors::ivf_pq::detail::build(handle, params, dataset); \ - } \ - \ - void build(raft::resources const& handle, \ - const cuvs::neighbors::ivf_pq::index_params& params, \ - raft::device_matrix_view dataset, \ - cuvs::neighbors::ivf_pq::index* idx) \ - { \ - cuvs::neighbors::ivf_pq::detail::build(handle, params, dataset, idx); \ - } \ - auto extend(raft::resources const& handle, \ - raft::device_matrix_view new_vectors, \ - std::optional> new_indices, \ - const cuvs::neighbors::ivf_pq::index& orig_index) \ - ->cuvs::neighbors::ivf_pq::index \ - { \ - return cuvs::neighbors::ivf_pq::detail::extend(handle, new_vectors, new_indices, orig_index); \ - } \ - \ - void extend(raft::resources const& handle, \ - raft::device_matrix_view new_vectors, \ - std::optional> new_indices, \ - cuvs::neighbors::ivf_pq::index* idx) \ - { \ - cuvs::neighbors::ivf_pq::detail::extend(handle, new_vectors, new_indices, idx); \ - } CUVS_INST_IVF_PQ_BUILD_EXTEND(uint8_t, int64_t); #undef CUVS_INST_IVF_PQ_BUILD_EXTEND diff --git a/cpp/src/neighbors/ivf_pq/ivf_pq_build.cuh b/cpp/src/neighbors/ivf_pq/ivf_pq_build.cuh index 5536d6edb1..3b0e475f4b 100644 --- a/cpp/src/neighbors/ivf_pq/ivf_pq_build.cuh +++ b/cpp/src/neighbors/ivf_pq/ivf_pq_build.cuh @@ -1659,13 +1659,14 @@ auto extend(raft::resources const& handle, return ext_index; } -template +template auto build(raft::resources const& handle, const index_params& params, - const T* dataset, - IdxT n_rows, - uint32_t dim) -> index + raft::mdspan, raft::row_major, accessor> dataset) + -> index { + IdxT n_rows = dataset.extent(0); + IdxT dim = dataset.extent(1); raft::common::nvtx::range fun_scope( "ivf_pq::build(%zu, %u)", size_t(n_rows), dim); static_assert(std::is_same_v || std::is_same_v || std::is_same_v || @@ -1700,7 +1701,7 @@ auto build(raft::resources const& handle, if constexpr (std::is_same_v) { RAFT_CUDA_TRY(cudaMemcpy2DAsync(trainset.data(), sizeof(T) * index.dim(), - dataset, + dataset.data_handle(), sizeof(T) * index.dim() * trainset_ratio, sizeof(T) * index.dim(), n_rows_train, @@ -1709,7 +1710,7 @@ auto build(raft::resources const& handle, } else { size_t dim = index.dim(); cudaPointerAttributes dataset_attr; - RAFT_CUDA_TRY(cudaPointerGetAttributes(&dataset_attr, dataset)); + RAFT_CUDA_TRY(cudaPointerGetAttributes(&dataset_attr, dataset.data_handle())); if (dataset_attr.devicePointer != nullptr) { // data is available on device: just run the kernel to raft::copy and map the data auto p = reinterpret_cast(dataset_attr.devicePointer); @@ -1728,7 +1729,7 @@ auto build(raft::resources const& handle, // T at the end of float rows. RAFT_CUDA_TRY(cudaMemcpy2DAsync(trainset_tmp, sizeof(float) * index.dim(), - dataset, + dataset.data_handle(), sizeof(T) * index.dim() * trainset_ratio, sizeof(T) * index.dim(), n_rows_train, @@ -1809,37 +1810,27 @@ auto build(raft::resources const& handle, // add the data if necessary if (params.add_data_on_build) { - detail::extend(handle, &index, dataset, nullptr, n_rows); + detail::extend(handle, &index, dataset.data_handle(), nullptr, n_rows); } return index; } -template -auto build(raft::resources const& handle, - const index_params& params, - raft::device_matrix_view dataset) -> index -{ - IdxT n_rows = dataset.extent(0); - IdxT dim = dataset.extent(1); - return build(handle, params, dataset.data_handle(), n_rows, dim); -} - -template +template void build(raft::resources const& handle, const index_params& params, - raft::device_matrix_view dataset, + raft::mdspan, raft::row_major, accessor> dataset, index* index) { - IdxT n_rows = dataset.extent(0); - IdxT dim = dataset.extent(1); - *index = build(handle, params, dataset.data_handle(), n_rows, dim); + *index = build(handle, params, dataset); } -template -auto extend(raft::resources const& handle, - raft::device_matrix_view new_vectors, - std::optional> new_indices, - const cuvs::neighbors::ivf_pq::index& orig_index) -> index +template +auto extend( + raft::resources const& handle, + raft::mdspan, raft::row_major, accessor> new_vectors, + std::optional, raft::row_major, accessor2>> + new_indices, + const cuvs::neighbors::ivf_pq::index& orig_index) -> index { ASSERT(new_vectors.extent(1) == orig_index.dim(), "new_vectors should have the same dimension as the index"); @@ -1857,11 +1848,13 @@ auto extend(raft::resources const& handle, n_rows); } -template -void extend(raft::resources const& handle, - raft::device_matrix_view new_vectors, - std::optional> new_indices, - index* index) +template +void extend( + raft::resources const& handle, + raft::mdspan, raft::row_major, accessor> new_vectors, + std::optional, raft::row_major, accessor2>> + new_indices, + index* index) { ASSERT(new_vectors.extent(1) == index->dim(), "new_vectors should have the same dimension as the index"); diff --git a/cpp/src/neighbors/ivf_pq/ivf_pq_deserialize.cu b/cpp/src/neighbors/ivf_pq/ivf_pq_deserialize.cu index 9515cd2d58..7827e7892a 100644 --- a/cpp/src/neighbors/ivf_pq/ivf_pq_deserialize.cu +++ b/cpp/src/neighbors/ivf_pq/ivf_pq_deserialize.cu @@ -16,15 +16,24 @@ #include "ivf_pq_serialize.cuh" #include +#include namespace cuvs::neighbors::ivf_pq { -void deserialize(raft::resources const& handle, - const std::string& filename, - cuvs::neighbors::ivf_pq::index* index) +void deserialize_file(raft::resources const& handle, + const std::string& filename, + cuvs::neighbors::ivf_pq::index* index) { if (!index) { RAFT_FAIL("Invalid index pointer"); } *index = cuvs::neighbors::ivf_pq::detail::deserialize(handle, filename); } +void deserialize(raft::resources const& handle, + const std::string& str, + cuvs::neighbors::ivf_pq::index* index) +{ + if (!index) { RAFT_FAIL("Invalid index pointer"); } + std::istringstream is(str); + *index = cuvs::neighbors::ivf_pq::detail::deserialize(handle, is); +} } // namespace cuvs::neighbors::ivf_pq \ No newline at end of file diff --git a/cpp/src/neighbors/ivf_pq/ivf_pq_serialize.cu b/cpp/src/neighbors/ivf_pq/ivf_pq_serialize.cu index 0fb71d0317..f0214f4bb3 100644 --- a/cpp/src/neighbors/ivf_pq/ivf_pq_serialize.cu +++ b/cpp/src/neighbors/ivf_pq/ivf_pq_serialize.cu @@ -16,14 +16,23 @@ #include "ivf_pq_serialize.cuh" #include +#include namespace cuvs::neighbors::ivf_pq { -void serialize(raft::resources const& handle, - std::string& filename, - const cuvs::neighbors::ivf_pq::index& index) +void serialize_file(raft::resources const& handle, + const std::string& filename, + const cuvs::neighbors::ivf_pq::index& index) { cuvs::neighbors::ivf_pq::detail::serialize(handle, filename, index); } +void serialize(raft::resources const& handle, + std::string& str, + const cuvs::neighbors::ivf_pq::index& index) +{ + std::ostringstream os; + cuvs::neighbors::ivf_pq::detail::serialize(handle, os, index); + str = os.str(); +} } // namespace cuvs::neighbors::ivf_pq \ No newline at end of file diff --git a/cpp/test/neighbors/ann_ivf_pq.cuh b/cpp/test/neighbors/ann_ivf_pq.cuh index fda32c6df2..f716a8efed 100644 --- a/cpp/test/neighbors/ann_ivf_pq.cuh +++ b/cpp/test/neighbors/ann_ivf_pq.cuh @@ -204,7 +204,7 @@ class ivf_pq_test : public ::testing::TestWithParam { ipams.add_data_on_build = true; auto index_view = - raft::make_device_matrix_view(database.data(), ps.num_db_vecs, ps.dim); + raft::make_device_matrix_view(database.data(), ps.num_db_vecs, ps.dim); return cuvs::neighbors::ivf_pq::build(handle_, ipams, index_view); } @@ -224,16 +224,16 @@ class ivf_pq_test : public ::testing::TestWithParam { ipams.add_data_on_build = false; auto database_view = - raft::make_device_matrix_view(database.data(), ps.num_db_vecs, ps.dim); + raft::make_device_matrix_view(database.data(), ps.num_db_vecs, ps.dim); auto idx = cuvs::neighbors::ivf_pq::build(handle_, ipams, database_view); - auto vecs_2_view = raft::make_device_matrix_view(vecs_2, size_2, ps.dim); - auto inds_2_view = raft::make_device_vector_view(inds_2, size_2); + auto vecs_2_view = raft::make_device_matrix_view(vecs_2, size_2, ps.dim); + auto inds_2_view = raft::make_device_vector_view(inds_2, size_2); cuvs::neighbors::ivf_pq::extend(handle_, vecs_2_view, inds_2_view, &idx); auto vecs_1_view = - raft::make_device_matrix_view(vecs_1, size_1, ps.dim); - auto inds_1_view = raft::make_device_vector_view(inds_1, size_1); + raft::make_device_matrix_view(vecs_1, size_1, ps.dim); + auto inds_1_view = raft::make_device_vector_view(inds_1, size_1); cuvs::neighbors::ivf_pq::extend(handle_, vecs_1_view, inds_1_view, &idx); return idx; } @@ -241,9 +241,9 @@ class ivf_pq_test : public ::testing::TestWithParam { auto build_serialize() { std::string filename = "ivf_pq_index"; - cuvs::neighbors::ivf_pq::serialize(handle_, filename, build_only()); + cuvs::neighbors::ivf_pq::serialize_file(handle_, filename, build_only()); cuvs::neighbors::ivf_pq::index index(handle_, ps.index_params, ps.dim); - cuvs::neighbors::ivf_pq::deserialize(handle_, filename, &index); + cuvs::neighbors::ivf_pq::deserialize_file(handle_, filename, &index); return index; } @@ -564,7 +564,7 @@ class ivf_pq_filter_test : public ::testing::TestWithParam { ipams.add_data_on_build = true; auto index_view = - raft::make_device_matrix_view(database.data(), ps.num_db_vecs, ps.dim); + raft::make_device_matrix_view(database.data(), ps.num_db_vecs, ps.dim); return cuvs::neighbors::ivf_pq::build(handle_, ipams, index_view); }