From 87d620ff15de25086d83be8dbfa19756e906cb61 Mon Sep 17 00:00:00 2001 From: "Corey J. Nolet" Date: Thu, 20 Oct 2022 19:06:27 -0400 Subject: [PATCH 1/8] Correcting spatial::knn docs to raft::neighbors --- docs/source/cpp_api.rst | 6 +-- .../cpp_api/{clustering.rst => cluster.rst} | 6 +-- docs/source/cpp_api/distance.rst | 10 +++++ docs/source/cpp_api/neighbors.rst | 43 +++++++++++++++++++ .../cpp_api/{optimization.rst => solver.rst} | 0 docs/source/cpp_api/spatial.rst | 31 ------------- 6 files changed, 59 insertions(+), 37 deletions(-) rename docs/source/cpp_api/{clustering.rst => cluster.rst} (77%) create mode 100644 docs/source/cpp_api/distance.rst create mode 100644 docs/source/cpp_api/neighbors.rst rename docs/source/cpp_api/{optimization.rst => solver.rst} (100%) delete mode 100644 docs/source/cpp_api/spatial.rst diff --git a/docs/source/cpp_api.rst b/docs/source/cpp_api.rst index db139031a2..05d3686dc3 100644 --- a/docs/source/cpp_api.rst +++ b/docs/source/cpp_api.rst @@ -9,11 +9,11 @@ RAFT C++ API Reference :maxdepth: 4 cpp_api/core.rst - cpp_api/clustering.rst + cpp_api/cluster.rst cpp_api/linalg.rst cpp_api/matrix.rst - cpp_api/optimization.rst + cpp_api/solver.rst cpp_api/random.rst - cpp_api/spatial.rst + cpp_api/distance.rst cpp_api/sparse.rst cpp_api/stats.rst \ No newline at end of file diff --git a/docs/source/cpp_api/clustering.rst b/docs/source/cpp_api/cluster.rst similarity index 77% rename from docs/source/cpp_api/clustering.rst rename to docs/source/cpp_api/cluster.rst index 90ca786cc1..781180a72a 100644 --- a/docs/source/cpp_api/clustering.rst +++ b/docs/source/cpp_api/cluster.rst @@ -1,7 +1,7 @@ -Clustering -========== +Cluster +======= -This page provides C++ class references for the publicly-exposed elements of the clustering package. +This page provides C++ class references for the publicly-exposed elements of the cluster package. .. doxygennamespace:: raft::cluster :project: RAFT diff --git a/docs/source/cpp_api/distance.rst b/docs/source/cpp_api/distance.rst new file mode 100644 index 0000000000..c2bce860d5 --- /dev/null +++ b/docs/source/cpp_api/distance.rst @@ -0,0 +1,10 @@ +Distance +======== + +This page provides C++ class references for the publicly-exposed elements of the distance package. + +Distance +######## + +.. doxygennamespace:: raft::distance + :project: RAFT diff --git a/docs/source/cpp_api/neighbors.rst b/docs/source/cpp_api/neighbors.rst new file mode 100644 index 0000000000..962bbd1efe --- /dev/null +++ b/docs/source/cpp_api/neighbors.rst @@ -0,0 +1,43 @@ +Neighbors +========= + +This page provides C++ class references for the publicly-exposed elements of the neighbors package. + + +Brute-force +----------- + +.. doxygennamespace:: raft::neighbors::brute_force + :project: RAFT + + +IVF-Flat +-------- + +.. doxygennamespace:: raft::neighbors::ivf_flat + :project: RAFT + :members: + + +IVF-PQ +-------- + +.. doxygennamespace:: raft::neighbors::ivf_pq + :project: RAFT + :members: + + +Epsilon Neighborhood +-------------------- + +.. doxygennamespace:: raft::neighbors::epsilon_neighborhood + :project: RAFT + :members: + + +Random Ball Cover +----------------- + +.. doxygennamespace:: raft::neighbors::ball_cover + :project: RAFT + :members: diff --git a/docs/source/cpp_api/optimization.rst b/docs/source/cpp_api/solver.rst similarity index 100% rename from docs/source/cpp_api/optimization.rst rename to docs/source/cpp_api/solver.rst diff --git a/docs/source/cpp_api/spatial.rst b/docs/source/cpp_api/spatial.rst deleted file mode 100644 index 9bda00dab7..0000000000 --- a/docs/source/cpp_api/spatial.rst +++ /dev/null @@ -1,31 +0,0 @@ -Spatial -======= - -This page provides C++ class references for the publicly-exposed elements of the spatial package. - -Distance -######## - -.. doxygennamespace:: raft::distance - :project: RAFT - - -Nearest Neighbors -################# - -.. doxygenfunction:: raft::spatial::knn::brute_force_knn - :project: RAFT - -.. doxygenfunction:: raft::spatial::knn::select_k - :project: RAFT - -.. doxygenfunction:: raft::spatial::knn::knn_merge_parts - :project: RAFT - - -IVF-Flat --------- - -.. doxygennamespace:: raft::spatial::knn::ivf_flat - :project: RAFT - :members: From febd1d40eb2bc511731b9335912e8bbf9cbeb3f8 Mon Sep 17 00:00:00 2001 From: "Corey J. Nolet" Date: Thu, 20 Oct 2022 19:08:48 -0400 Subject: [PATCH 2/8] Adding neighbors to index --- docs/source/cpp_api.rst | 3 ++- 1 file changed, 2 insertions(+), 1 deletion(-) diff --git a/docs/source/cpp_api.rst b/docs/source/cpp_api.rst index 05d3686dc3..d10d9773a5 100644 --- a/docs/source/cpp_api.rst +++ b/docs/source/cpp_api.rst @@ -10,10 +10,11 @@ RAFT C++ API Reference cpp_api/core.rst cpp_api/cluster.rst + cpp_api/distance.rst cpp_api/linalg.rst cpp_api/matrix.rst + cpp_api/neighbors.rst cpp_api/solver.rst cpp_api/random.rst - cpp_api/distance.rst cpp_api/sparse.rst cpp_api/stats.rst \ No newline at end of file From 63e2e8bdaa1bc71f41bc59c46f86bf61e9511b6a Mon Sep 17 00:00:00 2001 From: "Corey J. Nolet" Date: Thu, 20 Oct 2022 20:01:34 -0400 Subject: [PATCH 3/8] Updating docs --- cpp/include/raft/cluster/kmeans.cuh | 470 ++++++++++++++++++ cpp/include/raft/cluster/kmeans_types.hpp | 13 +- cpp/include/raft/cluster/single_linkage.cuh | 81 +++ .../raft/cluster/single_linkage_types.hpp | 8 + docs/source/cpp_api/cluster.rst | 17 +- docs/source/cpp_api/core.rst | 63 ++- docs/source/cpp_api/solver.rst | 5 +- 7 files changed, 647 insertions(+), 10 deletions(-) diff --git a/cpp/include/raft/cluster/kmeans.cuh b/cpp/include/raft/cluster/kmeans.cuh index 0ce35da4a5..d737b1b736 100644 --- a/cpp/include/raft/cluster/kmeans.cuh +++ b/cpp/include/raft/cluster/kmeans.cuh @@ -21,6 +21,476 @@ #include #include +namespace raft::cluster::kmeans { + +/** + * @brief Find clusters with k-means algorithm. + * Initial centroids are chosen with k-means++ algorithm. Empty + * clusters are reinitialized by choosing new centroids with + * k-means++ algorithm. + * @tparam DataT the type of data used for weights, distances. + * @tparam IndexT the type of data used for indexing. + * @param[in] handle The raft handle. + * @param[in] params Parameters for KMeans model. + * @param[in] X Training instances to cluster. The data must + * be in row-major format. + * [dim = n_samples x n_features] + * @param[in] sample_weight Optional weights for each observation in X. + * [len = n_samples] + * @param[inout] centroids [in] When init is InitMethod::Array, use + * centroids as the initial cluster centers. + * [out] The generated centroids from the + * kmeans algorithm are stored at the address + * pointed by 'centroids'. + * [dim = n_clusters x n_features] + * @param[out] inertia Sum of squared distances of samples to their + * closest cluster center. + * @param[out] n_iter Number of iterations run. + */ +template +void fit(handle_t const& handle, + const KMeansParams& params, + raft::device_matrix_view X, + std::optional> sample_weight, + raft::device_matrix_view centroids, + raft::host_scalar_view inertia, + raft::host_scalar_view n_iter) +{ + detail::kmeans_fit(handle, params, X, sample_weight, centroids, inertia, n_iter); +} + +template +void fit(handle_t const& handle, + const KMeansParams& params, + const DataT* X, + const DataT* sample_weight, + DataT* centroids, + IndexT n_samples, + IndexT n_features, + DataT& inertia, + IndexT& n_iter) +{ + detail::kmeans_fit( + handle, params, X, sample_weight, centroids, n_samples, n_features, inertia, n_iter); +} + +/** + * @brief Predict the closest cluster each sample in X belongs to. + * @tparam DataT the type of data used for weights, distances. + * @tparam IndexT the type of data used for indexing. + * @param[in] handle The raft handle. + * @param[in] params Parameters for KMeans model. + * @param[in] X New data to predict. + * [dim = n_samples x n_features] + * @param[in] sample_weight Optional weights for each observation in X. + * [len = n_samples] + * @param[in] centroids Cluster centroids. The data must be in + * row-major format. + * [dim = n_clusters x n_features] + * @param[in] normalize_weight True if the weights should be normalized + * @param[out] labels Index of the cluster each sample in X + * belongs to. + * [len = n_samples] + * @param[out] inertia Sum of squared distances of samples to + * their closest cluster center. + */ +template +void predict(handle_t const& handle, + const KMeansParams& params, + raft::device_matrix_view X, + std::optional> sample_weight, + raft::device_matrix_view centroids, + raft::device_vector_view labels, + bool normalize_weight, + raft::host_scalar_view inertia) +{ + detail::kmeans_predict( + handle, params, X, sample_weight, centroids, labels, normalize_weight, inertia); +} + +template +void predict(handle_t const& handle, + const KMeansParams& params, + const DataT* X, + const DataT* sample_weight, + const DataT* centroids, + IndexT n_samples, + IndexT n_features, + IndexT* labels, + bool normalize_weight, + DataT& inertia) +{ + detail::kmeans_predict(handle, + params, + X, + sample_weight, + centroids, + n_samples, + n_features, + labels, + normalize_weight, + inertia); +} + +/** + * @brief Compute k-means clustering and predicts cluster index for each sample + * in the input. + * + * @tparam DataT the type of data used for weights, distances. + * @tparam IndexT the type of data used for indexing. + * @param[in] handle The raft handle. + * @param[in] params Parameters for KMeans model. + * @param[in] X Training instances to cluster. The data must be + * in row-major format. + * [dim = n_samples x n_features] + * @param[in] sample_weight Optional weights for each observation in X. + * [len = n_samples] + * @param[inout] centroids Optional + * [in] When init is InitMethod::Array, use + * centroids as the initial cluster centers + * [out] The generated centroids from the + * kmeans algorithm are stored at the address + * pointed by 'centroids'. + * [dim = n_clusters x n_features] + * @param[out] labels Index of the cluster each sample in X belongs + * to. + * [len = n_samples] + * @param[out] inertia Sum of squared distances of samples to their + * closest cluster center. + * @param[out] n_iter Number of iterations run. + */ +template +void fit_predict(handle_t const& handle, + const KMeansParams& params, + raft::device_matrix_view X, + std::optional> sample_weight, + std::optional> centroids, + raft::device_vector_view labels, + raft::host_scalar_view inertia, + raft::host_scalar_view n_iter) +{ + detail::kmeans_fit_predict( + handle, params, X, sample_weight, centroids, labels, inertia, n_iter); +} + +template +void fit_predict(handle_t const& handle, + const KMeansParams& params, + const DataT* X, + const DataT* sample_weight, + DataT* centroids, + IndexT n_samples, + IndexT n_features, + IndexT* labels, + DataT& inertia, + IndexT& n_iter) +{ + detail::kmeans_fit_predict( + handle, params, X, sample_weight, centroids, n_samples, n_features, labels, inertia, n_iter); +} + +/** + * @brief Transform X to a cluster-distance space. + * + * @tparam DataT the type of data used for weights, distances. + * @tparam IndexT the type of data used for indexing. + * @param[in] handle The raft handle. + * @param[in] params Parameters for KMeans model. + * @param[in] X Training instances to cluster. The data must + * be in row-major format + * [dim = n_samples x n_features] + * @param[in] centroids Cluster centroids. The data must be in row-major format. + * [dim = n_clusters x n_features] + * @param[out] X_new X transformed in the new space. + * [dim = n_samples x n_features] + */ +template +void transform(const raft::handle_t& handle, + const KMeansParams& params, + raft::device_matrix_view X, + raft::device_matrix_view centroids, + raft::device_matrix_view X_new) +{ + detail::kmeans_transform(handle, params, X, centroids, X_new); +} + +template +void transform(const raft::handle_t& handle, + const KMeansParams& params, + const DataT* X, + const DataT* centroids, + IndexT n_samples, + IndexT n_features, + DataT* X_new) +{ + detail::kmeans_transform( + handle, params, X, centroids, n_samples, n_features, X_new); +} + +template +using SamplingOp = detail::SamplingOp; + +template +using KeyValueIndexOp = detail::KeyValueIndexOp; + +/** + * @brief Select centroids according to a sampling operation + * + * @tparam DataT the type of data used for weights, distances. + * @tparam IndexT the type of data used for indexing. + * + * @param[in] handle The raft handle + * @param[in] X The data in row-major format + * [dim = n_samples x n_features] + * @param[in] minClusterDistance Distance for every sample to it's nearest centroid + * [dim = n_samples] + * @param[in] isSampleCentroid Flag the sample choosen as initial centroid + * [dim = n_samples] + * @param[in] select_op The sampling operation used to select the centroids + * @param[out] inRankCp The sampled centroids + * [dim = n_selected_centroids x n_features] + * @param[in] workspace Temporary workspace buffer which can get resized + * + */ +template +void sample_centroids(const raft::handle_t& handle, + const raft::device_matrix_view& X, + const raft::device_vector_view& minClusterDistance, + const raft::device_vector_view& isSampleCentroid, + SamplingOp& select_op, + rmm::device_uvector& inRankCp, + rmm::device_uvector& workspace) +{ + detail::sampleCentroids( + handle, X, minClusterDistance, isSampleCentroid, select_op, inRankCp, workspace); +} + +/** + * @brief Compute cluster cost + * + * @tparam DataT the type of data used for weights, distances. + * @tparam ReductionOpT the type of data used for the reduction operation. + * + * @param[in] handle The raft handle + * @param[in] minClusterDistance Distance for every sample to it's nearest centroid + * [dim = n_samples] + * @param[in] workspace Temporary workspace buffer which can get resized + * @param[out] clusterCost Resulting cluster cost + * @param[in] reduction_op The reduction operation used for the cost + * + */ +template +void cluster_cost(const raft::handle_t& handle, + const raft::device_vector_view& minClusterDistance, + rmm::device_uvector& workspace, + const raft::device_scalar_view& clusterCost, + ReductionOpT reduction_op) +{ + detail::computeClusterCost( + handle, minClusterDistance, workspace, clusterCost, reduction_op); +} + +/** + * @brief Compute distance for every sample to it's nearest centroid + * + * @tparam DataT the type of data used for weights, distances. + * @tparam IndexT the type of data used for indexing. + * + * @param[in] handle The raft handle + * @param[in] params The parameters for KMeans + * @param[in] X The data in row-major format + * [dim = n_samples x n_features] + * @param[in] centroids Centroids data + * [dim = n_cluster x n_features] + * @param[out] minClusterDistance Distance for every sample to it's nearest centroid + * [dim = n_samples] + * @param[in] L2NormX L2 norm of X : ||x||^2 + * [dim = n_samples] + * @param[out] L2NormBuf_OR_DistBuf Resizable buffer to store L2 norm of centroids or distance + * matrix + * @param[in] workspace Temporary workspace buffer which can get resized + * + */ +template +void min_cluster_distance_compute(const raft::handle_t& handle, + const KMeansParams& params, + const raft::device_matrix_view& X, + const raft::device_matrix_view& centroids, + const raft::device_vector_view& minClusterDistance, + const raft::device_vector_view& L2NormX, + rmm::device_uvector& L2NormBuf_OR_DistBuf, + rmm::device_uvector& workspace) +{ + detail::minClusterDistanceCompute( + handle, params, X, centroids, minClusterDistance, L2NormX, L2NormBuf_OR_DistBuf, workspace); +} + +/** + * @brief Calculates a pair for every sample in input 'X' where key is an + * index of one of the 'centroids' (index of the nearest centroid) and 'value' + * is the distance between the sample and the 'centroid[key]' + * + * @tparam DataT the type of data used for weights, distances. + * @tparam IndexT the type of data used for indexing. + * + * @param[in] handle The raft handle + * @param[in] params The parameters for KMeans + * @param[in] X The data in row-major format + * [dim = n_samples x n_features] + * @param[in] centroids Centroids data + * [dim = n_cluster x n_features] + * @param[out] minClusterAndDistance Distance vector that contains for every sample, the nearest + * centroid and it's distance + * [dim = n_samples] + * @param[in] L2NormX L2 norm of X : ||x||^2 + * [dim = n_samples] + * @param[out] L2NormBuf_OR_DistBuf Resizable buffer to store L2 norm of centroids or distance + * matrix + * @param[in] workspace Temporary workspace buffer which can get resized + * + */ +template +void min_cluster_and_distance( + const raft::handle_t& handle, + const KMeansParams& params, + const raft::device_matrix_view X, + const raft::device_matrix_view centroids, + const raft::device_vector_view, IndexT>& minClusterAndDistance, + const raft::device_vector_view& L2NormX, + rmm::device_uvector& L2NormBuf_OR_DistBuf, + rmm::device_uvector& workspace) +{ + detail::minClusterAndDistanceCompute( + handle, params, X, centroids, minClusterAndDistance, L2NormX, L2NormBuf_OR_DistBuf, workspace); +} + +/** + * @brief Shuffle and randomly select 'n_samples_to_gather' from input 'in' and stores + * in 'out' does not modify the input + * + * @tparam DataT the type of data used for weights, distances. + * @tparam IndexT the type of data used for indexing. + * + * @param[in] handle The raft handle + * @param[in] in The data to shuffle and gather + * [dim = n_samples x n_features] + * @param[out] out The sampled data + * [dim = n_samples_to_gather x n_features] + * @param[in] n_samples_to_gather Number of sample to gather + * @param[in] seed Seed for the shuffle + * @param[in] workspace Temporary workspace buffer which can get resized + * + */ +template +void shuffle_and_gather(const raft::handle_t& handle, + const raft::device_matrix_view& in, + const raft::device_matrix_view& out, + uint32_t n_samples_to_gather, + uint64_t seed, + rmm::device_uvector* workspace = nullptr) +{ + detail::shuffleAndGather(handle, in, out, n_samples_to_gather, seed, workspace); +} + +/** + * @brief Count the number of samples in each cluster + * + * @tparam DataT the type of data used for weights, distances. + * @tparam IndexT the type of data used for indexing. + * + * @param[in] handle The raft handle + * @param[in] params The parameters for KMeans + * @param[in] X The data in row-major format + * [dim = n_samples x n_features] + * @param[in] L2NormX L2 norm of X : ||x||^2 + * [dim = n_samples] + * @param[in] centroids Centroids data + * [dim = n_cluster x n_features] + * @param[in] workspace Temporary workspace buffer which can get resized + * @param[out] sampleCountInCluster The count for each centroid + * [dim = n_cluster] + * + */ +template +void count_samples_in_cluster(const raft::handle_t& handle, + const KMeansParams& params, + const raft::device_matrix_view& X, + const raft::device_vector_view& L2NormX, + const raft::device_matrix_view& centroids, + rmm::device_uvector& workspace, + const raft::device_vector_view& sampleCountInCluster) +{ + detail::countSamplesInCluster( + handle, params, X, L2NormX, centroids, workspace, sampleCountInCluster); +} + +/* + * @brief Selects 'n_clusters' samples from the input X using kmeans++ algorithm. + + * @note This is the algorithm described in + * "k-means++: the advantages of careful seeding". 2007, Arthur, D. and Vassilvitskii, S. + * ACM-SIAM symposium on Discrete algorithms. + * + * @tparam DataT the type of data used for weights, distances. + * @tparam IndexT the type of data used for indexing. + * + * @param[in] handle The raft handle + * @param[in] params The parameters for KMeans + * @param[in] X The data in row-major format + * [dim = n_samples x n_features] + * @param[out] centroids Centroids data + * [dim = n_cluster x n_features] + * @param[in] workspace Temporary workspace buffer which can get resized + */ +template +void init_plus_plus(const raft::handle_t& handle, + const KMeansParams& params, + const raft::device_matrix_view& X, + const raft::device_matrix_view& centroidsRawData, + rmm::device_uvector& workspace) +{ + detail::kmeansPlusPlus(handle, params, X, centroidsRawData, workspace); +} + +/* + * @brief Main function used to fit KMeans (after cluster initialization) + * + * @tparam DataT the type of data used for weights, distances. + * @tparam IndexT the type of data used for indexing. + * + * @param[in] handle The raft handle. + * @param[in] params Parameters for KMeans model. + * @param[in] X Training instances to cluster. The data must + * be in row-major format. + * [dim = n_samples x n_features] + * @param[in] sample_weight Weights for each observation in X. + * [len = n_samples] + * @param[inout] centroids [in] Initial cluster centers. + * [out] The generated centroids from the + * kmeans algorithm are stored at the address + * pointed by 'centroids'. + * [dim = n_clusters x n_features] + * @param[out] inertia Sum of squared distances of samples to their + * closest cluster center. + * @param[out] n_iter Number of iterations run. + * @param[in] workspace Temporary workspace buffer which can get resized + */ +template +void fit_main(const raft::handle_t& handle, + const KMeansParams& params, + const raft::device_matrix_view& X, + const raft::device_vector_view& weight, + const raft::device_matrix_view& centroidsRawData, + const raft::host_scalar_view& inertia, + const raft::host_scalar_view& n_iter, + rmm::device_uvector& workspace) +{ + detail::kmeans_fit_main( + handle, params, X, weight, centroidsRawData, inertia, n_iter, workspace); +} + +} // end namespace raft::cluster::kmeans + namespace raft::cluster { /** * @brief Find clusters with k-means algorithm. diff --git a/cpp/include/raft/cluster/kmeans_types.hpp b/cpp/include/raft/cluster/kmeans_types.hpp index 87fc7c1880..bb8e1a2b73 100644 --- a/cpp/include/raft/cluster/kmeans_types.hpp +++ b/cpp/include/raft/cluster/kmeans_types.hpp @@ -18,8 +18,9 @@ #include #include -namespace raft { -namespace cluster { +namespace raft::cluster { + +namespace kmeans { struct KMeansParams { enum InitMethod { KMeansPlusPlus, Random, Array }; @@ -69,5 +70,9 @@ struct KMeansParams { bool inertia_check = false; }; -} // namespace cluster -} // namespace raft + +} // namespace kmeans + +using kmeans::KMeansParams; + +} // namespace raft::cluster diff --git a/cpp/include/raft/cluster/single_linkage.cuh b/cpp/include/raft/cluster/single_linkage.cuh index 8e33b8389d..ca2234f01f 100644 --- a/cpp/include/raft/cluster/single_linkage.cuh +++ b/cpp/include/raft/cluster/single_linkage.cuh @@ -21,6 +21,87 @@ namespace raft::cluster { +namespace hierarchy { +constexpr int DEFAULT_CONST_C = 15; + +/** + * Single-linkage clustering, capable of constructing a KNN graph to + * scale the algorithm beyond the n^2 memory consumption of implementations + * that use the fully-connected graph of pairwise distances by connecting + * a knn graph when k is not large enough to connect it. + + * @tparam value_idx + * @tparam value_t + * @tparam dist_type method to use for constructing connectivities graph + * @param[in] handle raft handle + * @param[in] X dense input matrix in row-major layout + * @param[in] m number of rows in X + * @param[in] n number of columns in X + * @param[in] metric distance metrix to use when constructing connectivities graph + * @param[out] out struct containing output dendrogram and cluster assignments + * @param[in] c a constant used when constructing connectivities from knn graph. Allows the indirect + control + * of k. The algorithm will set `k = log(n) + c` + * @param[in] n_clusters number of clusters to assign data samples + */ +template +void single_linkage(const raft::handle_t& handle, + const value_t* X, + size_t m, + size_t n, + raft::distance::DistanceType metric, + linkage_output* out, + int c, + size_t n_clusters) +{ + detail::single_linkage( + handle, X, m, n, metric, out, c, n_clusters); +} + +/** + * Single-linkage clustering, capable of constructing a KNN graph to + * scale the algorithm beyond the n^2 memory consumption of implementations + * that use the fully-connected graph of pairwise distances by connecting + * a knn graph when k is not large enough to connect it. + + * @tparam value_idx + * @tparam value_t + * @tparam dist_type method to use for constructing connectivities graph + * @param[in] handle raft handle + * @param[in] X dense input matrix in row-major layout + * @param[out] dendrogram output dendrogram (size [n_rows - 1] * 2) + * @param[out] labels output labels vector (size n_rows) + * @param[in] metric distance metrix to use when constructing connectivities graph + * @param[in] n_clusters number of clusters to assign data samples + * @param[in] c a constant used when constructing connectivities from knn graph. Allows the indirect + control of k. The algorithm will set `k = log(n) + c` + */ +template +void single_linkage(const raft::handle_t& handle, + raft::device_matrix_view X, + raft::device_matrix_view dendrogram, + raft::device_vector_view labels, + raft::distance::DistanceType metric, + size_t n_clusters, + std::optional c = std::make_optional(DEFAULT_CONST_C)) +{ + linkage_output out_arrs; + out_arrs.children = dendrogram.data_handle(); + out_arrs.labels = labels.data_handle(); + + single_linkage(handle, + X.data_handle(), + static_cast(X.extent(0)), + static_cast(X.extent(1)), + metric, + &out_arrs, + c.has_value() ? c.value() : DEFAULT_CONST_C, + n_clusters); +} +} // namespace hierarchy + constexpr int DEFAULT_CONST_C = 15; /** diff --git a/cpp/include/raft/cluster/single_linkage_types.hpp b/cpp/include/raft/cluster/single_linkage_types.hpp index 79f2ede482..28b245a2cf 100644 --- a/cpp/include/raft/cluster/single_linkage_types.hpp +++ b/cpp/include/raft/cluster/single_linkage_types.hpp @@ -20,6 +20,7 @@ namespace raft::cluster { +namespace hierarchy { enum LinkageDistance { PAIRWISE = 0, KNN_GRAPH = 1 }; /** @@ -58,4 +59,11 @@ class linkage_output_int : public linkage_output { class linkage_output_int64 : public linkage_output { }; +} // end namespace hierarchy + +using hierarchy::linkage_output; +using hierarchy::linkage_output_int; +using hierarchy::linkage_output_int64; +using hierarchy::LinkageDistance; + }; // namespace raft::cluster \ No newline at end of file diff --git a/docs/source/cpp_api/cluster.rst b/docs/source/cpp_api/cluster.rst index 781180a72a..41816482cc 100644 --- a/docs/source/cpp_api/cluster.rst +++ b/docs/source/cpp_api/cluster.rst @@ -3,10 +3,25 @@ Cluster This page provides C++ class references for the publicly-exposed elements of the cluster package. -.. doxygennamespace:: raft::cluster +K-Means +------- + +.. doxygennamespace:: raft::cluster::kmeans + :project: RAFT + :members: + + +Hierarchical Clustering +----------------------- + +.. doxygennamespace:: raft::cluster::hierarchy :project: RAFT :members: + +Spectral Clustering +------------------- + .. doxygennamespace:: raft::spectral :project: RAFT :members: \ No newline at end of file diff --git a/docs/source/cpp_api/core.rst b/docs/source/cpp_api/core.rst index ef6270556e..d4891bf0b3 100644 --- a/docs/source/cpp_api/core.rst +++ b/docs/source/cpp_api/core.rst @@ -4,7 +4,6 @@ Core This page provides C++ class references for the publicly-exposed elements of the core package. - handle_t ######## @@ -20,6 +19,13 @@ interruptible :project: RAFT :members: +NVTX +#### + +.. doxygennamespace:: raft::common::nvtx + :project: RAFT + :members: + mdarray ####### @@ -28,11 +34,64 @@ mdarray :project: RAFT :members: +.. doxygenclass:: raft::make_device_matrix + :project: RAFT + +.. doxygenclass:: raft::make_device_vector + :project: RAFT + +.. doxygenclass:: raft::make_device_scalar + :project: RAFT + +.. doxygenclass:: raft::make_host_matrix + :project: RAFT + +.. doxygenclass:: raft::make_host_vector + :project: RAFT + +.. doxygenclass:: raft::make_device_scalar + :project: RAFT + + +mdspan +####### + +.. doxygenfunction:: raft::make_device_mdspan + :project: RAFT + +.. doxygenfunction:: raft::make_device_matrix_view + :project: RAFT + +.. doxygenfunction:: raft::make_device_vector_view + :project: RAFT + +.. doxygenfunction:: raft::make_device_scalar_view + :project: RAFT + +.. doxygenfunction:: raft::make_host_matrix_view + :project: RAFT + +.. doxygenfunction:: raft::make_host_vector_view + :project: RAFT + +.. doxygenfunction:: raft::make_device_scalar_view + :project: RAFT span #### -.. doxygenclass:: raft::span +.. doxygenclass:: raft::device_span + :project: RAFT + :members: + +.. doxygenclass:: raft::host_span + :project: RAFT + :members: + +Key-Value Pair +############## + +.. doxygenclass:: raft::KeyValuePair :project: RAFT :members: diff --git a/docs/source/cpp_api/solver.rst b/docs/source/cpp_api/solver.rst index 75cec2494e..a8b93ca046 100644 --- a/docs/source/cpp_api/solver.rst +++ b/docs/source/cpp_api/solver.rst @@ -7,13 +7,12 @@ This page provides C++ class references for the publicly-exposed elements of the Linear Assignment Problem ######################### -.. doxygenclass:: raft::lap::LinearAssignmentProblem +.. doxygenclass:: raft::solver::LinearAssignmentProblem :project: RAFT :members: Minimum Spanning Tree ##################### -.. doxygennamespace:: raft::mst +.. doxygenfunction:: raft::sparse::solver::mst :project: RAFT - :members: From 831c3d244dcb7c428a5f2e63ad964e265c87575d Mon Sep 17 00:00:00 2001 From: "Corey J. Nolet" Date: Thu, 20 Oct 2022 20:29:15 -0400 Subject: [PATCH 4/8] Making sure we call new cluster namespaced code from deprecated code to spot any bugs/syntax issues --- cpp/include/raft/cluster/kmeans.cuh | 71 ++++++++++----------- cpp/include/raft/cluster/single_linkage.cuh | 20 ++---- 2 files changed, 39 insertions(+), 52 deletions(-) diff --git a/cpp/include/raft/cluster/kmeans.cuh b/cpp/include/raft/cluster/kmeans.cuh index d737b1b736..6384cfdeaa 100644 --- a/cpp/include/raft/cluster/kmeans.cuh +++ b/cpp/include/raft/cluster/kmeans.cuh @@ -312,14 +312,14 @@ void cluster_cost(const raft::handle_t& handle, * */ template -void min_cluster_distance_compute(const raft::handle_t& handle, - const KMeansParams& params, - const raft::device_matrix_view& X, - const raft::device_matrix_view& centroids, - const raft::device_vector_view& minClusterDistance, - const raft::device_vector_view& L2NormX, - rmm::device_uvector& L2NormBuf_OR_DistBuf, - rmm::device_uvector& workspace) +void min_cluster_distance(const raft::handle_t& handle, + const KMeansParams& params, + const raft::device_matrix_view& X, + const raft::device_matrix_view& centroids, + const raft::device_vector_view& minClusterDistance, + const raft::device_vector_view& L2NormX, + rmm::device_uvector& L2NormBuf_OR_DistBuf, + rmm::device_uvector& workspace) { detail::minClusterDistanceCompute( handle, params, X, centroids, minClusterDistance, L2NormX, L2NormBuf_OR_DistBuf, workspace); @@ -525,7 +525,7 @@ void kmeans_fit(handle_t const& handle, raft::host_scalar_view inertia, raft::host_scalar_view n_iter) { - detail::kmeans_fit(handle, params, X, sample_weight, centroids, inertia, n_iter); + kmeans::fit(handle, params, X, sample_weight, centroids, inertia, n_iter); } template @@ -539,7 +539,7 @@ void kmeans_fit(handle_t const& handle, DataT& inertia, IndexT& n_iter) { - detail::kmeans_fit( + kmeans::fit( handle, params, X, sample_weight, centroids, n_samples, n_features, inertia, n_iter); } @@ -573,7 +573,7 @@ void kmeans_predict(handle_t const& handle, bool normalize_weight, raft::host_scalar_view inertia) { - detail::kmeans_predict( + kmeans::predict( handle, params, X, sample_weight, centroids, labels, normalize_weight, inertia); } @@ -589,16 +589,16 @@ void kmeans_predict(handle_t const& handle, bool normalize_weight, DataT& inertia) { - detail::kmeans_predict(handle, - params, - X, - sample_weight, - centroids, - n_samples, - n_features, - labels, - normalize_weight, - inertia); + kmeans::predict(handle, + params, + X, + sample_weight, + centroids, + n_samples, + n_features, + labels, + normalize_weight, + inertia); } /** @@ -638,7 +638,7 @@ void kmeans_fit_predict(handle_t const& handle, raft::host_scalar_view inertia, raft::host_scalar_view n_iter) { - detail::kmeans_fit_predict( + kmeans::fit_predict( handle, params, X, sample_weight, centroids, labels, inertia, n_iter); } @@ -654,7 +654,7 @@ void kmeans_fit_predict(handle_t const& handle, DataT& inertia, IndexT& n_iter) { - detail::kmeans_fit_predict( + kmeans::fit_predict( handle, params, X, sample_weight, centroids, n_samples, n_features, labels, inertia, n_iter); } @@ -680,7 +680,7 @@ void kmeans_transform(const raft::handle_t& handle, raft::device_matrix_view centroids, raft::device_matrix_view X_new) { - detail::kmeans_transform(handle, params, X, centroids, X_new); + kmeans::transform(handle, params, X, centroids, X_new); } template @@ -692,15 +692,14 @@ void kmeans_transform(const raft::handle_t& handle, IndexT n_features, DataT* X_new) { - detail::kmeans_transform( - handle, params, X, centroids, n_samples, n_features, X_new); + kmeans::transform(handle, params, X, centroids, n_samples, n_features, X_new); } template -using SamplingOp = detail::SamplingOp; +using SamplingOp = kmeans::SamplingOp; template -using KeyValueIndexOp = detail::KeyValueIndexOp; +using KeyValueIndexOp = kmeans::KeyValueIndexOp; /** * @brief Select centroids according to a sampling operation @@ -730,7 +729,7 @@ void sampleCentroids(const raft::handle_t& handle, rmm::device_uvector& inRankCp, rmm::device_uvector& workspace) { - detail::sampleCentroids( + kmeans::sample_entroids( handle, X, minClusterDistance, isSampleCentroid, select_op, inRankCp, workspace); } @@ -755,7 +754,7 @@ void computeClusterCost(const raft::handle_t& handle, const raft::device_scalar_view& clusterCost, ReductionOpT reduction_op) { - detail::computeClusterCost( + kmeans::cluster_cost( handle, minClusterDistance, workspace, clusterCost, reduction_op); } @@ -790,7 +789,7 @@ void minClusterDistanceCompute(const raft::handle_t& handle, rmm::device_uvector& L2NormBuf_OR_DistBuf, rmm::device_uvector& workspace) { - detail::minClusterDistanceCompute( + kmeans::min_cluster_distance( handle, params, X, centroids, minClusterDistance, L2NormX, L2NormBuf_OR_DistBuf, workspace); } @@ -829,7 +828,7 @@ void minClusterAndDistanceCompute( rmm::device_uvector& L2NormBuf_OR_DistBuf, rmm::device_uvector& workspace) { - detail::minClusterAndDistanceCompute( + kmeans::min_cluster_and_distance( handle, params, X, centroids, minClusterAndDistance, L2NormX, L2NormBuf_OR_DistBuf, workspace); } @@ -858,7 +857,7 @@ void shuffleAndGather(const raft::handle_t& handle, uint64_t seed, rmm::device_uvector* workspace = nullptr) { - detail::shuffleAndGather(handle, in, out, n_samples_to_gather, seed, workspace); + kmeans::shuffle_and_gather(handle, in, out, n_samples_to_gather, seed, workspace); } /** @@ -889,7 +888,7 @@ void countSamplesInCluster(const raft::handle_t& handle, rmm::device_uvector& workspace, const raft::device_vector_view& sampleCountInCluster) { - detail::countSamplesInCluster( + kmeans::count_samples_in_cluster( handle, params, X, L2NormX, centroids, workspace, sampleCountInCluster); } @@ -918,7 +917,7 @@ void kmeansPlusPlus(const raft::handle_t& handle, const raft::device_matrix_view& centroidsRawData, rmm::device_uvector& workspace) { - detail::kmeansPlusPlus(handle, params, X, centroidsRawData, workspace); + kmeans::init_plus_plus(handle, params, X, centroidsRawData, workspace); } /* @@ -954,7 +953,7 @@ void kmeans_fit_main(const raft::handle_t& handle, const raft::host_scalar_view& n_iter, rmm::device_uvector& workspace) { - detail::kmeans_fit_main( + kmeans::fit_main( handle, params, X, weight, centroidsRawData, inertia, n_iter, workspace); } } // namespace raft::cluster diff --git a/cpp/include/raft/cluster/single_linkage.cuh b/cpp/include/raft/cluster/single_linkage.cuh index ca2234f01f..36fc812445 100644 --- a/cpp/include/raft/cluster/single_linkage.cuh +++ b/cpp/include/raft/cluster/single_linkage.cuh @@ -102,8 +102,6 @@ void single_linkage(const raft::handle_t& handle, } } // namespace hierarchy -constexpr int DEFAULT_CONST_C = 15; - /** * Single-linkage clustering, capable of constructing a KNN graph to * scale the algorithm beyond the n^2 memory consumption of implementations @@ -136,7 +134,7 @@ void single_linkage(const raft::handle_t& handle, int c, size_t n_clusters) { - detail::single_linkage( + hierarchy::single_linkage( handle, X, m, n, metric, out, c, n_clusters); } @@ -165,20 +163,10 @@ void single_linkage(const raft::handle_t& handle, raft::device_vector_view labels, raft::distance::DistanceType metric, size_t n_clusters, - std::optional c = std::make_optional(DEFAULT_CONST_C)) + std::optional c = std::make_optional(hierarchy::DEFAULT_CONST_C)) { - linkage_output out_arrs; - out_arrs.children = dendrogram.data_handle(); - out_arrs.labels = labels.data_handle(); - - single_linkage(handle, - X.data_handle(), - static_cast(X.extent(0)), - static_cast(X.extent(1)), - metric, - &out_arrs, - c.has_value() ? c.value() : DEFAULT_CONST_C, - n_clusters); + hierarchy::single_linkage( + handle, X, dendrogram, labels, metric, n_clusters, c); } }; // namespace raft::cluster From 31047e638b94316af12d8fcd1b7057bf1f9caf1d Mon Sep 17 00:00:00 2001 From: "Corey J. Nolet" Date: Thu, 20 Oct 2022 20:41:11 -0400 Subject: [PATCH 5/8] Deprecation warnings --- cpp/include/raft/cluster/single_linkage.cuh | 6 ++++++ 1 file changed, 6 insertions(+) diff --git a/cpp/include/raft/cluster/single_linkage.cuh b/cpp/include/raft/cluster/single_linkage.cuh index 36fc812445..0a79601647 100644 --- a/cpp/include/raft/cluster/single_linkage.cuh +++ b/cpp/include/raft/cluster/single_linkage.cuh @@ -102,6 +102,12 @@ void single_linkage(const raft::handle_t& handle, } } // namespace hierarchy +/** + * Note: All of the functions below in the raft::cluster namespace are deprecated + * and will be removed in a future release. Please use raft::cluster::hierarchy + * instead. + */ + /** * Single-linkage clustering, capable of constructing a KNN graph to * scale the algorithm beyond the n^2 memory consumption of implementations From fd8899ce7a2f5afa0066cacf83c919db20a9cee0 Mon Sep 17 00:00:00 2001 From: "Corey J. Nolet" Date: Thu, 20 Oct 2022 21:10:38 -0400 Subject: [PATCH 6/8] Fixing typo --- cpp/include/raft/cluster/kmeans.cuh | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/cpp/include/raft/cluster/kmeans.cuh b/cpp/include/raft/cluster/kmeans.cuh index 10004b69bf..cfd47d4058 100644 --- a/cpp/include/raft/cluster/kmeans.cuh +++ b/cpp/include/raft/cluster/kmeans.cuh @@ -735,7 +735,7 @@ void sampleCentroids(const raft::handle_t& handle, rmm::device_uvector& inRankCp, rmm::device_uvector& workspace) { - kmeans::sample_entroids( + kmeans::sample_centroids( handle, X, minClusterDistance, isSampleCentroid, select_op, inRankCp, workspace); } From 4968ce88263150065d0d13dead09a0b5b73f85e3 Mon Sep 17 00:00:00 2001 From: "Corey J. Nolet" Date: Thu, 20 Oct 2022 21:32:52 -0400 Subject: [PATCH 7/8] Fixing hierarchical compile error --- cpp/include/raft/cluster/single_linkage.cuh | 106 ++++-------------- .../raft/cluster/single_linkage_types.hpp | 16 ++- cpp/test/CMakeLists.txt | 2 +- cpp/test/{sparse => cluster}/linkage.cu | 21 ++-- 4 files changed, 39 insertions(+), 106 deletions(-) rename cpp/test/{sparse => cluster}/linkage.cu (98%) diff --git a/cpp/include/raft/cluster/single_linkage.cuh b/cpp/include/raft/cluster/single_linkage.cuh index 0a79601647..2d74c364b2 100644 --- a/cpp/include/raft/cluster/single_linkage.cuh +++ b/cpp/include/raft/cluster/single_linkage.cuh @@ -21,8 +21,11 @@ namespace raft::cluster { -namespace hierarchy { -constexpr int DEFAULT_CONST_C = 15; +/** + * Note: All of the functions below in the raft::cluster namespace are deprecated + * and will be removed in a future release. Please use raft::cluster::hierarchy + * instead. + */ /** * Single-linkage clustering, capable of constructing a KNN graph to @@ -59,6 +62,11 @@ void single_linkage(const raft::handle_t& handle, detail::single_linkage( handle, X, m, n, metric, out, c, n_clusters); } +}; // namespace raft::cluster + +namespace raft::cluster::hierarchy { + +constexpr int DEFAULT_CONST_C = 15; /** * Single-linkage clustering, capable of constructing a KNN graph to @@ -91,88 +99,14 @@ void single_linkage(const raft::handle_t& handle, out_arrs.children = dendrogram.data_handle(); out_arrs.labels = labels.data_handle(); - single_linkage(handle, - X.data_handle(), - static_cast(X.extent(0)), - static_cast(X.extent(1)), - metric, - &out_arrs, - c.has_value() ? c.value() : DEFAULT_CONST_C, - n_clusters); + raft::cluster::single_linkage( + handle, + X.data_handle(), + static_cast(X.extent(0)), + static_cast(X.extent(1)), + metric, + &out_arrs, + c.has_value() ? c.value() : DEFAULT_CONST_C, + n_clusters); } -} // namespace hierarchy - -/** - * Note: All of the functions below in the raft::cluster namespace are deprecated - * and will be removed in a future release. Please use raft::cluster::hierarchy - * instead. - */ - -/** - * Single-linkage clustering, capable of constructing a KNN graph to - * scale the algorithm beyond the n^2 memory consumption of implementations - * that use the fully-connected graph of pairwise distances by connecting - * a knn graph when k is not large enough to connect it. - - * @tparam value_idx - * @tparam value_t - * @tparam dist_type method to use for constructing connectivities graph - * @param[in] handle raft handle - * @param[in] X dense input matrix in row-major layout - * @param[in] m number of rows in X - * @param[in] n number of columns in X - * @param[in] metric distance metrix to use when constructing connectivities graph - * @param[out] out struct containing output dendrogram and cluster assignments - * @param[in] c a constant used when constructing connectivities from knn graph. Allows the indirect - control - * of k. The algorithm will set `k = log(n) + c` - * @param[in] n_clusters number of clusters to assign data samples - */ -template -void single_linkage(const raft::handle_t& handle, - const value_t* X, - size_t m, - size_t n, - raft::distance::DistanceType metric, - linkage_output* out, - int c, - size_t n_clusters) -{ - hierarchy::single_linkage( - handle, X, m, n, metric, out, c, n_clusters); -} - -/** - * Single-linkage clustering, capable of constructing a KNN graph to - * scale the algorithm beyond the n^2 memory consumption of implementations - * that use the fully-connected graph of pairwise distances by connecting - * a knn graph when k is not large enough to connect it. - - * @tparam value_idx - * @tparam value_t - * @tparam dist_type method to use for constructing connectivities graph - * @param[in] handle raft handle - * @param[in] X dense input matrix in row-major layout - * @param[out] dendrogram output dendrogram (size [n_rows - 1] * 2) - * @param[out] labels output labels vector (size n_rows) - * @param[in] metric distance metrix to use when constructing connectivities graph - * @param[in] n_clusters number of clusters to assign data samples - * @param[in] c a constant used when constructing connectivities from knn graph. Allows the indirect - control of k. The algorithm will set `k = log(n) + c` - */ -template -void single_linkage(const raft::handle_t& handle, - raft::device_matrix_view X, - raft::device_matrix_view dendrogram, - raft::device_vector_view labels, - raft::distance::DistanceType metric, - size_t n_clusters, - std::optional c = std::make_optional(hierarchy::DEFAULT_CONST_C)) -{ - hierarchy::single_linkage( - handle, X, dendrogram, labels, metric, n_clusters, c); -} - -}; // namespace raft::cluster +}; // namespace raft::cluster::hierarchy diff --git a/cpp/include/raft/cluster/single_linkage_types.hpp b/cpp/include/raft/cluster/single_linkage_types.hpp index 28b245a2cf..55239ff6d6 100644 --- a/cpp/include/raft/cluster/single_linkage_types.hpp +++ b/cpp/include/raft/cluster/single_linkage_types.hpp @@ -18,10 +18,15 @@ #include +namespace raft::cluster::hierarchy { +enum LinkageDistance { PAIRWISE = 0, KNN_GRAPH = 1 }; + +}; // end namespace raft::cluster::hierarchy + +// The code below is legacy namespace raft::cluster { -namespace hierarchy { -enum LinkageDistance { PAIRWISE = 0, KNN_GRAPH = 1 }; +using hierarchy::LinkageDistance; /** * Simple POCO for consolidating linkage results. This closely @@ -59,11 +64,4 @@ class linkage_output_int : public linkage_output { class linkage_output_int64 : public linkage_output { }; -} // end namespace hierarchy - -using hierarchy::linkage_output; -using hierarchy::linkage_output_int; -using hierarchy::linkage_output_int64; -using hierarchy::LinkageDistance; - }; // namespace raft::cluster \ No newline at end of file diff --git a/cpp/test/CMakeLists.txt b/cpp/test/CMakeLists.txt index 07ec85bf1e..0d5af9be5c 100644 --- a/cpp/test/CMakeLists.txt +++ b/cpp/test/CMakeLists.txt @@ -82,7 +82,7 @@ if(BUILD_TESTS) PATH test/cluster/kmeans.cu test/cluster_solvers.cu - test/sparse/linkage.cu + test/cluster/linkage.cu OPTIONAL DIST NN ) diff --git a/cpp/test/sparse/linkage.cu b/cpp/test/cluster/linkage.cu similarity index 98% rename from cpp/test/sparse/linkage.cu rename to cpp/test/cluster/linkage.cu index ce5741d06b..5533f552bd 100644 --- a/cpp/test/sparse/linkage.cu +++ b/cpp/test/cluster/linkage.cu @@ -180,20 +180,21 @@ class LinkageTest : public ::testing::TestWithParam> { raft::handle_t handle; - auto data_view = - raft::make_device_matrix_view(data.data(), params.n_row, params.n_col); + auto data_view = raft::make_device_matrix_view( + data.data(), params.n_row, params.n_col); auto dendrogram_view = raft::make_device_matrix_view(out_children.data(), params.n_row, 2); auto labels_view = raft::make_device_vector_view(labels.data(), params.n_row); - raft::cluster::single_linkage( - handle, - data_view, - dendrogram_view, - labels_view, - raft::distance::DistanceType::L2SqrtExpanded, - params.n_clusters, - std::make_optional(params.c)); + raft::cluster::hierarchy:: + single_linkage( + handle, + data_view, + dendrogram_view, + labels_view, + raft::distance::DistanceType::L2SqrtExpanded, + params.n_clusters, + std::make_optional(params.c)); handle.sync_stream(stream); From 6ccf61fbac6ae3d6eb6a098b9eb1e7ea4c77d27e Mon Sep 17 00:00:00 2001 From: "Corey J. Nolet" Date: Thu, 20 Oct 2022 22:03:46 -0400 Subject: [PATCH 8/8] Removing namespace conflict --- cpp/include/raft/cluster/kmeans.cuh | 4 +- cpp/include/raft/cluster/kmeans_types.hpp | 8 ++-- cpp/test/cluster_solvers_deprecated.cu | 48 ----------------------- 3 files changed, 6 insertions(+), 54 deletions(-) diff --git a/cpp/include/raft/cluster/kmeans.cuh b/cpp/include/raft/cluster/kmeans.cuh index cfd47d4058..2025a15ecf 100644 --- a/cpp/include/raft/cluster/kmeans.cuh +++ b/cpp/include/raft/cluster/kmeans.cuh @@ -489,7 +489,7 @@ void fit_main(const raft::handle_t& handle, handle, params, X, weight, centroidsRawData, inertia, n_iter, workspace); } -} // end namespace raft::cluster::kmeans +}; // end namespace raft::cluster::kmeans namespace raft::cluster { @@ -962,4 +962,4 @@ void kmeans_fit_main(const raft::handle_t& handle, kmeans::fit_main( handle, params, X, weight, centroidsRawData, inertia, n_iter, workspace); } -} // namespace raft::cluster +}; // namespace raft::cluster diff --git a/cpp/include/raft/cluster/kmeans_types.hpp b/cpp/include/raft/cluster/kmeans_types.hpp index bb8e1a2b73..d6eadd1ba6 100644 --- a/cpp/include/raft/cluster/kmeans_types.hpp +++ b/cpp/include/raft/cluster/kmeans_types.hpp @@ -18,9 +18,7 @@ #include #include -namespace raft::cluster { - -namespace kmeans { +namespace raft::cluster::kmeans { struct KMeansParams { enum InitMethod { KMeansPlusPlus, Random, Array }; @@ -71,7 +69,9 @@ struct KMeansParams { bool inertia_check = false; }; -} // namespace kmeans +} // namespace raft::cluster::kmeans + +namespace raft::cluster { using kmeans::KMeansParams; diff --git a/cpp/test/cluster_solvers_deprecated.cu b/cpp/test/cluster_solvers_deprecated.cu index 1e9ec0c15b..167a710b34 100644 --- a/cpp/test/cluster_solvers_deprecated.cu +++ b/cpp/test/cluster_solvers_deprecated.cu @@ -20,7 +20,6 @@ #include #include -#include namespace raft { namespace spectral { @@ -54,52 +53,5 @@ TEST(Raft, ClusterSolvers) EXPECT_ANY_THROW(cluster_solver.solve(h, n, d, eigvecs, codes)); } -TEST(Raft, ModularitySolvers) -{ - using namespace matrix; - using index_type = int; - using value_type = double; - - handle_t h; - ASSERT_EQ(0, - h. - - get_device() - - ); - - index_type neigvs{10}; - index_type maxiter{100}; - index_type restart_iter{10}; - value_type tol{1.0e-10}; - bool reorthog{true}; - - // nullptr expected to trigger exceptions: - // - index_type* clusters{nullptr}; - value_type* eigvals{nullptr}; - value_type* eigvecs{nullptr}; - - unsigned long long seed{100110021003}; - - eigen_solver_config_t eig_cfg{ - neigvs, maxiter, restart_iter, tol, reorthog, seed}; - lanczos_solver_t eig_solver{eig_cfg}; - - index_type k{5}; - - cluster_solver_config_deprecated_t clust_cfg{k, maxiter, tol, seed}; - kmeans_solver_deprecated_t cluster_solver{clust_cfg}; - - auto stream = h.get_stream(); - sparse_matrix_t sm{h, nullptr, nullptr, nullptr, 0, 0}; - - EXPECT_ANY_THROW(spectral::modularity_maximization( - h, sm, eig_solver, cluster_solver, clusters, eigvals, eigvecs)); - - value_type modularity{0}; - EXPECT_ANY_THROW(spectral::analyzeModularity(h, sm, k, clusters, modularity)); -} - } // namespace spectral } // namespace raft