From f9ce36f83a8803396d84eceab0e9b3a1706f8510 Mon Sep 17 00:00:00 2001 From: Yunsong Wang Date: Thu, 25 Jan 2024 14:11:48 -0800 Subject: [PATCH 1/6] Use new cuco_allocator --- .../cudf/detail/hash_reduce_by_row.cuh | 8 +-- cpp/include/cudf/detail/join.hpp | 11 ++-- .../cudf/hashing/detail/hash_allocator.cuh | 62 ------------------- cpp/src/hash/concurrent_unordered_map.cuh | 6 +- cpp/src/io/json/json_tree.cu | 11 ++-- cpp/src/join/hash_join.cu | 5 +- cpp/src/join/join_common_utils.hpp | 13 ++-- cpp/src/join/mixed_join.cu | 25 ++++---- cpp/src/join/mixed_join_semi.cu | 7 ++- cpp/src/reductions/histogram.cu | 13 ++-- cpp/src/search/contains_table.cu | 4 +- cpp/src/stream_compaction/distinct.cu | 4 +- cpp/src/stream_compaction/distinct_count.cu | 16 ++--- .../stream_compaction_common.hpp | 10 +-- cpp/src/text/bpe/byte_pair_encoding.cuh | 11 ++-- cpp/src/text/bpe/load_merge_pairs.cu | 33 +++++----- cpp/src/text/vocabulary_tokenize.cu | 12 ++-- 17 files changed, 85 insertions(+), 166 deletions(-) delete mode 100644 cpp/include/cudf/hashing/detail/hash_allocator.cuh diff --git a/cpp/include/cudf/detail/hash_reduce_by_row.cuh b/cpp/include/cudf/detail/hash_reduce_by_row.cuh index f63d1922950..006cb5142c9 100644 --- a/cpp/include/cudf/detail/hash_reduce_by_row.cuh +++ b/cpp/include/cudf/detail/hash_reduce_by_row.cuh @@ -1,5 +1,5 @@ /* - * Copyright (c) 2022-2023, NVIDIA CORPORATION. + * Copyright (c) 2022-2024, NVIDIA CORPORATION. * * Licensed under the Apache License, Version 2.0 (the "License"); * you may not use this file except in compliance with the License. @@ -14,7 +14,7 @@ * limitations under the License. */ -#include +#include #include #include #include @@ -22,7 +22,6 @@ #include #include #include -#include #include #include @@ -32,9 +31,8 @@ namespace cudf::detail { -using hash_table_allocator_type = rmm::mr::stream_allocator_adaptor>; using hash_map_type = - cuco::static_map; + cuco::static_map; /** * @brief The base struct for customized reduction functor to perform reduce-by-key with keys are diff --git a/cpp/include/cudf/detail/join.hpp b/cpp/include/cudf/detail/join.hpp index b69632c83ca..ad6269dae30 100644 --- a/cpp/include/cudf/detail/join.hpp +++ b/cpp/include/cudf/detail/join.hpp @@ -1,5 +1,5 @@ /* - * Copyright (c) 2022-2023, NVIDIA CORPORATION. + * Copyright (c) 2022-2024, NVIDIA CORPORATION. * * Licensed under the Apache License, Version 2.0 (the "License"); * you may not use this file except in compliance with the License. @@ -24,7 +24,6 @@ #include #include #include -#include #include @@ -33,9 +32,6 @@ #include // Forward declaration -template -class default_allocator; - namespace cudf::experimental::row::equality { class preprocessed_table; } @@ -43,6 +39,9 @@ class preprocessed_table; namespace cudf { namespace detail { +// Forward declaration +class cuco_allocator; + constexpr int DEFAULT_JOIN_CG_SIZE = 2; enum class join_kind { INNER_JOIN, LEFT_JOIN, FULL_JOIN, LEFT_SEMI_JOIN, LEFT_ANTI_JOIN }; @@ -62,7 +61,7 @@ struct hash_join { cuco::static_multimap>, + cudf::detail::cuco_allocator, cuco::double_hashing>; hash_join() = delete; diff --git a/cpp/include/cudf/hashing/detail/hash_allocator.cuh b/cpp/include/cudf/hashing/detail/hash_allocator.cuh deleted file mode 100644 index 64a2a852ae4..00000000000 --- a/cpp/include/cudf/hashing/detail/hash_allocator.cuh +++ /dev/null @@ -1,62 +0,0 @@ -/* - * Copyright (c) 2017-2023, NVIDIA CORPORATION. - * - * Licensed under the Apache License, Version 2.0 (the "License"); - * you may not use this file except in compliance with the License. - * You may obtain a copy of the License at - * - * http://www.apache.org/licenses/LICENSE-2.0 - * - * Unless required by applicable law or agreed to in writing, software - * distributed under the License is distributed on an "AS IS" BASIS, - * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. - * See the License for the specific language governing permissions and - * limitations under the License. - */ - -#pragma once - -#include - -#include - -#include -#include -#include -#include - -template -struct default_allocator { - using value_type = T; - rmm::mr::device_memory_resource* mr = rmm::mr::get_current_device_resource(); - - default_allocator() = default; - - template - constexpr default_allocator(default_allocator const&) noexcept - { - } - - T* allocate(std::size_t n, rmm::cuda_stream_view stream = cudf::get_default_stream()) const - { - return static_cast(mr->allocate(n * sizeof(T), stream)); - } - - void deallocate(T* p, - std::size_t n, - rmm::cuda_stream_view stream = cudf::get_default_stream()) const - { - mr->deallocate(p, n * sizeof(T), stream); - } -}; - -template -bool operator==(default_allocator const&, default_allocator const&) -{ - return true; -} -template -bool operator!=(default_allocator const&, default_allocator const&) -{ - return false; -} diff --git a/cpp/src/hash/concurrent_unordered_map.cuh b/cpp/src/hash/concurrent_unordered_map.cuh index d773c2763df..adc87c2400e 100644 --- a/cpp/src/hash/concurrent_unordered_map.cuh +++ b/cpp/src/hash/concurrent_unordered_map.cuh @@ -1,5 +1,5 @@ /* - * Copyright (c) 2017-2023, NVIDIA CORPORATION. All rights reserved. + * Copyright (c) 2017-2024, NVIDIA CORPORATION. All rights reserved. * * Licensed under the Apache License, Version 2.0 (the "License"); * you may not use this file except in compliance with the License. @@ -20,12 +20,12 @@ #include #include -#include #include #include #include #include +#include #include @@ -117,7 +117,7 @@ template , typename Equality = equal_to, - typename Allocator = default_allocator>> + typename Allocator = rmm::mr::polymorphic_allocator>> class concurrent_unordered_map { public: using size_type = size_t; diff --git a/cpp/src/io/json/json_tree.cu b/cpp/src/io/json/json_tree.cu index 275907c19c9..db9daf28c06 100644 --- a/cpp/src/io/json/json_tree.cu +++ b/cpp/src/io/json/json_tree.cu @@ -17,12 +17,12 @@ #include "nested_json.hpp" #include +#include #include #include #include #include #include -#include #include #include #include @@ -31,7 +31,6 @@ #include #include #include -#include #include @@ -511,7 +510,6 @@ rmm::device_uvector hash_node_type_with_field_name(device_span>; auto const num_nodes = d_tree.node_categories.size(); auto const num_fields = thrust::count(rmm::exec_policy(stream), @@ -555,7 +553,7 @@ rmm::device_uvector hash_node_type_with_field_name(device_span{d_hasher}, - hash_table_allocator_type{default_allocator{}, stream}, + cudf::detail::cuco_allocator{stream}, stream.value()}; key_set.insert_if_async(iter, iter + num_nodes, @@ -735,15 +733,14 @@ std::pair, rmm::device_uvector> hash_n }; constexpr size_type empty_node_index_sentinel = -1; - using hash_table_allocator_type = rmm::mr::stream_allocator_adaptor>; - using hasher_type = decltype(d_hashed_cache); + using hasher_type = decltype(d_hashed_cache); auto key_set = cuco::experimental::static_set{ cuco::experimental::extent{compute_hash_table_size(num_nodes)}, cuco::empty_key{empty_node_index_sentinel}, d_equal, cuco::experimental::linear_probing<1, hasher_type>{d_hashed_cache}, - hash_table_allocator_type{default_allocator{}, stream}, + cudf::detail::cuco_allocator{stream}, stream.value()}; // insert and convert node ids to unique set ids diff --git a/cpp/src/join/hash_join.cu b/cpp/src/join/hash_join.cu index 453257ab228..17616818a58 100644 --- a/cpp/src/join/hash_join.cu +++ b/cpp/src/join/hash_join.cu @@ -1,5 +1,5 @@ /* - * Copyright (c) 2020-2023, NVIDIA CORPORATION. + * Copyright (c) 2020-2024, NVIDIA CORPORATION. * * Licensed under the Apache License, Version 2.0 (the "License"); * you may not use this file except in compliance with the License. @@ -19,6 +19,7 @@ #include #include #include +#include #include #include @@ -368,7 +369,7 @@ hash_join::hash_join(cudf::table_view const& build, cuco::empty_key{std::numeric_limits::max()}, cuco::empty_value{cudf::detail::JoinNoneValue}, stream.value(), - detail::hash_table_allocator_type{default_allocator{}, stream}}, + cudf::detail::cuco_allocator{stream}}, _build{build}, _preprocessed_build{ cudf::experimental::row::equality::preprocessed_table::create(_build, stream)} diff --git a/cpp/src/join/join_common_utils.hpp b/cpp/src/join/join_common_utils.hpp index e96505e5ed6..b88a4fdef58 100644 --- a/cpp/src/join/join_common_utils.hpp +++ b/cpp/src/join/join_common_utils.hpp @@ -1,5 +1,5 @@ /* - * Copyright (c) 2019-2023, NVIDIA CORPORATION. + * Copyright (c) 2019-2024, NVIDIA CORPORATION. * * Licensed under the Apache License, Version 2.0 (the "License"); * you may not use this file except in compliance with the License. @@ -15,16 +15,13 @@ */ #pragma once +#include #include #include -#include -#include #include #include #include -#include - #include #include @@ -43,8 +40,6 @@ using pair_type = cuco::pair; using hash_type = cuco::murmurhash3_32; -using hash_table_allocator_type = rmm::mr::stream_allocator_adaptor>; - using multimap_type = cudf::hash_join::impl_type::map_type; // Multimap type used for mixed joins. TODO: This is a temporary alias used @@ -53,11 +48,11 @@ using multimap_type = cudf::hash_join::impl_type::map_type; using mixed_multimap_type = cuco::static_multimap>; using semi_map_type = cuco:: - static_map; + static_map; using row_hash_legacy = cudf::row_hasher; diff --git a/cpp/src/join/mixed_join.cu b/cpp/src/join/mixed_join.cu index 3d902bf93b2..6223114fcd0 100644 --- a/cpp/src/join/mixed_join.cu +++ b/cpp/src/join/mixed_join.cu @@ -1,5 +1,5 @@ /* - * Copyright (c) 2022-2023, NVIDIA CORPORATION. + * Copyright (c) 2022-2024, NVIDIA CORPORATION. * * Licensed under the Apache License, Version 2.0 (the "License"); * you may not use this file except in compliance with the License. @@ -21,6 +21,7 @@ #include #include #include +#include #include #include #include @@ -127,12 +128,11 @@ mixed_join( auto build_view = table_device_view::create(build, stream); // Don't use multimap_type because we want a CG size of 1. - mixed_multimap_type hash_table{ - compute_hash_table_size(build.num_rows()), - cuco::empty_key{std::numeric_limits::max()}, - cuco::empty_value{cudf::detail::JoinNoneValue}, - stream.value(), - detail::hash_table_allocator_type{default_allocator{}, stream}}; + mixed_multimap_type hash_table{compute_hash_table_size(build.num_rows()), + cuco::empty_key{std::numeric_limits::max()}, + cuco::empty_value{cudf::detail::JoinNoneValue}, + stream.value(), + cudf::detail::cuco_allocator{stream}}; // TODO: To add support for nested columns we will need to flatten in many // places. However, this probably isn't worth adding any time soon since we @@ -393,12 +393,11 @@ compute_mixed_join_output_size(table_view const& left_equality, auto build_view = table_device_view::create(build, stream); // Don't use multimap_type because we want a CG size of 1. - mixed_multimap_type hash_table{ - compute_hash_table_size(build.num_rows()), - cuco::empty_key{std::numeric_limits::max()}, - cuco::empty_value{cudf::detail::JoinNoneValue}, - stream.value(), - detail::hash_table_allocator_type{default_allocator{}, stream}}; + mixed_multimap_type hash_table{compute_hash_table_size(build.num_rows()), + cuco::empty_key{std::numeric_limits::max()}, + cuco::empty_value{cudf::detail::JoinNoneValue}, + stream.value(), + cudf::detail::cuco_allocator{stream}}; // TODO: To add support for nested columns we will need to flatten in many // places. However, this probably isn't worth adding any time soon since we diff --git a/cpp/src/join/mixed_join_semi.cu b/cpp/src/join/mixed_join_semi.cu index f619ed0d558..edf6c32eadf 100644 --- a/cpp/src/join/mixed_join_semi.cu +++ b/cpp/src/join/mixed_join_semi.cu @@ -1,5 +1,5 @@ /* - * Copyright (c) 2022-2023, NVIDIA CORPORATION. + * Copyright (c) 2022-2024, NVIDIA CORPORATION. * * Licensed under the Apache License, Version 2.0 (the "License"); * you may not use this file except in compliance with the License. @@ -23,6 +23,7 @@ #include #include #include +#include #include #include #include @@ -172,7 +173,7 @@ std::unique_ptr> mixed_join_semi( semi_map_type hash_table{compute_hash_table_size(build.num_rows()), cuco::empty_key{std::numeric_limits::max()}, cuco::empty_value{cudf::detail::JoinNoneValue}, - detail::hash_table_allocator_type{default_allocator{}, stream}, + cudf::detail::cuco_allocator{stream}, stream.value()}; // Create hash table containing all keys found in right table @@ -433,7 +434,7 @@ compute_mixed_join_output_size_semi(table_view const& left_equality, semi_map_type hash_table{compute_hash_table_size(build.num_rows()), cuco::empty_key{std::numeric_limits::max()}, cuco::empty_value{cudf::detail::JoinNoneValue}, - detail::hash_table_allocator_type{default_allocator{}, stream}, + cudf::detail::cuco_allocator{stream}, stream.value()}; // Create hash table containing all keys found in right table diff --git a/cpp/src/reductions/histogram.cu b/cpp/src/reductions/histogram.cu index 218e2e57420..42ef266a684 100644 --- a/cpp/src/reductions/histogram.cu +++ b/cpp/src/reductions/histogram.cu @@ -1,5 +1,5 @@ /* - * Copyright (c) 2023, NVIDIA CORPORATION. + * Copyright (c) 2023-2024, NVIDIA CORPORATION. * * Licensed under the Apache License, Version 2.0 (the "License"); * you may not use this file except in compliance with the License. @@ -163,12 +163,11 @@ compute_row_frequencies(table_view const& input, "Nested types are not yet supported in histogram aggregation.", std::invalid_argument); - auto map = cudf::detail::hash_map_type{ - compute_hash_table_size(input.num_rows()), - cuco::empty_key{-1}, - cuco::empty_value{std::numeric_limits::min()}, - cudf::detail::hash_table_allocator_type{default_allocator{}, stream}, - stream.value()}; + auto map = cudf::detail::hash_map_type{compute_hash_table_size(input.num_rows()), + cuco::empty_key{-1}, + cuco::empty_value{std::numeric_limits::min()}, + cudf::detail::cuco_allocator{stream}, + stream.value()}; auto const preprocessed_input = cudf::experimental::row::hash::preprocessed_table::create(input, stream); diff --git a/cpp/src/search/contains_table.cu b/cpp/src/search/contains_table.cu index b8ece03c4a0..ce069abcb78 100644 --- a/cpp/src/search/contains_table.cu +++ b/cpp/src/search/contains_table.cu @@ -16,7 +16,9 @@ #include +#include #include +#include #include #include #include @@ -231,7 +233,7 @@ rmm::device_uvector contains(table_view const& haystack, cuco::empty_key{lhs_index_type{-1}}, d_equal, probing_scheme, - detail::hash_table_allocator_type{default_allocator{}, stream}, + cudf::detail::cuco_allocator{stream}, stream.value()}; if (haystack_has_nulls && compare_nulls == null_equality::UNEQUAL) { diff --git a/cpp/src/stream_compaction/distinct.cu b/cpp/src/stream_compaction/distinct.cu index b867df1565a..e73bab1345e 100644 --- a/cpp/src/stream_compaction/distinct.cu +++ b/cpp/src/stream_compaction/distinct.cu @@ -1,5 +1,5 @@ /* - * Copyright (c) 2019-2023, NVIDIA CORPORATION. + * Copyright (c) 2019-2024, NVIDIA CORPORATION. * * Licensed under the Apache License, Version 2.0 (the "License"); * you may not use this file except in compliance with the License. @@ -54,7 +54,7 @@ rmm::device_uvector distinct_indices(table_view const& input, auto map = hash_map_type{compute_hash_table_size(input.num_rows()), cuco::empty_key{-1}, cuco::empty_value{std::numeric_limits::min()}, - detail::hash_table_allocator_type{default_allocator{}, stream}, + cudf::detail::cuco_allocator{stream}, stream.value()}; auto const preprocessed_input = diff --git a/cpp/src/stream_compaction/distinct_count.cu b/cpp/src/stream_compaction/distinct_count.cu index ac4811ad279..507bad777eb 100644 --- a/cpp/src/stream_compaction/distinct_count.cu +++ b/cpp/src/stream_compaction/distinct_count.cu @@ -1,5 +1,5 @@ /* - * Copyright (c) 2019-2023, NVIDIA CORPORATION. + * Copyright (c) 2019-2024, NVIDIA CORPORATION. * * Licensed under the Apache License, Version 2.0 (the "License"); * you may not use this file except in compliance with the License. @@ -141,13 +141,13 @@ cudf::size_type distinct_count(table_view const& keys, auto const comparator_helper = [&](auto const row_equal) { using hasher_type = decltype(hash_key); - auto key_set = cuco::experimental::static_set{ - cuco::experimental::extent{compute_hash_table_size(num_rows)}, - cuco::empty_key{-1}, - row_equal, - cuco::experimental::linear_probing<1, hasher_type>{hash_key}, - detail::hash_table_allocator_type{default_allocator{}, stream}, - stream.value()}; + auto key_set = + cuco::experimental::static_set{cuco::experimental::extent{compute_hash_table_size(num_rows)}, + cuco::empty_key{-1}, + row_equal, + cuco::experimental::linear_probing<1, hasher_type>{hash_key}, + cudf::detail::cuco_allocator{stream}, + stream.value()}; auto const iter = thrust::counting_iterator(0); // when nulls are equal, we skip hashing any row that has a null diff --git a/cpp/src/stream_compaction/stream_compaction_common.hpp b/cpp/src/stream_compaction/stream_compaction_common.hpp index 18c531e3e69..ceb62d1d059 100644 --- a/cpp/src/stream_compaction/stream_compaction_common.hpp +++ b/cpp/src/stream_compaction/stream_compaction_common.hpp @@ -1,5 +1,5 @@ /* - * Copyright (c) 2022-2023, NVIDIA CORPORATION. + * Copyright (c) 2022-2024, NVIDIA CORPORATION. * * Licensed under the Apache License, Version 2.0 (the "License"); * you may not use this file except in compliance with the License. @@ -15,13 +15,11 @@ */ #pragma once -#include +#include #include #include #include -#include - #include #include @@ -29,10 +27,8 @@ namespace cudf { namespace detail { -using hash_table_allocator_type = rmm::mr::stream_allocator_adaptor>; - using hash_map_type = - cuco::static_map; + cuco::static_map; } // namespace detail } // namespace cudf diff --git a/cpp/src/text/bpe/byte_pair_encoding.cuh b/cpp/src/text/bpe/byte_pair_encoding.cuh index 2a170317909..1a3f8eadea0 100644 --- a/cpp/src/text/bpe/byte_pair_encoding.cuh +++ b/cpp/src/text/bpe/byte_pair_encoding.cuh @@ -1,5 +1,5 @@ /* - * Copyright (c) 2022-2023, NVIDIA CORPORATION. + * Copyright (c) 2022-2024, NVIDIA CORPORATION. * * Licensed under the Apache License, Version 2.0 (the "License"); * you may not use this file except in compliance with the License. @@ -20,14 +20,13 @@ #include #include -#include +#include #include #include #include #include #include -#include #include @@ -46,8 +45,6 @@ using string_hasher_type = cudf::hashing::detail::MurmurHash3_x86_32; -using hash_table_allocator_type = rmm::mr::stream_allocator_adaptor>; - /** * @brief Hasher function used for building and using the cuco static-map * @@ -109,7 +106,7 @@ using merge_pairs_map_type = cuco::experimental::static_map; + cudf::detail::cuco_allocator>; /** * @brief Hasher function used for building and using the cuco static-map @@ -166,7 +163,7 @@ using mp_table_map_type = cuco::experimental::static_map; + cudf::detail::cuco_allocator>; } // namespace detail diff --git a/cpp/src/text/bpe/load_merge_pairs.cu b/cpp/src/text/bpe/load_merge_pairs.cu index c07d929e98a..3b630886b3e 100644 --- a/cpp/src/text/bpe/load_merge_pairs.cu +++ b/cpp/src/text/bpe/load_merge_pairs.cu @@ -1,5 +1,5 @@ /* - * Copyright (c) 2022-2023, NVIDIA CORPORATION. + * Copyright (c) 2022-2024, NVIDIA CORPORATION. * * Licensed under the Apache License, Version 2.0 (the "License"); * you may not use this file except in compliance with the License. @@ -42,14 +42,14 @@ namespace { std::unique_ptr initialize_merge_pairs_map( cudf::column_device_view const& input, rmm::cuda_stream_view stream) { - auto merge_pairs_map = std::make_unique( - static_cast(input.size()), - cuco::empty_key{-1}, - cuco::empty_value{-1}, - bpe_equal{input}, - bpe_probe_scheme{bpe_hasher{input}}, - hash_table_allocator_type{default_allocator{}, stream}, - stream.value()); + auto merge_pairs_map = + std::make_unique(static_cast(input.size()), + cuco::empty_key{-1}, + cuco::empty_value{-1}, + bpe_equal{input}, + bpe_probe_scheme{bpe_hasher{input}}, + cudf::detail::cuco_allocator{stream}, + stream.value()); auto iter = cudf::detail::make_counting_transform_iterator( 0, @@ -64,14 +64,13 @@ std::unique_ptr initialize_merge_pairs_map( std::unique_ptr initialize_mp_table_map( cudf::column_device_view const& input, rmm::cuda_stream_view stream) { - auto mp_table_map = std::make_unique( - static_cast(input.size()), - cuco::empty_key{-1}, - cuco::empty_value{-1}, - mp_equal{input}, - mp_probe_scheme{mp_hasher{input}}, - hash_table_allocator_type{default_allocator{}, stream}, - stream.value()); + auto mp_table_map = std::make_unique(static_cast(input.size()), + cuco::empty_key{-1}, + cuco::empty_value{-1}, + mp_equal{input}, + mp_probe_scheme{mp_hasher{input}}, + cudf::detail::cuco_allocator{stream}, + stream.value()); auto iter = cudf::detail::make_counting_transform_iterator( 0, diff --git a/cpp/src/text/vocabulary_tokenize.cu b/cpp/src/text/vocabulary_tokenize.cu index a9e8d4d9a24..80f275dba7d 100644 --- a/cpp/src/text/vocabulary_tokenize.cu +++ b/cpp/src/text/vocabulary_tokenize.cu @@ -21,13 +21,13 @@ #include #include #include +#include #include #include #include #include #include #include -#include #include #include #include @@ -35,7 +35,6 @@ #include #include -#include #include @@ -93,15 +92,14 @@ struct vocab_equal { } }; -using hash_table_allocator_type = rmm::mr::stream_allocator_adaptor>; -using probe_scheme = cuco::experimental::linear_probing<1, vocab_hasher>; -using vocabulary_map_type = cuco::experimental::static_map; +using vocabulary_map_type = cuco::experimental::static_map, cuda::thread_scope_device, vocab_equal, probe_scheme, - hash_table_allocator_type>; + cudf::detail::cuco_allocator>; } // namespace } // namespace detail @@ -150,7 +148,7 @@ tokenize_vocabulary::tokenize_vocabulary(cudf::strings_column_view const& input, cuco::empty_value{-1}, detail::vocab_equal{*d_vocabulary}, detail::probe_scheme{detail::vocab_hasher{*d_vocabulary}}, - detail::hash_table_allocator_type{default_allocator{}, stream}, + cudf::detail::cuco_allocator{stream}, stream.value()); // the row index is the token id (value for each key in the map) From dde07ad50e0bc44d952fbdd2bcc3a2fa292bb2f4 Mon Sep 17 00:00:00 2001 From: Yunsong Wang Date: Thu, 25 Jan 2024 14:25:28 -0800 Subject: [PATCH 2/6] Add cuco_allocator class --- cpp/include/cudf/detail/cuco_helpers.hpp | 33 ++++++++++++++++++++++++ 1 file changed, 33 insertions(+) create mode 100644 cpp/include/cudf/detail/cuco_helpers.hpp diff --git a/cpp/include/cudf/detail/cuco_helpers.hpp b/cpp/include/cudf/detail/cuco_helpers.hpp new file mode 100644 index 00000000000..380704d4c88 --- /dev/null +++ b/cpp/include/cudf/detail/cuco_helpers.hpp @@ -0,0 +1,33 @@ +/* + * Copyright (c) 2024, NVIDIA CORPORATION. + * + * Licensed under the Apache License, Version 2.0 (the "License"); + * you may not use this file except in compliance with the License. + * You may obtain a copy of the License at + * + * http://www.apache.org/licenses/LICENSE-2.0 + * + * Unless required by applicable law or agreed to in writing, software + * distributed under the License is distributed on an "AS IS" BASIS, + * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. + * See the License for the specific language governing permissions and + * limitations under the License. + */ + +#pragma once + +#include +#include + +namespace cudf::detail { + +class cuco_allocator + : public rmm::mr::stream_allocator_adaptor> { + using default_allocator = rmm::mr::polymorphic_allocator; + using base_type = rmm::mr::stream_allocator_adaptor; + + public: + cuco_allocator(rmm::cuda_stream_view stream) : base_type{default_allocator{}, stream} {} +}; + +} // namespace cudf::detail From 8ddcd4b956ec1f3f169b58ee2236e991756f5967 Mon Sep 17 00:00:00 2001 From: Yunsong Wang Date: Fri, 26 Jan 2024 12:43:46 -0800 Subject: [PATCH 3/6] Update docs --- cpp/include/cudf/detail/cuco_helpers.hpp | 7 +++++++ 1 file changed, 7 insertions(+) diff --git a/cpp/include/cudf/detail/cuco_helpers.hpp b/cpp/include/cudf/detail/cuco_helpers.hpp index 380704d4c88..14ea2a7901b 100644 --- a/cpp/include/cudf/detail/cuco_helpers.hpp +++ b/cpp/include/cudf/detail/cuco_helpers.hpp @@ -21,6 +21,13 @@ namespace cudf::detail { +/** + * @brief Stream-ordered allocator adaptor used for cuco data structures + * + * The stream-ordered `rmm::mr::polymorphic_allocator` cannot be used in `cuco` directly since the + * later expects a standard C++ `Allocator` interface. This allocator helper provides a simple way + * to handle cuco memory allocation/deallocation with the default rmm memory resource. + */ class cuco_allocator : public rmm::mr::stream_allocator_adaptor> { using default_allocator = rmm::mr::polymorphic_allocator; From 58281f6e59e38a5d28675ea329e81f37d1af8cbb Mon Sep 17 00:00:00 2001 From: Yunsong Wang Date: Fri, 26 Jan 2024 12:47:29 -0800 Subject: [PATCH 4/6] More docs --- cpp/include/cudf/detail/cuco_helpers.hpp | 9 +++++++-- 1 file changed, 7 insertions(+), 2 deletions(-) diff --git a/cpp/include/cudf/detail/cuco_helpers.hpp b/cpp/include/cudf/detail/cuco_helpers.hpp index 14ea2a7901b..492bbc2d27d 100644 --- a/cpp/include/cudf/detail/cuco_helpers.hpp +++ b/cpp/include/cudf/detail/cuco_helpers.hpp @@ -30,10 +30,15 @@ namespace cudf::detail { */ class cuco_allocator : public rmm::mr::stream_allocator_adaptor> { - using default_allocator = rmm::mr::polymorphic_allocator; - using base_type = rmm::mr::stream_allocator_adaptor; + using default_allocator = + rmm::mr::polymorphic_allocator; ///< Default stream-ordered allocator type + using base_type = + rmm::mr::stream_allocator_adaptor; ///< The base allocator adaptor type public: + /** + * @brief Constructs the adaptor with the given `stream` + */ cuco_allocator(rmm::cuda_stream_view stream) : base_type{default_allocator{}, stream} {} }; From 1fc6468708a9f74e88739e5e946d4eeaa21362a7 Mon Sep 17 00:00:00 2001 From: Yunsong Wang Date: Fri, 26 Jan 2024 12:48:39 -0800 Subject: [PATCH 5/6] Styling --- cpp/include/cudf/detail/cuco_helpers.hpp | 8 ++++---- 1 file changed, 4 insertions(+), 4 deletions(-) diff --git a/cpp/include/cudf/detail/cuco_helpers.hpp b/cpp/include/cudf/detail/cuco_helpers.hpp index 492bbc2d27d..1c2e8b3e85c 100644 --- a/cpp/include/cudf/detail/cuco_helpers.hpp +++ b/cpp/include/cudf/detail/cuco_helpers.hpp @@ -30,10 +30,10 @@ namespace cudf::detail { */ class cuco_allocator : public rmm::mr::stream_allocator_adaptor> { - using default_allocator = - rmm::mr::polymorphic_allocator; ///< Default stream-ordered allocator type - using base_type = - rmm::mr::stream_allocator_adaptor; ///< The base allocator adaptor type + /// Default stream-ordered allocator type + using default_allocator = rmm::mr::polymorphic_allocator; + /// The base allocator adaptor type + using base_type = rmm::mr::stream_allocator_adaptor; public: /** From d7370032149c3d210ca3fd99c2db8ff699c5c763 Mon Sep 17 00:00:00 2001 From: Yunsong Wang Date: Fri, 26 Jan 2024 12:51:48 -0800 Subject: [PATCH 6/6] More doc cleanups --- cpp/include/cudf/detail/cuco_helpers.hpp | 5 +++-- 1 file changed, 3 insertions(+), 2 deletions(-) diff --git a/cpp/include/cudf/detail/cuco_helpers.hpp b/cpp/include/cudf/detail/cuco_helpers.hpp index 1c2e8b3e85c..5f3c31479de 100644 --- a/cpp/include/cudf/detail/cuco_helpers.hpp +++ b/cpp/include/cudf/detail/cuco_helpers.hpp @@ -26,7 +26,8 @@ namespace cudf::detail { * * The stream-ordered `rmm::mr::polymorphic_allocator` cannot be used in `cuco` directly since the * later expects a standard C++ `Allocator` interface. This allocator helper provides a simple way - * to handle cuco memory allocation/deallocation with the default rmm memory resource. + * to handle cuco memory allocation/deallocation with the given `stream` and the rmm default memory + * resource. */ class cuco_allocator : public rmm::mr::stream_allocator_adaptor> { @@ -37,7 +38,7 @@ class cuco_allocator public: /** - * @brief Constructs the adaptor with the given `stream` + * @brief Constructs the allocator adaptor with the given `stream` */ cuco_allocator(rmm::cuda_stream_view stream) : base_type{default_allocator{}, stream} {} };