From e0a00c1fcb4b72b7abd29debe5b2f6b38081d39a Mon Sep 17 00:00:00 2001 From: Jayjeet Chakraborty Date: Mon, 22 Jul 2024 12:03:24 -0700 Subject: [PATCH] Add `stream` param to list explode APIs (#16317) Add `stream` param to list `explode*` APIs. Partially fixes https://github.com/rapidsai/cudf/issues/13744 Authors: - Jayjeet Chakraborty (https://github.com/JayjeetAtGithub) Approvers: - Vyas Ramasubramani (https://github.com/vyasr) URL: https://github.com/rapidsai/cudf/pull/16317 --- cpp/include/cudf/lists/explode.hpp | 8 ++++ cpp/include/cudf/lists/set_operations.hpp | 2 +- cpp/src/lists/explode.cu | 29 +++++++----- cpp/tests/streams/lists_test.cpp | 57 ++++++++++++++++++++++- 4 files changed, 82 insertions(+), 14 deletions(-) diff --git a/cpp/include/cudf/lists/explode.hpp b/cpp/include/cudf/lists/explode.hpp index 81d82dcfa09..303f182ce8c 100644 --- a/cpp/include/cudf/lists/explode.hpp +++ b/cpp/include/cudf/lists/explode.hpp @@ -66,6 +66,7 @@ namespace cudf { * * @param input_table Table to explode. * @param explode_column_idx Column index to explode inside the table. + * @param stream CUDA stream used for device memory operations and kernel launches. * @param mr Device memory resource used to allocate the returned column's device memory. * * @return A new table with explode_col exploded. @@ -73,6 +74,7 @@ namespace cudf { std::unique_ptr explode( table_view const& input_table, size_type explode_column_idx, + rmm::cuda_stream_view stream = cudf::get_default_stream(), rmm::device_async_resource_ref mr = rmm::mr::get_current_device_resource()); /** @@ -109,6 +111,7 @@ std::unique_ptr
explode( * * @param input_table Table to explode. * @param explode_column_idx Column index to explode inside the table. + * @param stream CUDA stream used for device memory operations and kernel launches. * @param mr Device memory resource used to allocate the returned column's device memory. * * @return A new table with exploded value and position. The column order of return table is @@ -117,6 +120,7 @@ std::unique_ptr
explode( std::unique_ptr
explode_position( table_view const& input_table, size_type explode_column_idx, + rmm::cuda_stream_view stream = cudf::get_default_stream(), rmm::device_async_resource_ref mr = rmm::mr::get_current_device_resource()); /** @@ -152,6 +156,7 @@ std::unique_ptr
explode_position( * * @param input_table Table to explode. * @param explode_column_idx Column index to explode inside the table. + * @param stream CUDA stream used for device memory operations and kernel launches. * @param mr Device memory resource used to allocate the returned column's device memory. * * @return A new table with explode_col exploded. @@ -159,6 +164,7 @@ std::unique_ptr
explode_position( std::unique_ptr
explode_outer( table_view const& input_table, size_type explode_column_idx, + rmm::cuda_stream_view stream = cudf::get_default_stream(), rmm::device_async_resource_ref mr = rmm::mr::get_current_device_resource()); /** @@ -196,6 +202,7 @@ std::unique_ptr
explode_outer( * * @param input_table Table to explode. * @param explode_column_idx Column index to explode inside the table. + * @param stream CUDA stream used for device memory operations and kernel launches. * @param mr Device memory resource used to allocate the returned column's device memory. * * @return A new table with explode_col exploded. @@ -203,6 +210,7 @@ std::unique_ptr
explode_outer( std::unique_ptr
explode_outer_position( table_view const& input_table, size_type explode_column_idx, + rmm::cuda_stream_view stream = cudf::get_default_stream(), rmm::device_async_resource_ref mr = rmm::mr::get_current_device_resource()); /** @} */ // end of group diff --git a/cpp/include/cudf/lists/set_operations.hpp b/cpp/include/cudf/lists/set_operations.hpp index b8abfd62461..871e66b2d83 100644 --- a/cpp/include/cudf/lists/set_operations.hpp +++ b/cpp/include/cudf/lists/set_operations.hpp @@ -53,8 +53,8 @@ namespace cudf::lists { * @param nulls_equal Flag to specify whether null elements should be considered as equal, default * to be `UNEQUAL` which means only non-null elements are checked for overlapping * @param nans_equal Flag to specify whether floating-point NaNs should be considered as equal - * @param mr Device memory resource used to allocate the returned object * @param stream CUDA stream used for device memory operations and kernel launches + * @param mr Device memory resource used to allocate the returned object * @return A column of type BOOL containing the check results */ std::unique_ptr have_overlap( diff --git a/cpp/src/lists/explode.cu b/cpp/src/lists/explode.cu index 370d7480578..46c4fc78a6f 100644 --- a/cpp/src/lists/explode.cu +++ b/cpp/src/lists/explode.cu @@ -229,8 +229,8 @@ std::unique_ptr
explode_outer(table_view const& input_table, if (null_or_empty_count == 0) { // performance penalty to run the below loop if there are no nulls or empty lists. // run simple explode instead - return include_position ? explode_position(input_table, explode_column_idx, stream, mr) - : explode(input_table, explode_column_idx, stream, mr); + return include_position ? detail::explode_position(input_table, explode_column_idx, stream, mr) + : detail::explode(input_table, explode_column_idx, stream, mr); } auto gather_map_size = sliced_child.size() + null_or_empty_count; @@ -300,58 +300,63 @@ std::unique_ptr
explode_outer(table_view const& input_table, } // namespace detail /** - * @copydoc cudf::explode(table_view const&, size_type, rmm::device_async_resource_ref) + * @copydoc cudf::explode(table_view const&, size_type, rmm::cuda_stream_view, + * rmm::device_async_resource_ref) */ std::unique_ptr
explode(table_view const& input_table, size_type explode_column_idx, + rmm::cuda_stream_view stream, rmm::device_async_resource_ref mr) { CUDF_FUNC_RANGE(); CUDF_EXPECTS(input_table.column(explode_column_idx).type().id() == type_id::LIST, "Unsupported non-list column"); - return detail::explode(input_table, explode_column_idx, cudf::get_default_stream(), mr); + return detail::explode(input_table, explode_column_idx, stream, mr); } /** - * @copydoc cudf::explode_position(table_view const&, size_type, rmm::device_async_resource_ref) + * @copydoc cudf::explode_position(table_view const&, size_type, rmm::cuda_stream_view, + * rmm::device_async_resource_ref) */ std::unique_ptr
explode_position(table_view const& input_table, size_type explode_column_idx, + rmm::cuda_stream_view stream, rmm::device_async_resource_ref mr) { CUDF_FUNC_RANGE(); CUDF_EXPECTS(input_table.column(explode_column_idx).type().id() == type_id::LIST, "Unsupported non-list column"); - return detail::explode_position(input_table, explode_column_idx, cudf::get_default_stream(), mr); + return detail::explode_position(input_table, explode_column_idx, stream, mr); } /** - * @copydoc cudf::explode_outer(table_view const&, size_type, rmm::device_async_resource_ref) + * @copydoc cudf::explode_outer(table_view const&, size_type, rmm::cuda_stream_view, + * rmm::device_async_resource_ref) */ std::unique_ptr
explode_outer(table_view const& input_table, size_type explode_column_idx, + rmm::cuda_stream_view stream, rmm::device_async_resource_ref mr) { CUDF_FUNC_RANGE(); CUDF_EXPECTS(input_table.column(explode_column_idx).type().id() == type_id::LIST, "Unsupported non-list column"); - return detail::explode_outer( - input_table, explode_column_idx, false, cudf::get_default_stream(), mr); + return detail::explode_outer(input_table, explode_column_idx, false, stream, mr); } /** * @copydoc cudf::explode_outer_position(table_view const&, size_type, - * rmm::device_async_resource_ref) + * rmm::cuda_stream_view, rmm::device_async_resource_ref) */ std::unique_ptr
explode_outer_position(table_view const& input_table, size_type explode_column_idx, + rmm::cuda_stream_view stream, rmm::device_async_resource_ref mr) { CUDF_FUNC_RANGE(); CUDF_EXPECTS(input_table.column(explode_column_idx).type().id() == type_id::LIST, "Unsupported non-list column"); - return detail::explode_outer( - input_table, explode_column_idx, true, cudf::get_default_stream(), mr); + return detail::explode_outer(input_table, explode_column_idx, true, stream, mr); } } // namespace cudf diff --git a/cpp/tests/streams/lists_test.cpp b/cpp/tests/streams/lists_test.cpp index 711e20e4b17..7963dced292 100644 --- a/cpp/tests/streams/lists_test.cpp +++ b/cpp/tests/streams/lists_test.cpp @@ -1,5 +1,5 @@ /* - * Copyright (c) 2023-2024, NVIDIA CORPORATION. + * Copyright (c) 2024, NVIDIA CORPORATION. * * Licensed under the Apache License, Version 2.0 (the "License"); * you may not use this file except in compliance with the License. @@ -21,6 +21,7 @@ #include #include #include +#include #include #include #include @@ -212,3 +213,57 @@ TEST_F(ListTest, HaveOverlap) cudf::nan_equality::ALL_EQUAL, cudf::test::get_default_stream()); } + +TEST_F(ListTest, Explode) +{ + cudf::test::fixed_width_column_wrapper list_col_a{100, 200, 300}; + cudf::test::lists_column_wrapper list_col_b{ + cudf::test::lists_column_wrapper{1, 2, 7}, + cudf::test::lists_column_wrapper{5, 6}, + cudf::test::lists_column_wrapper{0, 3}}; + cudf::test::strings_column_wrapper list_col_c{"string0", "string1", "string2"}; + cudf::table_view lists_table({list_col_a, list_col_b, list_col_c}); + cudf::explode(lists_table, 1, cudf::test::get_default_stream()); +} + +TEST_F(ListTest, ExplodePosition) +{ + cudf::test::fixed_width_column_wrapper list_col_a{100, 200, 300}; + cudf::test::lists_column_wrapper list_col_b{ + cudf::test::lists_column_wrapper{1, 2, 7}, + cudf::test::lists_column_wrapper{5, 6}, + cudf::test::lists_column_wrapper{0, 3}}; + cudf::test::strings_column_wrapper list_col_c{"string0", "string1", "string2"}; + cudf::table_view lists_table({list_col_a, list_col_b, list_col_c}); + cudf::explode_position(lists_table, 1, cudf::test::get_default_stream()); +} + +TEST_F(ListTest, ExplodeOuter) +{ + constexpr auto null = 0; + auto valids = + cudf::detail::make_counting_transform_iterator(0, [](auto i) { return i % 2 == 0; }); + cudf::test::lists_column_wrapper list_col_a{ + cudf::test::lists_column_wrapper({1, null, 7}, valids), + cudf::test::lists_column_wrapper({5, null, 0, null}, valids), + cudf::test::lists_column_wrapper{}, + cudf::test::lists_column_wrapper({0, null, 8}, valids)}; + cudf::test::fixed_width_column_wrapper list_col_b{100, 200, 300, 400}; + cudf::table_view lists_table({list_col_a, list_col_b}); + cudf::explode_outer(lists_table, 0, cudf::test::get_default_stream()); +} + +TEST_F(ListTest, ExplodeOuterPosition) +{ + constexpr auto null = 0; + auto valids = + cudf::detail::make_counting_transform_iterator(0, [](auto i) { return i % 2 == 0; }); + cudf::test::lists_column_wrapper list_col_a{ + cudf::test::lists_column_wrapper({1, null, 7}, valids), + cudf::test::lists_column_wrapper({5, null, 0, null}, valids), + cudf::test::lists_column_wrapper{}, + cudf::test::lists_column_wrapper({0, null, 8}, valids)}; + cudf::test::fixed_width_column_wrapper list_col_b{100, 200, 300, 400}; + cudf::table_view lists_table({list_col_a, list_col_b}); + cudf::explode_outer_position(lists_table, 0, cudf::test::get_default_stream()); +}