From cd40a9e9c9a3ca7a7eaf845fef22c9ca91f16b0a Mon Sep 17 00:00:00 2001 From: Nghia Truong Date: Tue, 8 Feb 2022 11:16:56 -0700 Subject: [PATCH 1/3] Cast source type to target type before computation --- .../sort/group_single_pass_reduction_util.cuh | 37 +++++++++++++------ 1 file changed, 26 insertions(+), 11 deletions(-) diff --git a/cpp/src/groupby/sort/group_single_pass_reduction_util.cuh b/cpp/src/groupby/sort/group_single_pass_reduction_util.cuh index dde4e00eb4a..92b13353477 100644 --- a/cpp/src/groupby/sort/group_single_pass_reduction_util.cuh +++ b/cpp/src/groupby/sort/group_single_pass_reduction_util.cuh @@ -74,12 +74,16 @@ struct element_arg_minmax_fn { /** * @brief Value accessor for column which supports dictionary column too. * + * This is similar to `value_accessor` in `column_device_view.cuh` but with support of dictionary + * type. + * * @tparam T Type of the underlying column. For dictionary column, type of the key column. */ template struct value_accessor { column_device_view const col; bool const is_dict; + value_accessor(column_device_view const& col) : col(col), is_dict(cudf::is_dictionary(col.type())) { } @@ -93,6 +97,7 @@ struct value_accessor { return col.element(i); } } + __device__ auto operator()(size_type i) const { return value(i); } }; @@ -100,20 +105,28 @@ struct value_accessor { * @brief Null replaced value accessor for column which supports dictionary column too. * For null value, returns null `init` value * - * @tparam T Type of the underlying column. For dictionary column, type of the key column. + * @tparam SourceType Type of the underlying column. For dictionary column, type of the key column. + * @tparam TargetType Type that is used for computation. */ -template -struct null_replaced_value_accessor : value_accessor { - using super_t = value_accessor; +template +struct null_replaced_value_accessor : value_accessor { + using super_t = value_accessor; + + TargetType const init; bool const has_nulls; - T const init; - null_replaced_value_accessor(column_device_view const& col, T const& init, bool const has_nulls) + + null_replaced_value_accessor(column_device_view const& col, + TargetType const& init, + bool const has_nulls) : super_t(col), init(init), has_nulls(has_nulls) { } - __device__ T operator()(size_type i) const + + __device__ TargetType operator()(size_type i) const { - return has_nulls && super_t::col.is_null_nocheck(i) ? init : super_t::value(i); + return has_nulls && super_t::col.is_null_nocheck(i) + ? init + : static_cast(super_t::value(i)); } }; @@ -168,7 +181,7 @@ struct group_reduction_functor; + using SourceDType = device_storage_type_t; using ResultType = cudf::detail::target_type_t; using ResultDType = device_storage_type_t; @@ -203,9 +216,11 @@ struct group_reduction_functor; - auto init = OpType::template identity(); + auto init = OpType::template identity(); auto inp_values = cudf::detail::make_counting_transform_iterator( - 0, null_replaced_value_accessor{*d_values_ptr, init, values.has_nulls()}); + 0, + null_replaced_value_accessor{ + *d_values_ptr, init, values.has_nulls()}); do_reduction(inp_values, result_begin, OpType{}); } From ddf306c49981625185dd7153fe28b94955e34509 Mon Sep 17 00:00:00 2001 From: Nghia Truong Date: Tue, 8 Feb 2022 11:17:27 -0700 Subject: [PATCH 2/3] Add a unit test --- cpp/tests/groupby/sum_tests.cpp | 21 +++++++++++++++++++++ 1 file changed, 21 insertions(+) diff --git a/cpp/tests/groupby/sum_tests.cpp b/cpp/tests/groupby/sum_tests.cpp index 5947e309bec..ca3d7fa655c 100644 --- a/cpp/tests/groupby/sum_tests.cpp +++ b/cpp/tests/groupby/sum_tests.cpp @@ -156,6 +156,27 @@ TYPED_TEST(groupby_sum_test, dictionary) force_use_sort_impl::YES); } +struct overflow_test : public cudf::test::BaseFixture { +}; +TEST_F(overflow_test, overflow_integer) +{ + using int32_col = fixed_width_column_wrapper; + using int64_col = fixed_width_column_wrapper; + + auto const keys = int32_col{0, 0}; + auto const vals = int32_col{-2147483648, -2147483648}; + auto const expect_keys = int32_col{0}; + auto const expect_vals = int64_col{-4294967296L}; + + auto test_sum = [&](auto const use_sort) { + auto agg = make_sum_aggregation(); + test_single_agg(keys, vals, expect_keys, expect_vals, std::move(agg), use_sort); + }; + + test_sum(force_use_sort_impl::NO); + test_sum(force_use_sort_impl::YES); +} + template struct FixedPointTestAllReps : public cudf::test::BaseFixture { }; From e76c13ccf4d91964dea4b95fd94717022f0406eb Mon Sep 17 00:00:00 2001 From: Nghia Truong Date: Tue, 8 Feb 2022 11:28:13 -0700 Subject: [PATCH 3/3] Update copyright year --- cpp/src/groupby/sort/group_single_pass_reduction_util.cuh | 2 +- cpp/tests/groupby/sum_tests.cpp | 2 +- 2 files changed, 2 insertions(+), 2 deletions(-) diff --git a/cpp/src/groupby/sort/group_single_pass_reduction_util.cuh b/cpp/src/groupby/sort/group_single_pass_reduction_util.cuh index 92b13353477..8e1463f7964 100644 --- a/cpp/src/groupby/sort/group_single_pass_reduction_util.cuh +++ b/cpp/src/groupby/sort/group_single_pass_reduction_util.cuh @@ -1,5 +1,5 @@ /* - * Copyright (c) 2019-2021, NVIDIA CORPORATION. + * Copyright (c) 2019-2022, NVIDIA CORPORATION. * * Licensed under the Apache License, Version 2.0 (the "License"); * you may not use this file except in compliance with the License. diff --git a/cpp/tests/groupby/sum_tests.cpp b/cpp/tests/groupby/sum_tests.cpp index ca3d7fa655c..be7da4a784c 100644 --- a/cpp/tests/groupby/sum_tests.cpp +++ b/cpp/tests/groupby/sum_tests.cpp @@ -1,5 +1,5 @@ /* - * Copyright (c) 2019-2021, NVIDIA CORPORATION. + * Copyright (c) 2019-2022, NVIDIA CORPORATION. * * Licensed under the Apache License, Version 2.0 (the "License"); * you may not use this file except in compliance with the License.