From f655602ecd8f254dfcee5eb0c790bd3336e83d7c Mon Sep 17 00:00:00 2001
From: Vyas Ramasubramani <vyasr@nvidia.com>
Date: Tue, 11 Jun 2024 15:59:20 -0700
Subject: [PATCH 1/9] Fix Cython typo preventing proper inheritance (#15978)

#15831 added new inheritance patterns to the Parquet options classes, but mirroring them perfectly in Cython proved problematic due to what appeared to be issues with Cython parsing of CRTP and inheritance. A deeper investigation revealed that the underlying issue was https://github.com/cython/cython/issues/6238. This PR applies the appropriate fix.

Authors:
  - Vyas Ramasubramani (https://github.com/vyasr)

Approvers:
  - Thomas Li (https://github.com/lithomas1)
  - Bradley Dice (https://github.com/bdice)

URL: https://github.com/rapidsai/cudf/pull/15978
---
 .../_lib/pylibcudf/libcudf/io/parquet.pxd     | 24 ++++++-------------
 1 file changed, 7 insertions(+), 17 deletions(-)

diff --git a/python/cudf/cudf/_lib/pylibcudf/libcudf/io/parquet.pxd b/python/cudf/cudf/_lib/pylibcudf/libcudf/io/parquet.pxd
index 36654457995..0ef6553db56 100644
--- a/python/cudf/cudf/_lib/pylibcudf/libcudf/io/parquet.pxd
+++ b/python/cudf/cudf/_lib/pylibcudf/libcudf/io/parquet.pxd
@@ -123,7 +123,7 @@ cdef extern from "cudf/io/parquet.hpp" namespace "cudf::io" nogil:
         ) except +
 
     cdef cppclass parquet_writer_options_builder_base[BuilderT, OptionsT]:
-        parquet_writer_options_builder() except +
+        parquet_writer_options_builder_base() except +
 
         BuilderT& metadata(
             cudf_io_types.table_input_metadata m
@@ -164,22 +164,6 @@ cdef extern from "cudf/io/parquet.hpp" namespace "cudf::io" nogil:
         BuilderT& dictionary_policy(
             cudf_io_types.dictionary_policy val
         ) except +
-        # FIXME: the following two functions actually belong in
-        # parquet_writer_options_builder, but placing them there yields a
-        # "'parquet_writer_options_builder' is not a type identifier" error.
-        # This is probably a bug in cython since a simpler CRTP example that
-        # has methods returning references to a child class seem to work.
-        # Calling these from the chunked options builder will fail at compile
-        # time, so this should be safe.
-        # NOTE: these two are never actually called from libcudf. Instead these
-        # properties are set in the options after calling build(), so perhaps
-        # they can be removed.
-        BuilderT& partitions(
-            vector[cudf_io_types.partition_info] partitions
-        ) except +
-        BuilderT& column_chunks_file_paths(
-            vector[string] column_chunks_file_paths
-        ) except +
         OptionsT build() except +
 
     cdef cppclass parquet_writer_options_builder(
@@ -190,6 +174,12 @@ cdef extern from "cudf/io/parquet.hpp" namespace "cudf::io" nogil:
             cudf_io_types.sink_info sink_,
             cudf_table_view.table_view table_
         ) except +
+        parquet_writer_options_builder& partitions(
+            vector[cudf_io_types.partition_info] partitions
+        ) except +
+        parquet_writer_options_builder& column_chunks_file_paths(
+            vector[string] column_chunks_file_paths
+        ) except +
 
     cdef unique_ptr[vector[uint8_t]] write_parquet(
         parquet_writer_options args

From 49e2a565ffb85479589406f622c74116d7f891c7 Mon Sep 17 00:00:00 2001
From: David Wendt <45795991+davidwendt@users.noreply.github.com>
Date: Tue, 11 Jun 2024 20:27:54 -0400
Subject: [PATCH 2/9] Support large strings in cudf::io::text::multibyte_split
 (#15947)

Replaces int32 type used for building offsets in `cudf::io::text::multibyte_split()` to use the offsetalator instead.
This allows creating large strings columns from input text files.

Authors:
  - David Wendt (https://github.com/davidwendt)

Approvers:
  - Mark Harris (https://github.com/harrism)
  - Bradley Dice (https://github.com/bdice)
  - Karthikeyan (https://github.com/karthikeyann)

URL: https://github.com/rapidsai/cudf/pull/15947
---
 cpp/src/io/text/multibyte_split.cu | 38 ++++++++++++++++--------------
 1 file changed, 20 insertions(+), 18 deletions(-)

diff --git a/cpp/src/io/text/multibyte_split.cu b/cpp/src/io/text/multibyte_split.cu
index 976d735e010..9c406369068 100644
--- a/cpp/src/io/text/multibyte_split.cu
+++ b/cpp/src/io/text/multibyte_split.cu
@@ -20,6 +20,7 @@
 #include <cudf/column/column_factories.hpp>
 #include <cudf/detail/iterator.cuh>
 #include <cudf/detail/nvtx/ranges.hpp>
+#include <cudf/detail/offsets_iterator_factory.cuh>
 #include <cudf/detail/utilities/cuda.cuh>
 #include <cudf/detail/utilities/integer_utils.hpp>
 #include <cudf/detail/utilities/stream_pool.hpp>
@@ -30,6 +31,7 @@
 #include <cudf/io/text/multibyte_split.hpp>
 #include <cudf/scalar/scalar.hpp>
 #include <cudf/strings/detail/strings_column_factories.cuh>
+#include <cudf/strings/detail/utilities.hpp>
 #include <cudf/utilities/default_stream.hpp>
 #include <cudf/utilities/span.hpp>
 
@@ -518,32 +520,37 @@ std::unique_ptr<cudf::column> multibyte_split(cudf::io::text::data_chunk_source
   bool const insert_end =
     not(last_row_offset.has_value() or
         (global_offsets.size() > 0 and global_offsets.back_element(stream) == chunk_offset));
-  rmm::device_uvector<int32_t> offsets{
-    global_offsets.size() + insert_begin + insert_end, stream, mr};
-  if (insert_begin) { offsets.set_element_to_zero_async(0, stream); }
-  if (insert_end) {
-    offsets.set_element(offsets.size() - 1, chunk_offset - *first_row_offset, stream);
-  }
+  auto const chars_bytes = chunk_offset - *first_row_offset;
+  auto offsets           = cudf::strings::detail::create_offsets_child_column(
+    chars_bytes, global_offsets.size() + insert_begin + insert_end, stream, mr);
+  auto offsets_itr =
+    cudf::detail::offsetalator_factory::make_output_iterator(offsets->mutable_view());
+  auto set_offset_value = [offsets_itr, stream](size_type index, int64_t value) {
+    cudf::detail::device_single_thread(
+      [offsets_itr, index, value] __device__() mutable { offsets_itr[index] = value; }, stream);
+  };
+  if (insert_begin) { set_offset_value(0, 0); }
+  if (insert_end) { set_offset_value(offsets->size() - 1, chars_bytes); }
   thrust::transform(rmm::exec_policy(stream),
                     global_offsets.begin(),
                     global_offsets.end(),
-                    offsets.begin() + insert_begin,
-                    cuda::proclaim_return_type<int32_t>(
+                    offsets_itr + insert_begin,
+                    cuda::proclaim_return_type<int64_t>(
                       [baseline = *first_row_offset] __device__(byte_offset global_offset) {
-                        return static_cast<int32_t>(global_offset - baseline);
+                        return (global_offset - baseline);
                       }));
-  auto string_count = offsets.size() - 1;
+  auto string_count = offsets->size() - 1;
   if (strip_delimiters) {
     auto it = cudf::detail::make_counting_transform_iterator(
       0,
       cuda::proclaim_return_type<thrust::pair<char*, int32_t>>(
-        [ofs        = offsets.data(),
+        [ofs        = cudf::detail::offsetalator_factory::make_input_iterator(offsets->view()),
          chars      = chars.data(),
          delim_size = static_cast<size_type>(delimiter.size()),
          last_row   = static_cast<size_type>(string_count) - 1,
          insert_end] __device__(size_type row) {
           auto const begin = ofs[row];
-          auto const len   = ofs[row + 1] - begin;
+          auto const len   = static_cast<size_type>(ofs[row + 1] - begin);
           if (row == last_row && insert_end) {
             return thrust::make_pair(chars + begin, len);
           } else {
@@ -552,12 +559,7 @@ std::unique_ptr<cudf::column> multibyte_split(cudf::io::text::data_chunk_source
         }));
     return cudf::strings::detail::make_strings_column(it, it + string_count, stream, mr);
   } else {
-    return cudf::make_strings_column(
-      string_count,
-      std::make_unique<cudf::column>(std::move(offsets), rmm::device_buffer{}, 0),
-      chars.release(),
-      0,
-      {});
+    return cudf::make_strings_column(string_count, std::move(offsets), chars.release(), 0, {});
   }
 }
 

From d2cd1d4411e1a16f5c989efff07643ca3411f8ab Mon Sep 17 00:00:00 2001
From: Matthew Murray <41342305+Matt711@users.noreply.github.com>
Date: Tue, 11 Jun 2024 20:28:40 -0400
Subject: [PATCH 3/9] Migrate lists/combine to pylibcudf (#15928)

Part of #15162. concatenate_rows, concatenate_list_elements

Authors:
  - Matthew Murray (https://github.com/Matt711)

Approvers:
  - Vyas Ramasubramani (https://github.com/vyasr)
  - Thomas Li (https://github.com/lithomas1)

URL: https://github.com/rapidsai/cudf/pull/15928
---
 python/cudf/cudf/_lib/lists.pyx               | 46 ++++----------
 python/cudf/cudf/_lib/pylibcudf/lists.pxd     |  7 +++
 python/cudf/cudf/_lib/pylibcudf/lists.pyx     | 61 +++++++++++++++++++
 .../cudf/cudf/pylibcudf_tests/test_lists.py   | 46 ++++++++++++++
 4 files changed, 127 insertions(+), 33 deletions(-)
 create mode 100644 python/cudf/cudf/pylibcudf_tests/test_lists.py

diff --git a/python/cudf/cudf/_lib/lists.pyx b/python/cudf/cudf/_lib/lists.pyx
index 656d92c1a4b..5d406f5c85f 100644
--- a/python/cudf/cudf/_lib/lists.pyx
+++ b/python/cudf/cudf/_lib/lists.pyx
@@ -9,11 +9,6 @@ from libcpp.utility cimport move
 from cudf._lib.column cimport Column
 from cudf._lib.pylibcudf.libcudf.column.column cimport column
 from cudf._lib.pylibcudf.libcudf.column.column_view cimport column_view
-from cudf._lib.pylibcudf.libcudf.lists.combine cimport (
-    concatenate_list_elements as cpp_concatenate_list_elements,
-    concatenate_null_policy,
-    concatenate_rows as cpp_concatenate_rows,
-)
 from cudf._lib.pylibcudf.libcudf.lists.contains cimport (
     contains,
     index_of as cpp_index_of,
@@ -32,7 +27,6 @@ from cudf._lib.pylibcudf.libcudf.lists.stream_compaction cimport (
     distinct as cpp_distinct,
 )
 from cudf._lib.pylibcudf.libcudf.scalar.scalar cimport scalar
-from cudf._lib.pylibcudf.libcudf.table.table_view cimport table_view
 from cudf._lib.pylibcudf.libcudf.types cimport (
     nan_equality,
     null_equality,
@@ -41,10 +35,7 @@ from cudf._lib.pylibcudf.libcudf.types cimport (
     size_type,
 )
 from cudf._lib.scalar cimport DeviceScalar
-from cudf._lib.utils cimport (
-    columns_from_pylibcudf_table,
-    table_view_from_columns,
-)
+from cudf._lib.utils cimport columns_from_pylibcudf_table
 
 from cudf._lib import pylibcudf
 
@@ -223,31 +214,20 @@ def index_of_column(Column col, Column search_keys):
 
 @acquire_spill_lock()
 def concatenate_rows(list source_columns):
-    cdef unique_ptr[column] c_result
-
-    cdef table_view c_table_view = table_view_from_columns(source_columns)
-
-    with nogil:
-        c_result = move(cpp_concatenate_rows(
-            c_table_view,
-        ))
-
-    return Column.from_unique_ptr(move(c_result))
+    return Column.from_pylibcudf(
+        pylibcudf.lists.concatenate_rows(
+            pylibcudf.Table([
+                c.to_pylibcudf(mode="read") for c in source_columns
+            ])
+        )
+    )
 
 
 @acquire_spill_lock()
 def concatenate_list_elements(Column input_column, dropna=False):
-    cdef concatenate_null_policy policy = (
-        concatenate_null_policy.IGNORE if dropna
-        else concatenate_null_policy.NULLIFY_OUTPUT_ROW
+    return Column.from_pylibcudf(
+        pylibcudf.lists.concatenate_list_elements(
+            input_column.to_pylibcudf(mode="read"),
+            dropna,
+        )
     )
-    cdef column_view c_input = input_column.view()
-    cdef unique_ptr[column] c_result
-
-    with nogil:
-        c_result = move(cpp_concatenate_list_elements(
-            c_input,
-            policy
-        ))
-
-    return Column.from_unique_ptr(move(c_result))
diff --git a/python/cudf/cudf/_lib/pylibcudf/lists.pxd b/python/cudf/cudf/_lib/pylibcudf/lists.pxd
index b780d299977..2d2a5b2a9ea 100644
--- a/python/cudf/cudf/_lib/pylibcudf/lists.pxd
+++ b/python/cudf/cudf/_lib/pylibcudf/lists.pxd
@@ -1,8 +1,15 @@
 # Copyright (c) 2024, NVIDIA CORPORATION.
 
+from libcpp cimport bool
+
 from cudf._lib.pylibcudf.libcudf.types cimport size_type
 
+from .column cimport Column
 from .table cimport Table
 
 
 cpdef Table explode_outer(Table, size_type explode_column_idx)
+
+cpdef Column concatenate_rows(Table)
+
+cpdef Column concatenate_list_elements(Column, bool dropna)
diff --git a/python/cudf/cudf/_lib/pylibcudf/lists.pyx b/python/cudf/cudf/_lib/pylibcudf/lists.pyx
index 654f39742b6..069c9da31c2 100644
--- a/python/cudf/cudf/_lib/pylibcudf/lists.pyx
+++ b/python/cudf/cudf/_lib/pylibcudf/lists.pyx
@@ -1,12 +1,20 @@
 # Copyright (c) 2024, NVIDIA CORPORATION.
 
+from libcpp cimport bool
 from libcpp.memory cimport unique_ptr
 from libcpp.utility cimport move
 
+from cudf._lib.pylibcudf.libcudf.column.column cimport column
 from cudf._lib.pylibcudf.libcudf.lists cimport explode as cpp_explode
+from cudf._lib.pylibcudf.libcudf.lists.combine cimport (
+    concatenate_list_elements as cpp_concatenate_list_elements,
+    concatenate_null_policy,
+    concatenate_rows as cpp_concatenate_rows,
+)
 from cudf._lib.pylibcudf.libcudf.table.table cimport table
 from cudf._lib.pylibcudf.libcudf.types cimport size_type
 
+from .column cimport Column
 from .table cimport Table
 
 
@@ -33,3 +41,56 @@ cpdef Table explode_outer(Table input, size_type explode_column_idx):
         c_result = move(cpp_explode.explode_outer(input.view(), explode_column_idx))
 
     return Table.from_libcudf(move(c_result))
+
+
+cpdef Column concatenate_rows(Table input):
+    """Concatenate multiple lists columns into a single lists column row-wise.
+
+    Parameters
+    ----------
+    input : Table
+        The input table
+
+    Returns
+    -------
+    Table
+        A new Column of concatenated rows
+    """
+    cdef unique_ptr[column] c_result
+
+    with nogil:
+        c_result = move(cpp_concatenate_rows(input.view()))
+
+    return Column.from_libcudf(move(c_result))
+
+
+cpdef Column concatenate_list_elements(Column input, bool dropna):
+    """Concatenate multiple lists on the same row into a single list.
+
+    Parameters
+    ----------
+    input : Column
+        The input column
+
+    Returns
+    -------
+    Column
+        A new Column of concatenated list elements
+    dropna : bool
+        If true, null list elements will be ignored
+        from concatenation. Otherwise any input null values will result in
+        the corresponding output row being set to null.
+    """
+    cdef concatenate_null_policy null_policy = (
+        concatenate_null_policy.IGNORE if dropna
+        else concatenate_null_policy.NULLIFY_OUTPUT_ROW
+    )
+    cdef unique_ptr[column] c_result
+
+    with nogil:
+        c_result = move(cpp_concatenate_list_elements(
+            input.view(),
+            null_policy,
+        ))
+
+    return Column.from_libcudf(move(c_result))
diff --git a/python/cudf/cudf/pylibcudf_tests/test_lists.py b/python/cudf/cudf/pylibcudf_tests/test_lists.py
new file mode 100644
index 00000000000..b21af8ea11c
--- /dev/null
+++ b/python/cudf/cudf/pylibcudf_tests/test_lists.py
@@ -0,0 +1,46 @@
+# Copyright (c) 2024, NVIDIA CORPORATION.
+
+import pyarrow as pa
+import pytest
+from utils import assert_column_eq
+
+from cudf._lib import pylibcudf as plc
+
+
+def test_concatenate_rows():
+    test_data = [[[0, 1], [2], [5], [6, 7]], [[8], [9], [], [13, 14, 15]]]
+
+    arrow_tbl = pa.Table.from_arrays(test_data, names=["a", "b"])
+    plc_tbl = plc.interop.from_arrow(arrow_tbl)
+
+    res = plc.lists.concatenate_rows(plc_tbl)
+
+    expect = pa.array([pair[0] + pair[1] for pair in zip(*test_data)])
+
+    assert_column_eq(expect, res)
+
+
+@pytest.mark.parametrize(
+    "test_data, dropna, expected",
+    [
+        (
+            [[[1, 2], [3, 4], [5]], [[6], None, [7, 8, 9]]],
+            False,
+            [[1, 2, 3, 4, 5], None],
+        ),
+        (
+            [[[1, 2], [3, 4], [5, None]], [[6], [None], [7, 8, 9]]],
+            True,
+            [[1, 2, 3, 4, 5, None], [6, None, 7, 8, 9]],
+        ),
+    ],
+)
+def test_concatenate_list_elements(test_data, dropna, expected):
+    arr = pa.array(test_data)
+    plc_column = plc.interop.from_arrow(arr)
+
+    res = plc.lists.concatenate_list_elements(plc_column, dropna)
+
+    expect = pa.array(expected)
+
+    assert_column_eq(expect, res)

From f7ba6ab47ac994e6a1363119c01eee5dd6304181 Mon Sep 17 00:00:00 2001
From: Vukasin Milovanovic <vmilovanovic@nvidia.com>
Date: Tue, 11 Jun 2024 17:47:19 -0700
Subject: [PATCH 4/9] Pinned vector factory that uses the global pool (#15895)

closes https://github.com/rapidsai/cudf/issues/15612
Expanded the set of vector factories to cover pinned vectors. The functions return `cudf::detail::host_vector`, which use a type-erased allocator, allowing us to utilize the runtime configurable global pinned (previously host) resource.
The `pinned_host_vector` type has been removed as it can only support the non-pooled pinned allocations. Its use is not replaced with `cudf::detail::host_vector`.
Moved the global host (now pinned) resource out of cuIO and changed the type to host_device. User-specified resources are now required to allocate device-accessible memory. The name has been changed to pinned to reflect the new requirement.

Authors:
  - Vukasin Milovanovic (https://github.com/vuule)

Approvers:
  - Alessandro Bellina (https://github.com/abellina)
  - Yunsong Wang (https://github.com/PointKernel)
  - Mark Harris (https://github.com/harrism)
  - David Wendt (https://github.com/davidwendt)

URL: https://github.com/rapidsai/cudf/pull/15895
---
 cpp/CMakeLists.txt                            |   1 +
 cpp/benchmarks/fixture/nvbench_fixture.hpp    |  13 +-
 cpp/benchmarks/io/cuio_common.cpp             |  12 +
 cpp/benchmarks/io/cuio_common.hpp             |   4 +-
 .../io/parquet/parquet_reader_multithread.cpp |   2 +-
 cpp/benchmarks/io/text/multibyte_split.cpp    |  10 +-
 .../{rmm_host_vector.hpp => host_vector.hpp}  |  18 +-
 .../detail/utilities/pinned_host_vector.hpp   | 216 ------------------
 .../detail/utilities/vector_factories.hpp     |  38 ++-
 cpp/include/cudf/io/memory_resource.hpp       |  65 ------
 cpp/include/cudf/utilities/pinned_memory.hpp  |  58 +++++
 cpp/src/io/csv/reader_impl.cu                 |   1 +
 cpp/src/io/orc/reader_impl_chunking.cu        |   1 +
 cpp/src/io/orc/writer_impl.cu                 |   5 +-
 cpp/src/io/parquet/reader_impl_helpers.cpp    |   2 +
 cpp/src/io/parquet/writer_impl.cu             |   3 +-
 cpp/src/io/text/bgzip_data_chunk_source.cu    |  16 +-
 .../io/text/data_chunk_source_factories.cpp   |  51 ++---
 cpp/src/io/utilities/config_utils.cpp         | 214 +----------------
 cpp/src/io/utilities/hostdevice_vector.hpp    |   9 +-
 cpp/src/utilities/pinned_memory.cpp           | 216 ++++++++++++++++++
 cpp/tests/CMakeLists.txt                      |   5 +-
 cpp/tests/io/json_test.cpp                    |   6 +-
 .../utilities_tests/io_utilities_tests.cpp    |  45 ----
 .../utilities_tests/pinned_memory_tests.cpp   |  65 ++++++
 .../java/ai/rapids/cudf/PinnedMemoryPool.java |  12 +-
 java/src/main/java/ai/rapids/cudf/Rmm.java    |   2 +-
 java/src/main/native/src/RmmJni.cpp           |  34 +--
 28 files changed, 487 insertions(+), 637 deletions(-)
 rename cpp/include/cudf/detail/utilities/{rmm_host_vector.hpp => host_vector.hpp} (93%)
 delete mode 100644 cpp/include/cudf/detail/utilities/pinned_host_vector.hpp
 delete mode 100644 cpp/include/cudf/io/memory_resource.hpp
 create mode 100644 cpp/include/cudf/utilities/pinned_memory.hpp
 create mode 100644 cpp/src/utilities/pinned_memory.cpp
 create mode 100644 cpp/tests/utilities_tests/pinned_memory_tests.cpp

diff --git a/cpp/CMakeLists.txt b/cpp/CMakeLists.txt
index ca85996b990..aab0a9b2d49 100644
--- a/cpp/CMakeLists.txt
+++ b/cpp/CMakeLists.txt
@@ -664,6 +664,7 @@ add_library(
   src/utilities/default_stream.cpp
   src/utilities/linked_column.cpp
   src/utilities/logger.cpp
+  src/utilities/pinned_memory.cpp
   src/utilities/stacktrace.cpp
   src/utilities/stream_pool.cpp
   src/utilities/traits.cpp
diff --git a/cpp/benchmarks/fixture/nvbench_fixture.hpp b/cpp/benchmarks/fixture/nvbench_fixture.hpp
index ebcbcb17e98..df1492690bb 100644
--- a/cpp/benchmarks/fixture/nvbench_fixture.hpp
+++ b/cpp/benchmarks/fixture/nvbench_fixture.hpp
@@ -15,8 +15,8 @@
  */
 #pragma once
 
-#include <cudf/io/memory_resource.hpp>
 #include <cudf/utilities/error.hpp>
+#include <cudf/utilities/pinned_memory.hpp>
 
 #include <rmm/cuda_device.hpp>
 #include <rmm/mr/device/arena_memory_resource.hpp>
@@ -81,17 +81,18 @@ struct nvbench_base_fixture {
               "\nExpecting: cuda, pool, async, arena, managed, or managed_pool");
   }
 
-  inline rmm::host_async_resource_ref make_cuio_host_pinned()
+  inline rmm::host_device_async_resource_ref make_cuio_host_pinned()
   {
     static std::shared_ptr<rmm::mr::pinned_host_memory_resource> mr =
       std::make_shared<rmm::mr::pinned_host_memory_resource>();
     return *mr;
   }
 
-  inline rmm::host_async_resource_ref create_cuio_host_memory_resource(std::string const& mode)
+  inline rmm::host_device_async_resource_ref create_cuio_host_memory_resource(
+    std::string const& mode)
   {
     if (mode == "pinned") return make_cuio_host_pinned();
-    if (mode == "pinned_pool") return cudf::io::get_host_memory_resource();
+    if (mode == "pinned_pool") return cudf::get_pinned_memory_resource();
     CUDF_FAIL("Unknown cuio_host_mem parameter: " + mode + "\nExpecting: pinned or pinned_pool");
   }
 
@@ -112,14 +113,14 @@ struct nvbench_base_fixture {
     rmm::mr::set_current_device_resource(mr.get());
     std::cout << "RMM memory resource = " << rmm_mode << "\n";
 
-    cudf::io::set_host_memory_resource(create_cuio_host_memory_resource(cuio_host_mode));
+    cudf::set_pinned_memory_resource(create_cuio_host_memory_resource(cuio_host_mode));
     std::cout << "CUIO host memory resource = " << cuio_host_mode << "\n";
   }
 
   ~nvbench_base_fixture()
   {
     // Ensure the the pool is freed before the CUDA context is destroyed:
-    cudf::io::set_host_memory_resource(this->make_cuio_host_pinned());
+    cudf::set_pinned_memory_resource(this->make_cuio_host_pinned());
   }
 
   std::shared_ptr<rmm::mr::device_memory_resource> mr;
diff --git a/cpp/benchmarks/io/cuio_common.cpp b/cpp/benchmarks/io/cuio_common.cpp
index 37ced8ea703..645994f3f0d 100644
--- a/cpp/benchmarks/io/cuio_common.cpp
+++ b/cpp/benchmarks/io/cuio_common.cpp
@@ -19,6 +19,9 @@
 #include <cudf/detail/utilities/integer_utils.hpp>
 #include <cudf/detail/utilities/logger.hpp>
 
+#include <rmm/mr/pinned_host_memory_resource.hpp>
+#include <rmm/resource_ref.hpp>
+
 #include <unistd.h>
 
 #include <cstdio>
@@ -28,6 +31,14 @@
 
 temp_directory const cuio_source_sink_pair::tmpdir{"cudf_gbench"};
 
+// Don't use cudf's pinned pool for the source data
+rmm::host_async_resource_ref pinned_memory_resource()
+{
+  static rmm::mr::pinned_host_memory_resource mr = rmm::mr::pinned_host_memory_resource{};
+
+  return mr;
+}
+
 std::string random_file_in_dir(std::string const& dir_path)
 {
   // `mkstemp` modifies the template in place
@@ -41,6 +52,7 @@ std::string random_file_in_dir(std::string const& dir_path)
 
 cuio_source_sink_pair::cuio_source_sink_pair(io_type type)
   : type{type},
+    pinned_buffer({pinned_memory_resource(), cudf::get_default_stream()}),
     d_buffer{0, cudf::get_default_stream()},
     file_name{random_file_in_dir(tmpdir.path())},
     void_sink{cudf::io::data_sink::create()}
diff --git a/cpp/benchmarks/io/cuio_common.hpp b/cpp/benchmarks/io/cuio_common.hpp
index d4f39a5f243..64d6021cf50 100644
--- a/cpp/benchmarks/io/cuio_common.hpp
+++ b/cpp/benchmarks/io/cuio_common.hpp
@@ -18,7 +18,7 @@
 
 #include <cudf_test/file_utilities.hpp>
 
-#include <cudf/detail/utilities/pinned_host_vector.hpp>
+#include <cudf/detail/utilities/host_vector.hpp>
 #include <cudf/io/data_sink.hpp>
 #include <cudf/io/datasource.hpp>
 
@@ -79,7 +79,7 @@ class cuio_source_sink_pair {
 
   io_type const type;
   std::vector<char> h_buffer;
-  cudf::detail::pinned_host_vector<char> pinned_buffer;
+  cudf::detail::host_vector<char> pinned_buffer;
   rmm::device_uvector<std::byte> d_buffer;
   std::string const file_name;
   std::unique_ptr<cudf::io::data_sink> void_sink;
diff --git a/cpp/benchmarks/io/parquet/parquet_reader_multithread.cpp b/cpp/benchmarks/io/parquet/parquet_reader_multithread.cpp
index a67d1932951..b4c8ed78ed8 100644
--- a/cpp/benchmarks/io/parquet/parquet_reader_multithread.cpp
+++ b/cpp/benchmarks/io/parquet/parquet_reader_multithread.cpp
@@ -20,9 +20,9 @@
 #include <benchmarks/io/nvbench_helpers.hpp>
 
 #include <cudf/detail/utilities/stream_pool.hpp>
-#include <cudf/io/memory_resource.hpp>
 #include <cudf/io/parquet.hpp>
 #include <cudf/utilities/default_stream.hpp>
+#include <cudf/utilities/pinned_memory.hpp>
 #include <cudf/utilities/thread_pool.hpp>
 
 #include <nvtx3/nvtx3.hpp>
diff --git a/cpp/benchmarks/io/text/multibyte_split.cpp b/cpp/benchmarks/io/text/multibyte_split.cpp
index b5d855d8881..67705863d41 100644
--- a/cpp/benchmarks/io/text/multibyte_split.cpp
+++ b/cpp/benchmarks/io/text/multibyte_split.cpp
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2021-2023, NVIDIA CORPORATION.
+ * Copyright (c) 2021-2024, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -22,7 +22,6 @@
 #include <cudf_test/file_utilities.hpp>
 
 #include <cudf/column/column_factories.hpp>
-#include <cudf/detail/utilities/pinned_host_vector.hpp>
 #include <cudf/detail/utilities/vector_factories.hpp>
 #include <cudf/io/text/data_chunk_source_factories.hpp>
 #include <cudf/io/text/detail/bgzip_utils.hpp>
@@ -132,9 +131,10 @@ static void bench_multibyte_split(nvbench::state& state,
 
   auto const delim_factor = static_cast<double>(delim_percent) / 100;
   std::unique_ptr<cudf::io::datasource> datasource;
-  auto device_input      = create_random_input(file_size_approx, delim_factor, 0.05, delim);
-  auto host_input        = std::vector<char>{};
-  auto host_pinned_input = cudf::detail::pinned_host_vector<char>{};
+  auto device_input = create_random_input(file_size_approx, delim_factor, 0.05, delim);
+  auto host_input   = std::vector<char>{};
+  auto host_pinned_input =
+    cudf::detail::make_pinned_vector_async<char>(0, cudf::get_default_stream());
 
   if (source_type != data_chunk_source_type::device &&
       source_type != data_chunk_source_type::host_pinned) {
diff --git a/cpp/include/cudf/detail/utilities/rmm_host_vector.hpp b/cpp/include/cudf/detail/utilities/host_vector.hpp
similarity index 93%
rename from cpp/include/cudf/detail/utilities/rmm_host_vector.hpp
rename to cpp/include/cudf/detail/utilities/host_vector.hpp
index 6901a19473e..6a115177ab5 100644
--- a/cpp/include/cudf/detail/utilities/rmm_host_vector.hpp
+++ b/cpp/include/cudf/detail/utilities/host_vector.hpp
@@ -19,6 +19,7 @@
 #include <cudf/utilities/default_stream.hpp>
 #include <cudf/utilities/error.hpp>
 
+#include <rmm/aligned.hpp>
 #include <rmm/resource_ref.hpp>
 
 #include <thrust/host_vector.h>
@@ -32,8 +33,6 @@ namespace cudf::detail {
 /*! \p rmm_host_allocator is a CUDA-specific host memory allocator
  *  that employs \c a `rmm::host_async_resource_ref` for allocation.
  *
- * This implementation is ported from pinned_host_vector in cudf.
- *
  *  \see https://en.cppreference.com/w/cpp/memory/allocator
  */
 template <typename T>
@@ -42,8 +41,6 @@ class rmm_host_allocator;
 /*! \p rmm_host_allocator is a CUDA-specific host memory allocator
  *  that employs \c an `cudf::host_async_resource_ref` for allocation.
  *
- * This implementation is ported from pinned_host_vector in cudf.
- *
  *  \see https://en.cppreference.com/w/cpp/memory/allocator
  */
 template <>
@@ -70,8 +67,7 @@ class rmm_host_allocator<void> {
  * The \p rmm_host_allocator provides an interface for host memory allocation through the user
  * provided \c `rmm::host_async_resource_ref`. The \p rmm_host_allocator does not take ownership of
  * this reference and therefore it is the user's responsibility to ensure its lifetime for the
- * duration of the lifetime of the \p rmm_host_allocator. This implementation is ported from
- * pinned_host_vector in cudf.
+ * duration of the lifetime of the \p rmm_host_allocator.
  *
  *  \see https://en.cppreference.com/w/cpp/memory/allocator
  */
@@ -121,8 +117,12 @@ class rmm_host_allocator {
   inline pointer allocate(size_type cnt)
   {
     if (cnt > this->max_size()) { throw std::bad_alloc(); }  // end if
-    return static_cast<pointer>(
-      mr.allocate_async(cnt * sizeof(value_type), rmm::RMM_DEFAULT_HOST_ALIGNMENT, stream));
+    auto const result =
+      mr.allocate_async(cnt * sizeof(value_type), rmm::RMM_DEFAULT_HOST_ALIGNMENT, stream);
+    // Synchronize to ensure the memory is allocated before thrust::host_vector initialization
+    // TODO: replace thrust::host_vector with a type that does not require synchronization
+    stream.synchronize();
+    return static_cast<pointer>(result);
   }
 
   /**
@@ -182,6 +182,6 @@ class rmm_host_allocator {
  * @brief A vector class with rmm host memory allocator
  */
 template <typename T>
-using rmm_host_vector = thrust::host_vector<T, rmm_host_allocator<T>>;
+using host_vector = thrust::host_vector<T, rmm_host_allocator<T>>;
 
 }  // namespace cudf::detail
diff --git a/cpp/include/cudf/detail/utilities/pinned_host_vector.hpp b/cpp/include/cudf/detail/utilities/pinned_host_vector.hpp
deleted file mode 100644
index c22b6a6ba15..00000000000
--- a/cpp/include/cudf/detail/utilities/pinned_host_vector.hpp
+++ /dev/null
@@ -1,216 +0,0 @@
-/*
- *  Copyright (c) 2008-2024, NVIDIA CORPORATION
- *
- *  Licensed under the Apache License, Version 2.0 (the "License");
- *  you may not use this file except in compliance with the License.
- *  You may obtain a copy of the License at
- *
- *      http://www.apache.org/licenses/LICENSE-2.0
- *
- *  Unless required by applicable law or agreed to in writing, software
- *  distributed under the License is distributed on an "AS IS" BASIS,
- *  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- *  See the License for the specific language governing permissions and
- *  limitations under the License.
- */
-
-#pragma once
-
-#include <cudf/utilities/error.hpp>
-
-#include <thrust/host_vector.h>
-
-#include <cstddef>
-#include <limits>
-#include <new>  // for bad_alloc
-
-namespace cudf::detail {
-
-/*! \p pinned_allocator is a CUDA-specific host memory allocator
- *  that employs \c cudaMallocHost for allocation.
- *
- * This implementation is ported from the experimental/pinned_allocator
- * that Thrust used to provide.
- *
- *  \see https://en.cppreference.com/w/cpp/memory/allocator
- */
-template <typename T>
-class pinned_allocator;
-
-/*! \p pinned_allocator is a CUDA-specific host memory allocator
- *  that employs \c cudaMallocHost for allocation.
- *
- * This implementation is ported from the experimental/pinned_allocator
- * that Thrust used to provide.
- *
- *  \see https://en.cppreference.com/w/cpp/memory/allocator
- */
-template <>
-class pinned_allocator<void> {
- public:
-  using value_type      = void;            ///< The type of the elements in the allocator
-  using pointer         = void*;           ///< The type returned by address() / allocate()
-  using const_pointer   = void const*;     ///< The type returned by address()
-  using size_type       = std::size_t;     ///< The type used for the size of the allocation
-  using difference_type = std::ptrdiff_t;  ///< The type of the distance between two pointers
-
-  /**
-   * @brief converts a `pinned_allocator<void>` to `pinned_allocator<U>`
-   */
-  template <typename U>
-  struct rebind {
-    using other = pinned_allocator<U>;  ///< The rebound type
-  };
-};
-
-/*! \p pinned_allocator is a CUDA-specific host memory allocator
- *  that employs \c cudaMallocHost for allocation.
- *
- * This implementation is ported from the experimental/pinned_allocator
- * that Thrust used to provide.
- *
- *  \see https://en.cppreference.com/w/cpp/memory/allocator
- */
-template <typename T>
-class pinned_allocator {
- public:
-  using value_type      = T;               ///< The type of the elements in the allocator
-  using pointer         = T*;              ///< The type returned by address() / allocate()
-  using const_pointer   = T const*;        ///< The type returned by address()
-  using reference       = T&;              ///< The parameter type for address()
-  using const_reference = T const&;        ///< The parameter type for address()
-  using size_type       = std::size_t;     ///< The type used for the size of the allocation
-  using difference_type = std::ptrdiff_t;  ///< The type of the distance between two pointers
-
-  /**
-   * @brief converts a `pinned_allocator<T>` to `pinned_allocator<U>`
-   */
-  template <typename U>
-  struct rebind {
-    using other = pinned_allocator<U>;  ///< The rebound type
-  };
-
-  /**
-   * @brief pinned_allocator's null constructor does nothing.
-   */
-  __host__ __device__ inline pinned_allocator() {}
-
-  /**
-   * @brief pinned_allocator's null destructor does nothing.
-   */
-  __host__ __device__ inline ~pinned_allocator() {}
-
-  /**
-   * @brief pinned_allocator's copy constructor does nothing.
-   */
-  __host__ __device__ inline pinned_allocator(pinned_allocator const&) {}
-
-  /**
-   * @brief  pinned_allocator's copy constructor does nothing.
-   *
-   *  This version of pinned_allocator's copy constructor
-   *  is templated on the \c value_type of the pinned_allocator
-   *  to copy from.  It is provided merely for convenience; it
-   *  does nothing.
-   */
-  template <typename U>
-  __host__ __device__ inline pinned_allocator(pinned_allocator<U> const&)
-  {
-  }
-
-  /**
-   * @brief This method returns the address of a \c reference of
-   *  interest.
-   *
-   *  @param r The \c reference of interest.
-   *  @return \c r's address.
-   */
-  __host__ __device__ inline pointer address(reference r) { return &r; }
-
-  /**
-   * @brief This method returns the address of a \c const_reference
-   *  of interest.
-   *
-   *  @param r The \c const_reference of interest.
-   *  @return \c r's address.
-   */
-  __host__ __device__ inline const_pointer address(const_reference r) { return &r; }
-
-  /**
-   * @brief This method allocates storage for objects in pinned host
-   *  memory.
-   *
-   *  @param cnt The number of objects to allocate.
-   *  @return a \c pointer to the newly allocated objects.
-   *  @note The second parameter to this function is meant as a
-   *        hint pointer to a nearby memory location, but is
-   *        not used by this allocator.
-   *  @note This method does not invoke \p value_type's constructor.
-   *        It is the responsibility of the caller to initialize the
-   *        objects at the returned \c pointer.
-   */
-  __host__ inline pointer allocate(size_type cnt, const_pointer /*hint*/ = 0)
-  {
-    if (cnt > this->max_size()) { throw std::bad_alloc(); }  // end if
-
-    pointer result(0);
-    CUDF_CUDA_TRY(cudaMallocHost(reinterpret_cast<void**>(&result), cnt * sizeof(value_type)));
-    return result;
-  }
-
-  /**
-   * @brief This method deallocates pinned host memory previously allocated
-   *  with this \c pinned_allocator.
-   *
-   *  @param p A \c pointer to the previously allocated memory.
-   *  @note The second parameter is the number of objects previously allocated
-   *        but is ignored by this allocator.
-   *  @note This method does not invoke \p value_type's destructor.
-   *        It is the responsibility of the caller to destroy
-   *        the objects stored at \p p.
-   */
-  __host__ inline void deallocate(pointer p, size_type /*cnt*/)
-  {
-    auto dealloc_worked = cudaFreeHost(p);
-    (void)dealloc_worked;
-    assert(dealloc_worked == cudaSuccess);
-  }
-
-  /**
-   * @brief This method returns the maximum size of the \c cnt parameter
-   *  accepted by the \p allocate() method.
-   *
-   *  @return The maximum number of objects that may be allocated
-   *          by a single call to \p allocate().
-   */
-  inline size_type max_size() const { return (std::numeric_limits<size_type>::max)() / sizeof(T); }
-
-  /**
-   * @brief This method tests this \p pinned_allocator for equality to
-   *  another.
-   *
-   *  @param x The other \p pinned_allocator of interest.
-   *  @return This method always returns \c true.
-   */
-  __host__ __device__ inline bool operator==(pinned_allocator const& x) const { return true; }
-
-  /**
-   * @brief This method tests this \p pinned_allocator for inequality
-   *  to another.
-   *
-   *  @param x The other \p pinned_allocator of interest.
-   *  @return This method always returns \c false.
-   */
-  __host__ __device__ inline bool operator!=(pinned_allocator const& x) const
-  {
-    return !operator==(x);
-  }
-};
-
-/**
- * @brief A vector class with pinned host memory allocator
- */
-template <typename T>
-using pinned_host_vector = thrust::host_vector<T, pinned_allocator<T>>;
-
-}  // namespace cudf::detail
diff --git a/cpp/include/cudf/detail/utilities/vector_factories.hpp b/cpp/include/cudf/detail/utilities/vector_factories.hpp
index 293a4096c57..20cb55bb1c7 100644
--- a/cpp/include/cudf/detail/utilities/vector_factories.hpp
+++ b/cpp/include/cudf/detail/utilities/vector_factories.hpp
@@ -21,8 +21,10 @@
  * @file vector_factories.hpp
  */
 
+#include <cudf/detail/utilities/host_vector.hpp>
 #include <cudf/utilities/default_stream.hpp>
 #include <cudf/utilities/error.hpp>
+#include <cudf/utilities/pinned_memory.hpp>
 #include <cudf/utilities/span.hpp>
 
 #include <rmm/cuda_stream_view.hpp>
@@ -380,7 +382,7 @@ thrust::host_vector<T> make_host_vector_async(device_span<T const> v, rmm::cuda_
  * @brief Asynchronously construct a `std::vector` containing a copy of data from a device
  * container
  *
- * @note This function synchronizes `stream`.
+ * @note This function does not synchronize `stream`.
  *
  * @tparam Container The type of the container to copy from
  * @tparam T The type of the data to copy
@@ -439,6 +441,40 @@ thrust::host_vector<typename Container::value_type> make_host_vector_sync(
   return make_host_vector_sync(device_span<typename Container::value_type const>{c}, stream);
 }
 
+/**
+ * @brief Asynchronously construct a pinned `cudf::detail::host_vector` of the given size
+ *
+ * @note This function may not synchronize `stream`.
+ *
+ * @tparam T The type of the vector data
+ * @param size The number of elements in the created vector
+ * @param stream The stream on which to allocate memory
+ * @return A host_vector of the given size
+ */
+template <typename T>
+host_vector<T> make_pinned_vector_async(size_t size, rmm::cuda_stream_view stream)
+{
+  return host_vector<T>(size, {cudf::get_pinned_memory_resource(), stream});
+}
+
+/**
+ * @brief Synchronously construct a pinned `cudf::detail::host_vector` of the given size
+ *
+ * @note This function synchronizes `stream`.
+ *
+ * @tparam T The type of the vector data
+ * @param size The number of elements in the created vector
+ * @param stream The stream on which to allocate memory
+ * @return A host_vector of the given size
+ */
+template <typename T>
+host_vector<T> make_pinned_vector_sync(size_t size, rmm::cuda_stream_view stream)
+{
+  auto result = make_pinned_vector_async<T>(size, stream);
+  stream.synchronize();
+  return result;
+}
+
 }  // namespace detail
 
 }  // namespace cudf
diff --git a/cpp/include/cudf/io/memory_resource.hpp b/cpp/include/cudf/io/memory_resource.hpp
deleted file mode 100644
index a36e220ae7b..00000000000
--- a/cpp/include/cudf/io/memory_resource.hpp
+++ /dev/null
@@ -1,65 +0,0 @@
-/*
- * Copyright (c) 2024, NVIDIA CORPORATION.
- *
- * Licensed under the Apache License, Version 2.0 (the "License");
- * you may not use this file except in compliance with the License.
- * You may obtain a copy of the License at
- *
- *     http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
- */
-
-#pragma once
-
-#include <rmm/resource_ref.hpp>
-
-#include <optional>
-
-namespace cudf::io {
-
-/**
- * @brief Set the rmm resource to be used for host memory allocations by
- * cudf::detail::hostdevice_vector
- *
- * hostdevice_vector is a utility class that uses a pair of host and device-side buffers for
- * bouncing state between the cpu and the gpu. The resource set with this function (typically a
- * pinned memory allocator) is what it uses to allocate space for it's host-side buffer.
- *
- * @param mr The rmm resource to be used for host-side allocations
- * @return The previous resource that was in use
- */
-rmm::host_async_resource_ref set_host_memory_resource(rmm::host_async_resource_ref mr);
-
-/**
- * @brief Get the rmm resource being used for host memory allocations by
- * cudf::detail::hostdevice_vector
- *
- * @return The rmm resource used for host-side allocations
- */
-rmm::host_async_resource_ref get_host_memory_resource();
-
-/**
- * @brief Options to configure the default host memory resource
- */
-struct host_mr_options {
-  std::optional<size_t> pool_size;  ///< The size of the pool to use for the default host memory
-                                    ///< resource. If not set, the default pool size is used.
-};
-
-/**
- * @brief Configure the size of the default host memory resource.
- *
- * @throws cudf::logic_error if called after the default host memory resource has been created
- *
- * @param opts Options to configure the default host memory resource
- * @return True if this call successfully configured the host memory resource, false if a
- * a resource was already configured.
- */
-bool config_default_host_memory_resource(host_mr_options const& opts);
-
-}  // namespace cudf::io
diff --git a/cpp/include/cudf/utilities/pinned_memory.hpp b/cpp/include/cudf/utilities/pinned_memory.hpp
new file mode 100644
index 00000000000..b423eab6d38
--- /dev/null
+++ b/cpp/include/cudf/utilities/pinned_memory.hpp
@@ -0,0 +1,58 @@
+/*
+ * Copyright (c) 2024, NVIDIA CORPORATION.
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+#pragma once
+
+#include <rmm/resource_ref.hpp>
+
+#include <optional>
+
+namespace cudf {
+
+/**
+ * @brief Set the rmm resource to be used for pinned memory allocations.
+ *
+ * @param mr The rmm resource to be used for pinned allocations
+ * @return The previous resource that was in use
+ */
+rmm::host_device_async_resource_ref set_pinned_memory_resource(
+  rmm::host_device_async_resource_ref mr);
+
+/**
+ * @brief Get the rmm resource being used for pinned memory allocations.
+ *
+ * @return The rmm resource used for pinned allocations
+ */
+rmm::host_device_async_resource_ref get_pinned_memory_resource();
+
+/**
+ * @brief Options to configure the default pinned memory resource
+ */
+struct pinned_mr_options {
+  std::optional<size_t> pool_size;  ///< The size of the pool to use for the default pinned memory
+                                    ///< resource. If not set, the default pool size is used.
+};
+
+/**
+ * @brief Configure the size of the default pinned memory resource.
+ *
+ * @param opts Options to configure the default pinned memory resource
+ * @return True if this call successfully configured the pinned memory resource, false if a
+ * a resource was already configured.
+ */
+bool config_default_pinned_memory_resource(pinned_mr_options const& opts);
+
+}  // namespace cudf
diff --git a/cpp/src/io/csv/reader_impl.cu b/cpp/src/io/csv/reader_impl.cu
index 5dee0c17a33..05faded651d 100644
--- a/cpp/src/io/csv/reader_impl.cu
+++ b/cpp/src/io/csv/reader_impl.cu
@@ -27,6 +27,7 @@
 #include "io/utilities/parsing_utils.cuh"
 
 #include <cudf/detail/utilities/cuda.cuh>
+#include <cudf/detail/utilities/logger.hpp>
 #include <cudf/detail/utilities/vector_factories.hpp>
 #include <cudf/detail/utilities/visitor_overload.hpp>
 #include <cudf/io/csv.hpp>
diff --git a/cpp/src/io/orc/reader_impl_chunking.cu b/cpp/src/io/orc/reader_impl_chunking.cu
index 5034aa14a95..43301826003 100644
--- a/cpp/src/io/orc/reader_impl_chunking.cu
+++ b/cpp/src/io/orc/reader_impl_chunking.cu
@@ -22,6 +22,7 @@
 
 #include <cudf/detail/timezone.hpp>
 #include <cudf/detail/utilities/integer_utils.hpp>
+#include <cudf/detail/utilities/logger.hpp>
 #include <cudf/utilities/error.hpp>
 
 #include <rmm/device_buffer.hpp>
diff --git a/cpp/src/io/orc/writer_impl.cu b/cpp/src/io/orc/writer_impl.cu
index 344e216cdc8..e9e031a407a 100644
--- a/cpp/src/io/orc/writer_impl.cu
+++ b/cpp/src/io/orc/writer_impl.cu
@@ -27,7 +27,6 @@
 #include <cudf/detail/iterator.cuh>
 #include <cudf/detail/null_mask.hpp>
 #include <cudf/detail/utilities/cuda.cuh>
-#include <cudf/detail/utilities/pinned_host_vector.hpp>
 #include <cudf/detail/utilities/stream_pool.hpp>
 #include <cudf/detail/utilities/vector_factories.hpp>
 #include <cudf/strings/strings_column_view.hpp>
@@ -2339,7 +2338,7 @@ auto convert_table_to_orc_data(table_view const& input,
                       std::move(streams),
                       std::move(stripes),
                       std::move(stripe_dicts.views),
-                      cudf::detail::pinned_host_vector<uint8_t>()};
+                      cudf::detail::make_pinned_vector_async<uint8_t>(0, stream)};
   }
 
   // Allocate intermediate output stream buffer
@@ -2407,7 +2406,7 @@ auto convert_table_to_orc_data(table_view const& input,
     return max_stream_size;
   }();
 
-  cudf::detail::pinned_host_vector<uint8_t> bounce_buffer(max_out_stream_size);
+  auto bounce_buffer = cudf::detail::make_pinned_vector_async<uint8_t>(max_out_stream_size, stream);
 
   auto intermediate_stats = gather_statistic_blobs(stats_freq, orc_table, segmentation, stream);
 
diff --git a/cpp/src/io/parquet/reader_impl_helpers.cpp b/cpp/src/io/parquet/reader_impl_helpers.cpp
index eb653c6b9ac..9de8a9e2719 100644
--- a/cpp/src/io/parquet/reader_impl_helpers.cpp
+++ b/cpp/src/io/parquet/reader_impl_helpers.cpp
@@ -23,6 +23,8 @@
 #include "ipc/Message_generated.h"
 #include "ipc/Schema_generated.h"
 
+#include <cudf/detail/utilities/logger.hpp>
+
 #include <thrust/iterator/counting_iterator.h>
 #include <thrust/iterator/zip_iterator.h>
 
diff --git a/cpp/src/io/parquet/writer_impl.cu b/cpp/src/io/parquet/writer_impl.cu
index 1dfced94f5b..6d466748c17 100644
--- a/cpp/src/io/parquet/writer_impl.cu
+++ b/cpp/src/io/parquet/writer_impl.cu
@@ -36,7 +36,6 @@
 #include <cudf/detail/get_value.cuh>
 #include <cudf/detail/utilities/integer_utils.hpp>
 #include <cudf/detail/utilities/linked_column.hpp>
-#include <cudf/detail/utilities/pinned_host_vector.hpp>
 #include <cudf/detail/utilities/vector_factories.hpp>
 #include <cudf/lists/detail/dremel.hpp>
 #include <cudf/lists/lists_column_view.hpp>
@@ -2278,7 +2277,7 @@ auto convert_table_to_parquet_data(table_input_metadata& table_meta,
   }
 
   auto bounce_buffer =
-    cudf::detail::pinned_host_vector<uint8_t>(all_device_write ? 0 : max_write_size);
+    cudf::detail::make_pinned_vector_async<uint8_t>(all_device_write ? 0 : max_write_size, stream);
 
   return std::tuple{std::move(agg_meta),
                     std::move(pages),
diff --git a/cpp/src/io/text/bgzip_data_chunk_source.cu b/cpp/src/io/text/bgzip_data_chunk_source.cu
index faa09e586ab..0e3ce779089 100644
--- a/cpp/src/io/text/bgzip_data_chunk_source.cu
+++ b/cpp/src/io/text/bgzip_data_chunk_source.cu
@@ -19,8 +19,9 @@
 #include "io/utilities/config_utils.hpp"
 
 #include <cudf/detail/nvtx/ranges.hpp>
+#include <cudf/detail/utilities/host_vector.hpp>
 #include <cudf/detail/utilities/integer_utils.hpp>
-#include <cudf/detail/utilities/pinned_host_vector.hpp>
+#include <cudf/detail/utilities/vector_factories.hpp>
 #include <cudf/io/text/data_chunk_source_factories.hpp>
 #include <cudf/io/text/detail/bgzip_utils.hpp>
 #include <cudf/utilities/default_stream.hpp>
@@ -66,7 +67,7 @@ struct bgzip_nvcomp_transform_functor {
 class bgzip_data_chunk_reader : public data_chunk_reader {
  private:
   template <typename T>
-  static void copy_to_device(cudf::detail::pinned_host_vector<T> const& host,
+  static void copy_to_device(cudf::detail::host_vector<T> const& host,
                              rmm::device_uvector<T>& device,
                              rmm::cuda_stream_view stream)
   {
@@ -84,9 +85,9 @@ class bgzip_data_chunk_reader : public data_chunk_reader {
       1 << 16;  // 64k offset allocation, resized on demand
 
     cudaEvent_t event;
-    cudf::detail::pinned_host_vector<char> h_compressed_blocks;
-    cudf::detail::pinned_host_vector<std::size_t> h_compressed_offsets;
-    cudf::detail::pinned_host_vector<std::size_t> h_decompressed_offsets;
+    cudf::detail::host_vector<char> h_compressed_blocks;
+    cudf::detail::host_vector<std::size_t> h_compressed_offsets;
+    cudf::detail::host_vector<std::size_t> h_decompressed_offsets;
     rmm::device_uvector<char> d_compressed_blocks;
     rmm::device_uvector<char> d_decompressed_blocks;
     rmm::device_uvector<std::size_t> d_compressed_offsets;
@@ -103,7 +104,10 @@ class bgzip_data_chunk_reader : public data_chunk_reader {
     bool is_decompressed{};
 
     decompression_blocks(rmm::cuda_stream_view init_stream)
-      : d_compressed_blocks(0, init_stream),
+      : h_compressed_blocks{cudf::detail::make_pinned_vector_async<char>(0, init_stream)},
+        h_compressed_offsets{cudf::detail::make_pinned_vector_async<std::size_t>(0, init_stream)},
+        h_decompressed_offsets{cudf::detail::make_pinned_vector_async<std::size_t>(0, init_stream)},
+        d_compressed_blocks(0, init_stream),
         d_decompressed_blocks(0, init_stream),
         d_compressed_offsets(0, init_stream),
         d_decompressed_offsets(0, init_stream),
diff --git a/cpp/src/io/text/data_chunk_source_factories.cpp b/cpp/src/io/text/data_chunk_source_factories.cpp
index 9d1d0498ace..596ca3458c8 100644
--- a/cpp/src/io/text/data_chunk_source_factories.cpp
+++ b/cpp/src/io/text/data_chunk_source_factories.cpp
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2021-2023, NVIDIA CORPORATION.
+ * Copyright (c) 2021-2024, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -14,10 +14,12 @@
  * limitations under the License.
  */
 
+#include "cudf/utilities/default_stream.hpp"
 #include "io/text/device_data_chunks.hpp"
 
 #include <cudf/detail/nvtx/ranges.hpp>
-#include <cudf/detail/utilities/pinned_host_vector.hpp>
+#include <cudf/detail/utilities/host_vector.hpp>
+#include <cudf/detail/utilities/vector_factories.hpp>
 #include <cudf/io/text/data_chunk_source_factories.hpp>
 
 #include <rmm/device_buffer.hpp>
@@ -31,8 +33,15 @@ namespace cudf::io::text {
 namespace {
 
 struct host_ticket {
-  cudaEvent_t event;
-  cudf::detail::pinned_host_vector<char> buffer;
+  cudaEvent_t event{};  // tracks the completion of the last device-to-host copy.
+  cudf::detail::host_vector<char> buffer;
+
+  host_ticket() : buffer{cudf::detail::make_pinned_vector_sync<char>(0, cudf::get_default_stream())}
+  {
+    cudaEventCreate(&event);
+  }
+
+  ~host_ticket() { cudaEventDestroy(event); }
 };
 
 /**
@@ -43,20 +52,7 @@ class datasource_chunk_reader : public data_chunk_reader {
   constexpr static int num_tickets = 2;
 
  public:
-  datasource_chunk_reader(datasource* source) : _source(source)
-  {
-    // create an event to track the completion of the last device-to-host copy.
-    for (auto& ticket : _tickets) {
-      CUDF_CUDA_TRY(cudaEventCreate(&(ticket.event)));
-    }
-  }
-
-  ~datasource_chunk_reader() override
-  {
-    for (auto& ticket : _tickets) {
-      CUDF_CUDA_TRY(cudaEventDestroy(ticket.event));
-    }
-  }
+  datasource_chunk_reader(datasource* source) : _source(source) {}
 
   void skip_bytes(std::size_t size) override
   {
@@ -84,7 +80,9 @@ class datasource_chunk_reader : public data_chunk_reader {
       CUDF_CUDA_TRY(cudaEventSynchronize(h_ticket.event));
 
       // resize the host buffer as necessary to contain the requested number of bytes
-      if (h_ticket.buffer.size() < read_size) { h_ticket.buffer.resize(read_size); }
+      if (h_ticket.buffer.size() < read_size) {
+        h_ticket.buffer = cudf::detail::make_pinned_vector_sync<char>(read_size, stream);
+      }
 
       _source->host_read(_offset, read_size, reinterpret_cast<uint8_t*>(h_ticket.buffer.data()));
 
@@ -120,17 +118,6 @@ class istream_data_chunk_reader : public data_chunk_reader {
   istream_data_chunk_reader(std::unique_ptr<std::istream> datastream)
     : _datastream(std::move(datastream))
   {
-    // create an event to track the completion of the last device-to-host copy.
-    for (auto& ticket : _tickets) {
-      CUDF_CUDA_TRY(cudaEventCreate(&(ticket.event)));
-    }
-  }
-
-  ~istream_data_chunk_reader() override
-  {
-    for (auto& ticket : _tickets) {
-      CUDF_CUDA_TRY(cudaEventDestroy(ticket.event));
-    }
   }
 
   void skip_bytes(std::size_t size) override { _datastream->ignore(size); };
@@ -148,7 +135,9 @@ class istream_data_chunk_reader : public data_chunk_reader {
     CUDF_CUDA_TRY(cudaEventSynchronize(h_ticket.event));
 
     // resize the host buffer as necessary to contain the requested number of bytes
-    if (h_ticket.buffer.size() < read_size) { h_ticket.buffer.resize(read_size); }
+    if (h_ticket.buffer.size() < read_size) {
+      h_ticket.buffer = cudf::detail::make_pinned_vector_sync<char>(read_size, stream);
+    }
 
     // read data from the host istream in to the pinned host memory buffer
     _datastream->read(h_ticket.buffer.data(), read_size);
diff --git a/cpp/src/io/utilities/config_utils.cpp b/cpp/src/io/utilities/config_utils.cpp
index dad1135e766..20ac89b4d53 100644
--- a/cpp/src/io/utilities/config_utils.cpp
+++ b/cpp/src/io/utilities/config_utils.cpp
@@ -16,22 +16,12 @@
 
 #include "config_utils.hpp"
 
-#include <cudf/detail/utilities/stream_pool.hpp>
-#include <cudf/io/memory_resource.hpp>
 #include <cudf/utilities/error.hpp>
-#include <cudf/utilities/export.hpp>
-
-#include <rmm/cuda_device.hpp>
-#include <rmm/mr/device/pool_memory_resource.hpp>
-#include <rmm/mr/pinned_host_memory_resource.hpp>
-#include <rmm/resource_ref.hpp>
 
 #include <cstdlib>
 #include <string>
 
-namespace cudf::io {
-
-namespace detail {
+namespace cudf::io::detail {
 
 namespace cufile_integration {
 
@@ -90,204 +80,4 @@ bool is_stable_enabled() { return is_all_enabled() or get_env_policy() == usage_
 
 }  // namespace nvcomp_integration
 
-}  // namespace detail
-
-namespace {
-class fixed_pinned_pool_memory_resource {
-  using upstream_mr    = rmm::mr::pinned_host_memory_resource;
-  using host_pooled_mr = rmm::mr::pool_memory_resource<upstream_mr>;
-
- private:
-  upstream_mr upstream_mr_{};
-  size_t pool_size_{0};
-  // Raw pointer to avoid a segfault when the pool is destroyed on exit
-  host_pooled_mr* pool_{nullptr};
-  void* pool_begin_{nullptr};
-  void* pool_end_{nullptr};
-  cuda::stream_ref stream_{cudf::detail::global_cuda_stream_pool().get_stream().value()};
-
- public:
-  fixed_pinned_pool_memory_resource(size_t size)
-    : pool_size_{size}, pool_{new host_pooled_mr(upstream_mr_, size, size)}
-  {
-    if (pool_size_ == 0) { return; }
-
-    // Allocate full size from the pinned pool to figure out the beginning and end address
-    pool_begin_ = pool_->allocate_async(pool_size_, stream_);
-    pool_end_   = static_cast<void*>(static_cast<uint8_t*>(pool_begin_) + pool_size_);
-    pool_->deallocate_async(pool_begin_, pool_size_, stream_);
-  }
-
-  void* do_allocate_async(std::size_t bytes, std::size_t alignment, cuda::stream_ref stream)
-  {
-    if (bytes <= pool_size_) {
-      try {
-        return pool_->allocate_async(bytes, alignment, stream);
-      } catch (...) {
-        // If the pool is exhausted, fall back to the upstream memory resource
-      }
-    }
-
-    return upstream_mr_.allocate_async(bytes, alignment, stream);
-  }
-
-  void do_deallocate_async(void* ptr,
-                           std::size_t bytes,
-                           std::size_t alignment,
-                           cuda::stream_ref stream) noexcept
-  {
-    if (bytes <= pool_size_ && ptr >= pool_begin_ && ptr <= pool_end_) {
-      pool_->deallocate_async(ptr, bytes, alignment, stream);
-    } else {
-      upstream_mr_.deallocate_async(ptr, bytes, alignment, stream);
-    }
-  }
-
-  void* allocate_async(std::size_t bytes, cuda::stream_ref stream)
-  {
-    return do_allocate_async(bytes, rmm::RMM_DEFAULT_HOST_ALIGNMENT, stream);
-  }
-
-  void* allocate_async(std::size_t bytes, std::size_t alignment, cuda::stream_ref stream)
-  {
-    return do_allocate_async(bytes, alignment, stream);
-  }
-
-  void* allocate(std::size_t bytes, std::size_t alignment = rmm::RMM_DEFAULT_HOST_ALIGNMENT)
-  {
-    auto const result = do_allocate_async(bytes, alignment, stream_);
-    stream_.wait();
-    return result;
-  }
-
-  void deallocate_async(void* ptr, std::size_t bytes, cuda::stream_ref stream) noexcept
-  {
-    return do_deallocate_async(ptr, bytes, rmm::RMM_DEFAULT_HOST_ALIGNMENT, stream);
-  }
-
-  void deallocate_async(void* ptr,
-                        std::size_t bytes,
-                        std::size_t alignment,
-                        cuda::stream_ref stream) noexcept
-  {
-    return do_deallocate_async(ptr, bytes, alignment, stream);
-  }
-
-  void deallocate(void* ptr,
-                  std::size_t bytes,
-                  std::size_t alignment = rmm::RMM_DEFAULT_HOST_ALIGNMENT) noexcept
-  {
-    deallocate_async(ptr, bytes, alignment, stream_);
-    stream_.wait();
-  }
-
-  bool operator==(fixed_pinned_pool_memory_resource const& other) const
-  {
-    return pool_ == other.pool_ and stream_ == other.stream_;
-  }
-
-  bool operator!=(fixed_pinned_pool_memory_resource const& other) const
-  {
-    return !operator==(other);
-  }
-
-  [[maybe_unused]] friend void get_property(fixed_pinned_pool_memory_resource const&,
-                                            cuda::mr::device_accessible) noexcept
-  {
-  }
-
-  [[maybe_unused]] friend void get_property(fixed_pinned_pool_memory_resource const&,
-                                            cuda::mr::host_accessible) noexcept
-  {
-  }
-};
-
-static_assert(cuda::mr::resource_with<fixed_pinned_pool_memory_resource,
-                                      cuda::mr::device_accessible,
-                                      cuda::mr::host_accessible>,
-              "");
-
-}  // namespace
-
-CUDF_EXPORT rmm::host_async_resource_ref& make_default_pinned_mr(std::optional<size_t> config_size)
-{
-  static fixed_pinned_pool_memory_resource mr = [config_size]() {
-    auto const size = [&config_size]() -> size_t {
-      if (auto const env_val = getenv("LIBCUDF_PINNED_POOL_SIZE"); env_val != nullptr) {
-        return std::atol(env_val);
-      }
-
-      if (config_size.has_value()) { return *config_size; }
-
-      size_t free{}, total{};
-      CUDF_CUDA_TRY(cudaMemGetInfo(&free, &total));
-      // 0.5% of the total device memory, capped at 100MB
-      return std::min(total / 200, size_t{100} * 1024 * 1024);
-    }();
-
-    // rmm requires the pool size to be a multiple of 256 bytes
-    auto const aligned_size = (size + 255) & ~255;
-    CUDF_LOG_INFO("Pinned pool size = {}", aligned_size);
-
-    // make the pool with max size equal to the initial size
-    return fixed_pinned_pool_memory_resource{aligned_size};
-  }();
-
-  static rmm::host_async_resource_ref mr_ref{mr};
-  return mr_ref;
-}
-
-CUDF_EXPORT std::mutex& host_mr_mutex()
-{
-  static std::mutex map_lock;
-  return map_lock;
-}
-
-// Must be called with the host_mr_mutex mutex held
-CUDF_EXPORT rmm::host_async_resource_ref& make_host_mr(std::optional<host_mr_options> const& opts,
-                                                       bool* did_configure = nullptr)
-{
-  static rmm::host_async_resource_ref* mr_ref = nullptr;
-  bool configured                             = false;
-  if (mr_ref == nullptr) {
-    configured = true;
-    mr_ref     = &make_default_pinned_mr(opts ? opts->pool_size : std::nullopt);
-  }
-
-  // If the user passed an out param to detect whether this call configured a resource
-  // set the result
-  if (did_configure != nullptr) { *did_configure = configured; }
-
-  return *mr_ref;
-}
-
-// Must be called with the host_mr_mutex mutex held
-CUDF_EXPORT rmm::host_async_resource_ref& host_mr()
-{
-  static rmm::host_async_resource_ref mr_ref = make_host_mr(std::nullopt);
-  return mr_ref;
-}
-
-rmm::host_async_resource_ref set_host_memory_resource(rmm::host_async_resource_ref mr)
-{
-  std::scoped_lock lock{host_mr_mutex()};
-  auto last_mr = host_mr();
-  host_mr()    = mr;
-  return last_mr;
-}
-
-rmm::host_async_resource_ref get_host_memory_resource()
-{
-  std::scoped_lock lock{host_mr_mutex()};
-  return host_mr();
-}
-
-bool config_default_host_memory_resource(host_mr_options const& opts)
-{
-  std::scoped_lock lock{host_mr_mutex()};
-  auto did_configure = false;
-  make_host_mr(opts, &did_configure);
-  return did_configure;
-}
-
-}  // namespace cudf::io
+}  // namespace cudf::io::detail
diff --git a/cpp/src/io/utilities/hostdevice_vector.hpp b/cpp/src/io/utilities/hostdevice_vector.hpp
index 0883ac3609f..1ae27a2f4ae 100644
--- a/cpp/src/io/utilities/hostdevice_vector.hpp
+++ b/cpp/src/io/utilities/hostdevice_vector.hpp
@@ -16,11 +16,10 @@
 
 #pragma once
 
-#include "config_utils.hpp"
 #include "hostdevice_span.hpp"
 
-#include <cudf/detail/utilities/rmm_host_vector.hpp>
-#include <cudf/io/memory_resource.hpp>
+#include <cudf/detail/utilities/host_vector.hpp>
+#include <cudf/detail/utilities/vector_factories.hpp>
 #include <cudf/utilities/default_stream.hpp>
 #include <cudf/utilities/error.hpp>
 #include <cudf/utilities/span.hpp>
@@ -53,7 +52,7 @@ class hostdevice_vector {
   }
 
   explicit hostdevice_vector(size_t initial_size, size_t max_size, rmm::cuda_stream_view stream)
-    : h_data({cudf::io::get_host_memory_resource(), stream}), d_data(max_size, stream)
+    : h_data{make_pinned_vector_async<T>(0, stream)}, d_data(max_size, stream)
   {
     CUDF_EXPECTS(initial_size <= max_size, "initial_size cannot be larger than max_size");
 
@@ -173,7 +172,7 @@ class hostdevice_vector {
   }
 
  private:
-  cudf::detail::rmm_host_vector<T> h_data;
+  cudf::detail::host_vector<T> h_data;
   rmm::device_uvector<T> d_data;
 };
 
diff --git a/cpp/src/utilities/pinned_memory.cpp b/cpp/src/utilities/pinned_memory.cpp
new file mode 100644
index 00000000000..5d2e3ac332a
--- /dev/null
+++ b/cpp/src/utilities/pinned_memory.cpp
@@ -0,0 +1,216 @@
+/*
+ * Copyright (c) 2024, NVIDIA CORPORATION.
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+#include <cudf/detail/utilities/logger.hpp>
+#include <cudf/detail/utilities/stream_pool.hpp>
+#include <cudf/utilities/error.hpp>
+#include <cudf/utilities/export.hpp>
+#include <cudf/utilities/pinned_memory.hpp>
+
+#include <rmm/cuda_device.hpp>
+#include <rmm/mr/device/pool_memory_resource.hpp>
+#include <rmm/mr/pinned_host_memory_resource.hpp>
+#include <rmm/resource_ref.hpp>
+
+namespace cudf {
+
+namespace {
+class fixed_pinned_pool_memory_resource {
+  using upstream_mr    = rmm::mr::pinned_host_memory_resource;
+  using host_pooled_mr = rmm::mr::pool_memory_resource<upstream_mr>;
+
+ private:
+  upstream_mr upstream_mr_{};
+  size_t pool_size_{0};
+  // Raw pointer to avoid a segfault when the pool is destroyed on exit
+  host_pooled_mr* pool_{nullptr};
+  void* pool_begin_{nullptr};
+  void* pool_end_{nullptr};
+  cuda::stream_ref stream_{cudf::detail::global_cuda_stream_pool().get_stream().value()};
+
+ public:
+  fixed_pinned_pool_memory_resource(size_t size)
+    : pool_size_{size}, pool_{new host_pooled_mr(upstream_mr_, size, size)}
+  {
+    if (pool_size_ == 0) { return; }
+
+    // Allocate full size from the pinned pool to figure out the beginning and end address
+    pool_begin_ = pool_->allocate_async(pool_size_, stream_);
+    pool_end_   = static_cast<void*>(static_cast<uint8_t*>(pool_begin_) + pool_size_);
+    pool_->deallocate_async(pool_begin_, pool_size_, stream_);
+  }
+
+  void* allocate_async(std::size_t bytes, std::size_t alignment, cuda::stream_ref stream)
+  {
+    if (bytes <= pool_size_) {
+      try {
+        return pool_->allocate_async(bytes, alignment, stream);
+      } catch (...) {
+        // If the pool is exhausted, fall back to the upstream memory resource
+      }
+    }
+
+    return upstream_mr_.allocate_async(bytes, alignment, stream);
+  }
+
+  void* allocate_async(std::size_t bytes, cuda::stream_ref stream)
+  {
+    return allocate_async(bytes, rmm::RMM_DEFAULT_HOST_ALIGNMENT, stream);
+  }
+
+  void* allocate(std::size_t bytes, std::size_t alignment = rmm::RMM_DEFAULT_HOST_ALIGNMENT)
+  {
+    auto const result = allocate_async(bytes, alignment, stream_);
+    stream_.wait();
+    return result;
+  }
+
+  void deallocate_async(void* ptr,
+                        std::size_t bytes,
+                        std::size_t alignment,
+                        cuda::stream_ref stream) noexcept
+  {
+    if (bytes <= pool_size_ && ptr >= pool_begin_ && ptr < pool_end_) {
+      pool_->deallocate_async(ptr, bytes, alignment, stream);
+    } else {
+      upstream_mr_.deallocate_async(ptr, bytes, alignment, stream);
+    }
+  }
+
+  void deallocate_async(void* ptr, std::size_t bytes, cuda::stream_ref stream) noexcept
+  {
+    return deallocate_async(ptr, bytes, rmm::RMM_DEFAULT_HOST_ALIGNMENT, stream);
+  }
+
+  void deallocate(void* ptr,
+                  std::size_t bytes,
+                  std::size_t alignment = rmm::RMM_DEFAULT_HOST_ALIGNMENT) noexcept
+  {
+    deallocate_async(ptr, bytes, alignment, stream_);
+    stream_.wait();
+  }
+
+  bool operator==(fixed_pinned_pool_memory_resource const& other) const
+  {
+    return pool_ == other.pool_ and stream_ == other.stream_;
+  }
+
+  bool operator!=(fixed_pinned_pool_memory_resource const& other) const
+  {
+    return !operator==(other);
+  }
+
+  friend void get_property(fixed_pinned_pool_memory_resource const&,
+                           cuda::mr::device_accessible) noexcept
+  {
+  }
+
+  friend void get_property(fixed_pinned_pool_memory_resource const&,
+                           cuda::mr::host_accessible) noexcept
+  {
+  }
+};
+
+static_assert(cuda::mr::resource_with<fixed_pinned_pool_memory_resource,
+                                      cuda::mr::device_accessible,
+                                      cuda::mr::host_accessible>,
+              "Pinned pool mr must be accessible from both host and device");
+
+CUDF_EXPORT rmm::host_device_async_resource_ref& make_default_pinned_mr(
+  std::optional<size_t> config_size)
+{
+  static fixed_pinned_pool_memory_resource mr = [config_size]() {
+    auto const size = [&config_size]() -> size_t {
+      if (auto const env_val = getenv("LIBCUDF_PINNED_POOL_SIZE"); env_val != nullptr) {
+        return std::atol(env_val);
+      }
+
+      if (config_size.has_value()) { return *config_size; }
+
+      auto const total = rmm::available_device_memory().second;
+      // 0.5% of the total device memory, capped at 100MB
+      return std::min(total / 200, size_t{100} * 1024 * 1024);
+    }();
+
+    // rmm requires the pool size to be a multiple of 256 bytes
+    auto const aligned_size = rmm::align_up(size, rmm::RMM_DEFAULT_HOST_ALIGNMENT);
+    CUDF_LOG_INFO("Pinned pool size = {}", aligned_size);
+
+    // make the pool with max size equal to the initial size
+    return fixed_pinned_pool_memory_resource{aligned_size};
+  }();
+
+  static rmm::host_device_async_resource_ref mr_ref{mr};
+  return mr_ref;
+}
+
+CUDF_EXPORT std::mutex& host_mr_mutex()
+{
+  static std::mutex map_lock;
+  return map_lock;
+}
+
+// Must be called with the host_mr_mutex mutex held
+CUDF_EXPORT rmm::host_device_async_resource_ref& make_host_mr(
+  std::optional<pinned_mr_options> const& opts, bool* did_configure = nullptr)
+{
+  static rmm::host_device_async_resource_ref* mr_ref = nullptr;
+  bool configured                                    = false;
+  if (mr_ref == nullptr) {
+    configured = true;
+    mr_ref     = &make_default_pinned_mr(opts ? opts->pool_size : std::nullopt);
+  }
+
+  // If the user passed an out param to detect whether this call configured a resource
+  // set the result
+  if (did_configure != nullptr) { *did_configure = configured; }
+
+  return *mr_ref;
+}
+
+// Must be called with the host_mr_mutex mutex held
+CUDF_EXPORT rmm::host_device_async_resource_ref& host_mr()
+{
+  static rmm::host_device_async_resource_ref mr_ref = make_host_mr(std::nullopt);
+  return mr_ref;
+}
+
+}  // namespace
+
+rmm::host_device_async_resource_ref set_pinned_memory_resource(
+  rmm::host_device_async_resource_ref mr)
+{
+  std::scoped_lock lock{host_mr_mutex()};
+  auto last_mr = host_mr();
+  host_mr()    = mr;
+  return last_mr;
+}
+
+rmm::host_device_async_resource_ref get_pinned_memory_resource()
+{
+  std::scoped_lock lock{host_mr_mutex()};
+  return host_mr();
+}
+
+bool config_default_pinned_memory_resource(pinned_mr_options const& opts)
+{
+  std::scoped_lock lock{host_mr_mutex()};
+  auto did_configure = false;
+  make_host_mr(opts, &did_configure);
+  return did_configure;
+}
+
+}  // namespace cudf
diff --git a/cpp/tests/CMakeLists.txt b/cpp/tests/CMakeLists.txt
index 826f879ddc0..f6d762cc2ec 100644
--- a/cpp/tests/CMakeLists.txt
+++ b/cpp/tests/CMakeLists.txt
@@ -380,15 +380,16 @@ ConfigureTest(
 # * utilities tests -------------------------------------------------------------------------------
 ConfigureTest(
   UTILITIES_TEST
-  utilities_tests/type_list_tests.cpp
   utilities_tests/column_debug_tests.cpp
   utilities_tests/column_utilities_tests.cpp
   utilities_tests/column_wrapper_tests.cpp
+  utilities_tests/default_stream_tests.cpp
   utilities_tests/io_utilities_tests.cpp
   utilities_tests/lists_column_wrapper_tests.cpp
   utilities_tests/logger_tests.cpp
-  utilities_tests/default_stream_tests.cpp
+  utilities_tests/pinned_memory_tests.cpp
   utilities_tests/type_check_tests.cpp
+  utilities_tests/type_list_tests.cpp
 )
 
 # ##################################################################################################
diff --git a/cpp/tests/io/json_test.cpp b/cpp/tests/io/json_test.cpp
index 57aa2721756..4c01a1fb87b 100644
--- a/cpp/tests/io/json_test.cpp
+++ b/cpp/tests/io/json_test.cpp
@@ -28,13 +28,13 @@
 #include <cudf/detail/iterator.cuh>
 #include <cudf/io/arrow_io_source.hpp>
 #include <cudf/io/json.hpp>
-#include <cudf/io/memory_resource.hpp>
 #include <cudf/strings/convert/convert_fixed_point.hpp>
 #include <cudf/strings/repeat_strings.hpp>
 #include <cudf/strings/strings_column_view.hpp>
 #include <cudf/table/table.hpp>
 #include <cudf/table/table_view.hpp>
 #include <cudf/types.hpp>
+#include <cudf/utilities/pinned_memory.hpp>
 
 #include <rmm/mr/pinned_host_memory_resource.hpp>
 
@@ -2068,7 +2068,7 @@ TEST_F(JsonReaderTest, JSONLinesRecoveringSync)
                     size_t{128} * 1024 * 1024};
 
   // Set new resource
-  auto last_mr = cudf::io::set_host_memory_resource(mr);
+  auto last_mr = cudf::set_pinned_memory_resource(mr);
 
   /**
    * @brief Spark has the specific need to ignore extra characters that come after the first record
@@ -2158,7 +2158,7 @@ TEST_F(JsonReaderTest, JSONLinesRecoveringSync)
     float64_wrapper{c_data.cbegin(), c_data.cend(), c_validity.cbegin()});
 
   // Restore original memory source
-  cudf::io::set_host_memory_resource(last_mr);
+  cudf::set_pinned_memory_resource(last_mr);
 }
 
 TEST_F(JsonReaderTest, MixedTypes)
diff --git a/cpp/tests/utilities_tests/io_utilities_tests.cpp b/cpp/tests/utilities_tests/io_utilities_tests.cpp
index e5a153bf781..9ed8f18f5cc 100644
--- a/cpp/tests/utilities_tests/io_utilities_tests.cpp
+++ b/cpp/tests/utilities_tests/io_utilities_tests.cpp
@@ -16,14 +16,6 @@
 
 #include <cudf_test/base_fixture.hpp>
 #include <cudf_test/column_wrapper.hpp>
-#include <cudf_test/table_utilities.hpp>
-
-#include <cudf/io/memory_resource.hpp>
-#include <cudf/io/parquet.hpp>
-
-#include <rmm/mr/device/pool_memory_resource.hpp>
-#include <rmm/mr/pinned_host_memory_resource.hpp>
-#include <rmm/resource_ref.hpp>
 
 #include <src/io/utilities/base64_utilities.hpp>
 
@@ -32,43 +24,6 @@ using cudf::io::detail::base64_encode;
 
 class IoUtilitiesTest : public cudf::test::BaseFixture {};
 
-TEST(IoUtilitiesTest, HostMemoryGetAndSet)
-{
-  // Global environment for temporary files
-  auto const temp_env = static_cast<cudf::test::TempDirTestEnvironment*>(
-    ::testing::AddGlobalTestEnvironment(new cudf::test::TempDirTestEnvironment));
-
-  // pinned/pooled host memory resource
-  using host_pooled_mr = rmm::mr::pool_memory_resource<rmm::mr::pinned_host_memory_resource>;
-  host_pooled_mr mr(std::make_shared<rmm::mr::pinned_host_memory_resource>().get(),
-                    size_t{128} * 1024 * 1024);
-
-  // set new resource
-  auto last_mr = cudf::io::get_host_memory_resource();
-  cudf::io::set_host_memory_resource(mr);
-
-  constexpr int num_rows = 32 * 1024;
-  auto valids =
-    cudf::detail::make_counting_transform_iterator(0, [&](int index) { return index % 2; });
-  auto values = thrust::make_counting_iterator(0);
-
-  cudf::test::fixed_width_column_wrapper<int> col(values, values + num_rows, valids);
-
-  cudf::table_view expected({col});
-  auto filepath = temp_env->get_temp_filepath("IoUtilsMemTest.parquet");
-  cudf::io::parquet_writer_options out_args =
-    cudf::io::parquet_writer_options::builder(cudf::io::sink_info{filepath}, expected);
-  cudf::io::write_parquet(out_args);
-
-  cudf::io::parquet_reader_options const read_opts =
-    cudf::io::parquet_reader_options::builder(cudf::io::source_info{filepath});
-  auto const result = cudf::io::read_parquet(read_opts);
-  CUDF_TEST_EXPECT_TABLES_EQUAL(*result.tbl, expected);
-
-  // reset memory resource back
-  cudf::io::set_host_memory_resource(last_mr);
-}
-
 TEST(IoUtilitiesTest, Base64EncodeAndDecode)
 {
   // a vector of lorem ipsum strings
diff --git a/cpp/tests/utilities_tests/pinned_memory_tests.cpp b/cpp/tests/utilities_tests/pinned_memory_tests.cpp
new file mode 100644
index 00000000000..df9103640f4
--- /dev/null
+++ b/cpp/tests/utilities_tests/pinned_memory_tests.cpp
@@ -0,0 +1,65 @@
+/*
+ * Copyright (c) 2024, NVIDIA CORPORATION.
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+#include <cudf_test/base_fixture.hpp>
+#include <cudf_test/column_wrapper.hpp>
+#include <cudf_test/table_utilities.hpp>
+
+#include <cudf/io/parquet.hpp>
+#include <cudf/utilities/pinned_memory.hpp>
+
+#include <rmm/mr/device/pool_memory_resource.hpp>
+#include <rmm/mr/pinned_host_memory_resource.hpp>
+#include <rmm/resource_ref.hpp>
+
+class PinnedMemoryTest : public cudf::test::BaseFixture {};
+
+TEST(PinnedMemoryTest, MemoryResourceGetAndSet)
+{
+  // Global environment for temporary files
+  auto const temp_env = static_cast<cudf::test::TempDirTestEnvironment*>(
+    ::testing::AddGlobalTestEnvironment(new cudf::test::TempDirTestEnvironment));
+
+  // pinned/pooled host memory resource
+  using host_pooled_mr = rmm::mr::pool_memory_resource<rmm::mr::pinned_host_memory_resource>;
+  host_pooled_mr mr(std::make_shared<rmm::mr::pinned_host_memory_resource>().get(),
+                    4 * 1024 * 1024);
+
+  // set new resource
+  auto last_mr = cudf::get_pinned_memory_resource();
+  cudf::set_pinned_memory_resource(mr);
+
+  constexpr int num_rows = 32 * 1024;
+  auto valids =
+    cudf::detail::make_counting_transform_iterator(0, [&](int index) { return index % 2; });
+  auto values = thrust::make_counting_iterator(0);
+
+  cudf::test::fixed_width_column_wrapper<int> col(values, values + num_rows, valids);
+
+  cudf::table_view expected({col});
+  auto filepath = temp_env->get_temp_filepath("MemoryResourceGetAndSetTest.parquet");
+  cudf::io::parquet_writer_options out_args =
+    cudf::io::parquet_writer_options::builder(cudf::io::sink_info{filepath}, expected);
+  cudf::io::write_parquet(out_args);
+
+  cudf::io::parquet_reader_options const read_opts =
+    cudf::io::parquet_reader_options::builder(cudf::io::source_info{filepath});
+  auto const result = cudf::io::read_parquet(read_opts);
+  CUDF_TEST_EXPECT_TABLES_EQUAL(*result.tbl, expected);
+
+  // reset memory resource back
+  cudf::set_pinned_memory_resource(last_mr);
+}
diff --git a/java/src/main/java/ai/rapids/cudf/PinnedMemoryPool.java b/java/src/main/java/ai/rapids/cudf/PinnedMemoryPool.java
index 83b801db7fb..df0d9dc7c3e 100644
--- a/java/src/main/java/ai/rapids/cudf/PinnedMemoryPool.java
+++ b/java/src/main/java/ai/rapids/cudf/PinnedMemoryPool.java
@@ -128,9 +128,9 @@ public static synchronized void initialize(long poolSize, int gpuId) {
    *
    * @param poolSize size of the pool to initialize.
    * @param gpuId    gpu id to set to get memory pool from, -1 means to use default
-   * @param setCuioHostMemoryResource true if this pinned pool should be used by cuIO for host memory
+   * @param setCudfPinnedPoolMemoryResource true if this pinned pool should be used by cuDF for pinned memory
    */
-  public static synchronized void initialize(long poolSize, int gpuId, boolean setCuioHostMemoryResource) {
+  public static synchronized void initialize(long poolSize, int gpuId, boolean setCudfPinnedPoolMemoryResource) {
     if (isInitialized()) {
       throw new IllegalStateException("Can only initialize the pool once.");
     }
@@ -139,7 +139,7 @@ public static synchronized void initialize(long poolSize, int gpuId, boolean set
       t.setDaemon(true);
       return t;
     });
-    initFuture = initService.submit(() -> new PinnedMemoryPool(poolSize, gpuId, setCuioHostMemoryResource));
+    initFuture = initService.submit(() -> new PinnedMemoryPool(poolSize, gpuId, setCudfPinnedPoolMemoryResource));
     initService.shutdown();
   }
 
@@ -216,15 +216,15 @@ public static long getTotalPoolSizeBytes() {
     return 0;
   }
 
-  private PinnedMemoryPool(long poolSize, int gpuId, boolean setCuioHostMemoryResource) {
+  private PinnedMemoryPool(long poolSize, int gpuId, boolean setCudfPinnedPoolMemoryResource) {
     if (gpuId > -1) {
       // set the gpu device to use
       Cuda.setDevice(gpuId);
       Cuda.freeZero();
     }
     this.poolHandle = Rmm.newPinnedPoolMemoryResource(poolSize, poolSize);
-    if (setCuioHostMemoryResource) {
-      Rmm.setCuioPinnedPoolMemoryResource(this.poolHandle);
+    if (setCudfPinnedPoolMemoryResource) {
+      Rmm.setCudfPinnedPoolMemoryResource(this.poolHandle);
     }
     this.poolSize = poolSize;
   }
diff --git a/java/src/main/java/ai/rapids/cudf/Rmm.java b/java/src/main/java/ai/rapids/cudf/Rmm.java
index 4dee1b7aa24..ed029c918e4 100755
--- a/java/src/main/java/ai/rapids/cudf/Rmm.java
+++ b/java/src/main/java/ai/rapids/cudf/Rmm.java
@@ -597,7 +597,7 @@ static native long newEventHandlerResourceAdaptor(long handle, long trackerHandl
 
   public static native long newPinnedPoolMemoryResource(long initSize, long maxSize);
 
-  public static native long setCuioPinnedPoolMemoryResource(long poolPtr);
+  public static native long setCudfPinnedPoolMemoryResource(long poolPtr);
 
   public static native void releasePinnedPoolMemoryResource(long poolPtr);
 
diff --git a/java/src/main/native/src/RmmJni.cpp b/java/src/main/native/src/RmmJni.cpp
index fa78f6ca4e2..8bd0f7793b4 100644
--- a/java/src/main/native/src/RmmJni.cpp
+++ b/java/src/main/native/src/RmmJni.cpp
@@ -16,7 +16,7 @@
 
 #include "cudf_jni_apis.hpp"
 
-#include <cudf/io/memory_resource.hpp>
+#include <cudf/utilities/pinned_memory.hpp>
 
 #include <rmm/aligned.hpp>
 #include <rmm/mr/device/aligned_resource_adaptor.hpp>
@@ -395,15 +395,17 @@ class java_debug_event_handler_memory_resource final : public java_event_handler
   }
 };
 
-inline auto& prior_cuio_host_mr()
+inline auto& prior_cudf_pinned_mr()
 {
-  static rmm::host_async_resource_ref _prior_cuio_host_mr = cudf::io::get_host_memory_resource();
-  return _prior_cuio_host_mr;
+  static rmm::host_device_async_resource_ref _prior_cudf_pinned_mr =
+    cudf::get_pinned_memory_resource();
+  return _prior_cudf_pinned_mr;
 }
 
 /**
  * This is a pinned fallback memory resource that will try to allocate `pool`
- * and if that fails, attempt to allocate from the prior resource used by cuIO `prior_cuio_host_mr`.
+ * and if that fails, attempt to allocate from the prior resource used by cuDF
+ * `prior_cudf_pinned_mr`.
  *
  * We detect whether a pointer to free is inside of the pool by checking its address (see
  * constructor)
@@ -433,7 +435,7 @@ class pinned_fallback_host_memory_resource {
 
   /**
    * @brief Allocates pinned host memory of size at least \p bytes bytes from either the
-   *        _pool argument provided, or prior_cuio_host_mr.
+   *        _pool argument provided, or prior_cudf_pinned_mr.
    *
    * @throws rmm::bad_alloc if the requested allocation could not be fulfilled due to any other
    * reason.
@@ -450,7 +452,7 @@ class pinned_fallback_host_memory_resource {
       return _pool->allocate(bytes, alignment);
     } catch (const std::exception& unused) {
       // try to allocate using the underlying pinned resource
-      return prior_cuio_host_mr().allocate(bytes, alignment);
+      return prior_cudf_pinned_mr().allocate(bytes, alignment);
     }
     // we should not reached here
     return nullptr;
@@ -459,7 +461,7 @@ class pinned_fallback_host_memory_resource {
   /**
    * @brief Deallocate memory pointed to by \p ptr of size \p bytes bytes. We attempt
    *        to deallocate from _pool, if ptr is detected to be in the pool address range,
-   *        otherwise we deallocate from `prior_cuio_host_mr`.
+   *        otherwise we deallocate from `prior_cudf_pinned_mr`.
    *
    * @param ptr Pointer to be deallocated.
    * @param bytes Size of the allocation.
@@ -472,7 +474,7 @@ class pinned_fallback_host_memory_resource {
     if (ptr >= pool_begin_ && ptr <= pool_end_) {
       _pool->deallocate(ptr, bytes, alignment);
     } else {
-      prior_cuio_host_mr().deallocate(ptr, bytes, alignment);
+      prior_cudf_pinned_mr().deallocate(ptr, bytes, alignment);
     }
   }
 
@@ -1025,7 +1027,7 @@ JNIEXPORT jlong JNICALL Java_ai_rapids_cudf_Rmm_newPinnedPoolMemoryResource(JNIE
   CATCH_STD(env, 0)
 }
 
-JNIEXPORT void JNICALL Java_ai_rapids_cudf_Rmm_setCuioPinnedPoolMemoryResource(JNIEnv* env,
+JNIEXPORT void JNICALL Java_ai_rapids_cudf_Rmm_setCudfPinnedPoolMemoryResource(JNIEnv* env,
                                                                                jclass clazz,
                                                                                jlong pool_ptr)
 {
@@ -1035,7 +1037,7 @@ JNIEXPORT void JNICALL Java_ai_rapids_cudf_Rmm_setCuioPinnedPoolMemoryResource(J
     // create a pinned fallback pool that will allocate pinned memory
     // if the regular pinned pool is exhausted
     pinned_fallback_mr.reset(new pinned_fallback_host_memory_resource(pool));
-    prior_cuio_host_mr() = cudf::io::set_host_memory_resource(*pinned_fallback_mr);
+    prior_cudf_pinned_mr() = cudf::set_pinned_memory_resource(*pinned_fallback_mr);
   }
   CATCH_STD(env, )
 }
@@ -1047,8 +1049,8 @@ JNIEXPORT void JNICALL Java_ai_rapids_cudf_Rmm_releasePinnedPoolMemoryResource(J
   try {
     cudf::jni::auto_set_device(env);
     // set the cuio host memory resource to what it was before, or the same
-    // if we didn't overwrite it with setCuioPinnedPoolMemoryResource
-    cudf::io::set_host_memory_resource(prior_cuio_host_mr());
+    // if we didn't overwrite it with setCudfPinnedPoolMemoryResource
+    cudf::set_pinned_memory_resource(prior_cudf_pinned_mr());
     pinned_fallback_mr.reset();
     delete reinterpret_cast<rmm_pinned_pool_t*>(pool_ptr);
   }
@@ -1088,7 +1090,7 @@ JNIEXPORT jlong JNICALL Java_ai_rapids_cudf_Rmm_allocFromFallbackPinnedPool(JNIE
                                                                             jlong size)
 {
   cudf::jni::auto_set_device(env);
-  void* ret = cudf::io::get_host_memory_resource().allocate(size);
+  void* ret = cudf::get_pinned_memory_resource().allocate(size);
   return reinterpret_cast<jlong>(ret);
 }
 
@@ -1101,7 +1103,7 @@ JNIEXPORT void JNICALL Java_ai_rapids_cudf_Rmm_freeFromFallbackPinnedPool(JNIEnv
   try {
     cudf::jni::auto_set_device(env);
     void* cptr = reinterpret_cast<void*>(ptr);
-    cudf::io::get_host_memory_resource().deallocate(cptr, size);
+    cudf::get_pinned_memory_resource().deallocate(cptr, size);
   }
   CATCH_STD(env, )
 }
@@ -1112,7 +1114,7 @@ JNIEXPORT jboolean JNICALL Java_ai_rapids_cudf_Rmm_configureDefaultCudfPinnedPoo
 {
   try {
     cudf::jni::auto_set_device(env);
-    return cudf::io::config_default_host_memory_resource(cudf::io::host_mr_options{size});
+    return cudf::config_default_pinned_memory_resource(cudf::pinned_mr_options{size});
   }
   CATCH_STD(env, false)
 }

From 2b1029908af97b74304169631189dd57f382f072 Mon Sep 17 00:00:00 2001
From: Vyas Ramasubramani <vyasr@nvidia.com>
Date: Wed, 12 Jun 2024 01:14:31 -0700
Subject: [PATCH 5/9] Apply clang-tidy autofixes (#15894)

This changeset is large, but it's not very substantial. It's all the automated fixes produced by clang-tidy using our script. The bulk of the changes are either adding `[[nodiscard]]` to many functions or changing const ref args to pass by value and then move in cases where the parameter is only used to set a value. There are also some places where clang-tidy preferred either more or less namespacing of objects depending on the current namespace. The goal is to enable clang-tidy in CI, which we made progress towards in #9860 but stalled in #10064. This PR contains the first set of changes that will required for such a check to pass.

I've marked this PR as breaking because some of the functions now marked as `[[nodiscard]]` are public APIs, so if consumers were ignoring the return values they will now see warnings, and if they are compiling with warnings as errors then the builds will break.

Contributes to #584

Authors:
  - Vyas Ramasubramani (https://github.com/vyasr)

Approvers:
  - Bradley Dice (https://github.com/bdice)
  - Nghia Truong (https://github.com/ttnghia)

URL: https://github.com/rapidsai/cudf/pull/15894
---
 .pre-commit-config.yaml                       |   8 +
 cpp/include/cudf/ast/expressions.hpp          |   7 +-
 .../cudf/column/column_device_view.cuh        |  10 +-
 .../cudf/detail/aggregation/aggregation.hpp   |  27 +-
 cpp/include/cudf/detail/contiguous_split.hpp  |   2 +-
 .../cudf/detail/normalizing_iterator.cuh      |   8 +-
 cpp/include/cudf/detail/structs/utilities.hpp |  24 +-
 .../cudf/detail/utilities/host_vector.hpp     |   4 +-
 .../cudf/detail/utilities/stream_pool.hpp     |   2 +-
 cpp/include/cudf/fixed_point/fixed_point.hpp  |   6 +-
 cpp/include/cudf/interop.hpp                  |   4 +-
 cpp/include/cudf/interop/detail/arrow.hpp     |   7 +-
 cpp/include/cudf/io/arrow_io_source.hpp       |   8 +-
 cpp/include/cudf/io/csv.hpp                   |  22 +-
 cpp/include/cudf/io/detail/parquet.hpp        |   2 +-
 cpp/include/cudf/io/json.hpp                  |  42 +-
 cpp/include/cudf/io/orc.hpp                   |  26 +-
 cpp/include/cudf/io/parquet.hpp               |   6 +-
 cpp/include/cudf/io/types.hpp                 |   5 +-
 cpp/include/cudf/join.hpp                     |  33 +-
 cpp/include/cudf/scalar/scalar.hpp            |  19 +-
 .../cudf/strings/regex/regex_program.hpp      |  14 +-
 cpp/include/cudf/strings/string_view.cuh      |   8 +-
 cpp/include/cudf/table/table.hpp              |   2 +-
 cpp/include/cudf/table/table_view.hpp         |   4 +-
 cpp/include/cudf/utilities/error.hpp          |   8 +-
 cpp/include/cudf/utilities/span.hpp           |  24 +-
 cpp/include/cudf/utilities/thread_pool.hpp    |   6 +-
 cpp/include/cudf/wrappers/dictionary.hpp      |   2 +-
 cpp/include/cudf/wrappers/durations.hpp       |  16 +-
 cpp/include/cudf/wrappers/timestamps.hpp      |  16 +-
 cpp/include/cudf_test/base_fixture.hpp        |   2 +-
 cpp/include/cudf_test/column_wrapper.hpp      |  15 +-
 .../stream_checking_resource_adaptor.hpp      |   2 +-
 cpp/src/binaryop/binaryop.cpp                 |   2 +-
 cpp/src/binaryop/compiled/operation.cuh       |   8 +-
 cpp/src/binaryop/compiled/util.cpp            |   4 +-
 cpp/src/copying/pack.cpp                      |   2 +-
 cpp/src/datetime/timezone.cpp                 |   2 +-
 cpp/src/interop/arrow_utilities.cpp           |   2 +-
 cpp/src/interop/arrow_utilities.hpp           |   2 +-
 cpp/src/interop/detail/arrow_allocator.cpp    |   2 +-
 cpp/src/interop/from_arrow_host.cu            |   4 +-
 cpp/src/io/avro/avro.cpp                      |   6 +-
 cpp/src/io/comp/uncomp.cpp                    |   8 +-
 cpp/src/io/functions.cpp                      |   8 +-
 cpp/src/io/json/nested_json_gpu.cu            |   8 +-
 cpp/src/io/json/read_json.cu                  |   2 +-
 cpp/src/io/orc/orc.hpp                        |   2 +-
 cpp/src/io/orc/orc_field_writer.hpp           |   6 +-
 cpp/src/io/orc/reader_impl_chunking.cu        |   2 +-
 cpp/src/io/orc/reader_impl_decode.cu          |   2 +-
 .../io/parquet/compact_protocol_reader.cpp    |   2 +-
 .../io/parquet/compact_protocol_writer.hpp    |   4 +-
 cpp/src/io/parquet/ipc/Schema_generated.h     | 416 +++++++++---------
 cpp/src/io/parquet/page_string_decode.cu      |  10 +-
 cpp/src/io/parquet/page_string_utils.cuh      |   4 +-
 cpp/src/io/parquet/parquet.hpp                |  30 +-
 cpp/src/io/parquet/parquet_gpu.hpp            |  33 +-
 cpp/src/io/parquet/predicate_pushdown.cpp     |   4 +-
 cpp/src/io/parquet/reader_impl_chunking.cu    |   2 +-
 cpp/src/io/parquet/reader_impl_helpers.cpp    |  26 +-
 cpp/src/io/parquet/reader_impl_preprocess.cu  |   8 +-
 cpp/src/io/statistics/byte_array_view.cuh     |   6 +-
 cpp/src/io/utilities/arrow_io_source.cpp      |   6 +-
 cpp/src/io/utilities/column_buffer.cpp        |  20 +-
 cpp/src/io/utilities/column_buffer.hpp        |  21 +-
 cpp/src/io/utilities/data_casting.cu          |   4 +-
 cpp/src/io/utilities/data_sink.cpp            |   8 +-
 cpp/src/io/utilities/datasource.cpp           |   2 +-
 cpp/src/io/utilities/file_io_utilities.cpp    |   8 +-
 cpp/src/io/utilities/hostdevice_span.hpp      |   2 +-
 cpp/src/io/utilities/hostdevice_vector.hpp    |   2 +-
 cpp/src/io/utilities/output_builder.cuh       |   4 +-
 cpp/src/io/utilities/string_parsing.hpp       |   6 +-
 cpp/src/io/utilities/type_inference.cu        |   2 +-
 cpp/src/jit/cache.cpp                         |   4 +-
 cpp/src/jit/parser.cpp                        |  17 +-
 cpp/src/jit/parser.hpp                        |   8 +-
 cpp/src/reductions/reductions.cpp             |   6 +-
 .../detail/optimized_unbounded_window.cpp     |   2 +-
 cpp/src/strings/regex/regcomp.cpp             |  26 +-
 cpp/src/strings/regex/regex.cuh               |  45 +-
 cpp/src/strings/regex/regex.inl               |   7 +-
 cpp/src/strings/regex/regexec.cpp             |  14 +-
 cpp/src/transform/transform.cpp               |   2 +-
 cpp/src/utilities/stream_pool.cpp             |   4 +-
 .../binop-compiled-fixed_point-test.cpp       |   8 +-
 cpp/tests/bitmask/is_element_valid_tests.cpp  |   8 +-
 cpp/tests/column/column_view_shallow_test.cpp |   3 +-
 cpp/tests/copying/concatenate_tests.cpp       |  79 ++--
 cpp/tests/copying/copy_tests.cpp              |   5 +-
 cpp/tests/copying/gather_str_tests.cpp        |  27 +-
 cpp/tests/copying/gather_struct_tests.cpp     |   4 +-
 cpp/tests/copying/get_value_tests.cpp         |  12 +-
 cpp/tests/copying/pack_tests.cpp              |  86 ++--
 cpp/tests/copying/scatter_list_tests.cpp      |  11 +-
 cpp/tests/copying/scatter_struct_tests.cpp    |   9 +-
 cpp/tests/copying/scatter_tests.cpp           |  47 +-
 cpp/tests/copying/shift_tests.cpp             |  57 +--
 cpp/tests/copying/slice_tests.cpp             |  69 ++-
 cpp/tests/copying/split_tests.cpp             | 123 ++++--
 cpp/tests/dictionary/decode_test.cpp          |   5 +-
 cpp/tests/dictionary/encode_test.cpp          |   5 +-
 cpp/tests/dictionary/factories_test.cpp       |   6 +-
 cpp/tests/dictionary/fill_test.cpp            |  10 +-
 cpp/tests/dictionary/gather_test.cpp          |   5 +-
 cpp/tests/dictionary/remove_keys_test.cpp     |  14 +-
 cpp/tests/dictionary/scatter_test.cpp         |  19 +-
 cpp/tests/dictionary/search_test.cpp          |   6 +-
 cpp/tests/dictionary/set_keys_test.cpp        |  12 +-
 cpp/tests/dictionary/slice_test.cpp           |  15 +-
 cpp/tests/groupby/argmax_tests.cpp            |   5 +-
 cpp/tests/groupby/argmin_tests.cpp            |   7 +-
 cpp/tests/groupby/collect_set_tests.cpp       |   4 +-
 cpp/tests/groupby/correlation_tests.cpp       |   8 +-
 cpp/tests/groupby/count_scan_tests.cpp        |   4 +-
 cpp/tests/groupby/count_tests.cpp             |   7 +-
 cpp/tests/groupby/covariance_tests.cpp        |   8 +-
 cpp/tests/groupby/groupby_test_util.cpp       |   4 +-
 cpp/tests/groupby/groups_tests.cpp            |   5 +-
 cpp/tests/groupby/keys_tests.cpp              |   8 +-
 cpp/tests/groupby/m2_tests.cpp                |   4 +-
 cpp/tests/groupby/max_scan_tests.cpp          |   4 +-
 cpp/tests/groupby/max_tests.cpp               |  25 +-
 cpp/tests/groupby/mean_tests.cpp              |   7 +-
 cpp/tests/groupby/median_tests.cpp            |   7 +-
 cpp/tests/groupby/merge_lists_tests.cpp       |   4 +-
 cpp/tests/groupby/merge_m2_tests.cpp          |   6 +-
 cpp/tests/groupby/merge_sets_tests.cpp        |   4 +-
 cpp/tests/groupby/min_scan_tests.cpp          |   4 +-
 cpp/tests/groupby/min_tests.cpp               |  25 +-
 cpp/tests/groupby/nth_element_tests.cpp       |  40 +-
 cpp/tests/groupby/nunique_tests.cpp           |  19 +-
 cpp/tests/groupby/product_scan_tests.cpp      |   2 +-
 cpp/tests/groupby/product_tests.cpp           |   4 +-
 cpp/tests/groupby/quantile_tests.cpp          |   7 +-
 cpp/tests/groupby/rank_scan_tests.cpp         |  12 +-
 cpp/tests/groupby/replace_nulls_tests.cpp     |  10 +-
 cpp/tests/groupby/shift_tests.cpp             |  23 +-
 cpp/tests/groupby/std_tests.cpp               |  12 +-
 cpp/tests/groupby/sum_of_squares_tests.cpp    |   7 +-
 cpp/tests/groupby/sum_scan_tests.cpp          |   4 +-
 cpp/tests/groupby/sum_tests.cpp               |   5 +-
 cpp/tests/groupby/var_tests.cpp               |  12 +-
 cpp/tests/hashing/md5_test.cpp                |  32 +-
 cpp/tests/hashing/murmurhash3_x86_32_test.cpp | 106 ++++-
 cpp/tests/hashing/sha1_test.cpp               |   8 +-
 cpp/tests/hashing/sha224_test.cpp             |   8 +-
 cpp/tests/hashing/sha256_test.cpp             |   8 +-
 cpp/tests/hashing/sha384_test.cpp             |   8 +-
 cpp/tests/hashing/sha512_test.cpp             |   8 +-
 cpp/tests/interop/dlpack_test.cpp             |   2 +-
 cpp/tests/interop/from_arrow_device_test.cpp  |  14 +-
 cpp/tests/interop/from_arrow_host_test.cpp    |   6 +-
 cpp/tests/interop/from_arrow_test.cpp         |  43 +-
 cpp/tests/interop/nanoarrow_utils.hpp         |  14 +-
 cpp/tests/interop/to_arrow_device_test.cpp    |  26 +-
 cpp/tests/io/csv_test.cpp                     |   4 +-
 cpp/tests/io/json_chunked_reader.cpp          |   4 +-
 .../io/json_quote_normalization_test.cpp      |   2 +-
 cpp/tests/io/json_test.cpp                    |   4 +-
 cpp/tests/io/json_tree.cpp                    |   8 +-
 cpp/tests/io/orc_chunked_reader_test.cu       |   4 +-
 cpp/tests/io/orc_test.cpp                     |   8 +-
 cpp/tests/io/parquet_chunked_writer_test.cpp  |  36 +-
 cpp/tests/io/parquet_reader_test.cpp          |  54 ++-
 cpp/tests/io/parquet_v2_test.cpp              |  79 ++--
 cpp/tests/io/parquet_writer_test.cpp          |  20 +-
 cpp/tests/join/distinct_join_tests.cpp        |  76 ++--
 cpp/tests/join/join_tests.cpp                 | 342 +++++++-------
 cpp/tests/join/semi_anti_join_tests.cpp       |  43 +-
 cpp/tests/json/json_tests.cpp                 |   6 +-
 .../large_strings/large_strings_fixture.cpp   |   9 +-
 cpp/tests/lists/contains_tests.cpp            |   2 +-
 cpp/tests/lists/count_elements_tests.cpp      |  10 +-
 cpp/tests/lists/explode_tests.cpp             |  68 +--
 cpp/tests/lists/sort_lists_tests.cpp          |   8 +-
 cpp/tests/merge/merge_dictionary_test.cpp     |  18 +-
 cpp/tests/merge/merge_string_test.cpp         |  63 ++-
 .../partitioning/hash_partition_test.cpp      |   2 +-
 cpp/tests/partitioning/round_robin_test.cpp   |  73 +--
 .../quantiles/percentile_approx_test.cpp      |  11 +-
 cpp/tests/quantiles/quantile_test.cpp         |   2 +-
 cpp/tests/quantiles/quantiles_test.cpp        |  12 +-
 cpp/tests/reductions/collect_ops_tests.cpp    |  47 +-
 cpp/tests/reductions/list_rank_test.cpp       |  85 +++-
 cpp/tests/reductions/reduction_tests.cpp      | 131 +++---
 cpp/tests/reductions/scan_tests.cpp           |  15 +-
 .../reductions/segmented_reduction_tests.cpp  |  69 +--
 cpp/tests/reshape/byte_cast_tests.cpp         |  16 +-
 cpp/tests/rolling/collect_ops_test.cpp        |  30 +-
 cpp/tests/rolling/grouped_rolling_test.cpp    | 110 +++--
 .../rolling/range_rolling_window_test.cpp     |  24 +-
 cpp/tests/round/round_tests.cpp               |   5 +-
 cpp/tests/scalar/scalar_test.cpp              |   4 +-
 cpp/tests/search/search_dictionary_test.cpp   |  30 +-
 cpp/tests/sort/is_sorted_tests.cpp            |   8 +-
 cpp/tests/sort/rank_test.cpp                  |  91 ++--
 cpp/tests/sort/stable_sort_tests.cpp          |   8 +-
 .../distinct_count_tests.cpp                  |  37 +-
 .../stream_compaction/distinct_tests.cpp      |   4 +-
 .../stream_compaction/drop_nans_tests.cpp     |  38 +-
 .../stream_compaction/drop_nulls_tests.cpp    |  67 +--
 .../stable_distinct_tests.cpp                 |   4 +-
 cpp/tests/stream_compaction/unique_tests.cpp  |  72 +--
 cpp/tests/streams/interop_test.cpp            |   1 +
 cpp/tests/streams/io/orc_test.cpp             |   4 +-
 cpp/tests/streams/io/parquet_test.cpp         |   4 +-
 cpp/tests/streams/lists_test.cpp              |   5 +-
 cpp/tests/streams/reduction_test.cpp          |  16 +-
 cpp/tests/streams/replace_test.cpp            |   9 +-
 cpp/tests/streams/strings/filter_test.cpp     |   4 +-
 cpp/tests/strings/case_tests.cpp              |  50 ++-
 cpp/tests/strings/chars_types_tests.cpp       |  51 ++-
 .../strings/combine/concatenate_tests.cpp     |  11 +-
 .../strings/combine/join_strings_tests.cpp    |   6 +-
 cpp/tests/strings/contains_tests.cpp          |  16 +-
 cpp/tests/strings/datetime_tests.cpp          |   6 +-
 cpp/tests/strings/extract_tests.cpp           |  23 +-
 cpp/tests/strings/fill_tests.cpp              |   6 +-
 cpp/tests/strings/find_multiple_tests.cpp     |   2 +-
 cpp/tests/strings/find_tests.cpp              | 102 +++--
 cpp/tests/strings/findall_tests.cpp           |   6 +-
 cpp/tests/strings/fixed_point_tests.cpp       |   6 +-
 cpp/tests/strings/integers_tests.cpp          |  24 +-
 cpp/tests/strings/ipv4_tests.cpp              |   7 +-
 cpp/tests/strings/like_tests.cpp              |   7 +-
 cpp/tests/strings/pad_tests.cpp               |   5 +-
 cpp/tests/strings/replace_regex_tests.cpp     |   6 +-
 cpp/tests/strings/replace_tests.cpp           |  12 +-
 cpp/tests/strings/reverse_tests.cpp           |  18 +-
 cpp/tests/strings/slice_tests.cpp             |   8 +-
 cpp/tests/strings/split_tests.cpp             |  42 +-
 cpp/tests/strings/strip_tests.cpp             |   5 +-
 cpp/tests/strings/translate_tests.cpp         |   4 +-
 cpp/tests/structs/structs_column_tests.cpp    |   2 +-
 cpp/tests/structs/utilities_tests.cpp         |   4 +-
 cpp/tests/table/row_operators_tests.cpp       |   8 +-
 cpp/tests/text/bpe_tests.cpp                  |   2 +-
 cpp/tests/text/jaccard_tests.cpp              |  15 +-
 cpp/tests/text/normalize_tests.cpp            |   6 +-
 cpp/tests/text/replace_tests.cpp              |   2 +-
 cpp/tests/text/stemmer_tests.cpp              |   2 +-
 cpp/tests/text/subword_tests.cpp              |   2 +-
 cpp/tests/text/tokenize_tests.cpp             |   6 +-
 cpp/tests/transform/nans_to_null_test.cpp     |   4 +-
 cpp/tests/transform/one_hot_encode_tests.cpp  |   9 +-
 cpp/tests/unary/cast_tests.cpp                |  15 +-
 cpp/tests/unary/math_ops_test.cpp             |   3 +-
 cpp/tests/utilities/column_utilities.cu       |   2 +-
 cpp/tests/utilities/identify_stream_usage.cpp |   2 +-
 cpp/tests/utilities_tests/logger_tests.cpp    |   4 +-
 cpp/tests/utilities_tests/type_list_tests.cpp |  54 +--
 java/src/main/native/include/jni_utils.hpp    |  26 +-
 java/src/main/native/src/ColumnVectorJni.cpp  |  14 +-
 java/src/main/native/src/ColumnViewJni.cpp    |  44 +-
 java/src/main/native/src/RmmJni.cpp           |   8 +-
 java/src/main/native/src/ScalarJni.cpp        |   4 +-
 java/src/main/native/src/TableJni.cpp         |  28 +-
 .../main/native/src/jni_writer_data_sink.hpp  |   4 +-
 261 files changed, 2911 insertions(+), 2151 deletions(-)

diff --git a/.pre-commit-config.yaml b/.pre-commit-config.yaml
index 4cdcac88091..cc08b832e69 100644
--- a/.pre-commit-config.yaml
+++ b/.pre-commit-config.yaml
@@ -56,12 +56,20 @@ repos:
       - id: clang-format
         types_or: [c, c++, cuda]
         args: ["-fallback-style=none", "-style=file", "-i"]
+        exclude: |
+          (?x)^(
+            ^cpp/src/io/parquet/ipc/Schema_generated.h|
+            ^cpp/src/io/parquet/ipc/Message_generated.h|
+            ^cpp/include/cudf_test/cxxopts.hpp|
+          )
   - repo: https://github.com/sirosen/texthooks
     rev: 0.6.6
     hooks:
       - id: fix-smartquotes
         exclude: |
           (?x)^(
+            ^cpp/src/io/parquet/ipc/Schema_generated.h|
+            ^cpp/src/io/parquet/ipc/Message_generated.h|
             ^cpp/include/cudf_test/cxxopts.hpp|
             ^python/cudf/cudf/tests/data/subword_tokenizer_data/.*|
             ^python/cudf/cudf/tests/text/test_text_methods.py
diff --git a/cpp/include/cudf/ast/expressions.hpp b/cpp/include/cudf/ast/expressions.hpp
index 26916e49012..918271e3e4f 100644
--- a/cpp/include/cudf/ast/expressions.hpp
+++ b/cpp/include/cudf/ast/expressions.hpp
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2020-2023, NVIDIA CORPORATION.
+ * Copyright (c) 2020-2024, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -478,7 +478,10 @@ class operation : public expression {
    *
    * @return Vector of operands
    */
-  std::vector<std::reference_wrapper<expression const>> get_operands() const { return operands; }
+  [[nodiscard]] std::vector<std::reference_wrapper<expression const>> get_operands() const
+  {
+    return operands;
+  }
 
   /**
    * @copydoc expression::accept
diff --git a/cpp/include/cudf/column/column_device_view.cuh b/cpp/include/cudf/column/column_device_view.cuh
index 19722d127cb..787e9c2c479 100644
--- a/cpp/include/cudf/column/column_device_view.cuh
+++ b/cpp/include/cudf/column/column_device_view.cuh
@@ -442,7 +442,7 @@ class alignas(16) column_device_view : public detail::column_device_view_base {
    * @return string_view instance representing this element at this index
    */
   template <typename T, CUDF_ENABLE_IF(std::is_same_v<T, string_view>)>
-  __device__ T element(size_type element_index) const noexcept
+  __device__ [[nodiscard]] T element(size_type element_index) const noexcept
   {
     size_type index       = element_index + offset();  // account for this view's _offset
     char const* d_strings = static_cast<char const*>(_data);
@@ -501,7 +501,7 @@ class alignas(16) column_device_view : public detail::column_device_view_base {
    * @return dictionary32 instance representing this element at this index
    */
   template <typename T, CUDF_ENABLE_IF(std::is_same_v<T, dictionary32>)>
-  __device__ T element(size_type element_index) const noexcept
+  __device__ [[nodiscard]] T element(size_type element_index) const noexcept
   {
     size_type index    = element_index + offset();  // account for this view's _offset
     auto const indices = d_children[0];
@@ -519,7 +519,7 @@ class alignas(16) column_device_view : public detail::column_device_view_base {
    * @return numeric::fixed_point representing the element at this index
    */
   template <typename T, CUDF_ENABLE_IF(cudf::is_fixed_point<T>())>
-  __device__ T element(size_type element_index) const noexcept
+  __device__ [[nodiscard]] T element(size_type element_index) const noexcept
   {
     using namespace numeric;
     using rep        = typename T::rep;
@@ -858,7 +858,7 @@ class alignas(16) column_device_view : public detail::column_device_view_base {
    */
   [[nodiscard]] __device__ device_span<column_device_view const> children() const noexcept
   {
-    return device_span<column_device_view const>(d_children, _num_children);
+    return {d_children, static_cast<std::size_t>(_num_children)};
   }
 
   /**
@@ -1032,7 +1032,7 @@ class alignas(16) mutable_column_device_view : public detail::column_device_view
    * @return Reference to the element at the specified index
    */
   template <typename T, CUDF_ENABLE_IF(is_rep_layout_compatible<T>())>
-  __device__ T& element(size_type element_index) const noexcept
+  __device__ [[nodiscard]] T& element(size_type element_index) const noexcept
   {
     return data<T>()[element_index];
   }
diff --git a/cpp/include/cudf/detail/aggregation/aggregation.hpp b/cpp/include/cudf/detail/aggregation/aggregation.hpp
index 87c0f8ec7f1..edee83783b8 100644
--- a/cpp/include/cudf/detail/aggregation/aggregation.hpp
+++ b/cpp/include/cudf/detail/aggregation/aggregation.hpp
@@ -24,6 +24,7 @@
 
 #include <functional>
 #include <numeric>
+#include <utility>
 
 namespace cudf {
 namespace detail {
@@ -510,7 +511,7 @@ class quantile_aggregation final : public groupby_aggregation, public reduce_agg
   void finalize(aggregation_finalizer& finalizer) const override { finalizer.visit(*this); }
 
  private:
-  size_t hash_impl() const
+  [[nodiscard]] size_t hash_impl() const
   {
     return std::hash<int>{}(static_cast<int>(_interpolation)) ^
            std::accumulate(
@@ -596,7 +597,10 @@ class nunique_aggregation final : public groupby_aggregation,
   void finalize(aggregation_finalizer& finalizer) const override { finalizer.visit(*this); }
 
  private:
-  size_t hash_impl() const { return std::hash<int>{}(static_cast<int>(_null_handling)); }
+  [[nodiscard]] size_t hash_impl() const
+  {
+    return std::hash<int>{}(static_cast<int>(_null_handling));
+  }
 };
 
 /**
@@ -638,7 +642,7 @@ class nth_element_aggregation final : public groupby_aggregation,
   void finalize(aggregation_finalizer& finalizer) const override { finalizer.visit(*this); }
 
  private:
-  size_t hash_impl() const
+  [[nodiscard]] size_t hash_impl() const
   {
     return std::hash<size_type>{}(_n) ^ std::hash<int>{}(static_cast<int>(_null_handling));
   }
@@ -763,7 +767,10 @@ class collect_list_aggregation final : public rolling_aggregation,
   void finalize(aggregation_finalizer& finalizer) const override { finalizer.visit(*this); }
 
  private:
-  size_t hash_impl() const { return std::hash<int>{}(static_cast<int>(_null_handling)); }
+  [[nodiscard]] size_t hash_impl() const
+  {
+    return std::hash<int>{}(static_cast<int>(_null_handling));
+  }
 };
 
 /**
@@ -813,7 +820,7 @@ class collect_set_aggregation final : public rolling_aggregation,
   void finalize(aggregation_finalizer& finalizer) const override { finalizer.visit(*this); }
 
  protected:
-  size_t hash_impl() const
+  [[nodiscard]] size_t hash_impl() const
   {
     return std::hash<int>{}(static_cast<int>(_null_handling) ^ static_cast<int>(_nulls_equal) ^
                             static_cast<int>(_nans_equal));
@@ -866,10 +873,10 @@ class lead_lag_aggregation final : public rolling_aggregation {
 class udf_aggregation final : public rolling_aggregation {
  public:
   udf_aggregation(aggregation::Kind type,
-                  std::string const& user_defined_aggregator,
+                  std::string user_defined_aggregator,
                   data_type output_type)
     : aggregation{type},
-      _source{user_defined_aggregator},
+      _source{std::move(user_defined_aggregator)},
       _operator_name{(type == aggregation::PTX) ? "rolling_udf_ptx" : "rolling_udf_cuda"},
       _function_name{"rolling_udf"},
       _output_type{output_type}
@@ -973,7 +980,7 @@ class merge_sets_aggregation final : public groupby_aggregation, public reduce_a
   void finalize(aggregation_finalizer& finalizer) const override { finalizer.visit(*this); }
 
  protected:
-  size_t hash_impl() const
+  [[nodiscard]] size_t hash_impl() const
   {
     return std::hash<int>{}(static_cast<int>(_nulls_equal) ^ static_cast<int>(_nans_equal));
   }
@@ -1046,7 +1053,7 @@ class covariance_aggregation final : public groupby_aggregation {
   void finalize(aggregation_finalizer& finalizer) const override { finalizer.visit(*this); }
 
  protected:
-  size_t hash_impl() const
+  [[nodiscard]] size_t hash_impl() const
   {
     return std::hash<size_type>{}(_min_periods) ^ std::hash<size_type>{}(_ddof);
   }
@@ -1088,7 +1095,7 @@ class correlation_aggregation final : public groupby_aggregation {
   void finalize(aggregation_finalizer& finalizer) const override { finalizer.visit(*this); }
 
  protected:
-  size_t hash_impl() const
+  [[nodiscard]] size_t hash_impl() const
   {
     return std::hash<int>{}(static_cast<int>(_type)) ^ std::hash<size_type>{}(_min_periods);
   }
diff --git a/cpp/include/cudf/detail/contiguous_split.hpp b/cpp/include/cudf/detail/contiguous_split.hpp
index de00b61cdca..1467ed1aa67 100644
--- a/cpp/include/cudf/detail/contiguous_split.hpp
+++ b/cpp/include/cudf/detail/contiguous_split.hpp
@@ -104,7 +104,7 @@ class metadata_builder {
    *
    * @returns A vector containing the serialized column metadata
    */
-  std::vector<uint8_t> build() const;
+  [[nodiscard]] std::vector<uint8_t> build() const;
 
   /**
    * @brief Clear the internal buffer containing all added metadata.
diff --git a/cpp/include/cudf/detail/normalizing_iterator.cuh b/cpp/include/cudf/detail/normalizing_iterator.cuh
index 32df13104e0..308fd188b09 100644
--- a/cpp/include/cudf/detail/normalizing_iterator.cuh
+++ b/cpp/include/cudf/detail/normalizing_iterator.cuh
@@ -51,7 +51,7 @@ struct alignas(16) base_normalator {
    */
   CUDF_HOST_DEVICE inline Derived& operator++()
   {
-    Derived& derived = static_cast<Derived&>(*this);
+    auto& derived = static_cast<Derived&>(*this);
     derived.p_ += width_;
     return derived;
   }
@@ -71,7 +71,7 @@ struct alignas(16) base_normalator {
    */
   CUDF_HOST_DEVICE inline Derived& operator--()
   {
-    Derived& derived = static_cast<Derived&>(*this);
+    auto& derived = static_cast<Derived&>(*this);
     derived.p_ -= width_;
     return derived;
   }
@@ -91,7 +91,7 @@ struct alignas(16) base_normalator {
    */
   CUDF_HOST_DEVICE inline Derived& operator+=(difference_type offset)
   {
-    Derived& derived = static_cast<Derived&>(*this);
+    auto& derived = static_cast<Derived&>(*this);
     derived.p_ += offset * width_;
     return derived;
   }
@@ -121,7 +121,7 @@ struct alignas(16) base_normalator {
    */
   CUDF_HOST_DEVICE inline Derived& operator-=(difference_type offset)
   {
-    Derived& derived = static_cast<Derived&>(*this);
+    auto& derived = static_cast<Derived&>(*this);
     derived.p_ -= offset * width_;
     return derived;
   }
diff --git a/cpp/include/cudf/detail/structs/utilities.hpp b/cpp/include/cudf/detail/structs/utilities.hpp
index e736514ac29..beedc009c84 100644
--- a/cpp/include/cudf/detail/structs/utilities.hpp
+++ b/cpp/include/cudf/detail/structs/utilities.hpp
@@ -25,6 +25,8 @@
 #include <rmm/device_buffer.hpp>
 #include <rmm/resource_ref.hpp>
 
+#include <utility>
+
 namespace cudf::structs::detail {
 
 enum class column_nullability {
@@ -112,12 +114,12 @@ class flattened_table {
    * @param columns_ Newly allocated columns to back the table_view
    * @param nullable_data_ Newly generated temporary data that needs to be kept alive
    */
-  flattened_table(table_view const& flattened_columns_,
+  flattened_table(table_view flattened_columns_,
                   std::vector<order> const& orders_,
                   std::vector<null_order> const& null_orders_,
                   std::vector<std::unique_ptr<column>>&& columns_,
                   temporary_nullable_data&& nullable_data_)
-    : _flattened_columns{flattened_columns_},
+    : _flattened_columns{std::move(flattened_columns_)},
       _orders{orders_},
       _null_orders{null_orders_},
       _columns{std::move(columns_)},
@@ -170,11 +172,11 @@ class flattened_table {
  *         orders, flattened null precedence, alongside the supporting columns and device_buffers
  *         for the flattened table.
  */
-[[nodiscard]] std::unique_ptr<flattened_table> flatten_nested_columns(
+[[nodiscard]] std::unique_ptr<cudf::structs::detail::flattened_table> flatten_nested_columns(
   table_view const& input,
-  std::vector<order> const& column_order,
-  std::vector<null_order> const& null_precedence,
-  column_nullability nullability,
+  std::vector<cudf::order> const& column_order,
+  std::vector<cudf::null_order> const& null_precedence,
+  cudf::structs::detail::column_nullability nullability,
   rmm::cuda_stream_view stream,
   rmm::device_async_resource_ref mr);
 
@@ -194,11 +196,11 @@ class flattened_table {
  * @param mr Device memory resource used to allocate new device memory
  * @return A new column with potentially new null mask
  */
-[[nodiscard]] std::unique_ptr<column> superimpose_nulls(bitmask_type const* null_mask,
-                                                        size_type null_count,
-                                                        std::unique_ptr<column>&& input,
-                                                        rmm::cuda_stream_view stream,
-                                                        rmm::device_async_resource_ref mr);
+[[nodiscard]] std::unique_ptr<cudf::column> superimpose_nulls(bitmask_type const* null_mask,
+                                                              cudf::size_type null_count,
+                                                              std::unique_ptr<cudf::column>&& input,
+                                                              rmm::cuda_stream_view stream,
+                                                              rmm::device_async_resource_ref mr);
 
 /**
  * @brief Push down nulls from the given input column into its children columns, using bitwise AND.
diff --git a/cpp/include/cudf/detail/utilities/host_vector.hpp b/cpp/include/cudf/detail/utilities/host_vector.hpp
index 6a115177ab5..2d14d0306cd 100644
--- a/cpp/include/cudf/detail/utilities/host_vector.hpp
+++ b/cpp/include/cudf/detail/utilities/host_vector.hpp
@@ -82,7 +82,7 @@ class rmm_host_allocator {
   using size_type       = std::size_t;     ///< The type used for the size of the allocation
   using difference_type = std::ptrdiff_t;  ///< The type of the distance between two pointers
 
-  typedef cuda::std::true_type propagate_on_container_move_assignment;
+  using propagate_on_container_move_assignment = cuda::std::true_type;
 
   /**
    * @brief converts a `rmm_host_allocator<T>` to `rmm_host_allocator<U>`
@@ -147,7 +147,7 @@ class rmm_host_allocator {
    *  @return The maximum number of objects that may be allocated
    *          by a single call to \p allocate().
    */
-  constexpr inline size_type max_size() const
+  [[nodiscard]] constexpr inline size_type max_size() const
   {
     return (std::numeric_limits<size_type>::max)() / sizeof(T);
   }
diff --git a/cpp/include/cudf/detail/utilities/stream_pool.hpp b/cpp/include/cudf/detail/utilities/stream_pool.hpp
index e19cc3ec2f7..64c1d4ae514 100644
--- a/cpp/include/cudf/detail/utilities/stream_pool.hpp
+++ b/cpp/include/cudf/detail/utilities/stream_pool.hpp
@@ -73,7 +73,7 @@ class cuda_stream_pool {
    *
    * @return the number of stream objects in the pool
    */
-  virtual std::size_t get_stream_pool_size() const = 0;
+  [[nodiscard]] virtual std::size_t get_stream_pool_size() const = 0;
 };
 
 /**
diff --git a/cpp/include/cudf/fixed_point/fixed_point.hpp b/cpp/include/cudf/fixed_point/fixed_point.hpp
index e39d75757e8..6c3c3b4da07 100644
--- a/cpp/include/cudf/fixed_point/fixed_point.hpp
+++ b/cpp/include/cudf/fixed_point/fixed_point.hpp
@@ -291,14 +291,14 @@ class fixed_point {
    *
    * @return The underlying value of the `fixed_point` number
    */
-  CUDF_HOST_DEVICE inline rep value() const { return _value; }
+  CUDF_HOST_DEVICE [[nodiscard]] inline rep value() const { return _value; }
 
   /**
    * @brief Method that returns the scale of the `fixed_point` number
    *
    * @return The scale of the `fixed_point` number
    */
-  CUDF_HOST_DEVICE inline scale_type scale() const { return _scale; }
+  CUDF_HOST_DEVICE [[nodiscard]] inline scale_type scale() const { return _scale; }
 
   /**
    * @brief Explicit conversion operator to `bool`
@@ -573,7 +573,7 @@ class fixed_point {
    * @param scale The `scale` of the returned `fixed_point` number
    * @return `fixed_point` number with a new `scale`
    */
-  CUDF_HOST_DEVICE inline fixed_point<Rep, Rad> rescaled(scale_type scale) const
+  CUDF_HOST_DEVICE [[nodiscard]] inline fixed_point<Rep, Rad> rescaled(scale_type scale) const
   {
     if (scale == _scale) { return *this; }
     Rep const value = detail::shift<Rep, Rad>(_value, scale_type{scale - _scale});
diff --git a/cpp/include/cudf/interop.hpp b/cpp/include/cudf/interop.hpp
index f3ff0009d5c..56ec62fa6e1 100644
--- a/cpp/include/cudf/interop.hpp
+++ b/cpp/include/cudf/interop.hpp
@@ -40,6 +40,8 @@
 
 #include <rmm/mr/device/per_device_resource.hpp>
 
+#include <utility>
+
 struct DLManagedTensor;
 
 struct ArrowDeviceArray;
@@ -121,7 +123,7 @@ struct column_metadata {
    *
    * @param _name Name of the column
    */
-  column_metadata(std::string const& _name) : name(_name) {}
+  column_metadata(std::string _name) : name(std::move(_name)) {}
   column_metadata() = default;
 };
 
diff --git a/cpp/include/cudf/interop/detail/arrow.hpp b/cpp/include/cudf/interop/detail/arrow.hpp
index 8043ecf5422..906d48f636b 100644
--- a/cpp/include/cudf/interop/detail/arrow.hpp
+++ b/cpp/include/cudf/interop/detail/arrow.hpp
@@ -24,8 +24,12 @@
 #define ARROW_C_DEVICE_DATA_INTERFACE
 
 // Device type for the allocated memory
-typedef int32_t ArrowDeviceType;
+using ArrowDeviceType = int32_t;
 
+// The Arrow spec specifies using macros rather than enums here to avoid being
+// susceptible to changes in the underlying type chosen by the compiler, but
+// clang-tidy doesn't like this.
+// NOLINTBEGIN
 // CPU device, same as using ArrowArray directly
 #define ARROW_DEVICE_CPU 1
 // CUDA GPU Device
@@ -34,6 +38,7 @@ typedef int32_t ArrowDeviceType;
 #define ARROW_DEVICE_CUDA_HOST 3
 // CUDA managed/unified memory allocated by cudaMallocManaged
 #define ARROW_DEVICE_CUDA_MANAGED 13
+// NOLINTEND
 
 struct ArrowDeviceArray {
   struct ArrowArray array;
diff --git a/cpp/include/cudf/io/arrow_io_source.hpp b/cpp/include/cudf/io/arrow_io_source.hpp
index 5f79f05c5a1..d7a48c34e12 100644
--- a/cpp/include/cudf/io/arrow_io_source.hpp
+++ b/cpp/include/cudf/io/arrow_io_source.hpp
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2023, NVIDIA CORPORATION.
+ * Copyright (c) 2023-2024, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -23,6 +23,7 @@
 
 #include <memory>
 #include <string>
+#include <utility>
 
 namespace cudf::io {
 /**
@@ -49,7 +50,10 @@ class arrow_io_source : public datasource {
    *
    * @param file The `arrow` object from which the data is read
    */
-  explicit arrow_io_source(std::shared_ptr<arrow::io::RandomAccessFile> file) : arrow_file(file) {}
+  explicit arrow_io_source(std::shared_ptr<arrow::io::RandomAccessFile> file)
+    : arrow_file(std::move(file))
+  {
+  }
 
   /**
    * @brief Returns a buffer with a subset of data from the `arrow` source.
diff --git a/cpp/include/cudf/io/csv.hpp b/cpp/include/cudf/io/csv.hpp
index a20f75cecd7..68bb7fba00e 100644
--- a/cpp/include/cudf/io/csv.hpp
+++ b/cpp/include/cudf/io/csv.hpp
@@ -27,6 +27,7 @@
 #include <memory>
 #include <string>
 #include <unordered_map>
+#include <utility>
 #include <variant>
 #include <vector>
 
@@ -431,7 +432,8 @@ class csv_reader_options {
    *
    * @return Per-column types
    */
-  std::variant<std::vector<data_type>, std::map<std::string, data_type>> const& get_dtypes() const
+  [[nodiscard]] std::variant<std::vector<data_type>, std::map<std::string, data_type>> const&
+  get_dtypes() const
   {
     return _dtypes;
   }
@@ -441,49 +443,49 @@ class csv_reader_options {
    *
    * @return Additional values to recognize as boolean true values
    */
-  std::vector<std::string> const& get_true_values() const { return _true_values; }
+  [[nodiscard]] std::vector<std::string> const& get_true_values() const { return _true_values; }
 
   /**
    * @brief Returns additional values to recognize as boolean false values.
    *
    * @return Additional values to recognize as boolean false values
    */
-  std::vector<std::string> const& get_false_values() const { return _false_values; }
+  [[nodiscard]] std::vector<std::string> const& get_false_values() const { return _false_values; }
 
   /**
    * @brief Returns additional values to recognize as null values.
    *
    * @return Additional values to recognize as null values
    */
-  std::vector<std::string> const& get_na_values() const { return _na_values; }
+  [[nodiscard]] std::vector<std::string> const& get_na_values() const { return _na_values; }
 
   /**
    * @brief Whether to keep the built-in default NA values.
    *
    * @return `true` if the built-in default NA values are kept
    */
-  bool is_enabled_keep_default_na() const { return _keep_default_na; }
+  [[nodiscard]] bool is_enabled_keep_default_na() const { return _keep_default_na; }
 
   /**
    * @brief Whether to disable null filter.
    *
    * @return `true` if null filter is enabled
    */
-  bool is_enabled_na_filter() const { return _na_filter; }
+  [[nodiscard]] bool is_enabled_na_filter() const { return _na_filter; }
 
   /**
    * @brief Whether to parse dates as DD/MM versus MM/DD.
    *
    * @return True if dates are parsed as DD/MM, false if MM/DD
    */
-  bool is_enabled_dayfirst() const { return _dayfirst; }
+  [[nodiscard]] bool is_enabled_dayfirst() const { return _dayfirst; }
 
   /**
    * @brief Returns timestamp_type to which all timestamp columns will be cast.
    *
    * @return timestamp_type to which all timestamp columns will be cast
    */
-  data_type get_timestamp_type() const { return _timestamp_type; }
+  [[nodiscard]] data_type get_timestamp_type() const { return _timestamp_type; }
 
   /**
    * @brief Sets compression format of the source.
@@ -1399,8 +1401,8 @@ class csv_writer_options {
    * @param sink The sink used for writer output
    * @param table Table to be written to output
    */
-  explicit csv_writer_options(sink_info const& sink, table_view const& table)
-    : _sink(sink), _table(table), _rows_per_chunk(table.num_rows())
+  explicit csv_writer_options(sink_info sink, table_view const& table)
+    : _sink(std::move(sink)), _table(table), _rows_per_chunk(table.num_rows())
   {
   }
 
diff --git a/cpp/include/cudf/io/detail/parquet.hpp b/cpp/include/cudf/io/detail/parquet.hpp
index 978216d971e..21c870cb75e 100644
--- a/cpp/include/cudf/io/detail/parquet.hpp
+++ b/cpp/include/cudf/io/detail/parquet.hpp
@@ -160,7 +160,7 @@ class chunked_reader : private reader {
    * destructor needs to be defined in a separate source file which can access to that object's
    * declaration.
    */
-  ~chunked_reader();
+  ~chunked_reader() override;
 
   /**
    * @copydoc cudf::io::chunked_parquet_reader::has_next
diff --git a/cpp/include/cudf/io/json.hpp b/cpp/include/cudf/io/json.hpp
index 65ba8f25577..8de690482f9 100644
--- a/cpp/include/cudf/io/json.hpp
+++ b/cpp/include/cudf/io/json.hpp
@@ -26,6 +26,7 @@
 
 #include <map>
 #include <string>
+#include <utility>
 #include <variant>
 #include <vector>
 
@@ -166,9 +167,9 @@ class json_reader_options {
    *
    * @returns Data types of the columns
    */
-  std::variant<std::vector<data_type>,
-               std::map<std::string, data_type>,
-               std::map<std::string, schema_element>> const&
+  [[nodiscard]] std::variant<std::vector<data_type>,
+                             std::map<std::string, data_type>,
+                             std::map<std::string, schema_element>> const&
   get_dtypes() const
   {
     return _dtypes;
@@ -179,28 +180,28 @@ class json_reader_options {
    *
    * @return Compression format of the source
    */
-  compression_type get_compression() const { return _compression; }
+  [[nodiscard]] compression_type get_compression() const { return _compression; }
 
   /**
    * @brief Returns number of bytes to skip from source start.
    *
    * @return Number of bytes to skip from source start
    */
-  size_t get_byte_range_offset() const { return _byte_range_offset; }
+  [[nodiscard]] size_t get_byte_range_offset() const { return _byte_range_offset; }
 
   /**
    * @brief Returns number of bytes to read.
    *
    * @return Number of bytes to read
    */
-  size_t get_byte_range_size() const { return _byte_range_size; }
+  [[nodiscard]] size_t get_byte_range_size() const { return _byte_range_size; }
 
   /**
    * @brief Returns number of bytes to read with padding.
    *
    * @return Number of bytes to read with padding
    */
-  size_t get_byte_range_size_with_padding() const
+  [[nodiscard]] size_t get_byte_range_size_with_padding() const
   {
     if (_byte_range_size == 0) {
       return 0;
@@ -214,7 +215,7 @@ class json_reader_options {
    *
    * @return Number of bytes to pad
    */
-  size_t get_byte_range_padding() const
+  [[nodiscard]] size_t get_byte_range_padding() const
   {
     auto const num_columns = std::visit([](auto const& dtypes) { return dtypes.size(); }, _dtypes);
 
@@ -236,67 +237,68 @@ class json_reader_options {
    *
    * @return Delimiter separating records in JSON lines
    */
-  char get_delimiter() const { return _delimiter; }
+  [[nodiscard]] char get_delimiter() const { return _delimiter; }
 
   /**
    * @brief Whether to read the file as a json object per line.
    *
    * @return `true` if reading the file as a json object per line
    */
-  bool is_enabled_lines() const { return _lines; }
+  [[nodiscard]] bool is_enabled_lines() const { return _lines; }
 
   /**
    * @brief Whether to parse mixed types as a string column.
    *
    * @return `true` if mixed types are parsed as a string column
    */
-  bool is_enabled_mixed_types_as_string() const { return _mixed_types_as_string; }
+  [[nodiscard]] bool is_enabled_mixed_types_as_string() const { return _mixed_types_as_string; }
 
   /**
    * @brief Whether to prune columns on read, selected based on the @ref set_dtypes option.
    *
    * When set as true, if the reader options include @ref set_dtypes, then
    * the reader will only return those columns which are mentioned in @ref set_dtypes.
-   * If false, then all columns are returned, independent of the @ref set_dtypes setting.
+   * If false, then all columns are returned, independent of the @ref set_dtypes
+   * setting.
    *
    * @return True if column pruning is enabled
    */
-  bool is_enabled_prune_columns() const { return _prune_columns; }
+  [[nodiscard]] bool is_enabled_prune_columns() const { return _prune_columns; }
 
   /**
    * @brief Whether to parse dates as DD/MM versus MM/DD.
    *
    * @returns true if dates are parsed as DD/MM, false if MM/DD
    */
-  bool is_enabled_dayfirst() const { return _dayfirst; }
+  [[nodiscard]] bool is_enabled_dayfirst() const { return _dayfirst; }
 
   /**
    * @brief Whether the reader should keep quotes of string values.
    *
    * @returns true if the reader should keep quotes, false otherwise
    */
-  bool is_enabled_keep_quotes() const { return _keep_quotes; }
+  [[nodiscard]] bool is_enabled_keep_quotes() const { return _keep_quotes; }
 
   /**
    * @brief Whether the reader should normalize single quotes around strings
    *
    * @returns true if the reader should normalize single quotes, false otherwise
    */
-  bool is_enabled_normalize_single_quotes() const { return _normalize_single_quotes; }
+  [[nodiscard]] bool is_enabled_normalize_single_quotes() const { return _normalize_single_quotes; }
 
   /**
    * @brief Whether the reader should normalize unquoted whitespace characters
    *
    * @returns true if the reader should normalize whitespace, false otherwise
    */
-  bool is_enabled_normalize_whitespace() const { return _normalize_whitespace; }
+  [[nodiscard]] bool is_enabled_normalize_whitespace() const { return _normalize_whitespace; }
 
   /**
    * @brief Queries the JSON reader's behavior on invalid JSON lines.
    *
    * @returns An enum that specifies the JSON reader's behavior on invalid JSON lines.
    */
-  json_recovery_mode_t recovery_mode() const { return _recovery_mode; }
+  [[nodiscard]] json_recovery_mode_t recovery_mode() const { return _recovery_mode; }
 
   /**
    * @brief Set data types for columns to be read.
@@ -717,8 +719,8 @@ class json_writer_options {
    * @param sink The sink used for writer output
    * @param table Table to be written to output
    */
-  explicit json_writer_options(sink_info const& sink, table_view const& table)
-    : _sink(sink), _table(table), _rows_per_chunk(table.num_rows())
+  explicit json_writer_options(sink_info sink, table_view table)
+    : _sink(std::move(sink)), _table(std::move(table)), _rows_per_chunk(table.num_rows())
   {
   }
 
diff --git a/cpp/include/cudf/io/orc.hpp b/cpp/include/cudf/io/orc.hpp
index 8140f8897b7..623c1d9fc72 100644
--- a/cpp/include/cudf/io/orc.hpp
+++ b/cpp/include/cudf/io/orc.hpp
@@ -28,6 +28,7 @@
 #include <optional>
 #include <string>
 #include <unordered_map>
+#include <utility>
 #include <vector>
 
 namespace cudf {
@@ -125,7 +126,7 @@ class orc_reader_options {
    *
    * @return Number of rows to skip from the start
    */
-  int64_t get_skip_rows() const { return _skip_rows; }
+  [[nodiscard]] int64_t get_skip_rows() const { return _skip_rows; }
 
   /**
    * @brief Returns number of row to read.
@@ -133,35 +134,38 @@ class orc_reader_options {
    * @return Number of rows to read; `nullopt` if the option hasn't been set (in which case the file
    * is read until the end)
    */
-  std::optional<int64_t> const& get_num_rows() const { return _num_rows; }
+  [[nodiscard]] std::optional<int64_t> const& get_num_rows() const { return _num_rows; }
 
   /**
    * @brief Whether to use row index to speed-up reading.
    *
    * @return `true` if row index is used to speed-up reading
    */
-  bool is_enabled_use_index() const { return _use_index; }
+  [[nodiscard]] bool is_enabled_use_index() const { return _use_index; }
 
   /**
    * @brief Whether to use numpy-compatible dtypes.
    *
    * @return `true` if numpy-compatible dtypes are used
    */
-  bool is_enabled_use_np_dtypes() const { return _use_np_dtypes; }
+  [[nodiscard]] bool is_enabled_use_np_dtypes() const { return _use_np_dtypes; }
 
   /**
    * @brief Returns timestamp type to which timestamp column will be cast.
    *
    * @return Timestamp type to which timestamp column will be cast
    */
-  data_type get_timestamp_type() const { return _timestamp_type; }
+  [[nodiscard]] data_type get_timestamp_type() const { return _timestamp_type; }
 
   /**
    * @brief Returns fully qualified names of columns that should be read as 128-bit Decimal.
    *
    * @return Fully qualified names of columns that should be read as 128-bit Decimal
    */
-  std::vector<std::string> const& get_decimal128_columns() const { return _decimal128_columns; }
+  [[nodiscard]] std::vector<std::string> const& get_decimal128_columns() const
+  {
+    return _decimal128_columns;
+  }
 
   // Setters
 
@@ -603,8 +607,8 @@ class orc_writer_options {
    * @param sink The sink used for writer output
    * @param table Table to be written to output
    */
-  explicit orc_writer_options(sink_info const& sink, table_view const& table)
-    : _sink(sink), _table(table)
+  explicit orc_writer_options(sink_info sink, table_view table)
+    : _sink(std::move(sink)), _table(std::move(table))
   {
   }
 
@@ -676,7 +680,7 @@ class orc_writer_options {
    *
    * @return Row index stride
    */
-  auto get_row_index_stride() const
+  [[nodiscard]] auto get_row_index_stride() const
   {
     auto const unaligned_stride = std::min(_row_index_stride, get_stripe_size_rows());
     return unaligned_stride - unaligned_stride % 8;
@@ -1048,7 +1052,7 @@ class chunked_orc_writer_options {
    *
    * @param sink The sink used for writer output
    */
-  chunked_orc_writer_options(sink_info const& sink) : _sink(sink) {}
+  chunked_orc_writer_options(sink_info sink) : _sink(std::move(sink)) {}
 
  public:
   /**
@@ -1107,7 +1111,7 @@ class chunked_orc_writer_options {
    *
    * @return Row index stride
    */
-  auto get_row_index_stride() const
+  [[nodiscard]] auto get_row_index_stride() const
   {
     auto const unaligned_stride = std::min(_row_index_stride, get_stripe_size_rows());
     return unaligned_stride - unaligned_stride % 8;
diff --git a/cpp/include/cudf/io/parquet.hpp b/cpp/include/cudf/io/parquet.hpp
index 51eeed5b721..431f14af522 100644
--- a/cpp/include/cudf/io/parquet.hpp
+++ b/cpp/include/cudf/io/parquet.hpp
@@ -187,7 +187,7 @@ class parquet_reader_options {
    *
    * @return Timestamp type used to cast timestamp columns
    */
-  data_type get_timestamp_type() const { return _timestamp_type; }
+  [[nodiscard]] data_type get_timestamp_type() const { return _timestamp_type; }
 
   /**
    * @brief Sets names of the columns to be read.
@@ -626,7 +626,7 @@ class parquet_writer_options_base {
    *
    * @param sink The sink used for writer output
    */
-  explicit parquet_writer_options_base(sink_info const& sink) : _sink(sink) {}
+  explicit parquet_writer_options_base(sink_info sink) : _sink(std::move(sink)) {}
 
  public:
   /**
@@ -1287,7 +1287,7 @@ class chunked_parquet_writer_options : public parquet_writer_options_base {
    *
    * @param sink Sink used for writer output
    */
-  explicit chunked_parquet_writer_options(sink_info const& sink);
+  explicit chunked_parquet_writer_options(sink_info sink);
 
   friend chunked_parquet_writer_options_builder;
 
diff --git a/cpp/include/cudf/io/types.hpp b/cpp/include/cudf/io/types.hpp
index 150e997f533..0dab1c606de 100644
--- a/cpp/include/cudf/io/types.hpp
+++ b/cpp/include/cudf/io/types.hpp
@@ -30,6 +30,7 @@
 #include <optional>
 #include <string>
 #include <unordered_map>
+#include <utility>
 #include <vector>
 
 namespace cudf {
@@ -247,10 +248,10 @@ struct column_name_info {
    * @param _is_nullable True if column is nullable
    * @param _is_binary True if column is binary data
    */
-  column_name_info(std::string const& _name,
+  column_name_info(std::string _name,
                    std::optional<bool> _is_nullable = std::nullopt,
                    std::optional<bool> _is_binary   = std::nullopt)
-    : name(_name), is_nullable(_is_nullable), is_binary(_is_binary)
+    : name(std::move(_name)), is_nullable(_is_nullable), is_binary(_is_binary)
   {
   }
 
diff --git a/cpp/include/cudf/join.hpp b/cpp/include/cudf/join.hpp
index 825f758adbd..ba485bd6372 100644
--- a/cpp/include/cudf/join.hpp
+++ b/cpp/include/cudf/join.hpp
@@ -336,8 +336,8 @@ class hash_join {
    * the result of performing an inner join between two tables with `build` and `probe`
    * as the join keys .
    */
-  std::pair<std::unique_ptr<rmm::device_uvector<size_type>>,
-            std::unique_ptr<rmm::device_uvector<size_type>>>
+  [[nodiscard]] std::pair<std::unique_ptr<rmm::device_uvector<size_type>>,
+                          std::unique_ptr<rmm::device_uvector<size_type>>>
   inner_join(cudf::table_view const& probe,
              std::optional<std::size_t> output_size = {},
              rmm::cuda_stream_view stream           = cudf::get_default_stream(),
@@ -359,10 +359,10 @@ class hash_join {
    *
    * @return A pair of columns [`left_indices`, `right_indices`] that can be used to construct
    * the result of performing a left join between two tables with `build` and `probe`
-   * as the join keys .
+   * as the join keys.
    */
-  std::pair<std::unique_ptr<rmm::device_uvector<size_type>>,
-            std::unique_ptr<rmm::device_uvector<size_type>>>
+  [[nodiscard]] std::pair<std::unique_ptr<rmm::device_uvector<size_type>>,
+                          std::unique_ptr<rmm::device_uvector<size_type>>>
   left_join(cudf::table_view const& probe,
             std::optional<std::size_t> output_size = {},
             rmm::cuda_stream_view stream           = cudf::get_default_stream(),
@@ -386,8 +386,8 @@ class hash_join {
    * the result of performing a full join between two tables with `build` and `probe`
    * as the join keys .
    */
-  std::pair<std::unique_ptr<rmm::device_uvector<size_type>>,
-            std::unique_ptr<rmm::device_uvector<size_type>>>
+  [[nodiscard]] std::pair<std::unique_ptr<rmm::device_uvector<size_type>>,
+                          std::unique_ptr<rmm::device_uvector<size_type>>>
   full_join(cudf::table_view const& probe,
             std::optional<std::size_t> output_size = {},
             rmm::cuda_stream_view stream           = cudf::get_default_stream(),
@@ -440,7 +440,7 @@ class hash_join {
    * @return The exact number of output when performing a full join between two tables with `build`
    * and `probe` as the join keys .
    */
-  std::size_t full_join_size(
+  [[nodiscard]] std::size_t full_join_size(
     cudf::table_view const& probe,
     rmm::cuda_stream_view stream      = cudf::get_default_stream(),
     rmm::device_async_resource_ref mr = rmm::mr::get_current_device_resource()) const;
@@ -492,12 +492,12 @@ class distinct_hash_join {
    * @param stream CUDA stream used for device memory operations and kernel launches
    * @param mr Device memory resource used to allocate the returned indices' device memory.
    *
-   * @return A pair of columns [`build_indices`, `probe_indices`] that can be used to construct
-   * the result of performing an inner join between two tables with `build` and `probe`
-   * as the join keys.
+   * @return A pair of columns [`build_indices`, `probe_indices`] that can be used to
+   * construct the result of performing an inner join between two tables
+   * with `build` and `probe` as the join keys.
    */
-  std::pair<std::unique_ptr<rmm::device_uvector<size_type>>,
-            std::unique_ptr<rmm::device_uvector<size_type>>>
+  [[nodiscard]] std::pair<std::unique_ptr<rmm::device_uvector<size_type>>,
+                          std::unique_ptr<rmm::device_uvector<size_type>>>
   inner_join(rmm::cuda_stream_view stream      = cudf::get_default_stream(),
              rmm::device_async_resource_ref mr = rmm::mr::get_current_device_resource()) const;
 
@@ -512,10 +512,11 @@ class distinct_hash_join {
    * @param stream CUDA stream used for device memory operations and kernel launches
    * @param mr Device memory resource used to allocate the returned table and columns' device
    * memory.
-   * @return A `build_indices` column that can be used to construct the result of performing a left
-   * join between two tables with `build` and `probe` as the join keys.
+   * @return A `build_indices` column that can be used to construct the result of
+   * performing a left join between two tables with `build` and `probe` as the join
+   * keys.
    */
-  std::unique_ptr<rmm::device_uvector<size_type>> left_join(
+  [[nodiscard]] std::unique_ptr<rmm::device_uvector<size_type>> left_join(
     rmm::cuda_stream_view stream      = cudf::get_default_stream(),
     rmm::device_async_resource_ref mr = rmm::mr::get_current_device_resource()) const;
 
diff --git a/cpp/include/cudf/scalar/scalar.hpp b/cpp/include/cudf/scalar/scalar.hpp
index da1d0d743a7..d78907b473a 100644
--- a/cpp/include/cudf/scalar/scalar.hpp
+++ b/cpp/include/cudf/scalar/scalar.hpp
@@ -187,7 +187,7 @@ class fixed_width_scalar : public scalar {
    * @param stream CUDA stream used for device memory operations.
    * @return Value of the scalar
    */
-  T value(rmm::cuda_stream_view stream = cudf::get_default_stream()) const;
+  [[nodiscard]] T value(rmm::cuda_stream_view stream = cudf::get_default_stream()) const;
 
   /**
    * @brief Returns a raw pointer to the value in device memory.
@@ -199,7 +199,7 @@ class fixed_width_scalar : public scalar {
    * @brief Returns a const raw pointer to the value in device memory.
    * @return A const raw pointer to the value in device memory
    */
-  T const* data() const;
+  [[nodiscard]] T const* data() const;
 
  protected:
   rmm::device_scalar<T> _data;  ///< device memory containing the value
@@ -245,8 +245,8 @@ class numeric_scalar : public detail::fixed_width_scalar<T> {
   static_assert(is_numeric<T>(), "Unexpected non-numeric type.");
 
  public:
-  numeric_scalar()  = delete;
-  ~numeric_scalar() = default;
+  numeric_scalar()           = delete;
+  ~numeric_scalar() override = default;
 
   /**
    * @brief Move constructor for numeric_scalar.
@@ -393,7 +393,7 @@ class fixed_point_scalar : public scalar {
    * @param stream CUDA stream used for device memory operations.
    * @return The value of the scalar
    */
-  rep_type value(rmm::cuda_stream_view stream = cudf::get_default_stream()) const;
+  [[nodiscard]] rep_type value(rmm::cuda_stream_view stream = cudf::get_default_stream()) const;
 
   /**
    * @brief Get the decimal32, decimal64 or decimal128.
@@ -401,7 +401,8 @@ class fixed_point_scalar : public scalar {
    * @param stream CUDA stream used for device memory operations.
    * @return The decimal32, decimal64 or decimal128 value
    */
-  T fixed_point_value(rmm::cuda_stream_view stream = cudf::get_default_stream()) const;
+  [[nodiscard]] T fixed_point_value(
+    rmm::cuda_stream_view stream = cudf::get_default_stream()) const;
 
   /**
    * @brief Explicit conversion operator to get the value of the scalar on the host.
@@ -418,7 +419,7 @@ class fixed_point_scalar : public scalar {
    * @brief Returns a const raw pointer to the value in device memory.
    * @return a const raw pointer to the value in device memory
    */
-  rep_type const* data() const;
+  [[nodiscard]] rep_type const* data() const;
 
  protected:
   rmm::device_scalar<rep_type> _data;  ///< device memory containing the value
@@ -565,8 +566,8 @@ class chrono_scalar : public detail::fixed_width_scalar<T> {
   static_assert(is_chrono<T>(), "Unexpected non-chrono type");
 
  public:
-  chrono_scalar()  = delete;
-  ~chrono_scalar() = default;
+  chrono_scalar()           = delete;
+  ~chrono_scalar() override = default;
 
   /**
    * @brief Move constructor for chrono_scalar.
diff --git a/cpp/include/cudf/strings/regex/regex_program.hpp b/cpp/include/cudf/strings/regex/regex_program.hpp
index bdf541f455f..95c86ae0f8a 100644
--- a/cpp/include/cudf/strings/regex/regex_program.hpp
+++ b/cpp/include/cudf/strings/regex/regex_program.hpp
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2022, NVIDIA CORPORATION.
+ * Copyright (c) 2022-2024, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -74,35 +74,35 @@ struct regex_program {
    *
    * @return regex pattern as a string
    */
-  std::string pattern() const;
+  [[nodiscard]] std::string pattern() const;
 
   /**
    * @brief Return the regex_flags used to create this instance
    *
    * @return regex flags setting
    */
-  regex_flags flags() const;
+  [[nodiscard]] regex_flags flags() const;
 
   /**
    * @brief Return the capture_groups used to create this instance
    *
    * @return capture groups setting
    */
-  capture_groups capture() const;
+  [[nodiscard]] capture_groups capture() const;
 
   /**
    * @brief Return the number of instructions in this instance
    *
    * @return Number of instructions
    */
-  int32_t instructions_count() const;
+  [[nodiscard]] int32_t instructions_count() const;
 
   /**
    * @brief Return the number of capture groups in this instance
    *
    * @return Number of groups
    */
-  int32_t groups_count() const;
+  [[nodiscard]] int32_t groups_count() const;
 
   /**
    * @brief Return the size of the working memory for the regex execution
@@ -110,7 +110,7 @@ struct regex_program {
    * @param num_strings Number of strings for computation
    * @return Size of the working memory in bytes
    */
-  std::size_t compute_working_memory_size(int32_t num_strings) const;
+  [[nodiscard]] std::size_t compute_working_memory_size(int32_t num_strings) const;
 
   ~regex_program();
 
diff --git a/cpp/include/cudf/strings/string_view.cuh b/cpp/include/cudf/strings/string_view.cuh
index 74df1ea1887..93cc787683b 100644
--- a/cpp/include/cudf/strings/string_view.cuh
+++ b/cpp/include/cudf/strings/string_view.cuh
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2019-2023, NVIDIA CORPORATION.
+ * Copyright (c) 2019-2024, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -110,7 +110,7 @@ static __constant__ char max_string_sentinel[5]{"\xF7\xBF\xBF\xBF"};
  *
  * @return An empty string
  */
-CUDF_HOST_DEVICE inline string_view string_view::min() { return string_view(); }
+CUDF_HOST_DEVICE inline string_view string_view::min() { return {}; }
 
 /**
  * @brief Return maximum value associated with the string type
@@ -130,7 +130,7 @@ CUDF_HOST_DEVICE inline string_view string_view::max()
   CUDF_CUDA_TRY(
     cudaGetSymbolAddress((void**)&psentinel, cudf::strings::detail::max_string_sentinel));
 #endif
-  return string_view(psentinel, 4);
+  return {psentinel, 4};
 }
 
 __device__ inline size_type string_view::length() const
@@ -439,7 +439,7 @@ __device__ inline string_view string_view::substr(size_type pos, size_type count
   auto const itr  = begin() + pos;
   auto const spos = itr.byte_offset();
   auto const epos = count >= 0 ? (itr + count).byte_offset() : size_bytes();
-  return string_view(data() + spos, epos - spos);
+  return {data() + spos, epos - spos};
 }
 
 __device__ inline size_type string_view::character_offset(size_type bytepos) const
diff --git a/cpp/include/cudf/table/table.hpp b/cpp/include/cudf/table/table.hpp
index 8efe6eb8c72..c4f14af53fb 100644
--- a/cpp/include/cudf/table/table.hpp
+++ b/cpp/include/cudf/table/table.hpp
@@ -144,7 +144,7 @@ class table {
    */
 
   template <typename InputIterator>
-  table_view select(InputIterator begin, InputIterator end) const
+  [[nodiscard]] table_view select(InputIterator begin, InputIterator end) const
   {
     std::vector<column_view> columns(std::distance(begin, end));
     std::transform(
diff --git a/cpp/include/cudf/table/table_view.hpp b/cpp/include/cudf/table/table_view.hpp
index ad12b1eef4e..a71e0558dec 100644
--- a/cpp/include/cudf/table/table_view.hpp
+++ b/cpp/include/cudf/table/table_view.hpp
@@ -123,7 +123,7 @@ class table_view_base {
    * @param column_index The index of the desired column
    * @return A reference to the desired column
    */
-  ColumnView const& column(size_type column_index) const;
+  [[nodiscard]] ColumnView const& column(size_type column_index) const;
 
   /**
    * @brief Returns the number of columns
@@ -224,7 +224,7 @@ class table_view : public detail::table_view_base<column_view> {
    * specified by the elements of `column_indices`
    */
   template <typename InputIterator>
-  table_view select(InputIterator begin, InputIterator end) const
+  [[nodiscard]] table_view select(InputIterator begin, InputIterator end) const
   {
     std::vector<column_view> columns(std::distance(begin, end));
     std::transform(begin, end, columns.begin(), [this](auto index) { return this->column(index); });
diff --git a/cpp/include/cudf/utilities/error.hpp b/cpp/include/cudf/utilities/error.hpp
index 719d44a9ab3..f019f516b84 100644
--- a/cpp/include/cudf/utilities/error.hpp
+++ b/cpp/include/cudf/utilities/error.hpp
@@ -48,7 +48,7 @@ struct stacktrace_recorder {
    *
    * @return The pointer to a null-terminated string storing the output stacktrace
    */
-  char const* stacktrace() const { return _stacktrace.c_str(); }
+  [[nodiscard]] char const* stacktrace() const { return _stacktrace.c_str(); }
 
  protected:
   std::string const _stacktrace;  //!< The whole stacktrace stored as one string.
@@ -78,7 +78,7 @@ struct logic_error : public std::logic_error, public stacktrace_recorder {
   // TODO Add an error code member? This would be useful for translating an
   // exception to an error code in a pure-C API
 
-  ~logic_error()
+  ~logic_error() override
   {
     // Needed so that the first instance of the implicit destructor for any TU isn't 'constructed'
     // from a host+device function marking the implicit version also as host+device
@@ -106,7 +106,7 @@ struct cuda_error : public std::runtime_error, public stacktrace_recorder {
    *
    * @return CUDA error code
    */
-  cudaError_t error_code() const { return _cudaError; }
+  [[nodiscard]] cudaError_t error_code() const { return _cudaError; }
 
  protected:
   cudaError_t _cudaError;  //!< CUDA error code
@@ -237,7 +237,7 @@ inline void throw_cuda_error(cudaError_t error, char const* file, unsigned int l
   // Calls cudaGetLastError to clear the error status. It is nearly certain that a fatal error
   // occurred if it still returns the same error after a cleanup.
   cudaGetLastError();
-  auto const last = cudaFree(0);
+  auto const last = cudaFree(nullptr);
   auto const msg  = std::string{"CUDA error encountered at: " + std::string{file} + ":" +
                                std::to_string(line) + ": " + std::to_string(error) + " " +
                                cudaGetErrorName(error) + " " + cudaGetErrorString(error)};
diff --git a/cpp/include/cudf/utilities/span.hpp b/cpp/include/cudf/utilities/span.hpp
index 47e92d61a9f..3b35e60e034 100644
--- a/cpp/include/cudf/utilities/span.hpp
+++ b/cpp/include/cudf/utilities/span.hpp
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2020-2023, NVIDIA CORPORATION.
+ * Copyright (c) 2020-2024, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -28,6 +28,7 @@
 #include <cstddef>
 #include <limits>
 #include <type_traits>
+#include <utility>
 
 namespace cudf {
 /**
@@ -90,7 +91,7 @@ class span_base {
    *
    * @return Reference to the first element in the span
    */
-  constexpr reference front() const { return _data[0]; }
+  [[nodiscard]] constexpr reference front() const { return _data[0]; }
   // not noexcept due to undefined behavior when size = 0
   /**
    * @brief Returns a reference to the last element in the span.
@@ -99,7 +100,7 @@ class span_base {
    *
    * @return Reference to the last element in the span
    */
-  constexpr reference back() const { return _data[_size - 1]; }
+  [[nodiscard]] constexpr reference back() const { return _data[_size - 1]; }
   // not noexcept due to undefined behavior when idx < 0 || idx >= size
   /**
    * @brief Returns a reference to the idx-th element of the sequence.
@@ -119,7 +120,7 @@ class span_base {
    *
    * @return An iterator to the first element of the span
    */
-  constexpr iterator begin() const noexcept { return _data; }
+  [[nodiscard]] constexpr iterator begin() const noexcept { return _data; }
   /**
    * @brief Returns an iterator to the element following the last element of the span.
    *
@@ -127,13 +128,13 @@ class span_base {
    *
    * @return An iterator to the element following the last element of the span
    */
-  constexpr iterator end() const noexcept { return _data + _size; }
+  [[nodiscard]] constexpr iterator end() const noexcept { return _data + _size; }
   /**
    * @brief Returns a pointer to the beginning of the sequence.
    *
    * @return A pointer to the first element of the span
    */
-  constexpr pointer data() const noexcept { return _data; }
+  [[nodiscard]] constexpr pointer data() const noexcept { return _data; }
 
   /**
    * @brief Returns the number of elements in the span.
@@ -160,7 +161,10 @@ class span_base {
    * @param count Number of elements from the beginning of this span to put in the subspan.
    * @return A subspan of the first N elements of the sequence
    */
-  constexpr Derived first(size_type count) const noexcept { return Derived(_data, count); }
+  [[nodiscard]] constexpr Derived first(size_type count) const noexcept
+  {
+    return Derived(_data, count);
+  }
 
   /**
    * @brief Obtains a subspan consisting of the last N elements of the sequence
@@ -168,7 +172,7 @@ class span_base {
    * @param count Number of elements from the end of this span to put in the subspan
    * @return A subspan of the last N elements of the sequence
    */
-  constexpr Derived last(size_type count) const noexcept
+  [[nodiscard]] constexpr Derived last(size_type count) const noexcept
   {
     return Derived(_data + _size - count, count);
   }
@@ -180,7 +184,7 @@ class span_base {
    * @param count The number of elements in the subspan
    * @return A subspan of the sequence, of requested count and offset
    */
-  constexpr Derived subspan(size_type offset, size_type count) const noexcept
+  [[nodiscard]] constexpr Derived subspan(size_type offset, size_type count) const noexcept
   {
     return Derived(_data + offset, count);
   }
@@ -365,7 +369,7 @@ class base_2dspan {
    * @param data Pointer to the data
    * @param size Size of the 2D span as pair
    */
-  base_2dspan(T* data, size_type size) noexcept : _data{data}, _size{size} {}
+  base_2dspan(T* data, size_type size) noexcept : _data{data}, _size{std::move(size)} {}
 
   /**
    * @brief Returns a pointer to the beginning of the sequence.
diff --git a/cpp/include/cudf/utilities/thread_pool.hpp b/cpp/include/cudf/utilities/thread_pool.hpp
index 74a2531710b..c8c3eb097c4 100644
--- a/cpp/include/cudf/utilities/thread_pool.hpp
+++ b/cpp/include/cudf/utilities/thread_pool.hpp
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2021-2023, NVIDIA CORPORATION.
+ * Copyright (c) 2021-2024, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -201,8 +201,8 @@ class thread_pool {
     running = false;
     destroy_threads();
     thread_count = _thread_count ? _thread_count : std::thread::hardware_concurrency();
-    threads.reset(new std::thread[thread_count]);
-    paused = was_paused;
+    threads      = std::make_unique<std::thread[]>(thread_count);
+    paused       = was_paused;
     create_threads();
     running = true;
   }
diff --git a/cpp/include/cudf/wrappers/dictionary.hpp b/cpp/include/cudf/wrappers/dictionary.hpp
index 37264c5a33c..95f4ac00a53 100644
--- a/cpp/include/cudf/wrappers/dictionary.hpp
+++ b/cpp/include/cudf/wrappers/dictionary.hpp
@@ -87,7 +87,7 @@ struct dictionary_wrapper {
    *
    * @return The value of this dictionary wrapper
    */
-  CUDF_HOST_DEVICE inline value_type value() const { return _value; }
+  CUDF_HOST_DEVICE [[nodiscard]] inline value_type value() const { return _value; }
 
   /**
    * @brief Returns the maximum value of the value type.
diff --git a/cpp/include/cudf/wrappers/durations.hpp b/cpp/include/cudf/wrappers/durations.hpp
index 62aa22c2788..840dba4f4ba 100644
--- a/cpp/include/cudf/wrappers/durations.hpp
+++ b/cpp/include/cudf/wrappers/durations.hpp
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2020-2022, NVIDIA CORPORATION.
+ * Copyright (c) 2020-2024, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -56,13 +56,13 @@ using duration_us = cuda::std::chrono::duration<int64_t, cuda::std::chrono::micr
  */
 using duration_ns = cuda::std::chrono::duration<int64_t, cuda::std::chrono::nanoseconds::period>;
 
-static_assert(sizeof(duration_D) == sizeof(typename duration_D::rep), "");
-static_assert(sizeof(duration_h) == sizeof(typename duration_h::rep), "");
-static_assert(sizeof(duration_m) == sizeof(typename duration_m::rep), "");
-static_assert(sizeof(duration_s) == sizeof(typename duration_s::rep), "");
-static_assert(sizeof(duration_ms) == sizeof(typename duration_ms::rep), "");
-static_assert(sizeof(duration_us) == sizeof(typename duration_us::rep), "");
-static_assert(sizeof(duration_ns) == sizeof(typename duration_ns::rep), "");
+static_assert(sizeof(duration_D) == sizeof(typename duration_D::rep));
+static_assert(sizeof(duration_h) == sizeof(typename duration_h::rep));
+static_assert(sizeof(duration_m) == sizeof(typename duration_m::rep));
+static_assert(sizeof(duration_s) == sizeof(typename duration_s::rep));
+static_assert(sizeof(duration_ms) == sizeof(typename duration_ms::rep));
+static_assert(sizeof(duration_us) == sizeof(typename duration_us::rep));
+static_assert(sizeof(duration_ns) == sizeof(typename duration_ns::rep));
 
 /** @} */  // end of group
 }  // namespace cudf
diff --git a/cpp/include/cudf/wrappers/timestamps.hpp b/cpp/include/cudf/wrappers/timestamps.hpp
index 0341ac6ede4..5194a3e8f96 100644
--- a/cpp/include/cudf/wrappers/timestamps.hpp
+++ b/cpp/include/cudf/wrappers/timestamps.hpp
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2019-2022, NVIDIA CORPORATION.
+ * Copyright (c) 2019-2024, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -73,13 +73,13 @@ using timestamp_us = detail::timestamp<cudf::duration_us>;
  */
 using timestamp_ns = detail::timestamp<cudf::duration_ns>;
 
-static_assert(sizeof(timestamp_D) == sizeof(typename timestamp_D::rep), "");
-static_assert(sizeof(timestamp_h) == sizeof(typename timestamp_h::rep), "");
-static_assert(sizeof(timestamp_m) == sizeof(typename timestamp_m::rep), "");
-static_assert(sizeof(timestamp_s) == sizeof(typename timestamp_s::rep), "");
-static_assert(sizeof(timestamp_ms) == sizeof(typename timestamp_ms::rep), "");
-static_assert(sizeof(timestamp_us) == sizeof(typename timestamp_us::rep), "");
-static_assert(sizeof(timestamp_ns) == sizeof(typename timestamp_ns::rep), "");
+static_assert(sizeof(timestamp_D) == sizeof(typename timestamp_D::rep));
+static_assert(sizeof(timestamp_h) == sizeof(typename timestamp_h::rep));
+static_assert(sizeof(timestamp_m) == sizeof(typename timestamp_m::rep));
+static_assert(sizeof(timestamp_s) == sizeof(typename timestamp_s::rep));
+static_assert(sizeof(timestamp_ms) == sizeof(typename timestamp_ms::rep));
+static_assert(sizeof(timestamp_us) == sizeof(typename timestamp_us::rep));
+static_assert(sizeof(timestamp_ns) == sizeof(typename timestamp_ns::rep));
 
 /** @} */  // end of group
 }  // namespace cudf
diff --git a/cpp/include/cudf_test/base_fixture.hpp b/cpp/include/cudf_test/base_fixture.hpp
index 18f75bbc842..0e35ff64af4 100644
--- a/cpp/include/cudf_test/base_fixture.hpp
+++ b/cpp/include/cudf_test/base_fixture.hpp
@@ -66,7 +66,7 @@ class BaseFixtureWithParam : public ::testing::TestWithParam<T> {
    * all tests inheriting from this fixture
    * @return pointer to memory resource
    */
-  rmm::device_async_resource_ref mr() const { return _mr; }
+  [[nodiscard]] rmm::device_async_resource_ref mr() const { return _mr; }
 };
 
 /**
diff --git a/cpp/include/cudf_test/column_wrapper.hpp b/cpp/include/cudf_test/column_wrapper.hpp
index dc873658abf..47d17988775 100644
--- a/cpp/include/cudf_test/column_wrapper.hpp
+++ b/cpp/include/cudf_test/column_wrapper.hpp
@@ -1121,14 +1121,20 @@ class dictionary_column_wrapper<std::string> : public detail::column_wrapper {
    *
    * @return column_view to keys column
    */
-  column_view keys() const { return cudf::dictionary_column_view{wrapped->view()}.keys(); }
+  [[nodiscard]] column_view keys() const
+  {
+    return cudf::dictionary_column_view{wrapped->view()}.keys();
+  }
 
   /**
    * @brief Access indices column view
    *
    * @return column_view to indices column
    */
-  column_view indices() const { return cudf::dictionary_column_view{wrapped->view()}.indices(); }
+  [[nodiscard]] column_view indices() const
+  {
+    return cudf::dictionary_column_view{wrapped->view()}.indices();
+  }
 
   /**
    * @brief Default constructor initializes an empty dictionary column of strings
@@ -1792,7 +1798,10 @@ class lists_column_wrapper : public detail::column_wrapper {
     return {std::move(cols), std::move(stubs)};
   }
 
-  column_view get_view() const { return root ? lists_column_view(*wrapped).child() : *wrapped; }
+  [[nodiscard]] column_view get_view() const
+  {
+    return root ? lists_column_view(*wrapped).child() : *wrapped;
+  }
 
   int depth = 0;
   bool root = false;
diff --git a/cpp/include/cudf_test/stream_checking_resource_adaptor.hpp b/cpp/include/cudf_test/stream_checking_resource_adaptor.hpp
index cafde6ca7d5..5a077e86a0f 100644
--- a/cpp/include/cudf_test/stream_checking_resource_adaptor.hpp
+++ b/cpp/include/cudf_test/stream_checking_resource_adaptor.hpp
@@ -110,7 +110,7 @@ class stream_checking_resource_adaptor final : public rmm::mr::device_memory_res
    * @param other The other resource to compare to
    * @return Whether or not the two resources are equivalent
    */
-  bool do_is_equal(device_memory_resource const& other) const noexcept override
+  [[nodiscard]] bool do_is_equal(device_memory_resource const& other) const noexcept override
   {
     if (this == &other) { return true; }
     auto cast = dynamic_cast<stream_checking_resource_adaptor<Upstream> const*>(&other);
diff --git a/cpp/src/binaryop/binaryop.cpp b/cpp/src/binaryop/binaryop.cpp
index ac31f9045fe..8ac1491547d 100644
--- a/cpp/src/binaryop/binaryop.cpp
+++ b/cpp/src/binaryop/binaryop.cpp
@@ -153,7 +153,7 @@ void binary_operation(mutable_column_view& out,
 
   cudf::jit::get_program_cache(*binaryop_jit_kernel_cu_jit)
     .get_kernel(kernel_name, {}, {{"binaryop/jit/operation-udf.hpp", cuda_source}}, {"-arch=sm_."})
-    ->configure_1d_max_occupancy(0, 0, 0, stream.value())
+    ->configure_1d_max_occupancy(0, 0, nullptr, stream.value())
     ->launch(out.size(),
              cudf::jit::get_data_ptr(out),
              cudf::jit::get_data_ptr(lhs),
diff --git a/cpp/src/binaryop/compiled/operation.cuh b/cpp/src/binaryop/compiled/operation.cuh
index 43b4bd232c4..57113785a29 100644
--- a/cpp/src/binaryop/compiled/operation.cuh
+++ b/cpp/src/binaryop/compiled/operation.cuh
@@ -173,8 +173,8 @@ struct PMod {
   __device__ inline auto operator()(TypeLhs x, TypeRhs y)
   {
     using common_t = std::common_type_t<TypeLhs, TypeRhs>;
-    common_t xconv = static_cast<common_t>(x);
-    common_t yconv = static_cast<common_t>(y);
+    auto xconv     = static_cast<common_t>(x);
+    auto yconv     = static_cast<common_t>(y);
     auto rem       = xconv % yconv;
     if constexpr (std::is_signed_v<decltype(rem)>)
       if (rem < 0) rem = (rem + yconv) % yconv;
@@ -188,8 +188,8 @@ struct PMod {
   __device__ inline auto operator()(TypeLhs x, TypeRhs y)
   {
     using common_t = std::common_type_t<TypeLhs, TypeRhs>;
-    common_t xconv = static_cast<common_t>(x);
-    common_t yconv = static_cast<common_t>(y);
+    auto xconv     = static_cast<common_t>(x);
+    auto yconv     = static_cast<common_t>(y);
     auto rem       = std::fmod(xconv, yconv);
     if (rem < 0) rem = std::fmod(rem + yconv, yconv);
     return rem;
diff --git a/cpp/src/binaryop/compiled/util.cpp b/cpp/src/binaryop/compiled/util.cpp
index 02f4e480ecb..2b6a4f58895 100644
--- a/cpp/src/binaryop/compiled/util.cpp
+++ b/cpp/src/binaryop/compiled/util.cpp
@@ -123,7 +123,7 @@ struct is_supported_operation_functor {
   template <typename TypeLhs, typename TypeRhs>
   struct nested_support_functor {
     template <typename BinaryOperator>
-    inline constexpr bool call(data_type out_type) const
+    [[nodiscard]] inline constexpr bool call(data_type out_type) const
     {
       return is_binary_operation_supported<BinaryOperator>{}.template operator()<TypeLhs, TypeRhs>(
         out_type);
@@ -163,7 +163,7 @@ struct is_supported_operation_functor {
   };
 
   template <typename BinaryOperator, typename TypeLhs, typename TypeRhs>
-  inline constexpr bool bool_op(data_type out) const
+  [[nodiscard]] inline constexpr bool bool_op(data_type out) const
   {
     return out.id() == type_id::BOOL8 and
            is_binary_operation_supported<BinaryOperator>{}.template operator()<TypeLhs, TypeRhs>();
diff --git a/cpp/src/copying/pack.cpp b/cpp/src/copying/pack.cpp
index b0208a58896..819ad593c0a 100644
--- a/cpp/src/copying/pack.cpp
+++ b/cpp/src/copying/pack.cpp
@@ -181,7 +181,7 @@ class metadata_builder_impl {
       col_type, col_size, col_null_count, data_offset, null_mask_offset, num_children);
   }
 
-  std::vector<uint8_t> build() const
+  [[nodiscard]] std::vector<uint8_t> build() const
   {
     auto output = std::vector<uint8_t>(metadata.size() * sizeof(detail::serialized_column));
     std::memcpy(output.data(), metadata.data(), output.size());
diff --git a/cpp/src/datetime/timezone.cpp b/cpp/src/datetime/timezone.cpp
index a3471485293..1b0d201501b 100644
--- a/cpp/src/datetime/timezone.cpp
+++ b/cpp/src/datetime/timezone.cpp
@@ -221,7 +221,7 @@ class posix_parser {
   /**
    * @brief Returns the remaining number of characters in the input.
    */
-  auto remaining_char_cnt() const { return end - cur; }
+  [[nodiscard]] auto remaining_char_cnt() const { return end - cur; }
 
   /**
    * @brief Returns the next character in the input.
diff --git a/cpp/src/interop/arrow_utilities.cpp b/cpp/src/interop/arrow_utilities.cpp
index 05beecfbf9b..dd9e9600a87 100644
--- a/cpp/src/interop/arrow_utilities.cpp
+++ b/cpp/src/interop/arrow_utilities.cpp
@@ -23,7 +23,7 @@
 
 namespace cudf {
 namespace detail {
-data_type arrow_to_cudf_type(const ArrowSchemaView* arrow_view)
+data_type arrow_to_cudf_type(ArrowSchemaView const* arrow_view)
 {
   switch (arrow_view->type) {
     case NANOARROW_TYPE_NA: return data_type(type_id::EMPTY);
diff --git a/cpp/src/interop/arrow_utilities.hpp b/cpp/src/interop/arrow_utilities.hpp
index defddb4dc42..4e2628ab689 100644
--- a/cpp/src/interop/arrow_utilities.hpp
+++ b/cpp/src/interop/arrow_utilities.hpp
@@ -37,7 +37,7 @@ static constexpr int fixed_width_data_buffer_idx = 1;
  * @param arrow_view SchemaView to pull the logical and storage types from
  * @return Column type id
  */
-data_type arrow_to_cudf_type(const ArrowSchemaView* arrow_view);
+data_type arrow_to_cudf_type(ArrowSchemaView const* arrow_view);
 
 /**
  * @brief Map cudf column type id to ArrowType id
diff --git a/cpp/src/interop/detail/arrow_allocator.cpp b/cpp/src/interop/detail/arrow_allocator.cpp
index 3e6a337457a..2a19a5360fe 100644
--- a/cpp/src/interop/detail/arrow_allocator.cpp
+++ b/cpp/src/interop/detail/arrow_allocator.cpp
@@ -38,7 +38,7 @@ T enable_hugepage(T&& buf)
   }
 
 #ifdef MADV_HUGEPAGE
-  const auto pagesize = sysconf(_SC_PAGESIZE);
+  auto const pagesize = sysconf(_SC_PAGESIZE);
   void* addr          = const_cast<uint8_t*>(buf->data());
   if (addr == nullptr) { return std::move(buf); }
   auto length{static_cast<std::size_t>(buf->size())};
diff --git a/cpp/src/interop/from_arrow_host.cu b/cpp/src/interop/from_arrow_host.cu
index 36bb35d9419..854a1d68fdc 100644
--- a/cpp/src/interop/from_arrow_host.cu
+++ b/cpp/src/interop/from_arrow_host.cu
@@ -140,7 +140,7 @@ std::unique_ptr<column> dispatch_copy_from_arrow_host::operator()<bool>(ArrowSch
                                                                         bool skip_mask)
 {
   auto data_buffer         = input->buffers[fixed_width_data_buffer_idx];
-  const auto buffer_length = bitmask_allocation_size_bytes(input->length + input->offset);
+  auto const buffer_length = bitmask_allocation_size_bytes(input->length + input->offset);
 
   auto data = rmm::device_buffer(buffer_length, stream, mr);
   CUDF_CUDA_TRY(cudaMemcpyAsync(data.data(),
@@ -322,7 +322,7 @@ template <>
 std::unique_ptr<column> dispatch_copy_from_arrow_host::operator()<cudf::list_view>(
   ArrowSchemaView* schema, ArrowArray const* input, data_type type, bool skip_mask)
 {
-  const void* offset_buffers[2] = {nullptr, input->buffers[fixed_width_data_buffer_idx]};
+  void const* offset_buffers[2] = {nullptr, input->buffers[fixed_width_data_buffer_idx]};
   ArrowArray offsets_array      = {
          .length     = input->offset + input->length + 1,
          .null_count = 0,
diff --git a/cpp/src/io/avro/avro.cpp b/cpp/src/io/avro/avro.cpp
index 221cdf93042..2041f03cd81 100644
--- a/cpp/src/io/avro/avro.cpp
+++ b/cpp/src/io/avro/avro.cpp
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2019-2023, NVIDIA CORPORATION.
+ * Copyright (c) 2019-2024, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -485,8 +485,8 @@ std::string schema_parser::get_str()
   char const* cur   = start;
   while (cur < m_end && *cur++ != '"')
     ;
-  int32_t len = static_cast<int32_t>(cur - start - 1);
-  m_cur       = cur;
+  auto len = static_cast<int32_t>(cur - start - 1);
+  m_cur    = cur;
   return s.assign(start, std::max(len, 0));
 }
 
diff --git a/cpp/src/io/comp/uncomp.cpp b/cpp/src/io/comp/uncomp.cpp
index 3e5d966282d..ab516dd585d 100644
--- a/cpp/src/io/comp/uncomp.cpp
+++ b/cpp/src/io/comp/uncomp.cpp
@@ -305,7 +305,7 @@ std::vector<uint8_t> decompress(compression_type compression, host_span<uint8_t
       if (OpenZipArchive(&za, raw, src.size())) {
         size_t cdfh_ofs = 0;
         for (int i = 0; i < za.eocd->num_entries; i++) {
-          zip_cdfh_s const* cdfh = reinterpret_cast<zip_cdfh_s const*>(
+          auto const* cdfh = reinterpret_cast<zip_cdfh_s const*>(
             reinterpret_cast<uint8_t const*>(za.cdfh) + cdfh_ofs);
           int cdfh_len = sizeof(zip_cdfh_s) + cdfh->fname_len + cdfh->extra_len + cdfh->comment_len;
           if (cdfh_ofs + cdfh_len > za.eocd->cdir_size || cdfh->sig != 0x0201'4b50) {
@@ -314,8 +314,8 @@ std::vector<uint8_t> decompress(compression_type compression, host_span<uint8_t
           }
           // For now, only accept with non-zero file sizes and DEFLATE
           if (cdfh->comp_method == 8 && cdfh->comp_size > 0 && cdfh->uncomp_size > 0) {
-            size_t lfh_ofs       = cdfh->hdr_ofs;
-            zip_lfh_s const* lfh = reinterpret_cast<zip_lfh_s const*>(raw + lfh_ofs);
+            size_t lfh_ofs  = cdfh->hdr_ofs;
+            auto const* lfh = reinterpret_cast<zip_lfh_s const*>(raw + lfh_ofs);
             if (lfh_ofs + sizeof(zip_lfh_s) <= src.size() && lfh->sig == 0x0403'4b50 &&
                 lfh_ofs + sizeof(zip_lfh_s) + lfh->fname_len + lfh->extra_len <= src.size()) {
               if (lfh->comp_method == 8 && lfh->comp_size > 0 && lfh->uncomp_size > 0) {
@@ -340,7 +340,7 @@ std::vector<uint8_t> decompress(compression_type compression, host_span<uint8_t
       [[fallthrough]];
     case compression_type::BZIP2:
       if (src.size() > 4) {
-        bz2_file_header_s const* fhdr = reinterpret_cast<bz2_file_header_s const*>(raw);
+        auto const* fhdr = reinterpret_cast<bz2_file_header_s const*>(raw);
         // Check for BZIP2 file signature "BZh1" to "BZh9"
         if (fhdr->sig[0] == 'B' && fhdr->sig[1] == 'Z' && fhdr->sig[2] == 'h' &&
             fhdr->blksz >= '1' && fhdr->blksz <= '9') {
diff --git a/cpp/src/io/functions.cpp b/cpp/src/io/functions.cpp
index 1ed8ee5ce06..5daa55d4552 100644
--- a/cpp/src/io/functions.cpp
+++ b/cpp/src/io/functions.cpp
@@ -306,14 +306,14 @@ raw_orc_statistics read_raw_orc_statistics(source_info const& src_info,
 
   // Get file-level statistics, statistics of each column of file
   for (auto const& stats : metadata.ff.statistics) {
-    result.file_stats.push_back(std::string(stats.cbegin(), stats.cend()));
+    result.file_stats.emplace_back(stats.cbegin(), stats.cend());
   }
 
   // Get stripe-level statistics
   for (auto const& stripes_stats : metadata.md.stripeStats) {
     result.stripes_stats.emplace_back();
     for (auto const& stats : stripes_stats.colStats) {
-      result.stripes_stats.back().push_back(std::string(stats.cbegin(), stats.cend()));
+      result.stripes_stats.back().emplace_back(stats.cbegin(), stats.cend());
     }
   }
 
@@ -1026,8 +1026,8 @@ parquet_writer_options_builder& parquet_writer_options_builder::column_chunks_fi
   return *this;
 }
 
-chunked_parquet_writer_options::chunked_parquet_writer_options(sink_info const& sink)
-  : parquet_writer_options_base(sink)
+chunked_parquet_writer_options::chunked_parquet_writer_options(sink_info sink)
+  : parquet_writer_options_base(std::move(sink))
 {
 }
 
diff --git a/cpp/src/io/json/nested_json_gpu.cu b/cpp/src/io/json/nested_json_gpu.cu
index b243e4ba006..031edfde4f6 100644
--- a/cpp/src/io/json/nested_json_gpu.cu
+++ b/cpp/src/io/json/nested_json_gpu.cu
@@ -245,7 +245,7 @@ struct TransduceToken {
                                                 RelativeOffsetT const relative_offset,
                                                 SymbolT const read_symbol) const
   {
-    const bool is_end_of_invalid_line =
+    bool const is_end_of_invalid_line =
       (state_id == static_cast<StateT>(TT_INV) &&
        match_id == static_cast<SymbolGroupT>(dfa_symbol_group_id::DELIMITER));
 
@@ -265,15 +265,15 @@ struct TransduceToken {
     // Number of tokens emitted on invalid lines
     constexpr int32_t num_inv_tokens = 2;
 
-    const bool is_delimiter = match_id == static_cast<SymbolGroupT>(dfa_symbol_group_id::DELIMITER);
+    bool const is_delimiter = match_id == static_cast<SymbolGroupT>(dfa_symbol_group_id::DELIMITER);
 
     // If state is either invalid or we're entering an invalid state, we discard tokens
-    const bool is_part_of_invalid_line =
+    bool const is_part_of_invalid_line =
       (match_id != static_cast<SymbolGroupT>(dfa_symbol_group_id::ERROR) &&
        state_id == static_cast<StateT>(TT_VLD));
 
     // Indicates whether we transition from an invalid line to a potentially valid line
-    const bool is_end_of_invalid_line = (state_id == static_cast<StateT>(TT_INV) && is_delimiter);
+    bool const is_end_of_invalid_line = (state_id == static_cast<StateT>(TT_INV) && is_delimiter);
 
     int32_t const emit_count =
       is_end_of_invalid_line ? num_inv_tokens : (is_part_of_invalid_line && !is_delimiter ? 1 : 0);
diff --git a/cpp/src/io/json/read_json.cu b/cpp/src/io/json/read_json.cu
index df5c7bc21e1..e999be8f83a 100644
--- a/cpp/src/io/json/read_json.cu
+++ b/cpp/src/io/json/read_json.cu
@@ -85,7 +85,7 @@ device_span<char> ingest_raw_input(device_span<char> buffer,
                                   sources.end(),
                                   prefsum_source_sizes.begin(),
                                   std::plus<int>{},
-                                  [](const std::unique_ptr<datasource>& s) { return s->size(); });
+                                  [](std::unique_ptr<datasource> const& s) { return s->size(); });
     auto upper =
       std::upper_bound(prefsum_source_sizes.begin(), prefsum_source_sizes.end(), range_offset);
     size_t start_source = std::distance(prefsum_source_sizes.begin(), upper);
diff --git a/cpp/src/io/orc/orc.hpp b/cpp/src/io/orc/orc.hpp
index fd55cbb6846..e1403acd455 100644
--- a/cpp/src/io/orc/orc.hpp
+++ b/cpp/src/io/orc/orc.hpp
@@ -511,7 +511,7 @@ class ProtobufWriter {
                            TypeKind kind,
                            ColStatsBlob const* stats);
 
-  std::size_t size() const { return m_buff.size(); }
+  [[nodiscard]] std::size_t size() const { return m_buff.size(); }
   uint8_t const* data() { return m_buff.data(); }
 
   std::vector<uint8_t>& buffer() { return m_buff; }
diff --git a/cpp/src/io/orc/orc_field_writer.hpp b/cpp/src/io/orc/orc_field_writer.hpp
index 4862562d526..731e9d7687e 100644
--- a/cpp/src/io/orc/orc_field_writer.hpp
+++ b/cpp/src/io/orc/orc_field_writer.hpp
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2020-2023, NVIDIA CORPORATION.
+ * Copyright (c) 2020-2024, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -31,10 +31,10 @@ namespace io {
 namespace orc {
 
 struct ProtobufWriter::ProtobufFieldWriter {
-  int struct_size;
+  int struct_size{0};
   ProtobufWriter* p;
 
-  ProtobufFieldWriter(ProtobufWriter* pbw) : struct_size(0), p(pbw) {}
+  ProtobufFieldWriter(ProtobufWriter* pbw) : p(pbw) {}
 
   /**
    * @brief Function to write a unsigned integer to the internal buffer
diff --git a/cpp/src/io/orc/reader_impl_chunking.cu b/cpp/src/io/orc/reader_impl_chunking.cu
index 43301826003..01ee5ad177d 100644
--- a/cpp/src/io/orc/reader_impl_chunking.cu
+++ b/cpp/src/io/orc/reader_impl_chunking.cu
@@ -537,7 +537,7 @@ void reader_impl::load_next_stripe_data(read_mode mode)
     _file_itm_data.selected_stripes.begin() + stripe_start,
     _file_itm_data.selected_stripes.begin() + stripe_start + stripe_count,
     std::size_t{0},
-    [](std::size_t count, const auto& stripe) { return count + stripe.stripe_info->numberOfRows; });
+    [](std::size_t count, auto const& stripe) { return count + stripe.stripe_info->numberOfRows; });
 
   // Decoding range needs to be reset to start from the first position in `decode_stripe_ranges`.
   _chunk_read_data.curr_decode_stripe_range = 0;
diff --git a/cpp/src/io/orc/reader_impl_decode.cu b/cpp/src/io/orc/reader_impl_decode.cu
index da9fb802a0a..72eb41b1360 100644
--- a/cpp/src/io/orc/reader_impl_decode.cu
+++ b/cpp/src/io/orc/reader_impl_decode.cu
@@ -810,7 +810,7 @@ void reader_impl::decompress_and_decode_stripes(read_mode mode)
       cudf::detail::hostdevice_2dvector<gpu::ColumnDesc>(stripe_count, num_lvl_columns, _stream);
     memset(chunks.base_host_ptr(), 0, chunks.size_bytes());
 
-    const bool use_index =
+    bool const use_index =
       _options.use_index &&
       // Do stripes have row group index
       _metadata.is_row_grp_idx_present() &&
diff --git a/cpp/src/io/parquet/compact_protocol_reader.cpp b/cpp/src/io/parquet/compact_protocol_reader.cpp
index c9212334a96..192833507b0 100644
--- a/cpp/src/io/parquet/compact_protocol_reader.cpp
+++ b/cpp/src/io/parquet/compact_protocol_reader.cpp
@@ -42,7 +42,7 @@ class parquet_field {
 
  public:
   virtual ~parquet_field() = default;
-  int field() const { return _field_val; }
+  [[nodiscard]] int field() const { return _field_val; }
 };
 
 std::string field_type_string(FieldType type)
diff --git a/cpp/src/io/parquet/compact_protocol_writer.hpp b/cpp/src/io/parquet/compact_protocol_writer.hpp
index c2e6178acbf..d4778b1ea15 100644
--- a/cpp/src/io/parquet/compact_protocol_writer.hpp
+++ b/cpp/src/io/parquet/compact_protocol_writer.hpp
@@ -64,11 +64,11 @@ class CompactProtocolWriter {
 class CompactProtocolFieldWriter {
   CompactProtocolWriter& writer;
   size_t struct_start_pos;
-  int current_field_value;
+  int current_field_value{0};
 
  public:
   CompactProtocolFieldWriter(CompactProtocolWriter& caller)
-    : writer(caller), struct_start_pos(writer.m_buf.size()), current_field_value(0)
+    : writer(caller), struct_start_pos(writer.m_buf.size())
   {
   }
 
diff --git a/cpp/src/io/parquet/ipc/Schema_generated.h b/cpp/src/io/parquet/ipc/Schema_generated.h
index 27141b4af31..c091204417a 100644
--- a/cpp/src/io/parquet/ipc/Schema_generated.h
+++ b/cpp/src/io/parquet/ipc/Schema_generated.h
@@ -139,13 +139,13 @@ inline const MetadataVersion (&EnumValuesMetadataVersion())[5]
   return values;
 }
 
-inline const char* const* EnumNamesMetadataVersion()
+inline char const* const* EnumNamesMetadataVersion()
 {
-  static const char* const names[6] = {"V1", "V2", "V3", "V4", "V5", nullptr};
+  static char const* const names[6] = {"V1", "V2", "V3", "V4", "V5", nullptr};
   return names;
 }
 
-inline const char* EnumNameMetadataVersion(MetadataVersion e)
+inline char const* EnumNameMetadataVersion(MetadataVersion e)
 {
   if (::flatbuffers::IsOutRange(e, MetadataVersion_V1, MetadataVersion_V5)) return "";
   const size_t index = static_cast<size_t>(e);
@@ -190,14 +190,14 @@ inline const Feature (&EnumValuesFeature())[3]
   return values;
 }
 
-inline const char* const* EnumNamesFeature()
+inline char const* const* EnumNamesFeature()
 {
-  static const char* const names[4] = {
+  static char const* const names[4] = {
     "UNUSED", "DICTIONARY_REPLACEMENT", "COMPRESSED_BODY", nullptr};
   return names;
 }
 
-inline const char* EnumNameFeature(Feature e)
+inline char const* EnumNameFeature(Feature e)
 {
   if (::flatbuffers::IsOutRange(e, Feature_UNUSED, Feature_COMPRESSED_BODY)) return "";
   const size_t index = static_cast<size_t>(e);
@@ -217,13 +217,13 @@ inline const UnionMode (&EnumValuesUnionMode())[2]
   return values;
 }
 
-inline const char* const* EnumNamesUnionMode()
+inline char const* const* EnumNamesUnionMode()
 {
-  static const char* const names[3] = {"Sparse", "Dense", nullptr};
+  static char const* const names[3] = {"Sparse", "Dense", nullptr};
   return names;
 }
 
-inline const char* EnumNameUnionMode(UnionMode e)
+inline char const* EnumNameUnionMode(UnionMode e)
 {
   if (::flatbuffers::IsOutRange(e, UnionMode_Sparse, UnionMode_Dense)) return "";
   const size_t index = static_cast<size_t>(e);
@@ -244,13 +244,13 @@ inline const Precision (&EnumValuesPrecision())[3]
   return values;
 }
 
-inline const char* const* EnumNamesPrecision()
+inline char const* const* EnumNamesPrecision()
 {
-  static const char* const names[4] = {"HALF", "SINGLE", "DOUBLE", nullptr};
+  static char const* const names[4] = {"HALF", "SINGLE", "DOUBLE", nullptr};
   return names;
 }
 
-inline const char* EnumNamePrecision(Precision e)
+inline char const* EnumNamePrecision(Precision e)
 {
   if (::flatbuffers::IsOutRange(e, Precision_HALF, Precision_DOUBLE)) return "";
   const size_t index = static_cast<size_t>(e);
@@ -270,13 +270,13 @@ inline const DateUnit (&EnumValuesDateUnit())[2]
   return values;
 }
 
-inline const char* const* EnumNamesDateUnit()
+inline char const* const* EnumNamesDateUnit()
 {
-  static const char* const names[3] = {"DAY", "MILLISECOND", nullptr};
+  static char const* const names[3] = {"DAY", "MILLISECOND", nullptr};
   return names;
 }
 
-inline const char* EnumNameDateUnit(DateUnit e)
+inline char const* EnumNameDateUnit(DateUnit e)
 {
   if (::flatbuffers::IsOutRange(e, DateUnit_DAY, DateUnit_MILLISECOND)) return "";
   const size_t index = static_cast<size_t>(e);
@@ -299,14 +299,14 @@ inline const TimeUnit (&EnumValuesTimeUnit())[4]
   return values;
 }
 
-inline const char* const* EnumNamesTimeUnit()
+inline char const* const* EnumNamesTimeUnit()
 {
-  static const char* const names[5] = {
+  static char const* const names[5] = {
     "SECOND", "MILLISECOND", "MICROSECOND", "NANOSECOND", nullptr};
   return names;
 }
 
-inline const char* EnumNameTimeUnit(TimeUnit e)
+inline char const* EnumNameTimeUnit(TimeUnit e)
 {
   if (::flatbuffers::IsOutRange(e, TimeUnit_SECOND, TimeUnit_NANOSECOND)) return "";
   const size_t index = static_cast<size_t>(e);
@@ -328,13 +328,13 @@ inline const IntervalUnit (&EnumValuesIntervalUnit())[3]
   return values;
 }
 
-inline const char* const* EnumNamesIntervalUnit()
+inline char const* const* EnumNamesIntervalUnit()
 {
-  static const char* const names[4] = {"YEAR_MONTH", "DAY_TIME", "MONTH_DAY_NANO", nullptr};
+  static char const* const names[4] = {"YEAR_MONTH", "DAY_TIME", "MONTH_DAY_NANO", nullptr};
   return names;
 }
 
-inline const char* EnumNameIntervalUnit(IntervalUnit e)
+inline char const* EnumNameIntervalUnit(IntervalUnit e)
 {
   if (::flatbuffers::IsOutRange(e, IntervalUnit_YEAR_MONTH, IntervalUnit_MONTH_DAY_NANO)) return "";
   const size_t index = static_cast<size_t>(e);
@@ -389,9 +389,9 @@ inline const Type (&EnumValuesType())[27]
   return values;
 }
 
-inline const char* const* EnumNamesType()
+inline char const* const* EnumNamesType()
 {
-  static const char* const names[28] = {
+  static char const* const names[28] = {
     "NONE",          "Null",      "Int",           "FloatingPoint",
     "Binary",        "Utf8",      "Bool",          "Decimal",
     "Date",          "Time",      "Timestamp",     "Interval",
@@ -402,7 +402,7 @@ inline const char* const* EnumNamesType()
   return names;
 }
 
-inline const char* EnumNameType(Type e)
+inline char const* EnumNameType(Type e)
 {
   if (::flatbuffers::IsOutRange(e, Type_NONE, Type_LargeListView)) return "";
   const size_t index = static_cast<size_t>(e);
@@ -544,10 +544,10 @@ struct TypeTraits<cudf::io::parquet::flatbuf::LargeListView> {
   static const Type enum_value = Type_LargeListView;
 };
 
-bool VerifyType(::flatbuffers::Verifier& verifier, const void* obj, Type type);
+bool VerifyType(::flatbuffers::Verifier& verifier, void const* obj, Type type);
 bool VerifyTypeVector(::flatbuffers::Verifier& verifier,
-                      const ::flatbuffers::Vector<::flatbuffers::Offset<void>>* values,
-                      const ::flatbuffers::Vector<uint8_t>* types);
+                      ::flatbuffers::Vector<::flatbuffers::Offset<void>> const* values,
+                      ::flatbuffers::Vector<uint8_t> const* types);
 
 /// ----------------------------------------------------------------------
 /// Dictionary encoding metadata
@@ -566,13 +566,13 @@ inline const DictionaryKind (&EnumValuesDictionaryKind())[1]
   return values;
 }
 
-inline const char* const* EnumNamesDictionaryKind()
+inline char const* const* EnumNamesDictionaryKind()
 {
-  static const char* const names[2] = {"DenseArray", nullptr};
+  static char const* const names[2] = {"DenseArray", nullptr};
   return names;
 }
 
-inline const char* EnumNameDictionaryKind(DictionaryKind e)
+inline char const* EnumNameDictionaryKind(DictionaryKind e)
 {
   if (::flatbuffers::IsOutRange(e, DictionaryKind_DenseArray, DictionaryKind_DenseArray)) return "";
   const size_t index = static_cast<size_t>(e);
@@ -594,13 +594,13 @@ inline const Endianness (&EnumValuesEndianness())[2]
   return values;
 }
 
-inline const char* const* EnumNamesEndianness()
+inline char const* const* EnumNamesEndianness()
 {
-  static const char* const names[3] = {"Little", "Big", nullptr};
+  static char const* const names[3] = {"Little", "Big", nullptr};
   return names;
 }
 
-inline const char* EnumNameEndianness(Endianness e)
+inline char const* EnumNameEndianness(Endianness e)
 {
   if (::flatbuffers::IsOutRange(e, Endianness_Little, Endianness_Big)) return "";
   const size_t index = static_cast<size_t>(e);
@@ -652,7 +652,7 @@ struct NullBuilder {
   }
   ::flatbuffers::Offset<Null> Finish()
   {
-    const auto end = fbb_.EndTable(start_);
+    auto const end = fbb_.EndTable(start_);
     auto o         = ::flatbuffers::Offset<Null>(end);
     return o;
   }
@@ -685,7 +685,7 @@ struct Struct_Builder {
   }
   ::flatbuffers::Offset<Struct_> Finish()
   {
-    const auto end = fbb_.EndTable(start_);
+    auto const end = fbb_.EndTable(start_);
     auto o         = ::flatbuffers::Offset<Struct_>(end);
     return o;
   }
@@ -715,7 +715,7 @@ struct ListBuilder {
   }
   ::flatbuffers::Offset<List> Finish()
   {
-    const auto end = fbb_.EndTable(start_);
+    auto const end = fbb_.EndTable(start_);
     auto o         = ::flatbuffers::Offset<List>(end);
     return o;
   }
@@ -747,7 +747,7 @@ struct LargeListBuilder {
   }
   ::flatbuffers::Offset<LargeList> Finish()
   {
-    const auto end = fbb_.EndTable(start_);
+    auto const end = fbb_.EndTable(start_);
     auto o         = ::flatbuffers::Offset<LargeList>(end);
     return o;
   }
@@ -780,7 +780,7 @@ struct ListViewBuilder {
   }
   ::flatbuffers::Offset<ListView> Finish()
   {
-    const auto end = fbb_.EndTable(start_);
+    auto const end = fbb_.EndTable(start_);
     auto o         = ::flatbuffers::Offset<ListView>(end);
     return o;
   }
@@ -812,7 +812,7 @@ struct LargeListViewBuilder {
   }
   ::flatbuffers::Offset<LargeListView> Finish()
   {
-    const auto end = fbb_.EndTable(start_);
+    auto const end = fbb_.EndTable(start_);
     auto o         = ::flatbuffers::Offset<LargeListView>(end);
     return o;
   }
@@ -851,7 +851,7 @@ struct FixedSizeListBuilder {
   }
   ::flatbuffers::Offset<FixedSizeList> Finish()
   {
-    const auto end = fbb_.EndTable(start_);
+    auto const end = fbb_.EndTable(start_);
     auto o         = ::flatbuffers::Offset<FixedSizeList>(end);
     return o;
   }
@@ -916,7 +916,7 @@ struct MapBuilder {
   }
   ::flatbuffers::Offset<Map> Finish()
   {
-    const auto end = fbb_.EndTable(start_);
+    auto const end = fbb_.EndTable(start_);
     auto o         = ::flatbuffers::Offset<Map>(end);
     return o;
   }
@@ -941,9 +941,9 @@ struct Union FLATBUFFERS_FINAL_CLASS : private ::flatbuffers::Table {
   {
     return static_cast<cudf::io::parquet::flatbuf::UnionMode>(GetField<int16_t>(VT_MODE, 0));
   }
-  const ::flatbuffers::Vector<int32_t>* typeIds() const
+  ::flatbuffers::Vector<int32_t> const* typeIds() const
   {
-    return GetPointer<const ::flatbuffers::Vector<int32_t>*>(VT_TYPEIDS);
+    return GetPointer<::flatbuffers::Vector<int32_t> const*>(VT_TYPEIDS);
   }
   bool Verify(::flatbuffers::Verifier& verifier) const
   {
@@ -971,7 +971,7 @@ struct UnionBuilder {
   }
   ::flatbuffers::Offset<Union> Finish()
   {
-    const auto end = fbb_.EndTable(start_);
+    auto const end = fbb_.EndTable(start_);
     auto o         = ::flatbuffers::Offset<Union>(end);
     return o;
   }
@@ -991,7 +991,7 @@ inline ::flatbuffers::Offset<Union> CreateUnion(
 inline ::flatbuffers::Offset<Union> CreateUnionDirect(
   ::flatbuffers::FlatBufferBuilder& _fbb,
   cudf::io::parquet::flatbuf::UnionMode mode = cudf::io::parquet::flatbuf::UnionMode_Sparse,
-  const std::vector<int32_t>* typeIds        = nullptr)
+  std::vector<int32_t> const* typeIds        = nullptr)
 {
   auto typeIds__ = typeIds ? _fbb.CreateVector<int32_t>(*typeIds) : 0;
   return cudf::io::parquet::flatbuf::CreateUnion(_fbb, mode, typeIds__);
@@ -1027,7 +1027,7 @@ struct IntBuilder {
   }
   ::flatbuffers::Offset<Int> Finish()
   {
-    const auto end = fbb_.EndTable(start_);
+    auto const end = fbb_.EndTable(start_);
     auto o         = ::flatbuffers::Offset<Int>(end);
     return o;
   }
@@ -1071,7 +1071,7 @@ struct FloatingPointBuilder {
   }
   ::flatbuffers::Offset<FloatingPoint> Finish()
   {
-    const auto end = fbb_.EndTable(start_);
+    auto const end = fbb_.EndTable(start_);
     auto o         = ::flatbuffers::Offset<FloatingPoint>(end);
     return o;
   }
@@ -1105,7 +1105,7 @@ struct Utf8Builder {
   }
   ::flatbuffers::Offset<Utf8> Finish()
   {
-    const auto end = fbb_.EndTable(start_);
+    auto const end = fbb_.EndTable(start_);
     auto o         = ::flatbuffers::Offset<Utf8>(end);
     return o;
   }
@@ -1136,7 +1136,7 @@ struct BinaryBuilder {
   }
   ::flatbuffers::Offset<Binary> Finish()
   {
-    const auto end = fbb_.EndTable(start_);
+    auto const end = fbb_.EndTable(start_);
     auto o         = ::flatbuffers::Offset<Binary>(end);
     return o;
   }
@@ -1168,7 +1168,7 @@ struct LargeUtf8Builder {
   }
   ::flatbuffers::Offset<LargeUtf8> Finish()
   {
-    const auto end = fbb_.EndTable(start_);
+    auto const end = fbb_.EndTable(start_);
     auto o         = ::flatbuffers::Offset<LargeUtf8>(end);
     return o;
   }
@@ -1200,7 +1200,7 @@ struct LargeBinaryBuilder {
   }
   ::flatbuffers::Offset<LargeBinary> Finish()
   {
-    const auto end = fbb_.EndTable(start_);
+    auto const end = fbb_.EndTable(start_);
     auto o         = ::flatbuffers::Offset<LargeBinary>(end);
     return o;
   }
@@ -1237,7 +1237,7 @@ struct Utf8ViewBuilder {
   }
   ::flatbuffers::Offset<Utf8View> Finish()
   {
-    const auto end = fbb_.EndTable(start_);
+    auto const end = fbb_.EndTable(start_);
     auto o         = ::flatbuffers::Offset<Utf8View>(end);
     return o;
   }
@@ -1274,7 +1274,7 @@ struct BinaryViewBuilder {
   }
   ::flatbuffers::Offset<BinaryView> Finish()
   {
-    const auto end = fbb_.EndTable(start_);
+    auto const end = fbb_.EndTable(start_);
     auto o         = ::flatbuffers::Offset<BinaryView>(end);
     return o;
   }
@@ -1312,7 +1312,7 @@ struct FixedSizeBinaryBuilder {
   }
   ::flatbuffers::Offset<FixedSizeBinary> Finish()
   {
-    const auto end = fbb_.EndTable(start_);
+    auto const end = fbb_.EndTable(start_);
     auto o         = ::flatbuffers::Offset<FixedSizeBinary>(end);
     return o;
   }
@@ -1344,7 +1344,7 @@ struct BoolBuilder {
   }
   ::flatbuffers::Offset<Bool> Finish()
   {
-    const auto end = fbb_.EndTable(start_);
+    auto const end = fbb_.EndTable(start_);
     auto o         = ::flatbuffers::Offset<Bool>(end);
     return o;
   }
@@ -1379,7 +1379,7 @@ struct RunEndEncodedBuilder {
   }
   ::flatbuffers::Offset<RunEndEncoded> Finish()
   {
-    const auto end = fbb_.EndTable(start_);
+    auto const end = fbb_.EndTable(start_);
     auto o         = ::flatbuffers::Offset<RunEndEncoded>(end);
     return o;
   }
@@ -1437,7 +1437,7 @@ struct DecimalBuilder {
   }
   ::flatbuffers::Offset<Decimal> Finish()
   {
-    const auto end = fbb_.EndTable(start_);
+    auto const end = fbb_.EndTable(start_);
     auto o         = ::flatbuffers::Offset<Decimal>(end);
     return o;
   }
@@ -1489,7 +1489,7 @@ struct DateBuilder {
   }
   ::flatbuffers::Offset<Date> Finish()
   {
-    const auto end = fbb_.EndTable(start_);
+    auto const end = fbb_.EndTable(start_);
     auto o         = ::flatbuffers::Offset<Date>(end);
     return o;
   }
@@ -1548,7 +1548,7 @@ struct TimeBuilder {
   }
   ::flatbuffers::Offset<Time> Finish()
   {
-    const auto end = fbb_.EndTable(start_);
+    auto const end = fbb_.EndTable(start_);
     auto o         = ::flatbuffers::Offset<Time>(end);
     return o;
   }
@@ -1687,9 +1687,9 @@ struct Timestamp FLATBUFFERS_FINAL_CLASS : private ::flatbuffers::Table {
   ///
   /// Whether a timezone string is present indicates different semantics about
   /// the data (see above).
-  const ::flatbuffers::String* timezone() const
+  ::flatbuffers::String const* timezone() const
   {
-    return GetPointer<const ::flatbuffers::String*>(VT_TIMEZONE);
+    return GetPointer<::flatbuffers::String const*>(VT_TIMEZONE);
   }
   bool Verify(::flatbuffers::Verifier& verifier) const
   {
@@ -1717,7 +1717,7 @@ struct TimestampBuilder {
   }
   ::flatbuffers::Offset<Timestamp> Finish()
   {
-    const auto end = fbb_.EndTable(start_);
+    auto const end = fbb_.EndTable(start_);
     auto o         = ::flatbuffers::Offset<Timestamp>(end);
     return o;
   }
@@ -1737,7 +1737,7 @@ inline ::flatbuffers::Offset<Timestamp> CreateTimestamp(
 inline ::flatbuffers::Offset<Timestamp> CreateTimestampDirect(
   ::flatbuffers::FlatBufferBuilder& _fbb,
   cudf::io::parquet::flatbuf::TimeUnit unit = cudf::io::parquet::flatbuf::TimeUnit_SECOND,
-  const char* timezone                      = nullptr)
+  char const* timezone                      = nullptr)
 {
   auto timezone__ = timezone ? _fbb.CreateString(timezone) : 0;
   return cudf::io::parquet::flatbuf::CreateTimestamp(_fbb, unit, timezone__);
@@ -1771,7 +1771,7 @@ struct IntervalBuilder {
   }
   ::flatbuffers::Offset<Interval> Finish()
   {
-    const auto end = fbb_.EndTable(start_);
+    auto const end = fbb_.EndTable(start_);
     auto o         = ::flatbuffers::Offset<Interval>(end);
     return o;
   }
@@ -1815,7 +1815,7 @@ struct DurationBuilder {
   }
   ::flatbuffers::Offset<Duration> Finish()
   {
-    const auto end = fbb_.EndTable(start_);
+    auto const end = fbb_.EndTable(start_);
     auto o         = ::flatbuffers::Offset<Duration>(end);
     return o;
   }
@@ -1836,13 +1836,13 @@ inline ::flatbuffers::Offset<Duration> CreateDuration(
 struct KeyValue FLATBUFFERS_FINAL_CLASS : private ::flatbuffers::Table {
   typedef KeyValueBuilder Builder;
   enum FlatBuffersVTableOffset FLATBUFFERS_VTABLE_UNDERLYING_TYPE { VT_KEY = 4, VT_VALUE = 6 };
-  const ::flatbuffers::String* key() const
+  ::flatbuffers::String const* key() const
   {
-    return GetPointer<const ::flatbuffers::String*>(VT_KEY);
+    return GetPointer<::flatbuffers::String const*>(VT_KEY);
   }
-  const ::flatbuffers::String* value() const
+  ::flatbuffers::String const* value() const
   {
-    return GetPointer<const ::flatbuffers::String*>(VT_VALUE);
+    return GetPointer<::flatbuffers::String const*>(VT_VALUE);
   }
   bool Verify(::flatbuffers::Verifier& verifier) const
   {
@@ -1870,7 +1870,7 @@ struct KeyValueBuilder {
   }
   ::flatbuffers::Offset<KeyValue> Finish()
   {
-    const auto end = fbb_.EndTable(start_);
+    auto const end = fbb_.EndTable(start_);
     auto o         = ::flatbuffers::Offset<KeyValue>(end);
     return o;
   }
@@ -1888,8 +1888,8 @@ inline ::flatbuffers::Offset<KeyValue> CreateKeyValue(
 }
 
 inline ::flatbuffers::Offset<KeyValue> CreateKeyValueDirect(::flatbuffers::FlatBufferBuilder& _fbb,
-                                                            const char* key   = nullptr,
-                                                            const char* value = nullptr)
+                                                            char const* key   = nullptr,
+                                                            char const* value = nullptr)
 {
   auto key__   = key ? _fbb.CreateString(key) : 0;
   auto value__ = value ? _fbb.CreateString(value) : 0;
@@ -1913,9 +1913,9 @@ struct DictionaryEncoding FLATBUFFERS_FINAL_CLASS : private ::flatbuffers::Table
   /// cross-language compatibility and performance, implementations are
   /// recommended to prefer signed integer types over unsigned integer types
   /// and to avoid uint64 indices unless they are required by an application.
-  const cudf::io::parquet::flatbuf::Int* indexType() const
+  cudf::io::parquet::flatbuf::Int const* indexType() const
   {
-    return GetPointer<const cudf::io::parquet::flatbuf::Int*>(VT_INDEXTYPE);
+    return GetPointer<cudf::io::parquet::flatbuf::Int const*>(VT_INDEXTYPE);
   }
   /// By default, dictionaries are not ordered, or the order does not have
   /// semantic meaning. In some statistical, applications, dictionary-encoding
@@ -1960,7 +1960,7 @@ struct DictionaryEncodingBuilder {
   }
   ::flatbuffers::Offset<DictionaryEncoding> Finish()
   {
-    const auto end = fbb_.EndTable(start_);
+    auto const end = fbb_.EndTable(start_);
     auto o         = ::flatbuffers::Offset<DictionaryEncoding>(end);
     return o;
   }
@@ -1997,9 +1997,9 @@ struct Field FLATBUFFERS_FINAL_CLASS : private ::flatbuffers::Table {
     VT_CUSTOM_METADATA = 16
   };
   /// Name is not required, in i.e. a List
-  const ::flatbuffers::String* name() const
+  ::flatbuffers::String const* name() const
   {
-    return GetPointer<const ::flatbuffers::String*>(VT_NAME);
+    return GetPointer<::flatbuffers::String const*>(VT_NAME);
   }
   /// Whether or not this field can contain nulls. Should be true in general.
   bool nullable() const { return GetField<uint8_t>(VT_NULLABLE, 0) != 0; }
@@ -2008,185 +2008,185 @@ struct Field FLATBUFFERS_FINAL_CLASS : private ::flatbuffers::Table {
     return static_cast<cudf::io::parquet::flatbuf::Type>(GetField<uint8_t>(VT_TYPE_TYPE, 0));
   }
   /// This is the type of the decoded value if the field is dictionary encoded.
-  const void* type() const { return GetPointer<const void*>(VT_TYPE); }
+  void const* type() const { return GetPointer<void const*>(VT_TYPE); }
   template <typename T>
-  const T* type_as() const;
-  const cudf::io::parquet::flatbuf::Null* type_as_Null() const
+  T const* type_as() const;
+  cudf::io::parquet::flatbuf::Null const* type_as_Null() const
   {
     return type_type() == cudf::io::parquet::flatbuf::Type_Null
-             ? static_cast<const cudf::io::parquet::flatbuf::Null*>(type())
+             ? static_cast<cudf::io::parquet::flatbuf::Null const*>(type())
              : nullptr;
   }
-  const cudf::io::parquet::flatbuf::Int* type_as_Int() const
+  cudf::io::parquet::flatbuf::Int const* type_as_Int() const
   {
     return type_type() == cudf::io::parquet::flatbuf::Type_Int
-             ? static_cast<const cudf::io::parquet::flatbuf::Int*>(type())
+             ? static_cast<cudf::io::parquet::flatbuf::Int const*>(type())
              : nullptr;
   }
-  const cudf::io::parquet::flatbuf::FloatingPoint* type_as_FloatingPoint() const
+  cudf::io::parquet::flatbuf::FloatingPoint const* type_as_FloatingPoint() const
   {
     return type_type() == cudf::io::parquet::flatbuf::Type_FloatingPoint
-             ? static_cast<const cudf::io::parquet::flatbuf::FloatingPoint*>(type())
+             ? static_cast<cudf::io::parquet::flatbuf::FloatingPoint const*>(type())
              : nullptr;
   }
-  const cudf::io::parquet::flatbuf::Binary* type_as_Binary() const
+  cudf::io::parquet::flatbuf::Binary const* type_as_Binary() const
   {
     return type_type() == cudf::io::parquet::flatbuf::Type_Binary
-             ? static_cast<const cudf::io::parquet::flatbuf::Binary*>(type())
+             ? static_cast<cudf::io::parquet::flatbuf::Binary const*>(type())
              : nullptr;
   }
-  const cudf::io::parquet::flatbuf::Utf8* type_as_Utf8() const
+  cudf::io::parquet::flatbuf::Utf8 const* type_as_Utf8() const
   {
     return type_type() == cudf::io::parquet::flatbuf::Type_Utf8
-             ? static_cast<const cudf::io::parquet::flatbuf::Utf8*>(type())
+             ? static_cast<cudf::io::parquet::flatbuf::Utf8 const*>(type())
              : nullptr;
   }
-  const cudf::io::parquet::flatbuf::Bool* type_as_Bool() const
+  cudf::io::parquet::flatbuf::Bool const* type_as_Bool() const
   {
     return type_type() == cudf::io::parquet::flatbuf::Type_Bool
-             ? static_cast<const cudf::io::parquet::flatbuf::Bool*>(type())
+             ? static_cast<cudf::io::parquet::flatbuf::Bool const*>(type())
              : nullptr;
   }
-  const cudf::io::parquet::flatbuf::Decimal* type_as_Decimal() const
+  cudf::io::parquet::flatbuf::Decimal const* type_as_Decimal() const
   {
     return type_type() == cudf::io::parquet::flatbuf::Type_Decimal
-             ? static_cast<const cudf::io::parquet::flatbuf::Decimal*>(type())
+             ? static_cast<cudf::io::parquet::flatbuf::Decimal const*>(type())
              : nullptr;
   }
-  const cudf::io::parquet::flatbuf::Date* type_as_Date() const
+  cudf::io::parquet::flatbuf::Date const* type_as_Date() const
   {
     return type_type() == cudf::io::parquet::flatbuf::Type_Date
-             ? static_cast<const cudf::io::parquet::flatbuf::Date*>(type())
+             ? static_cast<cudf::io::parquet::flatbuf::Date const*>(type())
              : nullptr;
   }
-  const cudf::io::parquet::flatbuf::Time* type_as_Time() const
+  cudf::io::parquet::flatbuf::Time const* type_as_Time() const
   {
     return type_type() == cudf::io::parquet::flatbuf::Type_Time
-             ? static_cast<const cudf::io::parquet::flatbuf::Time*>(type())
+             ? static_cast<cudf::io::parquet::flatbuf::Time const*>(type())
              : nullptr;
   }
-  const cudf::io::parquet::flatbuf::Timestamp* type_as_Timestamp() const
+  cudf::io::parquet::flatbuf::Timestamp const* type_as_Timestamp() const
   {
     return type_type() == cudf::io::parquet::flatbuf::Type_Timestamp
-             ? static_cast<const cudf::io::parquet::flatbuf::Timestamp*>(type())
+             ? static_cast<cudf::io::parquet::flatbuf::Timestamp const*>(type())
              : nullptr;
   }
-  const cudf::io::parquet::flatbuf::Interval* type_as_Interval() const
+  cudf::io::parquet::flatbuf::Interval const* type_as_Interval() const
   {
     return type_type() == cudf::io::parquet::flatbuf::Type_Interval
-             ? static_cast<const cudf::io::parquet::flatbuf::Interval*>(type())
+             ? static_cast<cudf::io::parquet::flatbuf::Interval const*>(type())
              : nullptr;
   }
-  const cudf::io::parquet::flatbuf::List* type_as_List() const
+  cudf::io::parquet::flatbuf::List const* type_as_List() const
   {
     return type_type() == cudf::io::parquet::flatbuf::Type_List
-             ? static_cast<const cudf::io::parquet::flatbuf::List*>(type())
+             ? static_cast<cudf::io::parquet::flatbuf::List const*>(type())
              : nullptr;
   }
-  const cudf::io::parquet::flatbuf::Struct_* type_as_Struct_() const
+  cudf::io::parquet::flatbuf::Struct_ const* type_as_Struct_() const
   {
     return type_type() == cudf::io::parquet::flatbuf::Type_Struct_
-             ? static_cast<const cudf::io::parquet::flatbuf::Struct_*>(type())
+             ? static_cast<cudf::io::parquet::flatbuf::Struct_ const*>(type())
              : nullptr;
   }
-  const cudf::io::parquet::flatbuf::Union* type_as_Union() const
+  cudf::io::parquet::flatbuf::Union const* type_as_Union() const
   {
     return type_type() == cudf::io::parquet::flatbuf::Type_Union
-             ? static_cast<const cudf::io::parquet::flatbuf::Union*>(type())
+             ? static_cast<cudf::io::parquet::flatbuf::Union const*>(type())
              : nullptr;
   }
-  const cudf::io::parquet::flatbuf::FixedSizeBinary* type_as_FixedSizeBinary() const
+  cudf::io::parquet::flatbuf::FixedSizeBinary const* type_as_FixedSizeBinary() const
   {
     return type_type() == cudf::io::parquet::flatbuf::Type_FixedSizeBinary
-             ? static_cast<const cudf::io::parquet::flatbuf::FixedSizeBinary*>(type())
+             ? static_cast<cudf::io::parquet::flatbuf::FixedSizeBinary const*>(type())
              : nullptr;
   }
-  const cudf::io::parquet::flatbuf::FixedSizeList* type_as_FixedSizeList() const
+  cudf::io::parquet::flatbuf::FixedSizeList const* type_as_FixedSizeList() const
   {
     return type_type() == cudf::io::parquet::flatbuf::Type_FixedSizeList
-             ? static_cast<const cudf::io::parquet::flatbuf::FixedSizeList*>(type())
+             ? static_cast<cudf::io::parquet::flatbuf::FixedSizeList const*>(type())
              : nullptr;
   }
-  const cudf::io::parquet::flatbuf::Map* type_as_Map() const
+  cudf::io::parquet::flatbuf::Map const* type_as_Map() const
   {
     return type_type() == cudf::io::parquet::flatbuf::Type_Map
-             ? static_cast<const cudf::io::parquet::flatbuf::Map*>(type())
+             ? static_cast<cudf::io::parquet::flatbuf::Map const*>(type())
              : nullptr;
   }
-  const cudf::io::parquet::flatbuf::Duration* type_as_Duration() const
+  cudf::io::parquet::flatbuf::Duration const* type_as_Duration() const
   {
     return type_type() == cudf::io::parquet::flatbuf::Type_Duration
-             ? static_cast<const cudf::io::parquet::flatbuf::Duration*>(type())
+             ? static_cast<cudf::io::parquet::flatbuf::Duration const*>(type())
              : nullptr;
   }
-  const cudf::io::parquet::flatbuf::LargeBinary* type_as_LargeBinary() const
+  cudf::io::parquet::flatbuf::LargeBinary const* type_as_LargeBinary() const
   {
     return type_type() == cudf::io::parquet::flatbuf::Type_LargeBinary
-             ? static_cast<const cudf::io::parquet::flatbuf::LargeBinary*>(type())
+             ? static_cast<cudf::io::parquet::flatbuf::LargeBinary const*>(type())
              : nullptr;
   }
-  const cudf::io::parquet::flatbuf::LargeUtf8* type_as_LargeUtf8() const
+  cudf::io::parquet::flatbuf::LargeUtf8 const* type_as_LargeUtf8() const
   {
     return type_type() == cudf::io::parquet::flatbuf::Type_LargeUtf8
-             ? static_cast<const cudf::io::parquet::flatbuf::LargeUtf8*>(type())
+             ? static_cast<cudf::io::parquet::flatbuf::LargeUtf8 const*>(type())
              : nullptr;
   }
-  const cudf::io::parquet::flatbuf::LargeList* type_as_LargeList() const
+  cudf::io::parquet::flatbuf::LargeList const* type_as_LargeList() const
   {
     return type_type() == cudf::io::parquet::flatbuf::Type_LargeList
-             ? static_cast<const cudf::io::parquet::flatbuf::LargeList*>(type())
+             ? static_cast<cudf::io::parquet::flatbuf::LargeList const*>(type())
              : nullptr;
   }
-  const cudf::io::parquet::flatbuf::RunEndEncoded* type_as_RunEndEncoded() const
+  cudf::io::parquet::flatbuf::RunEndEncoded const* type_as_RunEndEncoded() const
   {
     return type_type() == cudf::io::parquet::flatbuf::Type_RunEndEncoded
-             ? static_cast<const cudf::io::parquet::flatbuf::RunEndEncoded*>(type())
+             ? static_cast<cudf::io::parquet::flatbuf::RunEndEncoded const*>(type())
              : nullptr;
   }
-  const cudf::io::parquet::flatbuf::BinaryView* type_as_BinaryView() const
+  cudf::io::parquet::flatbuf::BinaryView const* type_as_BinaryView() const
   {
     return type_type() == cudf::io::parquet::flatbuf::Type_BinaryView
-             ? static_cast<const cudf::io::parquet::flatbuf::BinaryView*>(type())
+             ? static_cast<cudf::io::parquet::flatbuf::BinaryView const*>(type())
              : nullptr;
   }
-  const cudf::io::parquet::flatbuf::Utf8View* type_as_Utf8View() const
+  cudf::io::parquet::flatbuf::Utf8View const* type_as_Utf8View() const
   {
     return type_type() == cudf::io::parquet::flatbuf::Type_Utf8View
-             ? static_cast<const cudf::io::parquet::flatbuf::Utf8View*>(type())
+             ? static_cast<cudf::io::parquet::flatbuf::Utf8View const*>(type())
              : nullptr;
   }
-  const cudf::io::parquet::flatbuf::ListView* type_as_ListView() const
+  cudf::io::parquet::flatbuf::ListView const* type_as_ListView() const
   {
     return type_type() == cudf::io::parquet::flatbuf::Type_ListView
-             ? static_cast<const cudf::io::parquet::flatbuf::ListView*>(type())
+             ? static_cast<cudf::io::parquet::flatbuf::ListView const*>(type())
              : nullptr;
   }
-  const cudf::io::parquet::flatbuf::LargeListView* type_as_LargeListView() const
+  cudf::io::parquet::flatbuf::LargeListView const* type_as_LargeListView() const
   {
     return type_type() == cudf::io::parquet::flatbuf::Type_LargeListView
-             ? static_cast<const cudf::io::parquet::flatbuf::LargeListView*>(type())
+             ? static_cast<cudf::io::parquet::flatbuf::LargeListView const*>(type())
              : nullptr;
   }
   /// Present only if the field is dictionary encoded.
-  const cudf::io::parquet::flatbuf::DictionaryEncoding* dictionary() const
+  cudf::io::parquet::flatbuf::DictionaryEncoding const* dictionary() const
   {
-    return GetPointer<const cudf::io::parquet::flatbuf::DictionaryEncoding*>(VT_DICTIONARY);
+    return GetPointer<cudf::io::parquet::flatbuf::DictionaryEncoding const*>(VT_DICTIONARY);
   }
   /// children apply only to nested data types like Struct, List and Union. For
   /// primitive types children will have length 0.
-  const ::flatbuffers::Vector<::flatbuffers::Offset<cudf::io::parquet::flatbuf::Field>>* children()
+  ::flatbuffers::Vector<::flatbuffers::Offset<cudf::io::parquet::flatbuf::Field>> const* children()
     const
   {
     return GetPointer<
-      const ::flatbuffers::Vector<::flatbuffers::Offset<cudf::io::parquet::flatbuf::Field>>*>(
+      ::flatbuffers::Vector<::flatbuffers::Offset<cudf::io::parquet::flatbuf::Field>> const*>(
       VT_CHILDREN);
   }
   /// User-defined metadata
-  const ::flatbuffers::Vector<::flatbuffers::Offset<cudf::io::parquet::flatbuf::KeyValue>>*
+  ::flatbuffers::Vector<::flatbuffers::Offset<cudf::io::parquet::flatbuf::KeyValue>> const*
   custom_metadata() const
   {
     return GetPointer<
-      const ::flatbuffers::Vector<::flatbuffers::Offset<cudf::io::parquet::flatbuf::KeyValue>>*>(
+      ::flatbuffers::Vector<::flatbuffers::Offset<cudf::io::parquet::flatbuf::KeyValue>> const*>(
       VT_CUSTOM_METADATA);
   }
   bool Verify(::flatbuffers::Verifier& verifier) const
@@ -2203,182 +2203,182 @@ struct Field FLATBUFFERS_FINAL_CLASS : private ::flatbuffers::Table {
 };
 
 template <>
-inline const cudf::io::parquet::flatbuf::Null* Field::type_as<cudf::io::parquet::flatbuf::Null>()
+inline cudf::io::parquet::flatbuf::Null const* Field::type_as<cudf::io::parquet::flatbuf::Null>()
   const
 {
   return type_as_Null();
 }
 
 template <>
-inline const cudf::io::parquet::flatbuf::Int* Field::type_as<cudf::io::parquet::flatbuf::Int>()
+inline cudf::io::parquet::flatbuf::Int const* Field::type_as<cudf::io::parquet::flatbuf::Int>()
   const
 {
   return type_as_Int();
 }
 
 template <>
-inline const cudf::io::parquet::flatbuf::FloatingPoint*
+inline cudf::io::parquet::flatbuf::FloatingPoint const*
 Field::type_as<cudf::io::parquet::flatbuf::FloatingPoint>() const
 {
   return type_as_FloatingPoint();
 }
 
 template <>
-inline const cudf::io::parquet::flatbuf::Binary*
+inline cudf::io::parquet::flatbuf::Binary const*
 Field::type_as<cudf::io::parquet::flatbuf::Binary>() const
 {
   return type_as_Binary();
 }
 
 template <>
-inline const cudf::io::parquet::flatbuf::Utf8* Field::type_as<cudf::io::parquet::flatbuf::Utf8>()
+inline cudf::io::parquet::flatbuf::Utf8 const* Field::type_as<cudf::io::parquet::flatbuf::Utf8>()
   const
 {
   return type_as_Utf8();
 }
 
 template <>
-inline const cudf::io::parquet::flatbuf::Bool* Field::type_as<cudf::io::parquet::flatbuf::Bool>()
+inline cudf::io::parquet::flatbuf::Bool const* Field::type_as<cudf::io::parquet::flatbuf::Bool>()
   const
 {
   return type_as_Bool();
 }
 
 template <>
-inline const cudf::io::parquet::flatbuf::Decimal*
+inline cudf::io::parquet::flatbuf::Decimal const*
 Field::type_as<cudf::io::parquet::flatbuf::Decimal>() const
 {
   return type_as_Decimal();
 }
 
 template <>
-inline const cudf::io::parquet::flatbuf::Date* Field::type_as<cudf::io::parquet::flatbuf::Date>()
+inline cudf::io::parquet::flatbuf::Date const* Field::type_as<cudf::io::parquet::flatbuf::Date>()
   const
 {
   return type_as_Date();
 }
 
 template <>
-inline const cudf::io::parquet::flatbuf::Time* Field::type_as<cudf::io::parquet::flatbuf::Time>()
+inline cudf::io::parquet::flatbuf::Time const* Field::type_as<cudf::io::parquet::flatbuf::Time>()
   const
 {
   return type_as_Time();
 }
 
 template <>
-inline const cudf::io::parquet::flatbuf::Timestamp*
+inline cudf::io::parquet::flatbuf::Timestamp const*
 Field::type_as<cudf::io::parquet::flatbuf::Timestamp>() const
 {
   return type_as_Timestamp();
 }
 
 template <>
-inline const cudf::io::parquet::flatbuf::Interval*
+inline cudf::io::parquet::flatbuf::Interval const*
 Field::type_as<cudf::io::parquet::flatbuf::Interval>() const
 {
   return type_as_Interval();
 }
 
 template <>
-inline const cudf::io::parquet::flatbuf::List* Field::type_as<cudf::io::parquet::flatbuf::List>()
+inline cudf::io::parquet::flatbuf::List const* Field::type_as<cudf::io::parquet::flatbuf::List>()
   const
 {
   return type_as_List();
 }
 
 template <>
-inline const cudf::io::parquet::flatbuf::Struct_*
+inline cudf::io::parquet::flatbuf::Struct_ const*
 Field::type_as<cudf::io::parquet::flatbuf::Struct_>() const
 {
   return type_as_Struct_();
 }
 
 template <>
-inline const cudf::io::parquet::flatbuf::Union* Field::type_as<cudf::io::parquet::flatbuf::Union>()
+inline cudf::io::parquet::flatbuf::Union const* Field::type_as<cudf::io::parquet::flatbuf::Union>()
   const
 {
   return type_as_Union();
 }
 
 template <>
-inline const cudf::io::parquet::flatbuf::FixedSizeBinary*
+inline cudf::io::parquet::flatbuf::FixedSizeBinary const*
 Field::type_as<cudf::io::parquet::flatbuf::FixedSizeBinary>() const
 {
   return type_as_FixedSizeBinary();
 }
 
 template <>
-inline const cudf::io::parquet::flatbuf::FixedSizeList*
+inline cudf::io::parquet::flatbuf::FixedSizeList const*
 Field::type_as<cudf::io::parquet::flatbuf::FixedSizeList>() const
 {
   return type_as_FixedSizeList();
 }
 
 template <>
-inline const cudf::io::parquet::flatbuf::Map* Field::type_as<cudf::io::parquet::flatbuf::Map>()
+inline cudf::io::parquet::flatbuf::Map const* Field::type_as<cudf::io::parquet::flatbuf::Map>()
   const
 {
   return type_as_Map();
 }
 
 template <>
-inline const cudf::io::parquet::flatbuf::Duration*
+inline cudf::io::parquet::flatbuf::Duration const*
 Field::type_as<cudf::io::parquet::flatbuf::Duration>() const
 {
   return type_as_Duration();
 }
 
 template <>
-inline const cudf::io::parquet::flatbuf::LargeBinary*
+inline cudf::io::parquet::flatbuf::LargeBinary const*
 Field::type_as<cudf::io::parquet::flatbuf::LargeBinary>() const
 {
   return type_as_LargeBinary();
 }
 
 template <>
-inline const cudf::io::parquet::flatbuf::LargeUtf8*
+inline cudf::io::parquet::flatbuf::LargeUtf8 const*
 Field::type_as<cudf::io::parquet::flatbuf::LargeUtf8>() const
 {
   return type_as_LargeUtf8();
 }
 
 template <>
-inline const cudf::io::parquet::flatbuf::LargeList*
+inline cudf::io::parquet::flatbuf::LargeList const*
 Field::type_as<cudf::io::parquet::flatbuf::LargeList>() const
 {
   return type_as_LargeList();
 }
 
 template <>
-inline const cudf::io::parquet::flatbuf::RunEndEncoded*
+inline cudf::io::parquet::flatbuf::RunEndEncoded const*
 Field::type_as<cudf::io::parquet::flatbuf::RunEndEncoded>() const
 {
   return type_as_RunEndEncoded();
 }
 
 template <>
-inline const cudf::io::parquet::flatbuf::BinaryView*
+inline cudf::io::parquet::flatbuf::BinaryView const*
 Field::type_as<cudf::io::parquet::flatbuf::BinaryView>() const
 {
   return type_as_BinaryView();
 }
 
 template <>
-inline const cudf::io::parquet::flatbuf::Utf8View*
+inline cudf::io::parquet::flatbuf::Utf8View const*
 Field::type_as<cudf::io::parquet::flatbuf::Utf8View>() const
 {
   return type_as_Utf8View();
 }
 
 template <>
-inline const cudf::io::parquet::flatbuf::ListView*
+inline cudf::io::parquet::flatbuf::ListView const*
 Field::type_as<cudf::io::parquet::flatbuf::ListView>() const
 {
   return type_as_ListView();
 }
 
 template <>
-inline const cudf::io::parquet::flatbuf::LargeListView*
+inline cudf::io::parquet::flatbuf::LargeListView const*
 Field::type_as<cudf::io::parquet::flatbuf::LargeListView>() const
 {
   return type_as_LargeListView();
@@ -2425,7 +2425,7 @@ struct FieldBuilder {
   }
   ::flatbuffers::Offset<Field> Finish()
   {
-    const auto end = fbb_.EndTable(start_);
+    auto const end = fbb_.EndTable(start_);
     auto o         = ::flatbuffers::Offset<Field>(end);
     return o;
   }
@@ -2456,13 +2456,13 @@ inline ::flatbuffers::Offset<Field> CreateField(
 
 inline ::flatbuffers::Offset<Field> CreateFieldDirect(
   ::flatbuffers::FlatBufferBuilder& _fbb,
-  const char* name                           = nullptr,
+  char const* name                           = nullptr,
   bool nullable                              = false,
   cudf::io::parquet::flatbuf::Type type_type = cudf::io::parquet::flatbuf::Type_NONE,
   ::flatbuffers::Offset<void> type           = 0,
   ::flatbuffers::Offset<cudf::io::parquet::flatbuf::DictionaryEncoding> dictionary      = 0,
-  const std::vector<::flatbuffers::Offset<cudf::io::parquet::flatbuf::Field>>* children = nullptr,
-  const std::vector<::flatbuffers::Offset<cudf::io::parquet::flatbuf::KeyValue>>* custom_metadata =
+  std::vector<::flatbuffers::Offset<cudf::io::parquet::flatbuf::Field>> const* children = nullptr,
+  std::vector<::flatbuffers::Offset<cudf::io::parquet::flatbuf::KeyValue>> const* custom_metadata =
     nullptr)
 {
   auto name__ = name ? _fbb.CreateString(name) : 0;
@@ -2496,24 +2496,24 @@ struct Schema FLATBUFFERS_FINAL_CLASS : private ::flatbuffers::Table {
   {
     return static_cast<cudf::io::parquet::flatbuf::Endianness>(GetField<int16_t>(VT_ENDIANNESS, 0));
   }
-  const ::flatbuffers::Vector<::flatbuffers::Offset<cudf::io::parquet::flatbuf::Field>>* fields()
+  ::flatbuffers::Vector<::flatbuffers::Offset<cudf::io::parquet::flatbuf::Field>> const* fields()
     const
   {
     return GetPointer<
-      const ::flatbuffers::Vector<::flatbuffers::Offset<cudf::io::parquet::flatbuf::Field>>*>(
+      ::flatbuffers::Vector<::flatbuffers::Offset<cudf::io::parquet::flatbuf::Field>> const*>(
       VT_FIELDS);
   }
-  const ::flatbuffers::Vector<::flatbuffers::Offset<cudf::io::parquet::flatbuf::KeyValue>>*
+  ::flatbuffers::Vector<::flatbuffers::Offset<cudf::io::parquet::flatbuf::KeyValue>> const*
   custom_metadata() const
   {
     return GetPointer<
-      const ::flatbuffers::Vector<::flatbuffers::Offset<cudf::io::parquet::flatbuf::KeyValue>>*>(
+      ::flatbuffers::Vector<::flatbuffers::Offset<cudf::io::parquet::flatbuf::KeyValue>> const*>(
       VT_CUSTOM_METADATA);
   }
   /// Features used in the stream/file.
-  const ::flatbuffers::Vector<int64_t>* features() const
+  ::flatbuffers::Vector<int64_t> const* features() const
   {
-    return GetPointer<const ::flatbuffers::Vector<int64_t>*>(VT_FEATURES);
+    return GetPointer<::flatbuffers::Vector<int64_t> const*>(VT_FEATURES);
   }
   bool Verify(::flatbuffers::Verifier& verifier) const
   {
@@ -2558,7 +2558,7 @@ struct SchemaBuilder {
   }
   ::flatbuffers::Offset<Schema> Finish()
   {
-    const auto end = fbb_.EndTable(start_);
+    auto const end = fbb_.EndTable(start_);
     auto o         = ::flatbuffers::Offset<Schema>(end);
     return o;
   }
@@ -2584,10 +2584,10 @@ inline ::flatbuffers::Offset<Schema> CreateSchema(
 inline ::flatbuffers::Offset<Schema> CreateSchemaDirect(
   ::flatbuffers::FlatBufferBuilder& _fbb,
   cudf::io::parquet::flatbuf::Endianness endianness = cudf::io::parquet::flatbuf::Endianness_Little,
-  const std::vector<::flatbuffers::Offset<cudf::io::parquet::flatbuf::Field>>* fields = nullptr,
-  const std::vector<::flatbuffers::Offset<cudf::io::parquet::flatbuf::KeyValue>>* custom_metadata =
+  std::vector<::flatbuffers::Offset<cudf::io::parquet::flatbuf::Field>> const* fields = nullptr,
+  std::vector<::flatbuffers::Offset<cudf::io::parquet::flatbuf::KeyValue>> const* custom_metadata =
     nullptr,
-  const std::vector<int64_t>* features = nullptr)
+  std::vector<int64_t> const* features = nullptr)
 {
   auto fields__ =
     fields ? _fbb.CreateVector<::flatbuffers::Offset<cudf::io::parquet::flatbuf::Field>>(*fields)
@@ -2602,114 +2602,114 @@ inline ::flatbuffers::Offset<Schema> CreateSchemaDirect(
     _fbb, endianness, fields__, custom_metadata__, features__);
 }
 
-inline bool VerifyType(::flatbuffers::Verifier& verifier, const void* obj, Type type)
+inline bool VerifyType(::flatbuffers::Verifier& verifier, void const* obj, Type type)
 {
   switch (type) {
     case Type_NONE: {
       return true;
     }
     case Type_Null: {
-      auto ptr = reinterpret_cast<const cudf::io::parquet::flatbuf::Null*>(obj);
+      auto ptr = reinterpret_cast<cudf::io::parquet::flatbuf::Null const*>(obj);
       return verifier.VerifyTable(ptr);
     }
     case Type_Int: {
-      auto ptr = reinterpret_cast<const cudf::io::parquet::flatbuf::Int*>(obj);
+      auto ptr = reinterpret_cast<cudf::io::parquet::flatbuf::Int const*>(obj);
       return verifier.VerifyTable(ptr);
     }
     case Type_FloatingPoint: {
-      auto ptr = reinterpret_cast<const cudf::io::parquet::flatbuf::FloatingPoint*>(obj);
+      auto ptr = reinterpret_cast<cudf::io::parquet::flatbuf::FloatingPoint const*>(obj);
       return verifier.VerifyTable(ptr);
     }
     case Type_Binary: {
-      auto ptr = reinterpret_cast<const cudf::io::parquet::flatbuf::Binary*>(obj);
+      auto ptr = reinterpret_cast<cudf::io::parquet::flatbuf::Binary const*>(obj);
       return verifier.VerifyTable(ptr);
     }
     case Type_Utf8: {
-      auto ptr = reinterpret_cast<const cudf::io::parquet::flatbuf::Utf8*>(obj);
+      auto ptr = reinterpret_cast<cudf::io::parquet::flatbuf::Utf8 const*>(obj);
       return verifier.VerifyTable(ptr);
     }
     case Type_Bool: {
-      auto ptr = reinterpret_cast<const cudf::io::parquet::flatbuf::Bool*>(obj);
+      auto ptr = reinterpret_cast<cudf::io::parquet::flatbuf::Bool const*>(obj);
       return verifier.VerifyTable(ptr);
     }
     case Type_Decimal: {
-      auto ptr = reinterpret_cast<const cudf::io::parquet::flatbuf::Decimal*>(obj);
+      auto ptr = reinterpret_cast<cudf::io::parquet::flatbuf::Decimal const*>(obj);
       return verifier.VerifyTable(ptr);
     }
     case Type_Date: {
-      auto ptr = reinterpret_cast<const cudf::io::parquet::flatbuf::Date*>(obj);
+      auto ptr = reinterpret_cast<cudf::io::parquet::flatbuf::Date const*>(obj);
       return verifier.VerifyTable(ptr);
     }
     case Type_Time: {
-      auto ptr = reinterpret_cast<const cudf::io::parquet::flatbuf::Time*>(obj);
+      auto ptr = reinterpret_cast<cudf::io::parquet::flatbuf::Time const*>(obj);
       return verifier.VerifyTable(ptr);
     }
     case Type_Timestamp: {
-      auto ptr = reinterpret_cast<const cudf::io::parquet::flatbuf::Timestamp*>(obj);
+      auto ptr = reinterpret_cast<cudf::io::parquet::flatbuf::Timestamp const*>(obj);
       return verifier.VerifyTable(ptr);
     }
     case Type_Interval: {
-      auto ptr = reinterpret_cast<const cudf::io::parquet::flatbuf::Interval*>(obj);
+      auto ptr = reinterpret_cast<cudf::io::parquet::flatbuf::Interval const*>(obj);
       return verifier.VerifyTable(ptr);
     }
     case Type_List: {
-      auto ptr = reinterpret_cast<const cudf::io::parquet::flatbuf::List*>(obj);
+      auto ptr = reinterpret_cast<cudf::io::parquet::flatbuf::List const*>(obj);
       return verifier.VerifyTable(ptr);
     }
     case Type_Struct_: {
-      auto ptr = reinterpret_cast<const cudf::io::parquet::flatbuf::Struct_*>(obj);
+      auto ptr = reinterpret_cast<cudf::io::parquet::flatbuf::Struct_ const*>(obj);
       return verifier.VerifyTable(ptr);
     }
     case Type_Union: {
-      auto ptr = reinterpret_cast<const cudf::io::parquet::flatbuf::Union*>(obj);
+      auto ptr = reinterpret_cast<cudf::io::parquet::flatbuf::Union const*>(obj);
       return verifier.VerifyTable(ptr);
     }
     case Type_FixedSizeBinary: {
-      auto ptr = reinterpret_cast<const cudf::io::parquet::flatbuf::FixedSizeBinary*>(obj);
+      auto ptr = reinterpret_cast<cudf::io::parquet::flatbuf::FixedSizeBinary const*>(obj);
       return verifier.VerifyTable(ptr);
     }
     case Type_FixedSizeList: {
-      auto ptr = reinterpret_cast<const cudf::io::parquet::flatbuf::FixedSizeList*>(obj);
+      auto ptr = reinterpret_cast<cudf::io::parquet::flatbuf::FixedSizeList const*>(obj);
       return verifier.VerifyTable(ptr);
     }
     case Type_Map: {
-      auto ptr = reinterpret_cast<const cudf::io::parquet::flatbuf::Map*>(obj);
+      auto ptr = reinterpret_cast<cudf::io::parquet::flatbuf::Map const*>(obj);
       return verifier.VerifyTable(ptr);
     }
     case Type_Duration: {
-      auto ptr = reinterpret_cast<const cudf::io::parquet::flatbuf::Duration*>(obj);
+      auto ptr = reinterpret_cast<cudf::io::parquet::flatbuf::Duration const*>(obj);
       return verifier.VerifyTable(ptr);
     }
     case Type_LargeBinary: {
-      auto ptr = reinterpret_cast<const cudf::io::parquet::flatbuf::LargeBinary*>(obj);
+      auto ptr = reinterpret_cast<cudf::io::parquet::flatbuf::LargeBinary const*>(obj);
       return verifier.VerifyTable(ptr);
     }
     case Type_LargeUtf8: {
-      auto ptr = reinterpret_cast<const cudf::io::parquet::flatbuf::LargeUtf8*>(obj);
+      auto ptr = reinterpret_cast<cudf::io::parquet::flatbuf::LargeUtf8 const*>(obj);
       return verifier.VerifyTable(ptr);
     }
     case Type_LargeList: {
-      auto ptr = reinterpret_cast<const cudf::io::parquet::flatbuf::LargeList*>(obj);
+      auto ptr = reinterpret_cast<cudf::io::parquet::flatbuf::LargeList const*>(obj);
       return verifier.VerifyTable(ptr);
     }
     case Type_RunEndEncoded: {
-      auto ptr = reinterpret_cast<const cudf::io::parquet::flatbuf::RunEndEncoded*>(obj);
+      auto ptr = reinterpret_cast<cudf::io::parquet::flatbuf::RunEndEncoded const*>(obj);
       return verifier.VerifyTable(ptr);
     }
     case Type_BinaryView: {
-      auto ptr = reinterpret_cast<const cudf::io::parquet::flatbuf::BinaryView*>(obj);
+      auto ptr = reinterpret_cast<cudf::io::parquet::flatbuf::BinaryView const*>(obj);
       return verifier.VerifyTable(ptr);
     }
     case Type_Utf8View: {
-      auto ptr = reinterpret_cast<const cudf::io::parquet::flatbuf::Utf8View*>(obj);
+      auto ptr = reinterpret_cast<cudf::io::parquet::flatbuf::Utf8View const*>(obj);
       return verifier.VerifyTable(ptr);
     }
     case Type_ListView: {
-      auto ptr = reinterpret_cast<const cudf::io::parquet::flatbuf::ListView*>(obj);
+      auto ptr = reinterpret_cast<cudf::io::parquet::flatbuf::ListView const*>(obj);
       return verifier.VerifyTable(ptr);
     }
     case Type_LargeListView: {
-      auto ptr = reinterpret_cast<const cudf::io::parquet::flatbuf::LargeListView*>(obj);
+      auto ptr = reinterpret_cast<cudf::io::parquet::flatbuf::LargeListView const*>(obj);
       return verifier.VerifyTable(ptr);
     }
     default: return true;
@@ -2717,8 +2717,8 @@ inline bool VerifyType(::flatbuffers::Verifier& verifier, const void* obj, Type
 }
 
 inline bool VerifyTypeVector(::flatbuffers::Verifier& verifier,
-                             const ::flatbuffers::Vector<::flatbuffers::Offset<void>>* values,
-                             const ::flatbuffers::Vector<uint8_t>* types)
+                             ::flatbuffers::Vector<::flatbuffers::Offset<void>> const* values,
+                             ::flatbuffers::Vector<uint8_t> const* types)
 {
   if (!values || !types) return !values && !types;
   if (values->size() != types->size()) return false;
@@ -2728,12 +2728,12 @@ inline bool VerifyTypeVector(::flatbuffers::Verifier& verifier,
   return true;
 }
 
-inline const cudf::io::parquet::flatbuf::Schema* GetSchema(const void* buf)
+inline cudf::io::parquet::flatbuf::Schema const* GetSchema(void const* buf)
 {
   return ::flatbuffers::GetRoot<cudf::io::parquet::flatbuf::Schema>(buf);
 }
 
-inline const cudf::io::parquet::flatbuf::Schema* GetSizePrefixedSchema(const void* buf)
+inline cudf::io::parquet::flatbuf::Schema const* GetSizePrefixedSchema(void const* buf)
 {
   return ::flatbuffers::GetSizePrefixedRoot<cudf::io::parquet::flatbuf::Schema>(buf);
 }
diff --git a/cpp/src/io/parquet/page_string_decode.cu b/cpp/src/io/parquet/page_string_decode.cu
index ba3d35b9586..58e8a09d5b6 100644
--- a/cpp/src/io/parquet/page_string_decode.cu
+++ b/cpp/src/io/parquet/page_string_decode.cu
@@ -379,7 +379,7 @@ __device__ size_t totalDictEntriesSize(uint8_t const* data,
       if (mytid < batch_len) {
         dict_idx         = dict_val;
         int32_t ofs      = (mytid - ((batch_len + 7) & ~7)) * dict_bits;
-        const uint8_t* p = ptr + (ofs >> 3);
+        uint8_t const* p = ptr + (ofs >> 3);
         ofs &= 7;
         if (p < end) {
           uint32_t c = 8 - ofs;
@@ -399,7 +399,7 @@ __device__ size_t totalDictEntriesSize(uint8_t const* data,
         if (pos + mytid < end_value) {
           uint32_t const dict_pos = (dict_bits > 0) ? dict_idx * sizeof(string_index_pair) : 0;
           if (pos + mytid >= start_value && dict_pos < (uint32_t)dict_size) {
-            const auto* src = reinterpret_cast<const string_index_pair*>(dict_base + dict_pos);
+            auto const* src = reinterpret_cast<string_index_pair const*>(dict_base + dict_pos);
             l_str_len += src->second;
           }
         }
@@ -413,7 +413,7 @@ __device__ size_t totalDictEntriesSize(uint8_t const* data,
       if (mytid == 0) {
         uint32_t const dict_pos = (dict_bits > 0) ? dict_val * sizeof(string_index_pair) : 0;
         if (pos + batch_len > start_value && dict_pos < (uint32_t)dict_size) {
-          const auto* src = reinterpret_cast<const string_index_pair*>(dict_base + dict_pos);
+          auto const* src = reinterpret_cast<string_index_pair const*>(dict_base + dict_pos);
           l_str_len += (batch_len - start_off) * src->second;
         }
       }
@@ -452,7 +452,7 @@ __device__ size_t totalPlainEntriesSize(uint8_t const* data,
 
   // This step is purely serial
   if (!t) {
-    const uint8_t* cur = data;
+    uint8_t const* cur = data;
     int k              = 0;
 
     while (pos < end_value && k < data_size) {
@@ -899,7 +899,7 @@ CUDF_KERNEL void __launch_bounds__(preprocess_block_size) gpuComputePageStringSi
         // RLE-packed dictionary indices, first byte indicates index length in bits
         if (col.str_dict_index) {
           // String dictionary: use index
-          dict_base = reinterpret_cast<const uint8_t*>(col.str_dict_index);
+          dict_base = reinterpret_cast<uint8_t const*>(col.str_dict_index);
           dict_size = col.dict_page->num_input_values * sizeof(string_index_pair);
         } else {
           dict_base = col.dict_page->page_data;
diff --git a/cpp/src/io/parquet/page_string_utils.cuh b/cpp/src/io/parquet/page_string_utils.cuh
index a81d0a64466..66073097579 100644
--- a/cpp/src/io/parquet/page_string_utils.cuh
+++ b/cpp/src/io/parquet/page_string_utils.cuh
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2023, NVIDIA CORPORATION.
+ * Copyright (c) 2023-2024, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -51,7 +51,7 @@ inline __device__ void wideStrcpy(uint8_t* dst, uint8_t const* src, size_t len,
   for (int64_t ichar = out_start_aligned + lane_id * out_datatype_size; ichar < out_end_aligned;
        ichar += warp_size * out_datatype_size) {
     *(out_chars_aligned + (ichar + alignment_offset) / out_datatype_size) =
-      load_uint4((const char*)in_start + ichar);
+      load_uint4((char const*)in_start + ichar);
   }
 
   // Tail logic: copy characters of the current string outside
diff --git a/cpp/src/io/parquet/parquet.hpp b/cpp/src/io/parquet/parquet.hpp
index e35742c2527..8ee4c175e09 100644
--- a/cpp/src/io/parquet/parquet.hpp
+++ b/cpp/src/io/parquet/parquet.hpp
@@ -105,43 +105,51 @@ struct LogicalType {
   LogicalType(TimestampType&& tst) : type(TIMESTAMP), timestamp_type(tst) {}
   LogicalType(IntType&& it) : type(INTEGER), int_type(it) {}
 
-  constexpr bool is_time_millis() const
+  [[nodiscard]] constexpr bool is_time_millis() const
   {
     return type == TIME and time_type->unit.type == TimeUnit::MILLIS;
   }
 
-  constexpr bool is_time_micros() const
+  [[nodiscard]] constexpr bool is_time_micros() const
   {
     return type == TIME and time_type->unit.type == TimeUnit::MICROS;
   }
 
-  constexpr bool is_time_nanos() const
+  [[nodiscard]] constexpr bool is_time_nanos() const
   {
     return type == TIME and time_type->unit.type == TimeUnit::NANOS;
   }
 
-  constexpr bool is_timestamp_millis() const
+  [[nodiscard]] constexpr bool is_timestamp_millis() const
   {
     return type == TIMESTAMP and timestamp_type->unit.type == TimeUnit::MILLIS;
   }
 
-  constexpr bool is_timestamp_micros() const
+  [[nodiscard]] constexpr bool is_timestamp_micros() const
   {
     return type == TIMESTAMP and timestamp_type->unit.type == TimeUnit::MICROS;
   }
 
-  constexpr bool is_timestamp_nanos() const
+  [[nodiscard]] constexpr bool is_timestamp_nanos() const
   {
     return type == TIMESTAMP and timestamp_type->unit.type == TimeUnit::NANOS;
   }
+  [[nodiscard]] constexpr int8_t bit_width() const
+  {
+    return type == INTEGER ? int_type->bitWidth : -1;
+  }
 
-  constexpr int8_t bit_width() const { return type == INTEGER ? int_type->bitWidth : -1; }
-
-  constexpr bool is_signed() const { return type == INTEGER and int_type->isSigned; }
+  [[nodiscard]] constexpr bool is_signed() const { return type == INTEGER and int_type->isSigned; }
 
-  constexpr int32_t scale() const { return type == DECIMAL ? decimal_type->scale : -1; }
+  [[nodiscard]] constexpr int32_t scale() const
+  {
+    return type == DECIMAL ? decimal_type->scale : -1;
+  }
 
-  constexpr int32_t precision() const { return type == DECIMAL ? decimal_type->precision : -1; }
+  [[nodiscard]] constexpr int32_t precision() const
+  {
+    return type == DECIMAL ? decimal_type->precision : -1;
+  }
 };
 
 /**
diff --git a/cpp/src/io/parquet/parquet_gpu.hpp b/cpp/src/io/parquet/parquet_gpu.hpp
index e3e4d8736c7..d82c6f0de59 100644
--- a/cpp/src/io/parquet/parquet_gpu.hpp
+++ b/cpp/src/io/parquet/parquet_gpu.hpp
@@ -36,6 +36,7 @@
 #include <cuda_runtime.h>
 
 #include <type_traits>
+#include <utility>
 #include <vector>
 
 namespace cudf::io::parquet::detail {
@@ -133,11 +134,11 @@ struct input_column_info {
   std::vector<int> nesting;
 
   input_column_info(int _schema_idx, std::string _name, bool _has_repetition)
-    : schema_idx(_schema_idx), name(_name), has_repetition(_has_repetition)
+    : schema_idx(_schema_idx), name(std::move(_name)), has_repetition(_has_repetition)
   {
   }
 
-  auto nesting_depth() const { return nesting.size(); }
+  [[nodiscard]] auto nesting_depth() const { return nesting.size(); }
 };
 
 // The delta encodings use ULEB128 integers, but parquet only uses max 64 bits.
@@ -148,12 +149,12 @@ using zigzag128_t = int64_t;
 #if !defined(__cpp_lib_is_scoped_enum)
 template <typename Enum, bool = std::is_enum_v<Enum>>
 struct is_scoped_enum {
-  static const bool value = not std::is_convertible_v<Enum, std::underlying_type_t<Enum>>;
+  static bool const value = not std::is_convertible_v<Enum, std::underlying_type_t<Enum>>;
 };
 
 template <typename Enum>
 struct is_scoped_enum<Enum, false> {
-  static const bool value = false;
+  static bool const value = false;
 };
 #else
 using std::is_scoped_enum;
@@ -406,13 +407,7 @@ struct ColumnChunkDesc {
       type_length(datatype_length_),
       physical_type(datatype_),
       level_bits{def_level_bits_, rep_level_bits_},
-      num_data_pages(0),
-      num_dict_pages(0),
-      dict_page(nullptr),
-      str_dict_index(nullptr),
-      valid_map_base{nullptr},
-      column_data_base{nullptr},
-      column_string_base{nullptr},
+
       codec(codec_),
       logical_type(logical_type_),
       ts_clock_rate(ts_clock_rate_),
@@ -420,8 +415,8 @@ struct ColumnChunkDesc {
       src_col_schema(src_col_schema_),
       h_chunk_info(chunk_info_),
       list_bytes_per_row_est(list_bytes_per_row_est_),
-      is_strings_to_cat(strings_to_categorical_),
-      is_large_string_col(false)
+      is_strings_to_cat(strings_to_categorical_)
+
   {
   }
 
@@ -475,8 +470,8 @@ struct parquet_column_device_view : stats_column_desc {
   int32_t type_length;           //!< length of fixed_length_byte_array data
   uint8_t level_bits;  //!< bits to encode max definition (lower nibble) & repetition (upper nibble)
                        //!< levels
-  constexpr uint8_t num_def_level_bits() const { return level_bits & 0xf; }
-  constexpr uint8_t num_rep_level_bits() const { return level_bits >> 4; }
+  [[nodiscard]] constexpr uint8_t num_def_level_bits() const { return level_bits & 0xf; }
+  [[nodiscard]] constexpr uint8_t num_rep_level_bits() const { return level_bits >> 4; }
   uint8_t max_def_level;  //!< needed for SizeStatistics calculation
   uint8_t max_rep_level;
 
@@ -578,9 +573,9 @@ struct EncColumnChunk {
   uint32_t* rep_histogram_data;  //!< Size is (max(level) + 1) * (num_data_pages + 1).
   size_t var_bytes_size;         //!< Sum of var_bytes_size from the pages (byte arrays only)
 
-  constexpr uint32_t num_dict_pages() const { return use_dictionary ? 1 : 0; }
+  [[nodiscard]] constexpr uint32_t num_dict_pages() const { return use_dictionary ? 1 : 0; }
 
-  constexpr uint32_t num_data_pages() const { return num_pages - num_dict_pages(); }
+  [[nodiscard]] constexpr uint32_t num_data_pages() const { return num_pages - num_dict_pages(); }
 };
 
 /**
@@ -619,9 +614,9 @@ struct EncPage {
   Encoding encoding;       //!< Encoding used for page data
   uint16_t num_fragments;  //!< Number of fragments in page
 
-  constexpr bool is_v2() const { return page_type == PageType::DATA_PAGE_V2; }
+  [[nodiscard]] constexpr bool is_v2() const { return page_type == PageType::DATA_PAGE_V2; }
 
-  constexpr auto level_bytes() const { return def_lvl_bytes + rep_lvl_bytes; }
+  [[nodiscard]] constexpr auto level_bytes() const { return def_lvl_bytes + rep_lvl_bytes; }
 };
 
 /**
diff --git a/cpp/src/io/parquet/predicate_pushdown.cpp b/cpp/src/io/parquet/predicate_pushdown.cpp
index 0109be661a7..11f4a00ee8b 100644
--- a/cpp/src/io/parquet/predicate_pushdown.cpp
+++ b/cpp/src/io/parquet/predicate_pushdown.cpp
@@ -474,9 +474,9 @@ std::optional<std::vector<std::vector<size_type>>> aggregate_reader_metadata::fi
     return std::nullopt;
   }
   size_type is_required_idx = 0;
-  for (size_t src_idx = 0; src_idx < input_row_group_indices.size(); ++src_idx) {
+  for (auto const& input_row_group_index : input_row_group_indices) {
     std::vector<size_type> filtered_row_groups;
-    for (auto const rg_idx : input_row_group_indices[src_idx]) {
+    for (auto const rg_idx : input_row_group_index) {
       if ((!validity_it[is_required_idx]) || is_row_group_required[is_required_idx]) {
         filtered_row_groups.push_back(rg_idx);
       }
diff --git a/cpp/src/io/parquet/reader_impl_chunking.cu b/cpp/src/io/parquet/reader_impl_chunking.cu
index d3f321af0bd..9ad5a2d6e8d 100644
--- a/cpp/src/io/parquet/reader_impl_chunking.cu
+++ b/cpp/src/io/parquet/reader_impl_chunking.cu
@@ -1027,7 +1027,7 @@ struct decompression_info {
  *
  */
 struct get_decomp_info {
-  device_span<const ColumnChunkDesc> chunks;
+  device_span<ColumnChunkDesc const> chunks;
 
   __device__ decompression_info operator()(PageInfo const& p) const
   {
diff --git a/cpp/src/io/parquet/reader_impl_helpers.cpp b/cpp/src/io/parquet/reader_impl_helpers.cpp
index 9de8a9e2719..ebd4affd099 100644
--- a/cpp/src/io/parquet/reader_impl_helpers.cpp
+++ b/cpp/src/io/parquet/reader_impl_helpers.cpp
@@ -48,10 +48,10 @@ thrust::optional<LogicalType> converted_to_logical_type(SchemaElement const& sch
       case LIST: return LogicalType{LogicalType::LIST};
       case DECIMAL: return LogicalType{DecimalType{schema.decimal_scale, schema.decimal_precision}};
       case DATE: return LogicalType{LogicalType::DATE};
-      case TIME_MILLIS: return LogicalType{TimeType{true, TimeUnit::MILLIS}};
-      case TIME_MICROS: return LogicalType{TimeType{true, TimeUnit::MICROS}};
-      case TIMESTAMP_MILLIS: return LogicalType{TimestampType{true, TimeUnit::MILLIS}};
-      case TIMESTAMP_MICROS: return LogicalType{TimestampType{true, TimeUnit::MICROS}};
+      case TIME_MILLIS: return LogicalType{TimeType{true, {TimeUnit::MILLIS}}};
+      case TIME_MICROS: return LogicalType{TimeType{true, {TimeUnit::MICROS}}};
+      case TIMESTAMP_MILLIS: return LogicalType{TimestampType{true, {TimeUnit::MILLIS}}};
+      case TIMESTAMP_MICROS: return LogicalType{TimestampType{true, {TimeUnit::MICROS}}};
       case UINT_8: return LogicalType{IntType{8, false}};
       case UINT_16: return LogicalType{IntType{16, false}};
       case UINT_32: return LogicalType{IntType{32, false}};
@@ -1093,12 +1093,11 @@ aggregate_reader_metadata::select_columns(
                                         has_list_parent || col_type == type_id::LIST);
         }
       } else {
-        for (size_t idx = 0; idx < col_name_info->children.size(); idx++) {
-          path_is_valid |=
-            build_column(&col_name_info->children[idx],
-                         find_schema_child(schema_elem, col_name_info->children[idx].name),
-                         output_col.children,
-                         has_list_parent || col_type == type_id::LIST);
+        for (const auto& idx : col_name_info->children) {
+          path_is_valid |= build_column(&idx,
+                                        find_schema_child(schema_elem, idx.name),
+                                        output_col.children,
+                                        has_list_parent || col_type == type_id::LIST);
         }
       }
 
@@ -1106,7 +1105,7 @@ aggregate_reader_metadata::select_columns(
       // data stored) so add me to the list.
       if (schema_elem.num_children == 0) {
         input_column_info& input_col = input_columns.emplace_back(
-          input_column_info{schema_idx, schema_elem.name, schema_elem.max_repetition_level > 0});
+          schema_idx, schema_elem.name, schema_elem.max_repetition_level > 0);
 
         // set up child output column for one-level encoding list
         if (one_level_list) {
@@ -1257,10 +1256,9 @@ aggregate_reader_metadata::select_columns(
      */
     for (auto const& path : use_names3) {
       auto array_to_find_in = &selected_columns;
-      for (size_t depth = 0; depth < path.size(); ++depth) {
+      for (auto const& name_to_find : path) {
         // Check if the path exists in our selected_columns and if not, add it.
-        auto const& name_to_find = path[depth];
-        auto found_col           = std::find_if(
+        auto found_col = std::find_if(
           array_to_find_in->begin(),
           array_to_find_in->end(),
           [&name_to_find](column_name_info const& col) { return col.name == name_to_find; });
diff --git a/cpp/src/io/parquet/reader_impl_preprocess.cu b/cpp/src/io/parquet/reader_impl_preprocess.cu
index 7cb982f103d..9df5c362cdd 100644
--- a/cpp/src/io/parquet/reader_impl_preprocess.cu
+++ b/cpp/src/io/parquet/reader_impl_preprocess.cu
@@ -647,7 +647,7 @@ constexpr bool is_string_chunk(ColumnChunkDesc const& chunk)
 
 struct set_str_dict_index_count {
   device_span<size_t> str_dict_index_count;
-  device_span<const ColumnChunkDesc> chunks;
+  device_span<ColumnChunkDesc const> chunks;
 
   __device__ void operator()(PageInfo const& page)
   {
@@ -662,7 +662,7 @@ struct set_str_dict_index_count {
 
 struct set_str_dict_index_ptr {
   string_index_pair* const base;
-  device_span<const size_t> str_dict_index_offsets;
+  device_span<size_t const> str_dict_index_offsets;
   device_span<ColumnChunkDesc> chunks;
 
   __device__ void operator()(size_t i)
@@ -679,7 +679,7 @@ struct set_str_dict_index_ptr {
  *
  */
 struct set_list_row_count_estimate {
-  device_span<const ColumnChunkDesc> chunks;
+  device_span<ColumnChunkDesc const> chunks;
 
   __device__ void operator()(PageInfo& page)
   {
@@ -708,7 +708,7 @@ struct set_list_row_count_estimate {
  */
 struct set_final_row_count {
   device_span<PageInfo> pages;
-  device_span<const ColumnChunkDesc> chunks;
+  device_span<ColumnChunkDesc const> chunks;
 
   __device__ void operator()(size_t i)
   {
diff --git a/cpp/src/io/statistics/byte_array_view.cuh b/cpp/src/io/statistics/byte_array_view.cuh
index 0fe6c17db89..58698c6a19d 100644
--- a/cpp/src/io/statistics/byte_array_view.cuh
+++ b/cpp/src/io/statistics/byte_array_view.cuh
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2022-2023, NVIDIA CORPORATION.
+ * Copyright (c) 2022-2024, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -161,7 +161,7 @@ class byte_array_view {
    *
    * @return An empty byte_array_view
    */
-  [[nodiscard]] __device__ inline static byte_array_view min() { return byte_array_view(); }
+  [[nodiscard]] __device__ inline static byte_array_view min() { return {}; }
 
   /**
    * @brief Return a byte_array_view to interpret as maximum value
@@ -170,7 +170,7 @@ class byte_array_view {
    */
   [[nodiscard]] __device__ inline static byte_array_view max()
   {
-    return byte_array_view(nullptr, std::numeric_limits<std::size_t>::max());
+    return {nullptr, std::numeric_limits<std::size_t>::max()};
   }
 
  private:
diff --git a/cpp/src/io/utilities/arrow_io_source.cpp b/cpp/src/io/utilities/arrow_io_source.cpp
index d647f3c0a4b..157240b8b08 100644
--- a/cpp/src/io/utilities/arrow_io_source.cpp
+++ b/cpp/src/io/utilities/arrow_io_source.cpp
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2023, NVIDIA CORPORATION.
+ * Copyright (c) 2023-2024, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -22,6 +22,7 @@
 
 #include <memory>
 #include <string>
+#include <utility>
 
 namespace cudf::io {
 
@@ -32,7 +33,8 @@ class arrow_io_buffer : public datasource::buffer {
   std::shared_ptr<arrow::Buffer> arrow_buffer;
 
  public:
-  explicit arrow_io_buffer(std::shared_ptr<arrow::Buffer> arrow_buffer) : arrow_buffer(arrow_buffer)
+  explicit arrow_io_buffer(std::shared_ptr<arrow::Buffer> arrow_buffer)
+    : arrow_buffer(std::move(arrow_buffer))
   {
   }
   [[nodiscard]] size_t size() const override { return arrow_buffer->size(); }
diff --git a/cpp/src/io/utilities/column_buffer.cpp b/cpp/src/io/utilities/column_buffer.cpp
index 27fc53fbc9e..2f4272b0367 100644
--- a/cpp/src/io/utilities/column_buffer.cpp
+++ b/cpp/src/io/utilities/column_buffer.cpp
@@ -171,9 +171,7 @@ std::unique_ptr<column> make_column(column_buffer_base<string_policy>& buffer,
   switch (buffer.type.id()) {
     case type_id::STRING:
       if (schema.value_or(reader_column_schema{}).is_enabled_convert_binary_to_strings()) {
-        if (schema_info != nullptr) {
-          schema_info->children.push_back(column_name_info{"offsets"});
-        }
+        if (schema_info != nullptr) { schema_info->children.emplace_back("offsets"); }
 
         // make_strings_column allocates new memory, it does not simply move
         // from the inputs, so we need to pass it the memory resource given to
@@ -199,8 +197,8 @@ std::unique_ptr<column> make_column(column_buffer_base<string_policy>& buffer,
           data_type{type_id::UINT8}, char_size, std::move(*data), rmm::device_buffer{}, 0);
 
         if (schema_info != nullptr) {
-          schema_info->children.push_back(column_name_info{"offsets"});
-          schema_info->children.push_back(column_name_info{"binary"});
+          schema_info->children.emplace_back("offsets");
+          schema_info->children.emplace_back("binary");
           // cuDF type will be list<UINT8>, but remember it was originally binary data
           schema_info->is_binary = true;
           if (schema.has_value() and schema->get_type_length() > 0) {
@@ -224,8 +222,8 @@ std::unique_ptr<column> make_column(column_buffer_base<string_policy>& buffer,
 
       column_name_info* child_info = nullptr;
       if (schema_info != nullptr) {
-        schema_info->children.push_back(column_name_info{"offsets"});
-        schema_info->children.push_back(column_name_info{""});
+        schema_info->children.emplace_back("offsets");
+        schema_info->children.emplace_back("");
         child_info = &schema_info->children.back();
       }
 
@@ -256,7 +254,7 @@ std::unique_ptr<column> make_column(column_buffer_base<string_policy>& buffer,
       for (size_t i = 0; i < buffer.children.size(); ++i) {
         column_name_info* child_info = nullptr;
         if (schema_info != nullptr) {
-          schema_info->children.push_back(column_name_info{""});
+          schema_info->children.emplace_back("");
           child_info = &schema_info->children.back();
         }
 
@@ -306,8 +304,8 @@ std::unique_ptr<column> empty_like(column_buffer_base<string_policy>& buffer,
 
       column_name_info* child_info = nullptr;
       if (schema_info != nullptr) {
-        schema_info->children.push_back(column_name_info{"offsets"});
-        schema_info->children.push_back(column_name_info{""});
+        schema_info->children.emplace_back("offsets");
+        schema_info->children.emplace_back("");
         child_info = &schema_info->children.back();
       }
 
@@ -330,7 +328,7 @@ std::unique_ptr<column> empty_like(column_buffer_base<string_policy>& buffer,
                      [&](auto& col) {
                        column_name_info* child_info = nullptr;
                        if (schema_info != nullptr) {
-                         schema_info->children.push_back(column_name_info{""});
+                         schema_info->children.emplace_back("");
                          child_info = &schema_info->children.back();
                        }
                        return cudf::io::detail::empty_like<string_policy>(
diff --git a/cpp/src/io/utilities/column_buffer.hpp b/cpp/src/io/utilities/column_buffer.hpp
index e6bfae0681a..ed6bb8bbdca 100644
--- a/cpp/src/io/utilities/column_buffer.hpp
+++ b/cpp/src/io/utilities/column_buffer.hpp
@@ -137,8 +137,11 @@ class column_buffer_base {
   auto& null_count() { return _null_count; }
 
   auto data() { return static_cast<string_policy*>(this)->data_impl(); }
-  auto data() const { return static_cast<string_policy const*>(this)->data_impl(); }
-  auto data_size() const { return static_cast<string_policy const*>(this)->data_size_impl(); }
+  [[nodiscard]] auto data() const { return static_cast<string_policy const*>(this)->data_impl(); }
+  [[nodiscard]] auto data_size() const
+  {
+    return static_cast<string_policy const*>(this)->data_size_impl();
+  }
 
   std::unique_ptr<column> make_string_column(rmm::cuda_stream_view stream)
   {
@@ -191,9 +194,9 @@ class gather_column_buffer : public column_buffer_base<gather_column_buffer> {
 
   void allocate_strings_data(rmm::cuda_stream_view stream);
 
-  void* data_impl() { return _strings ? _strings->data() : _data.data(); }
-  void const* data_impl() const { return _strings ? _strings->data() : _data.data(); }
-  size_t data_size_impl() const { return _strings ? _strings->size() : _data.size(); }
+  [[nodiscard]] void* data_impl() { return _strings ? _strings->data() : _data.data(); }
+  [[nodiscard]] void const* data_impl() const { return _strings ? _strings->data() : _data.data(); }
+  [[nodiscard]] size_t data_size_impl() const { return _strings ? _strings->size() : _data.size(); }
 
   std::unique_ptr<column> make_string_column_impl(rmm::cuda_stream_view stream);
 
@@ -226,14 +229,14 @@ class inline_column_buffer : public column_buffer_base<inline_column_buffer> {
   void allocate_strings_data(rmm::cuda_stream_view stream);
 
   void* data_impl() { return _data.data(); }
-  void const* data_impl() const { return _data.data(); }
-  size_t data_size_impl() const { return _data.size(); }
+  [[nodiscard]] void const* data_impl() const { return _data.data(); }
+  [[nodiscard]] size_t data_size_impl() const { return _data.size(); }
   std::unique_ptr<column> make_string_column_impl(rmm::cuda_stream_view stream);
 
   void create_string_data(size_t num_bytes, rmm::cuda_stream_view stream);
   void* string_data() { return _string_data.data(); }
-  void const* string_data() const { return _string_data.data(); }
-  size_t string_size() const { return _string_data.size(); }
+  [[nodiscard]] void const* string_data() const { return _string_data.data(); }
+  [[nodiscard]] size_t string_size() const { return _string_data.size(); }
 
  private:
   rmm::device_buffer _string_data{};
diff --git a/cpp/src/io/utilities/data_casting.cu b/cpp/src/io/utilities/data_casting.cu
index 288a5690282..aa1b29a101f 100644
--- a/cpp/src/io/utilities/data_casting.cu
+++ b/cpp/src/io/utilities/data_casting.cu
@@ -917,8 +917,8 @@ static std::unique_ptr<column> parse_string(string_view_pair_it str_tuples,
 }
 
 std::unique_ptr<column> parse_data(
-  const char* data,
-  thrust::zip_iterator<thrust::tuple<const size_type*, const size_type*>> offset_length_begin,
+  char const* data,
+  thrust::zip_iterator<thrust::tuple<size_type const*, size_type const*>> offset_length_begin,
   size_type col_size,
   data_type col_type,
   rmm::device_buffer&& null_mask,
diff --git a/cpp/src/io/utilities/data_sink.cpp b/cpp/src/io/utilities/data_sink.cpp
index 66905c5256f..a6cbbcd84a6 100644
--- a/cpp/src/io/utilities/data_sink.cpp
+++ b/cpp/src/io/utilities/data_sink.cpp
@@ -49,7 +49,7 @@ class file_sink : public data_sink {
     }
   }
 
-  virtual ~file_sink() { flush(); }
+  ~file_sink() override { flush(); }
 
   void host_write(void const* data, size_t size) override
   {
@@ -113,7 +113,7 @@ class host_buffer_sink : public data_sink {
  public:
   explicit host_buffer_sink(std::vector<char>* buffer) : buffer_(buffer) {}
 
-  virtual ~host_buffer_sink() { flush(); }
+  ~host_buffer_sink() override { flush(); }
 
   void host_write(void const* data, size_t size) override
   {
@@ -136,7 +136,7 @@ class void_sink : public data_sink {
  public:
   explicit void_sink() {}
 
-  virtual ~void_sink() {}
+  ~void_sink() override {}
 
   void host_write(void const* data, size_t size) override { _bytes_written += size; }
 
@@ -169,7 +169,7 @@ class user_sink_wrapper : public data_sink {
  public:
   explicit user_sink_wrapper(cudf::io::data_sink* const user_sink_) : user_sink(user_sink_) {}
 
-  virtual ~user_sink_wrapper() {}
+  ~user_sink_wrapper() override {}
 
   void host_write(void const* data, size_t size) override { user_sink->host_write(data, size); }
 
diff --git a/cpp/src/io/utilities/datasource.cpp b/cpp/src/io/utilities/datasource.cpp
index d8dbd3614c8..ca8932322bf 100644
--- a/cpp/src/io/utilities/datasource.cpp
+++ b/cpp/src/io/utilities/datasource.cpp
@@ -53,7 +53,7 @@ class file_source : public datasource {
     }
   }
 
-  virtual ~file_source() = default;
+  ~file_source() override = default;
 
   [[nodiscard]] bool supports_device_read() const override
   {
diff --git a/cpp/src/io/utilities/file_io_utilities.cpp b/cpp/src/io/utilities/file_io_utilities.cpp
index 39031526fc8..a9d4f19c848 100644
--- a/cpp/src/io/utilities/file_io_utilities.cpp
+++ b/cpp/src/io/utilities/file_io_utilities.cpp
@@ -23,9 +23,9 @@
 #include <rmm/device_buffer.hpp>
 
 #include <dlfcn.h>
-#include <errno.h>
-#include <string.h>
 
+#include <cerrno>
+#include <cstring>
 #include <filesystem>
 #include <fstream>
 #include <numeric>
@@ -39,7 +39,7 @@ void force_init_cuda_context()
   // Workaround for https://github.com/rapidsai/cudf/issues/14140, where cuFileDriverOpen errors
   // out if no CUDA calls have been made before it. This is a no-op if the CUDA context is already
   // initialized.
-  cudaFree(0);
+  cudaFree(nullptr);
 }
 
 [[noreturn]] void throw_on_file_open_failure(std::string const& filepath, bool is_create)
@@ -98,7 +98,7 @@ class cufile_shim {
   decltype(cuFileDriverClose)* driver_close = nullptr;
 
   std::unique_ptr<cudf::logic_error> init_error;
-  auto is_valid() const noexcept { return init_error == nullptr; }
+  [[nodiscard]] auto is_valid() const noexcept { return init_error == nullptr; }
 
  public:
   cufile_shim(cufile_shim const&)            = delete;
diff --git a/cpp/src/io/utilities/hostdevice_span.hpp b/cpp/src/io/utilities/hostdevice_span.hpp
index c9a58ab31cf..d9eac423901 100644
--- a/cpp/src/io/utilities/hostdevice_span.hpp
+++ b/cpp/src/io/utilities/hostdevice_span.hpp
@@ -170,7 +170,7 @@ class hostdevice_span {
    * @param count The number of elements in the subspan
    * @return A subspan of the sequence, of requested count and offset
    */
-  constexpr hostdevice_span<T> subspan(size_t offset, size_t count) const noexcept
+  [[nodiscard]] constexpr hostdevice_span<T> subspan(size_t offset, size_t count) const noexcept
   {
     return hostdevice_span<T>(_host_data + offset, _device_data + offset, count);
   }
diff --git a/cpp/src/io/utilities/hostdevice_vector.hpp b/cpp/src/io/utilities/hostdevice_vector.hpp
index 1ae27a2f4ae..9acd6a1e3a9 100644
--- a/cpp/src/io/utilities/hostdevice_vector.hpp
+++ b/cpp/src/io/utilities/hostdevice_vector.hpp
@@ -224,7 +224,7 @@ class hostdevice_2dvector {
 
   T const* base_device_ptr(size_t offset = 0) const { return _data.device_ptr(offset); }
 
-  size_t size_bytes() const noexcept { return _data.size_bytes(); }
+  [[nodiscard]] size_t size_bytes() const noexcept { return _data.size_bytes(); }
 
   void host_to_device_async(rmm::cuda_stream_view stream) { _data.host_to_device_async(stream); }
   void host_to_device_sync(rmm::cuda_stream_view stream) { _data.host_to_device_sync(stream); }
diff --git a/cpp/src/io/utilities/output_builder.cuh b/cpp/src/io/utilities/output_builder.cuh
index a7517983cd3..3bc5ccf41ef 100644
--- a/cpp/src/io/utilities/output_builder.cuh
+++ b/cpp/src/io/utilities/output_builder.cuh
@@ -208,7 +208,7 @@ class output_builder {
                  size_type max_growth,
                  rmm::cuda_stream_view stream,
                  rmm::device_async_resource_ref mr = rmm::mr::get_current_device_resource())
-    : _size{0}, _max_write_size{max_write_size}, _max_growth{max_growth}
+    : _max_write_size{max_write_size}, _max_growth{max_growth}
   {
     CUDF_EXPECTS(max_write_size > 0, "Internal error");
     _chunks.emplace_back(0, stream, mr);
@@ -349,7 +349,7 @@ class output_builder {
     return device_span<T>{vector.data() + vector.size(), vector.capacity() - vector.size()};
   }
 
-  size_type _size;
+  size_type _size{0};
   size_type _max_write_size;
   size_type _max_growth;
   std::vector<rmm::device_uvector<T>> _chunks;
diff --git a/cpp/src/io/utilities/string_parsing.hpp b/cpp/src/io/utilities/string_parsing.hpp
index 612889af74b..3e6f57f2896 100644
--- a/cpp/src/io/utilities/string_parsing.hpp
+++ b/cpp/src/io/utilities/string_parsing.hpp
@@ -46,7 +46,7 @@ namespace detail {
 cudf::data_type infer_data_type(
   cudf::io::json_inference_options_view const& options,
   device_span<char const> data,
-  thrust::zip_iterator<thrust::tuple<const size_type*, const size_type*>> offset_length_begin,
+  thrust::zip_iterator<thrust::tuple<size_type const*, size_type const*>> offset_length_begin,
   std::size_t const size,
   rmm::cuda_stream_view stream);
 }  // namespace detail
@@ -67,8 +67,8 @@ namespace json::detail {
  * @return The column that contains the parsed data
  */
 std::unique_ptr<column> parse_data(
-  const char* data,
-  thrust::zip_iterator<thrust::tuple<const size_type*, const size_type*>> offset_length_begin,
+  char const* data,
+  thrust::zip_iterator<thrust::tuple<size_type const*, size_type const*>> offset_length_begin,
   size_type col_size,
   data_type col_type,
   rmm::device_buffer&& null_mask,
diff --git a/cpp/src/io/utilities/type_inference.cu b/cpp/src/io/utilities/type_inference.cu
index dff40cc09ed..43dc38c4ac6 100644
--- a/cpp/src/io/utilities/type_inference.cu
+++ b/cpp/src/io/utilities/type_inference.cu
@@ -255,7 +255,7 @@ cudf::io::column_type_histogram infer_column_type(OptionsView const& options,
 cudf::data_type infer_data_type(
   cudf::io::json_inference_options_view const& options,
   device_span<char const> data,
-  thrust::zip_iterator<thrust::tuple<const size_type*, const size_type*>> offset_length_begin,
+  thrust::zip_iterator<thrust::tuple<size_type const*, size_type const*>> offset_length_begin,
   std::size_t const size,
   rmm::cuda_stream_view stream)
 {
diff --git a/cpp/src/jit/cache.cpp b/cpp/src/jit/cache.cpp
index bc8e3e8e392..89c47d246d0 100644
--- a/cpp/src/jit/cache.cpp
+++ b/cpp/src/jit/cache.cpp
@@ -33,7 +33,7 @@ std::filesystem::path get_user_home_cache_dir()
   if (home_dir != nullptr) {
     return std::filesystem::path(home_dir) / ".cudf";
   } else {
-    return std::filesystem::path();
+    return {};
   }
 }
 
@@ -90,7 +90,7 @@ std::filesystem::path get_cache_dir()
       std::filesystem::create_directories(kernel_cache_path);
     } catch (std::exception const& e) {
       // if directory creation fails for any reason, return empty path
-      return std::filesystem::path();
+      return {};
     }
   }
   return kernel_cache_path;
diff --git a/cpp/src/jit/parser.cpp b/cpp/src/jit/parser.cpp
index e59c1089318..398c36821cc 100644
--- a/cpp/src/jit/parser.cpp
+++ b/cpp/src/jit/parser.cpp
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2019-2023, NVIDIA CORPORATION.
+ * Copyright (c) 2019-2024, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -23,6 +23,7 @@
 #include <map>
 #include <set>
 #include <string>
+#include <utility>
 #include <vector>
 
 namespace cudf {
@@ -207,7 +208,7 @@ std::string ptx_parser::parse_instruction(std::string const& src)
       } else if (is_pragma_instruction) {
         // quote any string
         std::string transformed_piece;
-        for (const auto& c : piece) {
+        for (auto const& c : piece) {
           if (c == '"') {
             transformed_piece += "\\\"";
           } else {
@@ -378,13 +379,13 @@ std::string ptx_parser::parse()
   return final_output + " asm volatile (\"RETTGT:}\");}";
 }
 
-ptx_parser::ptx_parser(std::string const& ptx_,
-                       std::string const& function_name_,
-                       std::string const& output_arg_type_,
+ptx_parser::ptx_parser(std::string ptx_,
+                       std::string function_name_,
+                       std::string output_arg_type_,
                        std::set<int> const& pointer_arg_list_)
-  : ptx(ptx_),
-    function_name(function_name_),
-    output_arg_type(output_arg_type_),
+  : ptx(std::move(ptx_)),
+    function_name(std::move(function_name_)),
+    output_arg_type(std::move(output_arg_type_)),
     pointer_arg_list(pointer_arg_list_)
 {
 }
diff --git a/cpp/src/jit/parser.hpp b/cpp/src/jit/parser.hpp
index 86f869c5e97..55528bed6cf 100644
--- a/cpp/src/jit/parser.hpp
+++ b/cpp/src/jit/parser.hpp
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2019-2023, NVIDIA CORPORATION.
+ * Copyright (c) 2019-2024, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -195,9 +195,9 @@ class ptx_parser {
    * function.
    * @param pointer_arg_list_ A list of the parameters that are pointers.
    */
-  ptx_parser(std::string const& ptx_,
-             std::string const& function_name_,
-             std::string const& output_arg_type_,
+  ptx_parser(std::string ptx_,
+             std::string function_name_,
+             std::string output_arg_type_,
              std::set<int> const& pointer_arg_list_);
 
   // parse the source!!!
diff --git a/cpp/src/reductions/reductions.cpp b/cpp/src/reductions/reductions.cpp
index 8fa036a0949..d4ea84742c7 100644
--- a/cpp/src/reductions/reductions.cpp
+++ b/cpp/src/reductions/reductions.cpp
@@ -34,6 +34,8 @@
 #include <rmm/cuda_stream_view.hpp>
 #include <rmm/resource_ref.hpp>
 
+#include <utility>
+
 namespace cudf {
 namespace reduction {
 namespace detail {
@@ -44,12 +46,12 @@ struct reduce_dispatch_functor {
   rmm::device_async_resource_ref mr;
   rmm::cuda_stream_view stream;
 
-  reduce_dispatch_functor(column_view const& col,
+  reduce_dispatch_functor(column_view col,
                           data_type output_dtype,
                           std::optional<std::reference_wrapper<scalar const>> init,
                           rmm::cuda_stream_view stream,
                           rmm::device_async_resource_ref mr)
-    : col(col), output_dtype(output_dtype), init(init), mr(mr), stream(stream)
+    : col(std::move(col)), output_dtype(output_dtype), init(init), mr(mr), stream(stream)
   {
   }
 
diff --git a/cpp/src/rolling/detail/optimized_unbounded_window.cpp b/cpp/src/rolling/detail/optimized_unbounded_window.cpp
index 3e085fa963c..4175c6e34c1 100644
--- a/cpp/src/rolling/detail/optimized_unbounded_window.cpp
+++ b/cpp/src/rolling/detail/optimized_unbounded_window.cpp
@@ -102,7 +102,7 @@ std::unique_ptr<column> aggregation_based_rolling_window(table_view const& group
                "Ungrouped rolling window not supported in aggregation path.");
 
   auto agg_requests = std::vector<cudf::groupby::aggregation_request>{};
-  agg_requests.push_back(cudf::groupby::aggregation_request());
+  agg_requests.emplace_back();
   agg_requests.front().values = input;
   agg_requests.front().aggregations.push_back(convert_to<cudf::groupby_aggregation>(aggr));
 
diff --git a/cpp/src/strings/regex/regcomp.cpp b/cpp/src/strings/regex/regcomp.cpp
index 170ed59d2fe..adf650a4f27 100644
--- a/cpp/src/strings/regex/regcomp.cpp
+++ b/cpp/src/strings/regex/regcomp.cpp
@@ -80,7 +80,7 @@ std::array<char, 33> const escapable_chars{
  */
 std::vector<char32_t> string_to_char32_vector(std::string_view pattern)
 {
-  size_type size  = static_cast<size_type>(pattern.size());
+  auto size       = static_cast<size_type>(pattern.size());
   size_type count = std::count_if(pattern.cbegin(), pattern.cend(), [](char ch) {
     return is_begin_utf8_char(static_cast<uint8_t>(ch));
   });
@@ -165,8 +165,8 @@ class regex_parser {
         int16_t m;
       } count;
     } d;
-    Item(int32_t type, char32_t chr) : type{type}, d{chr} {}
-    Item(int32_t type, int32_t id) : type{type}, d{.cclass_id{id}} {}
+    Item(int32_t type, char32_t chr) : type{type}, d{.chr = chr} {}
+    Item(int32_t type, int32_t id) : type{type}, d{.cclass_id = id} {}
     Item(int32_t type, int16_t n, int16_t m) : type{type}, d{.count{n, m}} {}
   };
 
@@ -692,7 +692,7 @@ class regex_parser {
     return CHAR;
   }
 
-  std::vector<regex_parser::Item> expand_counted_items() const
+  [[nodiscard]] std::vector<regex_parser::Item> expand_counted_items() const
   {
     std::vector<regex_parser::Item> const& in = _items;
     std::vector<regex_parser::Item> out;
@@ -738,20 +738,20 @@ class regex_parser {
         // optional maximum repeats (m)
         if (m >= 0) {
           for (int j = n; j < m; j++) {
-            out.push_back(regex_parser::Item{LBRA_NC, 0});
+            out.emplace_back(LBRA_NC, 0);
             out.insert(out.end(), begin, end);
           }
           for (int j = n; j < m; j++) {
-            out.push_back(regex_parser::Item{RBRA, 0});
-            out.push_back(regex_parser::Item{item.type == COUNTED ? QUEST : QUEST_LAZY, 0});
+            out.emplace_back(RBRA, 0);
+            out.emplace_back(item.type == COUNTED ? QUEST : QUEST_LAZY, 0);
           }
         } else {
           // infinite repeats
           if (n > 0) {  // append '+' after last repetition
-            out.push_back(regex_parser::Item{item.type == COUNTED ? PLUS : PLUS_LAZY, 0});
+            out.emplace_back(item.type == COUNTED ? PLUS : PLUS_LAZY, 0);
           } else {  // copy it once then append '*'
             out.insert(out.end(), begin, end);
-            out.push_back(regex_parser::Item{item.type == COUNTED ? STAR : STAR_LAZY, 0});
+            out.emplace_back(item.type == COUNTED ? STAR : STAR_LAZY, 0);
           }
         }
       }
@@ -780,7 +780,7 @@ class regex_parser {
     }
   }
 
-  std::vector<regex_parser::Item> get_items() const
+  [[nodiscard]] std::vector<regex_parser::Item> get_items() const
   {
     return _has_counted ? expand_counted_items() : _items;
   }
@@ -803,8 +803,8 @@ class regex_compiler {
   reprog& _prog;
   std::stack<and_node> _and_stack;
   std::stack<re_operator> _operator_stack;
-  bool _last_was_and;
-  int _bracket_count;
+  bool _last_was_and{false};
+  int _bracket_count{0};
   regex_flags _flags;
 
   inline void push_and(int first, int last) { _and_stack.push({first, last}); }
@@ -971,7 +971,7 @@ class regex_compiler {
                  regex_flags const flags,
                  capture_groups const capture,
                  reprog& prog)
-    : _prog(prog), _last_was_and(false), _bracket_count(0), _flags(flags)
+    : _prog(prog), _flags(flags)
   {
     // Parse pattern into items
     auto const items = regex_parser(pattern, _flags, capture, _prog).get_items();
diff --git a/cpp/src/strings/regex/regex.cuh b/cpp/src/strings/regex/regex.cuh
index c8d846624f8..e6134296e45 100644
--- a/cpp/src/strings/regex/regex.cuh
+++ b/cpp/src/strings/regex/regex.cuh
@@ -186,10 +186,10 @@ class reprog_device {
    *            Specify -1 to match any virtual positions past the end of the string.
    * @return If match found, returns character positions of the matches.
    */
-  __device__ inline match_result find(int32_t const thread_idx,
-                                      string_view const d_str,
-                                      string_view::const_iterator begin,
-                                      cudf::size_type end = -1) const;
+  __device__ [[nodiscard]] inline match_result find(int32_t const thread_idx,
+                                                    string_view const d_str,
+                                                    string_view::const_iterator begin,
+                                                    cudf::size_type end = -1) const;
 
   /**
    * @brief Does an extract evaluation using the compiled expression on the given string.
@@ -205,11 +205,11 @@ class reprog_device {
    * @param group_id The specific group to return its matching position values.
    * @return If valid, returns the character position of the matched group in the given string,
    */
-  __device__ inline match_result extract(int32_t const thread_idx,
-                                         string_view const d_str,
-                                         string_view::const_iterator begin,
-                                         cudf::size_type end,
-                                         cudf::size_type const group_id) const;
+  __device__ [[nodiscard]] inline match_result extract(int32_t const thread_idx,
+                                                       string_view const d_str,
+                                                       string_view::const_iterator begin,
+                                                       cudf::size_type end,
+                                                       cudf::size_type const group_id) const;
 
  private:
   struct reljunk {
@@ -225,30 +225,31 @@ class reprog_device {
   /**
    * @brief Returns the regex instruction object for a given id.
    */
-  __device__ inline reinst get_inst(int32_t id) const;
+  __device__ [[nodiscard]] inline reinst get_inst(int32_t id) const;
 
   /**
    * @brief Returns the regex class object for a given id.
    */
-  __device__ inline reclass_device get_class(int32_t id) const;
+  __device__ [[nodiscard]] inline reclass_device get_class(int32_t id) const;
 
   /**
    * @brief Executes the regex pattern on the given string.
    */
-  __device__ inline match_result regexec(string_view const d_str,
-                                         reljunk jnk,
-                                         string_view::const_iterator begin,
-                                         cudf::size_type end,
-                                         cudf::size_type const group_id = 0) const;
+  __device__ [[nodiscard]] inline match_result regexec(string_view const d_str,
+                                                       reljunk jnk,
+                                                       string_view::const_iterator begin,
+                                                       cudf::size_type end,
+                                                       cudf::size_type const group_id = 0) const;
 
   /**
    * @brief Utility wrapper to setup state memory structures for calling regexec
    */
-  __device__ inline match_result call_regexec(int32_t const thread_idx,
-                                              string_view const d_str,
-                                              string_view::const_iterator begin,
-                                              cudf::size_type end,
-                                              cudf::size_type const group_id = 0) const;
+  __device__ [[nodiscard]] inline match_result call_regexec(
+    int32_t const thread_idx,
+    string_view const d_str,
+    string_view::const_iterator begin,
+    cudf::size_type end,
+    cudf::size_type const group_id = 0) const;
 
   reprog_device(reprog const&);
 
@@ -300,7 +301,7 @@ __device__ __forceinline__ string_view string_from_match(match_pair const result
                                                          string_view::const_iterator last)
 {
   auto const [begin, end] = match_positions_to_bytes(result, d_str, last);
-  return string_view(d_str.data() + begin, end - begin);
+  return {d_str.data() + begin, end - begin};
 }
 
 }  // namespace detail
diff --git a/cpp/src/strings/regex/regex.inl b/cpp/src/strings/regex/regex.inl
index 10e06505094..23e1944cda4 100644
--- a/cpp/src/strings/regex/regex.inl
+++ b/cpp/src/strings/regex/regex.inl
@@ -81,12 +81,11 @@ struct alignas(8) relist {
     return true;
   }
 
-  __device__ __forceinline__ restate get_state(int16_t idx) const
+  __device__ [[nodiscard]] __forceinline__ restate get_state(int16_t idx) const
   {
     return restate{ranges[idx * stride], inst_ids[idx * stride]};
   }
-
-  __device__ __forceinline__ int16_t get_size() const { return size; }
+  __device__ [[nodiscard]] __forceinline__ int16_t get_size() const { return size; }
 
  private:
   int16_t size{};
@@ -102,7 +101,7 @@ struct alignas(8) relist {
     mask[pos >> 3] |= uc;
   }
 
-  __device__ __forceinline__ bool readMask(int32_t pos) const
+  __device__ [[nodiscard]] __forceinline__ bool readMask(int32_t pos) const
   {
     u_char const uc = mask[pos >> 3];
     return static_cast<bool>((uc >> (pos & 7)) & 1);
diff --git a/cpp/src/strings/regex/regexec.cpp b/cpp/src/strings/regex/regexec.cpp
index b5e7e7e8922..d1990733e81 100644
--- a/cpp/src/strings/regex/regexec.cpp
+++ b/cpp/src/strings/regex/regexec.cpp
@@ -55,12 +55,12 @@ std::unique_ptr<reprog_device, std::function<void(reprog_device*)>> reprog_devic
   // compute size of each section
   auto insts_size    = insts_count * sizeof(_insts[0]);
   auto startids_size = starts_count * sizeof(_startinst_ids[0]);
-  auto classes_size  = std::transform_reduce(
-    h_prog.classes_data(),
-    h_prog.classes_data() + h_prog.classes_count(),
-    classes_count * sizeof(_classes[0]),
-    std::plus<std::size_t>{},
-    [&h_prog](auto& cls) { return cls.literals.size() * sizeof(reclass_range); });
+  auto classes_size =
+    std::transform_reduce(h_prog.classes_data(),
+                          h_prog.classes_data() + h_prog.classes_count(),
+                          classes_count * sizeof(_classes[0]),
+                          std::plus<std::size_t>{},
+                          [](auto& cls) { return cls.literals.size() * sizeof(reclass_range); });
   // make sure each section is aligned for the subsequent section's data type
   auto const memsize = cudf::util::round_up_safe(insts_size, sizeof(_startinst_ids[0])) +
                        cudf::util::round_up_safe(startids_size, sizeof(_classes[0])) +
@@ -73,7 +73,7 @@ std::unique_ptr<reprog_device, std::function<void(reprog_device*)>> reprog_devic
   auto d_ptr    = reinterpret_cast<u_char*>(d_buffer->data());  // running device pointer
 
   // create our device object; this is managed separately and returned to the caller
-  reprog_device* d_prog = new reprog_device(h_prog);
+  auto* d_prog = new reprog_device(h_prog);
 
   // copy the instructions array first (fixed-sized structs)
   memcpy(h_ptr, h_prog.insts_data(), insts_size);
diff --git a/cpp/src/transform/transform.cpp b/cpp/src/transform/transform.cpp
index 072eb73453b..98ec44758b9 100644
--- a/cpp/src/transform/transform.cpp
+++ b/cpp/src/transform/transform.cpp
@@ -59,7 +59,7 @@ void unary_operation(mutable_column_view output,
   cudf::jit::get_program_cache(*transform_jit_kernel_cu_jit)
     .get_kernel(
       kernel_name, {}, {{"transform/jit/operation-udf.hpp", cuda_source}}, {"-arch=sm_."})  //
-    ->configure_1d_max_occupancy(0, 0, 0, stream.value())                                   //
+    ->configure_1d_max_occupancy(0, 0, nullptr, stream.value())                             //
     ->launch(output.size(),                                                                 //
              cudf::jit::get_data_ptr(output),
              cudf::jit::get_data_ptr(input));
diff --git a/cpp/src/utilities/stream_pool.cpp b/cpp/src/utilities/stream_pool.cpp
index 121873ad44b..9d3a7ce5a4e 100644
--- a/cpp/src/utilities/stream_pool.cpp
+++ b/cpp/src/utilities/stream_pool.cpp
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2023, NVIDIA CORPORATION.
+ * Copyright (c) 2023-2024, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -101,7 +101,7 @@ class debug_cuda_stream_pool : public cuda_stream_pool {
     return std::vector<rmm::cuda_stream_view>(count, cudf::get_default_stream());
   }
 
-  std::size_t get_stream_pool_size() const override { return 1UL; }
+  [[nodiscard]] std::size_t get_stream_pool_size() const override { return 1UL; }
 };
 
 cuda_stream_pool* create_global_cuda_stream_pool()
diff --git a/cpp/tests/binaryop/binop-compiled-fixed_point-test.cpp b/cpp/tests/binaryop/binop-compiled-fixed_point-test.cpp
index 8b1e987c8bf..6d097b2ff12 100644
--- a/cpp/tests/binaryop/binop-compiled-fixed_point-test.cpp
+++ b/cpp/tests/binaryop/binop-compiled-fixed_point-test.cpp
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2021-2023, NVIDIA CORPORATION.
+ * Copyright (c) 2021-2024, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -380,7 +380,7 @@ TYPED_TEST(FixedPointCompiledTest, FixedPointBinaryOpEqualSimpleScale0Null)
 
   auto const col1     = fp_wrapper<RepType>{{1, 2, 3, 4}, {1, 1, 1, 1}, scale_type{0}};
   auto const col2     = fp_wrapper<RepType>{{1, 2, 3, 4}, {0, 0, 0, 0}, scale_type{0}};
-  auto const expected = wrapper<bool>{{0, 1, 0, 1}, {0, 0, 0, 0}};
+  auto const expected = wrapper<bool>{{0, 1, 0, 1}, {false, false, false, false}};
 
   auto const result = cudf::binary_operation(
     col1, col2, cudf::binary_operator::EQUAL, cudf::data_type{cudf::type_id::BOOL8});
@@ -396,7 +396,7 @@ TYPED_TEST(FixedPointCompiledTest, FixedPointBinaryOpEqualSimpleScale2Null)
 
   auto const col1     = fp_wrapper<RepType>{{1, 2, 3, 4}, {1, 1, 1, 1}, scale_type{-2}};
   auto const col2     = fp_wrapper<RepType>{{1, 2, 3, 4}, {0, 0, 0, 0}, scale_type{0}};
-  auto const expected = wrapper<bool>{{0, 1, 0, 1}, {0, 0, 0, 0}};
+  auto const expected = wrapper<bool>{{0, 1, 0, 1}, {false, false, false, false}};
 
   auto const result = cudf::binary_operation(
     col1, col2, cudf::binary_operator::EQUAL, cudf::data_type{cudf::type_id::BOOL8});
@@ -495,7 +495,7 @@ TYPED_TEST(FixedPointCompiledTest, FixedPointBinaryOpNullEqualsSimple)
 
   auto const col1     = fp_wrapper<RepType>{{400, 300, 300, 100}, {1, 1, 1, 0}, scale_type{-2}};
   auto const col2     = fp_wrapper<RepType>{{40, 200, 20, 400}, {1, 0, 1, 0}, scale_type{-1}};
-  auto const expected = wrapper<bool>{{1, 0, 0, 1}, {1, 1, 1, 1}};
+  auto const expected = wrapper<bool>{{1, 0, 0, 1}, {true, true, true, true}};
 
   auto const result = cudf::binary_operation(
     col1, col2, cudf::binary_operator::NULL_EQUALS, cudf::data_type{cudf::type_id::BOOL8});
diff --git a/cpp/tests/bitmask/is_element_valid_tests.cpp b/cpp/tests/bitmask/is_element_valid_tests.cpp
index 224b9893c4a..077d761cc1d 100644
--- a/cpp/tests/bitmask/is_element_valid_tests.cpp
+++ b/cpp/tests/bitmask/is_element_valid_tests.cpp
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2021-2023, NVIDIA CORPORATION.
+ * Copyright (c) 2021-2024, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -27,7 +27,8 @@ struct IsElementValidTest : public cudf::test::BaseFixture {};
 
 TEST_F(IsElementValidTest, IsElementValidBasic)
 {
-  cudf::test::fixed_width_column_wrapper<int32_t> col({1, 1, 1, 1, 1}, {1, 0, 0, 0, 1});
+  cudf::test::fixed_width_column_wrapper<int32_t> col({1, 1, 1, 1, 1},
+                                                      {true, false, false, false, true});
   EXPECT_TRUE(cudf::detail::is_element_valid_sync(col, 0, cudf::get_default_stream()));
   EXPECT_FALSE(cudf::detail::is_element_valid_sync(col, 1, cudf::get_default_stream()));
   EXPECT_FALSE(cudf::detail::is_element_valid_sync(col, 2, cudf::get_default_stream()));
@@ -51,7 +52,8 @@ TEST_F(IsElementValidTest, IsElementValidLarge)
 
 TEST_F(IsElementValidTest, IsElementValidOffset)
 {
-  cudf::test::fixed_width_column_wrapper<int32_t> col({1, 1, 1, 1, 1}, {1, 0, 0, 0, 1});
+  cudf::test::fixed_width_column_wrapper<int32_t> col({1, 1, 1, 1, 1},
+                                                      {true, false, false, false, true});
   {
     auto offset_col = cudf::slice(col, {1, 5}).front();
     EXPECT_FALSE(cudf::detail::is_element_valid_sync(offset_col, 0, cudf::get_default_stream()));
diff --git a/cpp/tests/column/column_view_shallow_test.cpp b/cpp/tests/column/column_view_shallow_test.cpp
index 87187dfe57b..37ab4b8f387 100644
--- a/cpp/tests/column/column_view_shallow_test.cpp
+++ b/cpp/tests/column/column_view_shallow_test.cpp
@@ -43,7 +43,8 @@ template <typename T, std::enable_if_t<cudf::is_dictionary<T>()>* = nullptr>
 std::unique_ptr<cudf::column> example_column()
 {
   return cudf::test::dictionary_column_wrapper<std::string>(
-           {"fff", "aaa", "ddd", "bbb", "ccc", "ccc", "ccc", "", ""}, {1, 1, 1, 1, 1, 1, 1, 1, 0})
+           {"fff", "aaa", "ddd", "bbb", "ccc", "ccc", "ccc", "", ""},
+           {true, true, true, true, true, true, true, true, false})
     .release();
 }
 
diff --git a/cpp/tests/copying/concatenate_tests.cpp b/cpp/tests/copying/concatenate_tests.cpp
index 3b7bff69938..078e0ef9bae 100644
--- a/cpp/tests/copying/concatenate_tests.cpp
+++ b/cpp/tests/copying/concatenate_tests.cpp
@@ -74,8 +74,8 @@ struct TypedColumnTest : public cudf::test::BaseFixture {
     stream.synchronize();
   }
 
-  cudf::size_type num_elements() const { return _num_elements; }
-  cudf::size_type null_count() const { return _null_count; }
+  [[nodiscard]] cudf::size_type num_elements() const { return _num_elements; }
+  [[nodiscard]] cudf::size_type null_count() const { return _null_count; }
 
   std::random_device r;
   std::default_random_engine generator{r()};
@@ -297,16 +297,17 @@ TEST_F(TableTest, ConcatenateTablesWithOffsets)
 
 TEST_F(TableTest, ConcatenateTablesWithOffsetsAndNulls)
 {
-  cudf::test::fixed_width_column_wrapper<int32_t> col1_1{{5, 4, 3, 5, 8, 5, 6},
-                                                         {0, 1, 1, 1, 1, 1, 1}};
+  cudf::test::fixed_width_column_wrapper<int32_t> col1_1{
+    {5, 4, 3, 5, 8, 5, 6}, {false, true, true, true, true, true, true}};
   cudf::test::strings_column_wrapper col2_1({"dada", "egg", "avocado", "dada", "kite", "dog", "ln"},
-                                            {1, 1, 1, 0, 1, 1, 1});
+                                            {true, true, true, false, true, true, true});
   cudf::table_view table_view_in1{{col1_1, col2_1}};
 
-  cudf::test::fixed_width_column_wrapper<int32_t> col1_2{{5, 8, 5, 6, 15, 14, 13},
-                                                         {1, 1, 1, 1, 1, 1, 0}};
+  cudf::test::fixed_width_column_wrapper<int32_t> col1_2{
+    {5, 8, 5, 6, 15, 14, 13}, {true, true, true, true, true, true, false}};
   cudf::test::strings_column_wrapper col2_2(
-    {"dada", "kite", "dog", "ln", "dado", "greg", "spinach"}, {1, 0, 1, 1, 1, 1, 1});
+    {"dada", "kite", "dog", "ln", "dado", "greg", "spinach"},
+    {true, false, true, true, true, true, true});
   cudf::table_view table_view_in2{{col1_2, col2_2}};
 
   std::vector<cudf::size_type> split_indexes1{3};
@@ -321,10 +322,11 @@ TEST_F(TableTest, ConcatenateTablesWithOffsetsAndNulls)
     table_views_to_concat.push_back(partitioned2[1]);
     std::unique_ptr<cudf::table> concatenated_tables = cudf::concatenate(table_views_to_concat);
 
-    cudf::test::fixed_width_column_wrapper<int32_t> exp1_1{{5, 8, 5, 6, 6, 15, 14, 13},
-                                                           {1, 1, 1, 1, 1, 1, 1, 0}};
+    cudf::test::fixed_width_column_wrapper<int32_t> exp1_1{
+      {5, 8, 5, 6, 6, 15, 14, 13}, {true, true, true, true, true, true, true, false}};
     cudf::test::strings_column_wrapper exp2_1(
-      {"dada", "kite", "dog", "ln", "ln", "dado", "greg", "spinach"}, {0, 1, 1, 1, 1, 1, 1, 1});
+      {"dada", "kite", "dog", "ln", "ln", "dado", "greg", "spinach"},
+      {false, true, true, true, true, true, true, true});
     cudf::table_view table_view_exp1{{exp1_1, exp2_1}};
     CUDF_TEST_EXPECT_TABLES_EQUAL(concatenated_tables->view(), table_view_exp1);
   }
@@ -336,7 +338,7 @@ TEST_F(TableTest, ConcatenateTablesWithOffsetsAndNulls)
 
     cudf::test::fixed_width_column_wrapper<int32_t> exp1_1{5, 8, 5, 6, 5, 8, 5};
     cudf::test::strings_column_wrapper exp2_1({"dada", "kite", "dog", "ln", "dada", "kite", "dog"},
-                                              {0, 1, 1, 1, 1, 0, 1});
+                                              {false, true, true, true, true, false, true});
     cudf::table_view table_view_exp1{{exp1_1, exp2_1}};
     CUDF_TEST_EXPECT_TABLES_EQUAL(concatenated_tables->view(), table_view_exp1);
   }
@@ -507,7 +509,7 @@ TEST_F(OverflowTest, Presliced)
 
     // try and concatenate 4 string columns of with ~1/2 billion chars in each
     auto offset_gen = cudf::detail::make_counting_transform_iterator(
-      0, [string_size](cudf::size_type index) { return index * string_size; });
+      0, [](cudf::size_type index) { return index * string_size; });
     cudf::test::fixed_width_column_wrapper<int> offsets(offset_gen, offset_gen + num_rows + 1);
     auto many_chars = rmm::device_uvector<char>(total_chars_size, cudf::get_default_stream());
     auto col        = cudf::make_strings_column(
@@ -775,7 +777,7 @@ TEST_F(StructsColumnTest, ConcatenateStructs)
   // 1. String "names" column.
   std::vector<std::vector<std::string>> names(
     {{"Vimes", "Carrot"}, {"Angua", "Cheery"}, {}, {"Detritus", "Slant"}});
-  std::vector<std::vector<bool>> names_validity({{1, 1}, {1, 1}, {}, {1, 1}});
+  std::vector<std::vector<bool>> names_validity({{true, true}, {true, true}, {}, {true, true}});
   std::vector<cudf::test::strings_column_wrapper> name_cols;
   std::transform(count_iter, count_iter + names.size(), std::back_inserter(name_cols), [&](int i) {
     return cudf::test::strings_column_wrapper(
@@ -784,7 +786,7 @@ TEST_F(StructsColumnTest, ConcatenateStructs)
 
   // 2. Numeric "ages" column.
   std::vector<std::vector<int>> ages({{5, 10}, {15, 20}, {}, {25, 30}});
-  std::vector<std::vector<bool>> ages_validity({{1, 1}, {1, 1}, {}, {0, 1}});
+  std::vector<std::vector<bool>> ages_validity({{true, true}, {true, true}, {}, {false, true}});
   std::vector<cudf::test::fixed_width_column_wrapper<int>> age_cols;
   std::transform(count_iter, count_iter + ages.size(), std::back_inserter(age_cols), [&](int i) {
     return cudf::test::fixed_width_column_wrapper<int>(
@@ -793,7 +795,7 @@ TEST_F(StructsColumnTest, ConcatenateStructs)
 
   // 3. Boolean "is_human" column.
   std::vector<std::vector<bool>> is_human({{true, true}, {false, false}, {}, {false, false}});
-  std::vector<std::vector<bool>> is_human_validity({{1, 1}, {1, 0}, {}, {1, 1}});
+  std::vector<std::vector<bool>> is_human_validity({{true, true}, {true, false}, {}, {true, true}});
   std::vector<cudf::test::fixed_width_column_wrapper<bool>> is_human_cols;
   std::transform(
     count_iter, count_iter + is_human.size(), std::back_inserter(is_human_cols), [&](int i) {
@@ -811,7 +813,7 @@ TEST_F(StructsColumnTest, ConcatenateStructs)
   expected_children.push_back(cudf::concatenate(name_col_vec));
   expected_children.push_back(cudf::concatenate(age_col_vec));
   expected_children.push_back(cudf::concatenate(is_human_col_vec));
-  std::vector<bool> struct_validity({1, 0, 1, 1, 1, 0});
+  std::vector<bool> struct_validity({true, false, true, true, true, false});
   auto [null_mask, null_count] =
     cudf::test::detail::make_null_mask(struct_validity.begin(), struct_validity.end());
   auto expected =
@@ -819,14 +821,14 @@ TEST_F(StructsColumnTest, ConcatenateStructs)
 
   // concatenate as structs
   std::vector<cudf::test::structs_column_wrapper> src;
-  src.push_back(
-    cudf::test::structs_column_wrapper({name_cols[0], age_cols[0], is_human_cols[0]}, {1, 0}));
-  src.push_back(
-    cudf::test::structs_column_wrapper({name_cols[1], age_cols[1], is_human_cols[1]}, {1, 1}));
+  src.push_back(cudf::test::structs_column_wrapper({name_cols[0], age_cols[0], is_human_cols[0]},
+                                                   {true, false}));
+  src.push_back(cudf::test::structs_column_wrapper({name_cols[1], age_cols[1], is_human_cols[1]},
+                                                   {true, true}));
   src.push_back(
     cudf::test::structs_column_wrapper({name_cols[2], age_cols[2], is_human_cols[2]}, {}));
-  src.push_back(
-    cudf::test::structs_column_wrapper({name_cols[3], age_cols[3], is_human_cols[3]}, {1, 0}));
+  src.push_back(cudf::test::structs_column_wrapper({name_cols[3], age_cols[3], is_human_cols[3]},
+                                                   {true, false}));
 
   // concatenate
   auto result = cudf::concatenate(std::vector<column_view>({src[0], src[1], src[2], src[3]}));
@@ -857,7 +859,8 @@ TEST_F(StructsColumnTest, ConcatenateSplitStructs)
   std::vector<std::vector<std::string>> names(
     {{"Vimes", "Carrot", "Angua", "Cheery", "Detritus", "Slant"},
      {"Bill", "Bob", "Sam", "Fred", "Tom"}});
-  std::vector<std::vector<bool>> names_validity({{1, 1, 1, 1, 1, 1}, {0, 1, 0, 1, 0}});
+  std::vector<std::vector<bool>> names_validity(
+    {{true, true, true, true, true, true}, {false, true, false, true, false}});
   std::vector<cudf::test::strings_column_wrapper> name_cols;
   std::transform(count_iter, count_iter + names.size(), std::back_inserter(name_cols), [&](int i) {
     return cudf::test::strings_column_wrapper(
@@ -866,7 +869,8 @@ TEST_F(StructsColumnTest, ConcatenateSplitStructs)
 
   // 2. Numeric "ages" column.
   std::vector<std::vector<int>> ages({{5, 10, 15, 20, 25, 30}, {11, 16, 17, 41, 42}});
-  std::vector<std::vector<bool>> ages_validity({{1, 1, 1, 1, 0, 1}, {1, 1, 1, 0, 0}});
+  std::vector<std::vector<bool>> ages_validity(
+    {{true, true, true, true, false, true}, {true, true, true, false, false}});
   std::vector<cudf::test::fixed_width_column_wrapper<int>> age_cols;
   std::transform(count_iter, count_iter + ages.size(), std::back_inserter(age_cols), [&](int i) {
     return cudf::test::fixed_width_column_wrapper<int>(
@@ -876,7 +880,8 @@ TEST_F(StructsColumnTest, ConcatenateSplitStructs)
   // 3. Boolean "is_human" column.
   std::vector<std::vector<bool>> is_human(
     {{true, true, false, false, false, false}, {true, true, true, false, true}});
-  std::vector<std::vector<bool>> is_human_validity({{1, 1, 1, 0, 1, 1}, {0, 0, 0, 1, 1}});
+  std::vector<std::vector<bool>> is_human_validity(
+    {{true, true, true, false, true, true}, {false, false, false, true, true}});
   std::vector<cudf::test::fixed_width_column_wrapper<bool>> is_human_cols;
   std::transform(
     count_iter, count_iter + is_human.size(), std::back_inserter(is_human_cols), [&](int i) {
@@ -910,7 +915,7 @@ TEST_F(StructsColumnTest, ConcatenateSplitStructs)
     inputs.push_back(std::make_unique<column>(split_names_cols[idx]));
     inputs.push_back(std::make_unique<column>(split_ages_cols[idx]));
     inputs.push_back(std::make_unique<column>(split_is_human_cols[idx]));
-    src.push_back(cudf::test::structs_column_wrapper(std::move(inputs)));
+    src.emplace_back(std::move(inputs));
   }
 
   // concatenate
@@ -932,7 +937,8 @@ TEST_F(StructsColumnTest, ConcatenateStructsNested)
     std::vector<std::vector<std::string>> names(
       {{"Vimes", "Carrot", "Angua", "Cheery", "Detritus", "Slant"},
        {"Bill", "Bob", "Sam", "Fred", "Tom"}});
-    std::vector<std::vector<bool>> names_validity({{1, 1, 1, 1, 1, 1}, {0, 1, 0, 1, 0}});
+    std::vector<std::vector<bool>> names_validity(
+      {{true, true, true, true, true, true}, {false, true, false, true, false}});
     std::vector<cudf::test::strings_column_wrapper> name_cols;
     std::transform(
       count_iter, count_iter + names.size(), std::back_inserter(name_cols), [&](int i) {
@@ -942,7 +948,8 @@ TEST_F(StructsColumnTest, ConcatenateStructsNested)
 
     // 2. Numeric "ages" column.
     std::vector<std::vector<int>> ages({{5, 10, 15, 20, 25, 30}, {11, 16, 17, 41, 42}});
-    std::vector<std::vector<bool>> ages_validity({{1, 1, 1, 1, 0, 1}, {1, 1, 1, 0, 0}});
+    std::vector<std::vector<bool>> ages_validity(
+      {{true, true, true, true, false, true}, {true, true, true, false, false}});
     std::vector<cudf::test::fixed_width_column_wrapper<int>> age_cols;
     std::transform(count_iter, count_iter + ages.size(), std::back_inserter(age_cols), [&](int i) {
       return cudf::test::fixed_width_column_wrapper<int>(
@@ -953,7 +960,7 @@ TEST_F(StructsColumnTest, ConcatenateStructsNested)
       std::vector<std::unique_ptr<column>> children;
       children.push_back(name_cols[idx].release());
       children.push_back(age_cols[idx].release());
-      inner_structs.push_back(cudf::test::structs_column_wrapper(std::move(children)));
+      inner_structs.emplace_back(std::move(children));
     }
   }
 
@@ -983,7 +990,7 @@ TEST_F(StructsColumnTest, ConcatenateStructsNested)
     std::vector<std::unique_ptr<column>> inputs;
     inputs.push_back(std::make_unique<column>(inner_structs[idx]));
     inputs.push_back(std::make_unique<column>(inner_lists[idx]));
-    src.push_back(cudf::test::structs_column_wrapper(std::move(inputs)));
+    src.emplace_back(std::move(inputs));
   }
 
   // concatenate
@@ -1499,7 +1506,8 @@ TEST_F(ListsColumnTest, ListOfStructs)
        {},
        {},
        {"Bill", "Bob", "Sam", "Fred", "Tom"}});
-    std::vector<std::vector<bool>> names_validity({{1, 1, 1, 1, 1, 1}, {}, {}, {0, 1, 0, 1, 0}});
+    std::vector<std::vector<bool>> names_validity(
+      {{true, true, true, true, true, true}, {}, {}, {false, true, false, true, false}});
     std::vector<cudf::test::strings_column_wrapper> name_cols;
     std::transform(
       count_iter, count_iter + names.size(), std::back_inserter(name_cols), [&](int i) {
@@ -1509,7 +1517,8 @@ TEST_F(ListsColumnTest, ListOfStructs)
 
     // 2. Numeric "ages" column.
     std::vector<std::vector<int>> ages({{5, 10, 15, 20, 25, 30}, {}, {}, {11, 16, 17, 41, 42}});
-    std::vector<std::vector<bool>> ages_validity({{1, 1, 1, 1, 0, 1}, {}, {}, {1, 1, 1, 0, 0}});
+    std::vector<std::vector<bool>> ages_validity(
+      {{true, true, true, true, false, true}, {}, {}, {true, true, true, false, false}});
     std::vector<cudf::test::fixed_width_column_wrapper<int>> age_cols;
     std::transform(count_iter, count_iter + ages.size(), std::back_inserter(age_cols), [&](int i) {
       return cudf::test::fixed_width_column_wrapper<int>(
@@ -1520,7 +1529,7 @@ TEST_F(ListsColumnTest, ListOfStructs)
       std::vector<std::unique_ptr<column>> children;
       children.push_back(name_cols[idx].release());
       children.push_back(age_cols[idx].release());
-      inner_structs.push_back(cudf::test::structs_column_wrapper(std::move(children)));
+      inner_structs.emplace_back(std::move(children));
     }
   }
 
@@ -1618,7 +1627,7 @@ TEST_F(DictionaryConcatTest, StringsKeys)
 {
   cudf::test::strings_column_wrapper strings(
     {"eee", "aaa", "ddd", "bbb", "", "", "ccc", "ccc", "ccc", "eee", "aaa"},
-    {1, 1, 1, 1, 0, 1, 1, 1, 1, 1, 1});
+    {true, true, true, true, false, true, true, true, true, true, true});
   auto dictionary = cudf::dictionary::encode(strings);
 
   std::vector<cudf::size_type> splits{0, 2, 2, 5, 5, 7, 7, 7, 7, 11};
diff --git a/cpp/tests/copying/copy_tests.cpp b/cpp/tests/copying/copy_tests.cpp
index f31d8d6f79a..7c8729b6a77 100644
--- a/cpp/tests/copying/copy_tests.cpp
+++ b/cpp/tests/copying/copy_tests.cpp
@@ -57,7 +57,8 @@ TYPED_TEST(CopyTest, CopyIfElseTestManyNulls)
 {
   using T = TypeParam;
 
-  cudf::test::fixed_width_column_wrapper<bool> mask_w{{1, 0, 0, 0, 0, 0, 1}, {1, 1, 1, 1, 1, 1, 0}};
+  cudf::test::fixed_width_column_wrapper<bool> mask_w{{1, 0, 0, 0, 0, 0, 1},
+                                                      {true, true, true, true, true, true, false}};
 
   wrapper<T, int32_t> lhs_w({5, 5, 5, 5, 5, 5, 5}, {1, 1, 1, 1, 1, 1, 1});
   wrapper<T, int32_t> rhs_w({6, 6, 6, 6, 6, 6, 6}, {1, 0, 0, 0, 0, 0, 1});
@@ -124,7 +125,7 @@ TYPED_TEST(CopyTest, CopyIfElseTestMultipleBlocks)
   std::vector<int32_t> h_rhs(num, 6);
   std::vector<bool> h_mask(num, false);
   std::vector<bool> h_validity(num, true);
-  h_validity[0] = 0;
+  h_validity[0] = false;
 
   cudf::test::fixed_width_column_wrapper<T, int32_t> lhs_w(
     h_lhs.begin(), h_lhs.end(), h_validity.begin());
diff --git a/cpp/tests/copying/gather_str_tests.cpp b/cpp/tests/copying/gather_str_tests.cpp
index 22af600ab96..b31f34504e7 100644
--- a/cpp/tests/copying/gather_str_tests.cpp
+++ b/cpp/tests/copying/gather_str_tests.cpp
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2020-2023, NVIDIA CORPORATION.
+ * Copyright (c) 2020-2024, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -31,15 +31,17 @@ class GatherTestStr : public cudf::test::BaseFixture {};
 
 TEST_F(GatherTestStr, StringColumn)
 {
-  cudf::test::fixed_width_column_wrapper<int16_t> col1{{1, 2, 3, 4, 5, 6}, {1, 1, 0, 1, 0, 1}};
+  cudf::test::fixed_width_column_wrapper<int16_t> col1{{1, 2, 3, 4, 5, 6},
+                                                       {true, true, false, true, false, true}};
   cudf::test::strings_column_wrapper col2{{"This", "is", "not", "a", "string", "type"},
-                                          {1, 1, 1, 1, 1, 0}};
+                                          {true, true, true, true, true, false}};
   cudf::table_view source_table{{col1, col2}};
 
   cudf::test::fixed_width_column_wrapper<int16_t> gather_map{{0, 1, 3, 4}};
 
-  cudf::test::fixed_width_column_wrapper<int16_t> exp_col1{{1, 2, 4, 5}, {1, 1, 1, 0}};
-  cudf::test::strings_column_wrapper exp_col2{{"This", "is", "a", "string"}, {1, 1, 1, 1}};
+  cudf::test::fixed_width_column_wrapper<int16_t> exp_col1{{1, 2, 4, 5}, {true, true, true, false}};
+  cudf::test::strings_column_wrapper exp_col2{{"This", "is", "a", "string"},
+                                              {true, true, true, true}};
   cudf::table_view expected{{exp_col1, exp_col2}};
 
   auto got = cudf::gather(source_table, gather_map);
@@ -50,26 +52,26 @@ TEST_F(GatherTestStr, StringColumn)
 TEST_F(GatherTestStr, GatherSlicedStringsColumn)
 {
   cudf::test::strings_column_wrapper strings{{"This", "is", "not", "a", "string", "type"},
-                                             {1, 1, 1, 1, 1, 0}};
+                                             {true, true, true, true, true, false}};
   std::vector<cudf::size_type> slice_indices{0, 2, 2, 3, 3, 6};
   auto sliced_strings = cudf::slice(strings, slice_indices);
   {
     cudf::test::fixed_width_column_wrapper<int16_t> gather_map{{1, 0, 1}};
-    cudf::test::strings_column_wrapper expected_strings{{"is", "This", "is"}, {1, 1, 1}};
+    cudf::test::strings_column_wrapper expected_strings{{"is", "This", "is"}, {true, true, true}};
     cudf::table_view expected{{expected_strings}};
     auto result = cudf::gather(cudf::table_view{{sliced_strings[0]}}, gather_map);
     CUDF_TEST_EXPECT_TABLES_EQUAL(expected, result->view());
   }
   {
     cudf::test::fixed_width_column_wrapper<int16_t> gather_map{{0, 0, 0}};
-    cudf::test::strings_column_wrapper expected_strings{{"not", "not", "not"}, {1, 1, 1}};
+    cudf::test::strings_column_wrapper expected_strings{{"not", "not", "not"}, {true, true, true}};
     cudf::table_view expected{{expected_strings}};
     auto result = cudf::gather(cudf::table_view{{sliced_strings[1]}}, gather_map);
     CUDF_TEST_EXPECT_TABLES_EQUAL(expected, result->view());
   }
   {
     cudf::test::fixed_width_column_wrapper<int16_t> gather_map{{2, 1, 0}};
-    cudf::test::strings_column_wrapper expected_strings{{"", "string", "a"}, {0, 1, 1}};
+    cudf::test::strings_column_wrapper expected_strings{{"", "string", "a"}, {false, true, true}};
     cudf::table_view expected{{expected_strings}};
     auto result = cudf::gather(cudf::table_view{{sliced_strings[2]}}, gather_map);
     CUDF_TEST_EXPECT_TABLES_EQUAL(expected, result->view());
@@ -93,8 +95,7 @@ TEST_F(GatherTestStr, Gather)
 
   std::vector<char const*> h_expected;
   std::vector<int32_t> expected_validity;
-  for (auto itr = h_map.begin(); itr != h_map.end(); ++itr) {
-    auto index = *itr;
+  for (int index : h_map) {
     if ((0 <= index) && (index < static_cast<decltype(index)>(h_strings.size()))) {
       h_expected.push_back(h_strings[index]);
       expected_validity.push_back(1);
@@ -124,8 +125,8 @@ TEST_F(GatherTestStr, GatherDontCheckOutOfBounds)
                                       rmm::mr::get_current_device_resource());
 
   std::vector<char const*> h_expected;
-  for (auto itr = h_map.begin(); itr != h_map.end(); ++itr) {
-    h_expected.push_back(h_strings[*itr]);
+  for (int itr : h_map) {
+    h_expected.push_back(h_strings[itr]);
   }
   cudf::test::strings_column_wrapper expected(h_expected.begin(), h_expected.end());
   CUDF_TEST_EXPECT_COLUMNS_EQUAL(results->view().column(0), expected);
diff --git a/cpp/tests/copying/gather_struct_tests.cpp b/cpp/tests/copying/gather_struct_tests.cpp
index 2bc18c706db..1598ab2646a 100644
--- a/cpp/tests/copying/gather_struct_tests.cpp
+++ b/cpp/tests/copying/gather_struct_tests.cpp
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2020-2023, NVIDIA CORPORATION.
+ * Copyright (c) 2020-2024, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -408,7 +408,7 @@ TYPED_TEST(TypedStructGatherTest, TestGatherStructOfListOfStructs)
       5, offsets{0, 2, 4, 6, 8, 10}.release(), std::move(expected_struct_col), 0, {});
     std::vector<std::unique_ptr<cudf::column>> expected_vector_of_columns;
     expected_vector_of_columns.push_back(std::move(expected_list_of_structs_column));
-    return structs{std::move(expected_vector_of_columns), {0, 1, 1, 1, 1}};
+    return structs{std::move(expected_vector_of_columns), {false, true, true, true, true}};
   }();
 
   CUDF_TEST_EXPECT_COLUMNS_EQUIVALENT(expected_gather_result, gathered_structs->view());
diff --git a/cpp/tests/copying/get_value_tests.cpp b/cpp/tests/copying/get_value_tests.cpp
index 99b86c86997..90ff97e7355 100644
--- a/cpp/tests/copying/get_value_tests.cpp
+++ b/cpp/tests/copying/get_value_tests.cpp
@@ -109,7 +109,7 @@ TEST_F(StringGetValueTest, GetEmpty)
 
 TEST_F(StringGetValueTest, GetFromNullable)
 {
-  cudf::test::strings_column_wrapper col({"this", "is", "a", "test"}, {0, 1, 0, 1});
+  cudf::test::strings_column_wrapper col({"this", "is", "a", "test"}, {false, true, false, true});
   auto s = cudf::get_element(col, 1);
 
   auto typed_s = static_cast<cudf::string_scalar const*>(s.get());
@@ -120,7 +120,7 @@ TEST_F(StringGetValueTest, GetFromNullable)
 
 TEST_F(StringGetValueTest, GetNull)
 {
-  cudf::test::strings_column_wrapper col({"this", "is", "a", "test"}, {0, 1, 0, 1});
+  cudf::test::strings_column_wrapper col({"this", "is", "a", "test"}, {false, true, false, true});
   auto s = cudf::get_element(col, 2);
 
   EXPECT_FALSE(s->is_valid());
@@ -149,8 +149,8 @@ TYPED_TEST(DictionaryGetValueTest, BasicGet)
 TYPED_TEST(DictionaryGetValueTest, GetFromNullable)
 {
   cudf::test::fixed_width_column_wrapper<TypeParam, int32_t> keys({6, 7, 8, 9});
-  cudf::test::fixed_width_column_wrapper<uint32_t> indices({0, 0, 1, 2, 1, 3, 3, 2},
-                                                           {0, 1, 0, 1, 1, 1, 0, 0});
+  cudf::test::fixed_width_column_wrapper<uint32_t> indices(
+    {0, 0, 1, 2, 1, 3, 3, 2}, {false, true, false, true, true, true, false, false});
   auto col = cudf::make_dictionary_column(keys, indices);
 
   auto s = cudf::get_element(*col, 3);
@@ -165,8 +165,8 @@ TYPED_TEST(DictionaryGetValueTest, GetFromNullable)
 TYPED_TEST(DictionaryGetValueTest, GetNull)
 {
   cudf::test::fixed_width_column_wrapper<TypeParam, int32_t> keys({6, 7, 8, 9});
-  cudf::test::fixed_width_column_wrapper<uint32_t> indices({0, 0, 1, 2, 1, 3, 3, 2},
-                                                           {0, 1, 0, 1, 1, 1, 0, 0});
+  cudf::test::fixed_width_column_wrapper<uint32_t> indices(
+    {0, 0, 1, 2, 1, 3, 3, 2}, {false, true, false, true, true, true, false, false});
   auto col = cudf::make_dictionary_column(keys, indices);
 
   auto s = cudf::get_element(*col, 2);
diff --git a/cpp/tests/copying/pack_tests.cpp b/cpp/tests/copying/pack_tests.cpp
index 8a33e017935..ea4408efa6a 100644
--- a/cpp/tests/copying/pack_tests.cpp
+++ b/cpp/tests/copying/pack_tests.cpp
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2021-2023, NVIDIA CORPORATION.
+ * Copyright (c) 2021-2024, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -41,8 +41,8 @@ struct PackUnpackTest : public cudf::test::BaseFixture {
 
 TEST_F(PackUnpackTest, SingleColumnFixedWidth)
 {
-  cudf::test::fixed_width_column_wrapper<int64_t> col1({1, 2, 3, 4, 5, 6, 7},
-                                                       {1, 1, 1, 0, 1, 0, 1});
+  cudf::test::fixed_width_column_wrapper<int64_t> col1(
+    {1, 2, 3, 4, 5, 6, 7}, {true, true, true, false, true, false, true});
 
   this->run_test({col1});
 }
@@ -56,20 +56,22 @@ TEST_F(PackUnpackTest, SingleColumnFixedWidthNonNullable)
 
 TEST_F(PackUnpackTest, MultiColumnFixedWidth)
 {
-  cudf::test::fixed_width_column_wrapper<int16_t> col1({1, 2, 3, 4, 5, 6, 7},
-                                                       {1, 1, 1, 0, 1, 0, 1});
-  cudf::test::fixed_width_column_wrapper<float> col2({7, 8, 6, 5, 4, 3, 2}, {1, 0, 1, 1, 1, 1, 1});
-  cudf::test::fixed_width_column_wrapper<double> col3({8, 4, 2, 0, 7, 1, 3}, {0, 1, 1, 1, 1, 1, 1});
+  cudf::test::fixed_width_column_wrapper<int16_t> col1(
+    {1, 2, 3, 4, 5, 6, 7}, {true, true, true, false, true, false, true});
+  cudf::test::fixed_width_column_wrapper<float> col2({7, 8, 6, 5, 4, 3, 2},
+                                                     {true, false, true, true, true, true, true});
+  cudf::test::fixed_width_column_wrapper<double> col3({8, 4, 2, 0, 7, 1, 3},
+                                                      {false, true, true, true, true, true, true});
 
   this->run_test({col1, col2, col3});
 }
 
 TEST_F(PackUnpackTest, MultiColumnWithStrings)
 {
-  cudf::test::fixed_width_column_wrapper<int16_t> col1({1, 2, 3, 4, 5, 6, 7},
-                                                       {1, 1, 1, 0, 1, 0, 1});
+  cudf::test::fixed_width_column_wrapper<int16_t> col1(
+    {1, 2, 3, 4, 5, 6, 7}, {true, true, true, false, true, false, true});
   cudf::test::strings_column_wrapper col2({"Lorem", "ipsum", "dolor", "sit", "amet", "ort", "ral"},
-                                          {1, 0, 1, 1, 1, 0, 1});
+                                          {true, false, true, true, true, false, true});
   cudf::test::strings_column_wrapper col3({"", "this", "is", "a", "column", "of", "strings"});
 
   this->run_test({col1, col2, col3});
@@ -164,7 +166,7 @@ std::vector<std::unique_ptr<cudf::column>> generate_structs(bool include_validit
 
   // 2. Numeric "ages" column.
   std::vector<int> ages{5, 10, 15, 20, 25, 30, 100, 101, 102};
-  std::vector<bool> ages_validity = {1, 1, 1, 1, 0, 1, 0, 0, 1};
+  std::vector<bool> ages_validity = {true, true, true, true, false, true, false, false, true};
   auto ages_column =
     include_validity
       ? cudf::test::fixed_width_column_wrapper<int>(ages.begin(), ages.end(), ages_validity.begin())
@@ -172,7 +174,7 @@ std::vector<std::unique_ptr<cudf::column>> generate_structs(bool include_validit
 
   // 3. Boolean "is_human" column.
   std::vector<bool> is_human{true, true, false, false, false, false, true, true, true};
-  std::vector<bool> is_human_validity{1, 1, 1, 0, 1, 1, 1, 1, 0};
+  std::vector<bool> is_human_validity{true, true, true, false, true, true, true, true, false};
   auto is_human_col =
     include_validity
       ? cudf::test::fixed_width_column_wrapper<bool>(
@@ -180,7 +182,8 @@ std::vector<std::unique_ptr<cudf::column>> generate_structs(bool include_validit
       : cudf::test::fixed_width_column_wrapper<bool>(is_human.begin(), is_human.end());
 
   // Assemble struct column.
-  auto const struct_validity = std::vector<bool>{1, 1, 1, 1, 1, 0, 0, 1, 0};
+  auto const struct_validity =
+    std::vector<bool>{true, true, true, true, true, false, false, true, false};
   auto struct_column =
     include_validity
       ? cudf::test::structs_column_wrapper({names_column, ages_column, is_human_col},
@@ -201,13 +204,13 @@ std::vector<std::unique_ptr<cudf::column>> generate_struct_of_list()
 
   // 2. Numeric "ages" column.
   std::vector<int> ages{5, 10, 15, 20, 25, 30, 100, 101, 102};
-  std::vector<bool> ages_validity = {1, 1, 1, 1, 0, 1, 0, 0, 1};
+  std::vector<bool> ages_validity = {true, true, true, true, false, true, false, false, true};
   auto ages_column =
     cudf::test::fixed_width_column_wrapper<int>(ages.begin(), ages.end(), ages_validity.begin());
 
   // 3. List column
   using LCW = cudf::test::lists_column_wrapper<cudf::string_view>;
-  std::vector<bool> list_validity{1, 1, 1, 1, 1, 0, 1, 0, 1};
+  std::vector<bool> list_validity{true, true, true, true, true, false, true, false, true};
   cudf::test::lists_column_wrapper<cudf::string_view> list(
     {{{"abc", "d", "edf"}, {"jjj"}},
      {{"dgaer", "-7"}, LCW{}},
@@ -221,7 +224,8 @@ std::vector<std::unique_ptr<cudf::column>> generate_struct_of_list()
     list_validity.begin());
 
   // Assemble struct column.
-  auto const struct_validity = std::vector<bool>{1, 1, 1, 1, 1, 0, 0, 1, 0};
+  auto const struct_validity =
+    std::vector<bool>{true, true, true, true, true, false, false, true, false};
   auto struct_column =
     cudf::test::structs_column_wrapper({names_column, ages_column, list}, struct_validity.begin());
 
@@ -253,17 +257,47 @@ std::vector<std::unique_ptr<cudf::column>> generate_list_of_struct()
 
   // 2. Numeric "ages" column.
   std::vector<int> ages{5, 10, 15, 20, 25, 30, 100, 101, 102, -1, -2, -3, -4, -5, -6, -7};
-  std::vector<bool> ages_validity = {1, 1, 1, 1, 0, 1, 0, 0, 1, 0, 0, 0, 0, 1, 1, 1};
+  std::vector<bool> ages_validity = {true,
+                                     true,
+                                     true,
+                                     true,
+                                     false,
+                                     true,
+                                     false,
+                                     false,
+                                     true,
+                                     false,
+                                     false,
+                                     false,
+                                     false,
+                                     true,
+                                     true,
+                                     true};
   auto ages_column =
     cudf::test::fixed_width_column_wrapper<int>(ages.begin(), ages.end(), ages_validity.begin());
 
   // Assemble struct column.
-  auto const struct_validity = std::vector<bool>{1, 1, 1, 1, 1, 0, 0, 1, 0, 1, 1, 1, 1, 1, 1, 1};
+  auto const struct_validity = std::vector<bool>{true,
+                                                 true,
+                                                 true,
+                                                 true,
+                                                 true,
+                                                 false,
+                                                 false,
+                                                 true,
+                                                 false,
+                                                 true,
+                                                 true,
+                                                 true,
+                                                 true,
+                                                 true,
+                                                 true,
+                                                 true};
   auto struct_column =
     cudf::test::structs_column_wrapper({names_column, ages_column}, struct_validity.begin());
 
   // 3. List column
-  std::vector<bool> list_validity{1, 1, 1, 1, 1, 0, 1, 0, 1};
+  std::vector<bool> list_validity{true, true, true, true, true, false, true, false, true};
 
   cudf::test::fixed_width_column_wrapper<int> offsets{0, 1, 4, 5, 7, 7, 10, 13, 14, 16};
   auto [null_mask, null_count] =
@@ -479,19 +513,21 @@ TEST_F(PackUnpackTest, NestedSliced)
   // struct
   {
     cudf::test::fixed_width_column_wrapper<int> a{0, 1, 2, 3, 4, 5, 6, 7};
-    cudf::test::fixed_width_column_wrapper<float> b{{0, -1, -2, -3, -4, -5, -6, -7},
-                                                    {1, 1, 1, 0, 0, 0, 0, 1}};
+    cudf::test::fixed_width_column_wrapper<float> b{
+      {0, -1, -2, -3, -4, -5, -6, -7}, {true, true, true, false, false, false, false, true}};
     cudf::test::strings_column_wrapper c{{"abc", "def", "ghi", "jkl", "mno", "", "st", "uvwx"},
-                                         {0, 0, 1, 1, 1, 1, 1, 1}};
-    std::vector<bool> list_validity{1, 0, 1, 0, 1, 0, 1, 1};
+                                         {false, false, true, true, true, true, true, true}};
+    std::vector<bool> list_validity{true, false, true, false, true, false, true, true};
     cudf::test::lists_column_wrapper<int16_t> d{
       {{0, 1}, {2, 3, 4}, {5, 6}, {7}, {8, 9, 10}, {11, 12}, {}, {15, 16, 17}},
       list_validity.begin()};
     cudf::test::fixed_width_column_wrapper<int> _a{10, 20, 30, 40, 50, 60, 70, 80};
     cudf::test::fixed_width_column_wrapper<float> _b{-10, -20, -30, -40, -50, -60, -70, -80};
     cudf::test::strings_column_wrapper _c{"aa", "", "ccc", "dddd", "eeeee", "f", "gg", "hhh"};
-    cudf::test::structs_column_wrapper e({_a, _b, _c}, {1, 1, 1, 0, 1, 1, 1, 0});
-    cudf::test::structs_column_wrapper s({a, b, c, d, e}, {1, 1, 0, 1, 1, 1, 1, 1});
+    cudf::test::structs_column_wrapper e({_a, _b, _c},
+                                         {true, true, true, false, true, true, true, false});
+    cudf::test::structs_column_wrapper s({a, b, c, d, e},
+                                         {true, true, false, true, true, true, true, true});
 
     auto split = cudf::split(s, {2, 5});
 
diff --git a/cpp/tests/copying/scatter_list_tests.cpp b/cpp/tests/copying/scatter_list_tests.cpp
index 9501bb29245..a82860a3eec 100644
--- a/cpp/tests/copying/scatter_list_tests.cpp
+++ b/cpp/tests/copying/scatter_list_tests.cpp
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2020-2023, NVIDIA CORPORATION.
+ * Copyright (c) 2020-2024, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -235,7 +235,8 @@ TEST_F(ScatterListsTest, ListsOfStrings)
 TEST_F(ScatterListsTest, ListsOfNullableStrings)
 {
   auto src_strings_column = cudf::test::strings_column_wrapper{
-    {"all", "the", "leaves", "are", "brown", "california", "dreaming"}, {1, 1, 1, 0, 1, 0, 1}};
+    {"all", "the", "leaves", "are", "brown", "california", "dreaming"},
+    {true, true, true, false, true, false, true}};
 
   auto src_list_column = cudf::make_lists_column(
     2,
@@ -288,7 +289,8 @@ TEST_F(ScatterListsTest, ListsOfNullableStrings)
 TEST_F(ScatterListsTest, EmptyListsOfNullableStrings)
 {
   auto src_strings_column = cudf::test::strings_column_wrapper{
-    {"all", "the", "leaves", "are", "brown", "california", "dreaming"}, {1, 1, 1, 0, 1, 0, 1}};
+    {"all", "the", "leaves", "are", "brown", "california", "dreaming"},
+    {true, true, true, false, true, false, true}};
 
   auto src_list_column = cudf::make_lists_column(
     3,
@@ -339,7 +341,8 @@ TEST_F(ScatterListsTest, EmptyListsOfNullableStrings)
 TEST_F(ScatterListsTest, NullableListsOfNullableStrings)
 {
   auto src_strings_column = cudf::test::strings_column_wrapper{
-    {"all", "the", "leaves", "are", "brown", "california", "dreaming"}, {1, 1, 1, 0, 1, 0, 1}};
+    {"all", "the", "leaves", "are", "brown", "california", "dreaming"},
+    {true, true, true, false, true, false, true}};
 
   auto src_validity =
     cudf::detail::make_counting_transform_iterator(0, [](auto i) { return i != 1; });
diff --git a/cpp/tests/copying/scatter_struct_tests.cpp b/cpp/tests/copying/scatter_struct_tests.cpp
index f678880617c..c92244d047b 100644
--- a/cpp/tests/copying/scatter_struct_tests.cpp
+++ b/cpp/tests/copying/scatter_struct_tests.cpp
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2020-2023, NVIDIA CORPORATION.
+ * Copyright (c) 2020-2024, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -209,9 +209,10 @@ TYPED_TEST(TypedStructScatterTest, ScatterStructOfListsTest)
   auto const structs_tgt = structs_col{{lists_col_tgt}}.release();
 
   // Expected data
-  auto const validity_expected = std::vector<bool>{0, 1, 1, 0, 0, 1, 1, 0, 0};
-  auto lists_col_expected      = lists_col{
-         {{1}, {2, 3}, {80}, {70, 75}, {55, 60, 65}, {35, 40, 45, 50}, {5}, {10, 15}, {20, 25, 30}},
+  auto const validity_expected =
+    std::vector<bool>{false, true, true, false, false, true, true, false, false};
+  auto lists_col_expected = lists_col{
+    {{1}, {2, 3}, {80}, {70, 75}, {55, 60, 65}, {35, 40, 45, 50}, {5}, {10, 15}, {20, 25, 30}},
     validity_expected.begin()};
   auto const structs_expected = structs_col{{lists_col_expected}}.release();
 
diff --git a/cpp/tests/copying/scatter_tests.cpp b/cpp/tests/copying/scatter_tests.cpp
index 16cbeb7e657..41a753cd0ac 100644
--- a/cpp/tests/copying/scatter_tests.cpp
+++ b/cpp/tests/copying/scatter_tests.cpp
@@ -47,7 +47,8 @@ TEST_F(ScatterUntypedTests, ScatterMapNulls)
 {
   cudf::test::fixed_width_column_wrapper<int32_t> source({1, 2, 3, 4, 5, 6});
   cudf::test::fixed_width_column_wrapper<int32_t> target({10, 20, 30, 40, 50, 60, 70, 80});
-  cudf::test::fixed_width_column_wrapper<int32_t> scatter_map({-3, 3, 1, -1}, {0, 1, 1, 1});
+  cudf::test::fixed_width_column_wrapper<int32_t> scatter_map({-3, 3, 1, -1},
+                                                              {false, true, true, true});
 
   auto const source_table = cudf::table_view({source, source});
   auto const target_table = cudf::table_view({target, target});
@@ -63,7 +64,8 @@ TEST_F(ScatterUntypedTests, ScatterScalarMapNulls)
   std::vector<std::reference_wrapper<const cudf::scalar>> source_vector{slr_ref};
 
   cudf::test::fixed_width_column_wrapper<int32_t> target({10, 20, 30, 40, 50, 60, 70, 80});
-  cudf::test::fixed_width_column_wrapper<int32_t> scatter_map({-3, 3, 1, -1}, {0, 1, 1, 1});
+  cudf::test::fixed_width_column_wrapper<int32_t> scatter_map({-3, 3, 1, -1},
+                                                              {false, true, true, true});
 
   auto const target_table = cudf::table_view({target});
 
@@ -524,11 +526,12 @@ TYPED_TEST(BooleanMaskScatter, WithNull)
   using T = TypeParam;
   cudf::test::fixed_width_column_wrapper<T, int32_t> source_col1({1, 5, 6, 8, 9}, {1, 0, 1, 0, 1});
   cudf::test::strings_column_wrapper source_col2({"This", "is", "cudf", "test", "column"},
-                                                 {1, 0, 0, 1, 0});
+                                                 {true, false, false, true, false});
   cudf::test::fixed_width_column_wrapper<T, int32_t> target_col1({2, 2, 3, 4, 11, 12, 7, 7, 10, 10},
                                                                  {1, 1, 0, 1, 1, 1, 1, 1, 1, 0});
   cudf::test::strings_column_wrapper target_col2(
-    {"a", "bc", "cd", "ef", "gh", "ij", "jk", "lm", "no", "pq"}, {1, 1, 0, 1, 1, 1, 1, 1, 1, 0});
+    {"a", "bc", "cd", "ef", "gh", "ij", "jk", "lm", "no", "pq"},
+    {true, true, false, true, true, true, true, true, true, false});
   cudf::test::fixed_width_column_wrapper<bool> mask(
     {true, false, false, false, true, true, false, true, true, false});
 
@@ -536,7 +539,7 @@ TYPED_TEST(BooleanMaskScatter, WithNull)
                                                                    {1, 1, 0, 1, 0, 1, 1, 0, 1, 0});
   cudf::test::strings_column_wrapper expected_col2(
     {"This", "bc", "cd", "ef", "is", "cudf", "jk", "test", "column", "pq"},
-    {1, 1, 0, 1, 0, 0, 1, 1, 0, 0});
+    {true, true, false, true, false, false, true, true, false, false});
   auto source_table   = cudf::table_view({source_col1, source_col2});
   auto target_table   = cudf::table_view({target_col1, target_col2});
   auto expected_table = cudf::table_view({expected_col1, expected_col2});
@@ -566,11 +569,13 @@ TEST_F(BooleanMaskScatterString, NoNUll)
 
 TEST_F(BooleanMaskScatterString, WithNUll)
 {
-  cudf::test::strings_column_wrapper source({"This", "cudf"}, {0, 1});
-  cudf::test::strings_column_wrapper target({"is", "is", "a", "udf", "api"}, {1, 0, 0, 1, 1});
+  cudf::test::strings_column_wrapper source({"This", "cudf"}, {false, true});
+  cudf::test::strings_column_wrapper target({"is", "is", "a", "udf", "api"},
+                                            {true, false, false, true, true});
   cudf::test::fixed_width_column_wrapper<bool> mask({true, false, false, true, false});
 
-  cudf::test::strings_column_wrapper expected({"This", "is", "a", "cudf", "api"}, {0, 0, 0, 1, 1});
+  cudf::test::strings_column_wrapper expected({"This", "is", "a", "cudf", "api"},
+                                              {false, false, false, true, true});
   auto source_table   = cudf::table_view({source});
   auto target_table   = cudf::table_view({target});
   auto expected_table = cudf::table_view({expected});
@@ -697,11 +702,12 @@ TYPED_TEST(BooleanMaskScalarScatter, WithNull)
   scalar_2->set_valid_async(true);
   std::vector<std::reference_wrapper<const cudf::scalar>> scalar_vect;
   scalar_vect.push_back(*scalar_1);
-  scalar_vect.push_back(*scalar_2);
+  scalar_vect.emplace_back(*scalar_2);
   cudf::test::fixed_width_column_wrapper<T, int32_t> target_col1({2, 2, 3, 4, 11, 12, 7, 7, 10, 10},
                                                                  {1, 1, 0, 1, 1, 1, 1, 1, 1, 0});
   cudf::test::strings_column_wrapper target_col2(
-    {"a", "bc", "cd", "ef", "gh", "ij", "jk", "lm", "no", "pq"}, {1, 1, 0, 1, 1, 1, 1, 1, 1, 0});
+    {"a", "bc", "cd", "ef", "gh", "ij", "jk", "lm", "no", "pq"},
+    {true, true, false, true, true, true, true, true, true, false});
   cudf::test::fixed_width_column_wrapper<bool> mask(
     {true, false, false, false, true, true, false, true, true, false});
 
@@ -709,7 +715,7 @@ TYPED_TEST(BooleanMaskScalarScatter, WithNull)
     {11, 2, 3, 4, 11, 11, 7, 11, 11, 10}, {0, 1, 0, 1, 0, 0, 1, 0, 0, 0});
   cudf::test::strings_column_wrapper expected_col2(
     {"cudf", "bc", "cd", "ef", "cudf", "cudf", "jk", "cudf", "cudf", "pq"},
-    {1, 1, 0, 1, 1, 1, 1, 1, 1, 0});
+    {true, true, false, true, true, true, true, true, true, false});
   auto target_table   = cudf::table_view({target_col1, target_col2});
   auto expected_table = cudf::table_view({expected_col1, expected_col2});
 
@@ -725,7 +731,7 @@ TEST_F(BooleanMaskScatterScalarString, NoNUll)
   auto scalar = cudf::make_string_scalar("cudf");
   scalar->set_valid_async(true);
   std::vector<std::reference_wrapper<const cudf::scalar>> scalar_vect;
-  scalar_vect.push_back(*scalar);
+  scalar_vect.emplace_back(*scalar);
 
   cudf::test::strings_column_wrapper target({"is", "is", "a", "udf", "api"});
   cudf::test::fixed_width_column_wrapper<bool> mask({true, false, false, true, false});
@@ -744,12 +750,13 @@ TEST_F(BooleanMaskScatterScalarString, WithNUll)
   auto scalar = cudf::make_string_scalar("cudf");
   scalar->set_valid_async(true);
   std::vector<std::reference_wrapper<const cudf::scalar>> scalar_vect;
-  scalar_vect.push_back(*scalar);
-  cudf::test::strings_column_wrapper target({"is", "is", "a", "udf", "api"}, {1, 0, 0, 1, 1});
+  scalar_vect.emplace_back(*scalar);
+  cudf::test::strings_column_wrapper target({"is", "is", "a", "udf", "api"},
+                                            {true, false, false, true, true});
   cudf::test::fixed_width_column_wrapper<bool> mask({true, false, true, true, false});
 
   cudf::test::strings_column_wrapper expected({"cudf", "is", "cudf", "cudf", "api"},
-                                              {1, 0, 1, 1, 1});
+                                              {true, false, true, true, true});
   auto target_table   = cudf::table_view({target});
   auto expected_table = cudf::table_view({expected});
   auto got            = cudf::boolean_mask_scatter(scalar_vect, target_table, mask);
@@ -764,7 +771,7 @@ TEST_F(BooleanMaskScatterScalarFails, SourceAndTargetTypeMismatch)
   auto scalar =
     cudf::make_numeric_scalar(cudf::data_type(cudf::data_type{cudf::type_to_id<int32_t>()}));
   std::vector<std::reference_wrapper<const cudf::scalar>> scalar_vect;
-  scalar_vect.push_back(*scalar);
+  scalar_vect.emplace_back(*scalar);
   cudf::test::fixed_width_column_wrapper<int64_t> target({2, 2, 3, 4, 11, 12, 7, 7, 10, 10});
   cudf::test::fixed_width_column_wrapper<bool> mask(
     {true, false, false, false, true, true, false, true, true, false});
@@ -778,7 +785,7 @@ TEST_F(BooleanMaskScatterScalarFails, BooleanMaskTypeMismatch)
   auto scalar =
     cudf::make_numeric_scalar(cudf::data_type(cudf::data_type{cudf::type_to_id<int32_t>()}));
   std::vector<std::reference_wrapper<const cudf::scalar>> scalar_vect;
-  scalar_vect.push_back(*scalar);
+  scalar_vect.emplace_back(*scalar);
   cudf::test::fixed_width_column_wrapper<int32_t> target({2, 2, 3, 4, 11, 12, 7, 7, 10, 10});
   cudf::test::fixed_width_column_wrapper<int8_t> mask(
     {true, false, false, false, true, true, false, true, true, false});
@@ -792,7 +799,7 @@ TEST_F(BooleanMaskScatterScalarFails, BooleanMaskTargetSizeMismatch)
   auto scalar =
     cudf::make_numeric_scalar(cudf::data_type(cudf::data_type{cudf::type_to_id<int32_t>()}));
   std::vector<std::reference_wrapper<const cudf::scalar>> scalar_vect;
-  scalar_vect.push_back(*scalar);
+  scalar_vect.emplace_back(*scalar);
   cudf::test::fixed_width_column_wrapper<int32_t> target({2, 2, 3, 4, 11, 12, 7, 7, 10, 10});
   cudf::test::fixed_width_column_wrapper<bool> mask(
     {true, false, false, false, true, true, false, true, true});
@@ -806,8 +813,8 @@ TEST_F(BooleanMaskScatterScalarFails, NumberOfColumnAndScalarMismatch)
   auto scalar =
     cudf::make_numeric_scalar(cudf::data_type(cudf::data_type{cudf::type_to_id<int32_t>()}));
   std::vector<std::reference_wrapper<const cudf::scalar>> scalar_vect;
-  scalar_vect.push_back(*scalar);
-  scalar_vect.push_back(*scalar);
+  scalar_vect.emplace_back(*scalar);
+  scalar_vect.emplace_back(*scalar);
   cudf::test::fixed_width_column_wrapper<int32_t> target({2, 2, 3, 4, 11, 12, 7, 7, 10, 10});
   cudf::test::fixed_width_column_wrapper<bool> mask(
     {true, false, false, false, true, true, false, true, true});
diff --git a/cpp/tests/copying/shift_tests.cpp b/cpp/tests/copying/shift_tests.cpp
index 9c2b16df1e1..01ad4f2247c 100644
--- a/cpp/tests/copying/shift_tests.cpp
+++ b/cpp/tests/copying/shift_tests.cpp
@@ -201,28 +201,29 @@ struct ShiftTests : public cudf::test::BaseFixture {};
 
 TEST_F(ShiftTests, StringsShiftTest)
 {
-  auto input =
-    cudf::test::strings_column_wrapper({"", "bb", "ccc", "ddddddé", ""}, {0, 1, 1, 1, 0});
+  auto input = cudf::test::strings_column_wrapper({"", "bb", "ccc", "ddddddé", ""},
+                                                  {false, true, true, true, false});
 
-  auto fill    = cudf::string_scalar("xx");
-  auto results = cudf::shift(input, 2, fill);
-  auto expected_right =
-    cudf::test::strings_column_wrapper({"xx", "xx", "", "bb", "ccc"}, {1, 1, 0, 1, 1});
+  auto fill           = cudf::string_scalar("xx");
+  auto results        = cudf::shift(input, 2, fill);
+  auto expected_right = cudf::test::strings_column_wrapper({"xx", "xx", "", "bb", "ccc"},
+                                                           {true, true, false, true, true});
   CUDF_TEST_EXPECT_COLUMNS_EQUAL(expected_right, *results);
 
-  results = cudf::shift(input, -2, fill);
-  auto expected_left =
-    cudf::test::strings_column_wrapper({"ccc", "ddddddé", "", "xx", "xx"}, {1, 1, 0, 1, 1});
+  results            = cudf::shift(input, -2, fill);
+  auto expected_left = cudf::test::strings_column_wrapper({"ccc", "ddddddé", "", "xx", "xx"},
+                                                          {true, true, false, true, true});
   CUDF_TEST_EXPECT_COLUMNS_EQUAL(expected_left, *results);
 
   auto sliced = cudf::slice(input, {1, 4}).front();
 
   results           = cudf::shift(sliced, 1, fill);
-  auto sliced_right = cudf::test::strings_column_wrapper({"xx", "bb", "ccc"}, {1, 1, 1});
+  auto sliced_right = cudf::test::strings_column_wrapper({"xx", "bb", "ccc"}, {true, true, true});
   CUDF_TEST_EXPECT_COLUMNS_EQUAL(sliced_right, *results);
 
-  results          = cudf::shift(sliced, -1, fill);
-  auto sliced_left = cudf::test::strings_column_wrapper({"ccc", "ddddddé", "xx"}, {1, 1, 1});
+  results = cudf::shift(sliced, -1, fill);
+  auto sliced_left =
+    cudf::test::strings_column_wrapper({"ccc", "ddddddé", "xx"}, {true, true, true});
   CUDF_TEST_EXPECT_COLUMNS_EQUAL(sliced_left, *results);
 }
 
@@ -234,42 +235,47 @@ TEST_F(ShiftTests, StringsShiftNullFillTest)
 
   auto results  = cudf::shift(input, -1, phil);
   auto expected = cudf::test::strings_column_wrapper(
-    {"b", "c", "d", "e", "ff", "ggg", "hhhh", "iii", "jjjjj", ""}, {1, 1, 1, 1, 1, 1, 1, 1, 1, 0});
+    {"b", "c", "d", "e", "ff", "ggg", "hhhh", "iii", "jjjjj", ""},
+    {true, true, true, true, true, true, true, true, true, false});
   CUDF_TEST_EXPECT_COLUMNS_EQUAL(*results, expected);
 
   results  = cudf::shift(input, 1, phil);
   expected = cudf::test::strings_column_wrapper(
-    {"", "a", "b", "c", "d", "e", "ff", "ggg", "hhhh", "iii"}, {0, 1, 1, 1, 1, 1, 1, 1, 1, 1});
+    {"", "a", "b", "c", "d", "e", "ff", "ggg", "hhhh", "iii"},
+    {false, true, true, true, true, true, true, true, true, true});
   CUDF_TEST_EXPECT_COLUMNS_EQUAL(*results, expected);
 
   auto sliced = cudf::slice(input, {5, 10}).front();
   results     = cudf::shift(sliced, -2, phil);
-  expected = cudf::test::strings_column_wrapper({"hhhh", "iii", "jjjjj", "", ""}, {1, 1, 1, 0, 0});
+  expected    = cudf::test::strings_column_wrapper({"hhhh", "iii", "jjjjj", "", ""},
+                                                   {true, true, true, false, false});
   CUDF_TEST_EXPECT_COLUMNS_EQUAL(*results, expected);
 
   results  = cudf::shift(sliced, 2, phil);
-  expected = cudf::test::strings_column_wrapper({"", "", "ff", "ggg", "hhhh"}, {0, 0, 1, 1, 1});
+  expected = cudf::test::strings_column_wrapper({"", "", "ff", "ggg", "hhhh"},
+                                                {false, false, true, true, true});
   CUDF_TEST_EXPECT_COLUMNS_EQUAL(*results, expected);
 }
 
 TEST_F(ShiftTests, OffsetGreaterThanSize)
 {
-  auto const input_str =
-    cudf::test::strings_column_wrapper({"", "bb", "ccc", "ddé", ""}, {0, 1, 1, 1, 0});
-  auto results      = cudf::shift(input_str, 6, cudf::string_scalar("xx"));
-  auto expected_str = cudf::test::strings_column_wrapper({"xx", "xx", "xx", "xx", "xx"});
+  auto const input_str = cudf::test::strings_column_wrapper({"", "bb", "ccc", "ddé", ""},
+                                                            {false, true, true, true, false});
+  auto results         = cudf::shift(input_str, 6, cudf::string_scalar("xx"));
+  auto expected_str    = cudf::test::strings_column_wrapper({"xx", "xx", "xx", "xx", "xx"});
   CUDF_TEST_EXPECT_COLUMNS_EQUIVALENT(expected_str, *results);
   results = cudf::shift(input_str, -6, cudf::string_scalar("xx"));
   CUDF_TEST_EXPECT_COLUMNS_EQUIVALENT(expected_str, *results);
 
-  results      = cudf::shift(input_str, 6, cudf::string_scalar("", false));
-  expected_str = cudf::test::strings_column_wrapper({"", "", "", "", ""}, {0, 0, 0, 0, 0});
+  results = cudf::shift(input_str, 6, cudf::string_scalar("", false));
+  expected_str =
+    cudf::test::strings_column_wrapper({"", "", "", "", ""}, {false, false, false, false, false});
   CUDF_TEST_EXPECT_COLUMNS_EQUIVALENT(expected_str, *results);
   results = cudf::shift(input_str, -6, cudf::string_scalar("", false));
   CUDF_TEST_EXPECT_COLUMNS_EQUIVALENT(expected_str, *results);
 
-  auto const input =
-    cudf::test::fixed_width_column_wrapper<int32_t>({0, 2, 3, 4, 0}, {0, 1, 1, 1, 0});
+  auto const input = cudf::test::fixed_width_column_wrapper<int32_t>(
+    {0, 2, 3, 4, 0}, {false, true, true, true, false});
   results       = cudf::shift(input, 6, cudf::numeric_scalar<int32_t>(9));
   auto expected = cudf::test::fixed_width_column_wrapper<int32_t>({9, 9, 9, 9, 9});
   CUDF_TEST_EXPECT_COLUMNS_EQUIVALENT(expected, *results);
@@ -277,7 +283,8 @@ TEST_F(ShiftTests, OffsetGreaterThanSize)
   CUDF_TEST_EXPECT_COLUMNS_EQUIVALENT(expected, *results);
 
   results  = cudf::shift(input, 6, cudf::numeric_scalar<int32_t>(0, false));
-  expected = cudf::test::fixed_width_column_wrapper<int32_t>({0, 0, 0, 0, 0}, {0, 0, 0, 0, 0});
+  expected = cudf::test::fixed_width_column_wrapper<int32_t>({0, 0, 0, 0, 0},
+                                                             {false, false, false, false, false});
   CUDF_TEST_EXPECT_COLUMNS_EQUIVALENT(expected, *results);
   results = cudf::shift(input, -6, cudf::numeric_scalar<int32_t>(0, false));
   CUDF_TEST_EXPECT_COLUMNS_EQUIVALENT(expected, *results);
diff --git a/cpp/tests/copying/slice_tests.cpp b/cpp/tests/copying/slice_tests.cpp
index fffc51eef2c..bebd3d25610 100644
--- a/cpp/tests/copying/slice_tests.cpp
+++ b/cpp/tests/copying/slice_tests.cpp
@@ -168,7 +168,7 @@ TEST_F(SliceListTest, Lists)
   {
     cudf::test::lists_column_wrapper<int> list{{{1, 2, 3}, {4, 5}},
                                                {LCW{}, LCW{}, {7, 8}, LCW{}},
-                                               {{{6}}},
+                                               {{{6}}},  // NOLINT
                                                {{7, 8}, {9, 10, 11}, LCW{}},
                                                {LCW{}, {-1, -2, -3, -4, -5}},
                                                {LCW{}},
@@ -177,7 +177,7 @@ TEST_F(SliceListTest, Lists)
     std::vector<cudf::size_type> indices{1, 3, 3, 6};
 
     std::vector<cudf::test::lists_column_wrapper<int>> expected;
-    expected.push_back(LCW{{LCW{}, LCW{}, {7, 8}, LCW{}}, {{{6}}}});
+    expected.push_back(LCW{{LCW{}, LCW{}, {7, 8}, LCW{}}, {{{6}}}});  // NOLINT
     expected.push_back(LCW{{{7, 8}, {9, 10, 11}, LCW{}}, {LCW{}, {-1, -2, -3, -4, -5}}, {LCW{}}});
 
     std::vector<cudf::column_view> result = cudf::slice(list, indices);
@@ -233,7 +233,7 @@ TEST_F(SliceListTest, ListsWithNulls)
   {
     cudf::test::lists_column_wrapper<int> list{{{{1, 2, 3}, valids}, {4, 5}},
                                                {{LCW{}, LCW{}, {7, 8}, LCW{}}, valids},
-                                               {{{6}}},
+                                               {{{6}}},  // NOLINT
                                                {{{7, 8}, {{9, 10, 11}, valids}, LCW{}}, valids},
                                                {{LCW{}, {-1, -2, -3, -4, -5}}, valids},
                                                {LCW{}},
@@ -242,7 +242,7 @@ TEST_F(SliceListTest, ListsWithNulls)
     std::vector<cudf::size_type> indices{1, 3, 3, 6};
 
     std::vector<cudf::test::lists_column_wrapper<int>> expected;
-    expected.push_back(LCW{{{LCW{}, LCW{}, {7, 8}, LCW{}}, valids}, {{{6}}}});
+    expected.push_back(LCW{{{LCW{}, LCW{}, {7, 8}, LCW{}}, valids}, {{{6}}}});  // NOLINT
     expected.push_back(LCW{{{{7, 8}, {{9, 10, 11}, valids}, LCW{}}, valids},
                            {{LCW{}, {-1, -2, -3, -4, -5}}, valids},
                            {LCW{}}});
@@ -476,11 +476,30 @@ TEST_F(SliceTableCornerCases, MiscOffset)
   cudf::test::fixed_width_column_wrapper<int32_t> col2{
     {3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3,
      3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3},
-    {1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
-     1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0}};
+    {true, true, true, true, true, true, true, true, true, true,  true,  true, true,
+     true, true, true, true, true, true, true, true, true, true,  true,  true, true,
+     true, true, true, true, true, true, true, true, true, false, false, false}};
   cudf::test::fixed_width_column_wrapper<int32_t> col3{
     {3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3},
-    {1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0}};
+    {true,
+     true,
+     true,
+     true,
+     true,
+     true,
+     true,
+     true,
+     true,
+     true,
+     true,
+     true,
+     true,
+     true,
+     true,
+     true,
+     false,
+     false,
+     false}};
   std::vector<cudf::size_type> indices{19, 38};
   std::vector<cudf::column_view> result = cudf::slice(col2, indices);
   cudf::column result_column(result[0]);
@@ -493,16 +512,19 @@ TEST_F(SliceTableCornerCases, PreSlicedInputs)
   {
     using LCW = cudf::test::lists_column_wrapper<float>;
 
-    cudf::test::fixed_width_column_wrapper<int> a{{0, 1, 2, 3, 4, 5, 6, 7, 8, 9},
-                                                  {1, 1, 0, 1, 1, 1, 0, 0, 1, 0}};
+    cudf::test::fixed_width_column_wrapper<int> a{
+      {0, 1, 2, 3, 4, 5, 6, 7, 8, 9},
+      {true, true, false, true, true, true, false, false, true, false}};
 
-    cudf::test::fixed_width_column_wrapper<int> b{{0, -1, -2, -3, -4, -5, -6, -7, -8, -9},
-                                                  {0, 0, 0, 0, 0, 0, 0, 0, 0, 0}};
+    cudf::test::fixed_width_column_wrapper<int> b{
+      {0, -1, -2, -3, -4, -5, -6, -7, -8, -9},
+      {false, false, false, false, false, false, false, false, false, false}};
 
-    cudf::test::strings_column_wrapper c{{"aa", "b", "", "ccc", "ddd", "e", "ff", "", "", "gggg"},
-                                         {0, 0, 1, 1, 0, 0, 1, 1, 1, 0}};
+    cudf::test::strings_column_wrapper c{
+      {"aa", "b", "", "ccc", "ddd", "e", "ff", "", "", "gggg"},
+      {false, false, true, true, false, false, true, true, true, false}};
 
-    std::vector<bool> list_validity{1, 0, 1, 0, 1, 1, 0, 0, 1, 1};
+    std::vector<bool> list_validity{true, false, true, false, true, true, false, false, true, true};
     cudf::test::lists_column_wrapper<float> d{
       {{0, 1}, {2}, {3, 4, 5}, {6}, {7, 7}, {8, 9}, {10, 11}, {12, 13}, {}, {14, 15, 16}},
       list_validity.begin()};
@@ -513,18 +535,21 @@ TEST_F(SliceTableCornerCases, PreSlicedInputs)
 
     auto result = cudf::slice(pre_sliced[1], {0, 1, 1, 6});
 
-    cudf::test::fixed_width_column_wrapper<int> e0_a({4}, {1});
-    cudf::test::fixed_width_column_wrapper<int> e0_b({-4}, {0});
-    cudf::test::strings_column_wrapper e0_c({""}, {0});
-    std::vector<bool> e0_list_validity{1};
+    cudf::test::fixed_width_column_wrapper<int> e0_a({4}, {true});
+    cudf::test::fixed_width_column_wrapper<int> e0_b({-4}, {false});
+    cudf::test::strings_column_wrapper e0_c({""}, {false});
+    std::vector<bool> e0_list_validity{true};
     cudf::test::lists_column_wrapper<float> e0_d({LCW{7, 7}}, e0_list_validity.begin());
     cudf::table_view expected0({e0_a, e0_b, e0_c, e0_d});
     CUDF_TEST_EXPECT_TABLES_EQUAL(result[0], expected0);
 
-    cudf::test::fixed_width_column_wrapper<int> e1_a{{5, 6, 7, 8, 9}, {1, 0, 0, 1, 0}};
-    cudf::test::fixed_width_column_wrapper<int> e1_b{{-5, -6, -7, -8, -9}, {0, 0, 0, 0, 0}};
-    cudf::test::strings_column_wrapper e1_c{{"e", "ff", "", "", "gggg"}, {0, 1, 1, 1, 0}};
-    std::vector<bool> e1_list_validity{1, 0, 0, 1, 1};
+    cudf::test::fixed_width_column_wrapper<int> e1_a{{5, 6, 7, 8, 9},
+                                                     {true, false, false, true, false}};
+    cudf::test::fixed_width_column_wrapper<int> e1_b{{-5, -6, -7, -8, -9},
+                                                     {false, false, false, false, false}};
+    cudf::test::strings_column_wrapper e1_c{{"e", "ff", "", "", "gggg"},
+                                            {false, true, true, true, false}};
+    std::vector<bool> e1_list_validity{true, false, false, true, true};
     cudf::test::lists_column_wrapper<float> e1_d{{{8, 9}, {10, 11}, {12, 13}, {}, {14, 15, 16}},
                                                  e1_list_validity.begin()};
     cudf::table_view expected1({e1_a, e1_b, e1_c, e1_d});
diff --git a/cpp/tests/copying/split_tests.cpp b/cpp/tests/copying/split_tests.cpp
index 077092ca036..7ff159cf896 100644
--- a/cpp/tests/copying/split_tests.cpp
+++ b/cpp/tests/copying/split_tests.cpp
@@ -116,8 +116,7 @@ std::vector<std::vector<bool>> create_expected_validity(std::vector<cudf::size_t
   std::vector<cudf::size_type> indices  = splits_to_indices(splits, validity.size());
 
   for (unsigned long index = 0; index < indices.size(); index += 2) {
-    result.push_back(
-      std::vector<bool>(validity.begin() + indices[index], validity.begin() + indices[index + 1]));
+    result.emplace_back(validity.begin() + indices[index], validity.begin() + indices[index + 1]);
   }
 
   return result;
@@ -914,12 +913,12 @@ void split_structs(bool include_validity, SplitFunc Split, CompareFunc Compare,
   // 1. String "names" column.
   std::vector<std::string> names{
     "Vimes", "Carrot", "Angua", "Cheery", "Detritus", "Slant", "Fred", "Todd", "Kevin"};
-  std::vector<bool> names_validity{1, 1, 1, 1, 1, 1, 1, 1, 1};
+  std::vector<bool> names_validity{true, true, true, true, true, true, true, true, true};
   cudf::test::strings_column_wrapper names_column(names.begin(), names.end());
 
   // 2. Numeric "ages" column.
   std::vector<int> ages{5, 10, 15, 20, 25, 30, 100, 101, 102};
-  std::vector<bool> ages_validity = {1, 1, 1, 1, 0, 1, 0, 0, 1};
+  std::vector<bool> ages_validity = {true, true, true, true, false, true, false, false, true};
   auto ages_column =
     include_validity
       ? cudf::test::fixed_width_column_wrapper<int>(ages.begin(), ages.end(), ages_validity.begin())
@@ -927,7 +926,7 @@ void split_structs(bool include_validity, SplitFunc Split, CompareFunc Compare,
 
   // 3. Boolean "is_human" column.
   std::vector<bool> is_human{true, true, false, false, false, false, true, true, true};
-  std::vector<bool> is_human_validity{1, 1, 1, 0, 1, 1, 1, 1, 0};
+  std::vector<bool> is_human_validity{true, true, true, false, true, true, true, true, false};
   auto is_human_col =
     include_validity
       ? cudf::test::fixed_width_column_wrapper<bool>(
@@ -935,7 +934,8 @@ void split_structs(bool include_validity, SplitFunc Split, CompareFunc Compare,
       : cudf::test::fixed_width_column_wrapper<bool>(is_human.begin(), is_human.end());
 
   // Assemble struct column.
-  auto const struct_validity = std::vector<bool>{1, 1, 1, 1, 1, 0, 0, 1, 0};
+  auto const struct_validity =
+    std::vector<bool>{true, true, true, true, true, false, false, true, false};
   auto struct_column =
     include_validity
       ? cudf::test::structs_column_wrapper({names_column, ages_column, is_human_col},
@@ -1084,17 +1084,17 @@ void split_nested_struct_of_list(SplitFunc Split, CompareFunc Compare, bool spli
   // 1. String "names" column.
   std::vector<std::string> names{
     "Vimes", "Carrot", "Angua", "Cheery", "Detritus", "Slant", "Fred", "Todd", "Kevin"};
-  std::vector<bool> names_validity{1, 1, 1, 1, 1, 1, 1, 1, 1};
+  std::vector<bool> names_validity{true, true, true, true, true, true, true, true, true};
   cudf::test::strings_column_wrapper names_column(names.begin(), names.end());
 
   // 2. Numeric "ages" column.
   std::vector<int> ages{5, 10, 15, 20, 25, 30, 100, 101, 102};
-  std::vector<bool> ages_validity = {1, 1, 1, 1, 0, 1, 0, 0, 1};
+  std::vector<bool> ages_validity = {true, true, true, true, false, true, false, false, true};
   auto ages_column =
     cudf::test::fixed_width_column_wrapper<int>(ages.begin(), ages.end(), ages_validity.begin());
 
   // 3. List column
-  std::vector<bool> list_validity{1, 1, 1, 1, 1, 0, 1, 0, 1};
+  std::vector<bool> list_validity{true, true, true, true, true, false, true, false, true};
   cudf::test::lists_column_wrapper<float> list({{{1, 2, 3}, {4}},
                                                 {{-1, -2}, LCW{}},
                                                 LCW{},
@@ -1107,7 +1107,8 @@ void split_nested_struct_of_list(SplitFunc Split, CompareFunc Compare, bool spli
                                                list_validity.begin());
 
   // Assemble struct column.
-  auto const struct_validity = std::vector<bool>{1, 1, 1, 1, 1, 0, 0, 1, 0};
+  auto const struct_validity =
+    std::vector<bool>{true, true, true, true, true, false, false, true, false};
   auto struct_column =
     cudf::test::structs_column_wrapper({names_column, ages_column, list}, struct_validity.begin());
 
@@ -1120,7 +1121,7 @@ void split_nested_struct_of_list(SplitFunc Split, CompareFunc Compare, bool spli
     std::vector<cudf::test::lists_column_wrapper<float>> expected_lists;
     expected_lists.push_back(LCW({{{1, 2, 3}, {4}}}));
     expected_lists.push_back(LCW({{{-1, -2}, LCW{}}, LCW{}}));
-    std::vector<bool> ex_v{1, 1, 0, 1, 0};
+    std::vector<bool> ex_v{true, true, false, true, false};
     expected_lists.push_back(LCW({{{10}, {20, 30, 40}, {100, -100}},
                                   {LCW{}, LCW{}, {8, 9}},
                                   LCW{},
@@ -1169,17 +1170,68 @@ void split_nested_list_of_structs(SplitFunc Split, CompareFunc Compare, bool spl
                                  "Mark",
                                  "Herman",
                                  "Will"};
-  std::vector<bool> names_validity{1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1};
+  std::vector<bool> names_validity{true,
+                                   true,
+                                   true,
+                                   true,
+                                   true,
+                                   true,
+                                   true,
+                                   true,
+                                   true,
+                                   true,
+                                   true,
+                                   true,
+                                   true,
+                                   true,
+                                   true,
+                                   true,
+                                   true,
+                                   true};
   cudf::test::strings_column_wrapper names_column(names.begin(), names.end());
 
   // 2. Numeric "ages" column.
   std::vector<int> ages{5, 10, 15, 20, 25, 30, 100, 101, 102, 26, 64, 12, 17, 16, 120, 44, 23, 50};
-  std::vector<bool> ages_validity = {1, 1, 1, 1, 0, 1, 0, 0, 1, 1, 1, 0, 0, 0, 1, 1, 1, 0};
+  std::vector<bool> ages_validity = {true,
+                                     true,
+                                     true,
+                                     true,
+                                     false,
+                                     true,
+                                     false,
+                                     false,
+                                     true,
+                                     true,
+                                     true,
+                                     false,
+                                     false,
+                                     false,
+                                     true,
+                                     true,
+                                     true,
+                                     false};
   auto ages_column =
     cudf::test::fixed_width_column_wrapper<int>(ages.begin(), ages.end(), ages_validity.begin());
 
   // 3. List column
-  std::vector<bool> list_validity{1, 1, 1, 1, 1, 0, 1, 0, 1, 1, 1, 1, 1, 1, 1, 0, 1, 1};
+  std::vector<bool> list_validity{true,
+                                  true,
+                                  true,
+                                  true,
+                                  true,
+                                  false,
+                                  true,
+                                  false,
+                                  true,
+                                  true,
+                                  true,
+                                  true,
+                                  true,
+                                  true,
+                                  true,
+                                  false,
+                                  true,
+                                  true};
   cudf::test::lists_column_wrapper<cudf::string_view> list(
     {{"ab", "cd", "ef"},
      LCW{"gh"},
@@ -1202,8 +1254,24 @@ void split_nested_list_of_structs(SplitFunc Split, CompareFunc Compare, bool spl
     list_validity.begin());
 
   // Assembly struct column
-  auto const struct_validity =
-    std::vector<bool>{1, 1, 1, 1, 1, 0, 0, 1, 0, 0, 0, 0, 1, 1, 1, 1, 0, 1};
+  auto const struct_validity = std::vector<bool>{true,
+                                                 true,
+                                                 true,
+                                                 true,
+                                                 true,
+                                                 false,
+                                                 false,
+                                                 true,
+                                                 false,
+                                                 false,
+                                                 false,
+                                                 false,
+                                                 true,
+                                                 true,
+                                                 true,
+                                                 true,
+                                                 false,
+                                                 true};
   auto struct_column =
     cudf::test::structs_column_wrapper({names_column, ages_column, list}, struct_validity.begin());
 
@@ -1211,7 +1279,7 @@ void split_nested_list_of_structs(SplitFunc Split, CompareFunc Compare, bool spl
   std::vector<int> outer_offsets{0, 3, 4, 8, 13, 16, 17, 18};
   cudf::test::fixed_width_column_wrapper<int> outer_offsets_col(outer_offsets.begin(),
                                                                 outer_offsets.end());
-  std::vector<bool> outer_validity{1, 1, 1, 0, 1, 1, 0};
+  std::vector<bool> outer_validity{true, true, true, false, true, true, false};
   auto [outer_null_mask, outer_null_count] =
     cudf::test::detail::make_null_mask(outer_validity.begin(), outer_validity.end());
   auto outer_list = make_lists_column(static_cast<cudf::size_type>(outer_validity.size()),
@@ -1713,8 +1781,8 @@ TEST_F(ContiguousSplitStringTableTest, EmptyInputColumn)
     auto result = cudf::contiguous_split(src_table, splits);
     ASSERT_EQ(result.size(), 5);
 
-    for (size_t idx = 0; idx < result.size(); idx++) {
-      CUDF_TEST_EXPECT_TABLES_EQUIVALENT(src_table, result[idx].table);
+    for (auto& idx : result) {
+      CUDF_TEST_EXPECT_TABLES_EQUIVALENT(src_table, idx.table);
     }
   }
 }
@@ -1953,7 +2021,7 @@ TEST_F(ContiguousSplitTableCornerCases, PreSplitTable)
 
   cudf::test::lists_column_wrapper<int> col0{{{1, 2, 3}, {4, 5}},
                                              {{LCW{}, LCW{}, {7, 8}, LCW{}}, valids},
-                                             {{{6}}},
+                                             {{{6}}},  // NOLINT
                                              {{{7, 8}, LCW{}, {{9, 10, 11}, valids}}, valids},
                                              {{{-1, -2, -3, -4, -5}, LCW{}}, valids},
                                              {LCW{}},
@@ -2098,12 +2166,13 @@ TEST_F(ContiguousSplitTableCornerCases, PreSplitStructs)
   // includes struct<list>
   {
     cudf::test::fixed_width_column_wrapper<int> a{0, 1, 2, 3, 4, 5, 6, 7, 8, 9};
-    cudf::test::fixed_width_column_wrapper<float> b{{0, -1, -2, -3, -4, -5, -6, -7, -8, -9},
-                                                    {1, 1, 1, 0, 0, 0, 0, 1, 1, 1}};
+    cudf::test::fixed_width_column_wrapper<float> b{
+      {0, -1, -2, -3, -4, -5, -6, -7, -8, -9},
+      {true, true, true, false, false, false, false, true, true, true}};
     cudf::test::strings_column_wrapper c{
       {"abc", "def", "ghi", "jkl", "mno", "", "st", "uvwx", "yy", "zzzz"},
-      {0, 0, 1, 1, 1, 1, 1, 1, 1, 1}};
-    std::vector<bool> list_validity{1, 0, 1, 0, 1, 0, 1, 1, 1, 1};
+      {false, false, true, true, true, true, true, true, true, true}};
+    std::vector<bool> list_validity{true, false, true, false, true, false, true, true, true, true};
     cudf::test::lists_column_wrapper<int16_t> d{
       {{0, 1}, {2, 3, 4}, {5, 6}, {7}, {8, 9, 10}, {11, 12}, {}, {15, 16, 17}, {18, 19}, {20}},
       list_validity.begin()};
@@ -2112,8 +2181,10 @@ TEST_F(ContiguousSplitTableCornerCases, PreSplitStructs)
       -10, -20, -30, -40, -50, -60, -70, -80, -90, -100};
     cudf::test::strings_column_wrapper _c{
       "aa", "", "ccc", "dddd", "eeeee", "f", "gg", "hhh", "i", "jjj"};
-    cudf::test::structs_column_wrapper e({_a, _b, _c}, {1, 1, 1, 0, 1, 1, 1, 0, 1, 1});
-    cudf::test::structs_column_wrapper s({a, b, c, d, e}, {1, 1, 0, 1, 1, 1, 1, 1, 1, 1});
+    cudf::test::structs_column_wrapper e(
+      {_a, _b, _c}, {true, true, true, false, true, true, true, false, true, true});
+    cudf::test::structs_column_wrapper s(
+      {a, b, c, d, e}, {true, true, false, true, true, true, true, true, true, true});
 
     auto pre_split = cudf::split(s, {4});
 
diff --git a/cpp/tests/dictionary/decode_test.cpp b/cpp/tests/dictionary/decode_test.cpp
index 33c8cb23110..84b6c728e4b 100644
--- a/cpp/tests/dictionary/decode_test.cpp
+++ b/cpp/tests/dictionary/decode_test.cpp
@@ -48,8 +48,9 @@ TEST_F(DictionaryDecodeTest, FloatColumn)
 
 TEST_F(DictionaryDecodeTest, ColumnWithNull)
 {
-  cudf::test::fixed_width_column_wrapper<int64_t> input{{444, 0, 333, 111, 222, 222, 222, 444, 000},
-                                                        {1, 1, 1, 1, 1, 0, 1, 1, 1}};
+  cudf::test::fixed_width_column_wrapper<int64_t> input{
+    {444, 0, 333, 111, 222, 222, 222, 444, 000},
+    {true, true, true, true, true, false, true, true, true}};
 
   auto dictionary = cudf::dictionary::encode(input);
   auto output     = cudf::dictionary::decode(cudf::dictionary_column_view(dictionary->view()));
diff --git a/cpp/tests/dictionary/encode_test.cpp b/cpp/tests/dictionary/encode_test.cpp
index 93c2ab4c0ef..5db0e9fa1e4 100644
--- a/cpp/tests/dictionary/encode_test.cpp
+++ b/cpp/tests/dictionary/encode_test.cpp
@@ -56,8 +56,9 @@ TEST_F(DictionaryEncodeTest, EncodeFloat)
 
 TEST_F(DictionaryEncodeTest, EncodeWithNull)
 {
-  cudf::test::fixed_width_column_wrapper<int64_t> input{{444, 0, 333, 111, 222, 222, 222, 444, 000},
-                                                        {1, 1, 1, 1, 1, 0, 1, 1, 1}};
+  cudf::test::fixed_width_column_wrapper<int64_t> input{
+    {444, 0, 333, 111, 222, 222, 222, 444, 000},
+    {true, true, true, true, true, false, true, true, true}};
 
   auto dictionary = cudf::dictionary::encode(input);
   cudf::dictionary_column_view view(dictionary->view());
diff --git a/cpp/tests/dictionary/factories_test.cpp b/cpp/tests/dictionary/factories_test.cpp
index 35aa19c5558..051ea45aed6 100644
--- a/cpp/tests/dictionary/factories_test.cpp
+++ b/cpp/tests/dictionary/factories_test.cpp
@@ -96,7 +96,8 @@ TEST_F(DictionaryFactoriesTest, ColumnsWithNulls)
 
 TEST_F(DictionaryFactoriesTest, KeysWithNulls)
 {
-  cudf::test::fixed_width_column_wrapper<int32_t> keys{{0, 1, 2, 3, 4}, {1, 1, 1, 0, 1}};
+  cudf::test::fixed_width_column_wrapper<int32_t> keys{{0, 1, 2, 3, 4},
+                                                       {true, true, true, false, true}};
   cudf::test::fixed_width_column_wrapper<uint32_t> indices{5, 4, 3, 2, 1, 0};
   EXPECT_THROW(cudf::make_dictionary_column(keys, indices), cudf::logic_error);
 }
@@ -104,7 +105,8 @@ TEST_F(DictionaryFactoriesTest, KeysWithNulls)
 TEST_F(DictionaryFactoriesTest, IndicesWithNulls)
 {
   cudf::test::fixed_width_column_wrapper<int32_t> keys{0, 1, 2, 3, 4};
-  cudf::test::fixed_width_column_wrapper<uint32_t> indices{{5, 4, 3, 2, 1, 0}, {1, 1, 1, 0, 1, 0}};
+  cudf::test::fixed_width_column_wrapper<uint32_t> indices{{5, 4, 3, 2, 1, 0},
+                                                           {true, true, true, false, true, false}};
   EXPECT_THROW(
     cudf::make_dictionary_column(keys.release(), indices.release(), rmm::device_buffer{}, 0),
     cudf::logic_error);
diff --git a/cpp/tests/dictionary/fill_test.cpp b/cpp/tests/dictionary/fill_test.cpp
index 7f2bb5496f3..18696b66e48 100644
--- a/cpp/tests/dictionary/fill_test.cpp
+++ b/cpp/tests/dictionary/fill_test.cpp
@@ -42,25 +42,27 @@ TEST_F(DictionaryFillTest, StringsColumn)
 
 TEST_F(DictionaryFillTest, WithNulls)
 {
-  cudf::test::fixed_width_column_wrapper<int64_t> input({9, 8, 7, 6, 4}, {0, 1, 1, 0, 1});
+  cudf::test::fixed_width_column_wrapper<int64_t> input({9, 8, 7, 6, 4},
+                                                        {false, true, true, false, true});
   auto dictionary = cudf::dictionary::encode(input);
   cudf::numeric_scalar<int64_t> fv(-10);
   auto results = cudf::fill(dictionary->view(), 0, 2, fv);
   auto decoded = cudf::dictionary::decode(results->view());
-  cudf::test::fixed_width_column_wrapper<int64_t> expected({-10, -10, 7, 6, 4}, {1, 1, 1, 0, 1});
+  cudf::test::fixed_width_column_wrapper<int64_t> expected({-10, -10, 7, 6, 4},
+                                                           {true, true, true, false, true});
   CUDF_TEST_EXPECT_COLUMNS_EQUAL(decoded->view(), expected);
 }
 
 TEST_F(DictionaryFillTest, FillWithNull)
 {
   cudf::test::fixed_width_column_wrapper<double> input({1.2, 8.5, 7.75, 6.25, 4.125},
-                                                       {1, 1, 1, 0, 1});
+                                                       {true, true, true, false, true});
   auto dictionary = cudf::dictionary::encode(input);
   cudf::numeric_scalar<double> fv(0, false);
   auto results = cudf::fill(dictionary->view(), 1, 3, fv);
   auto decoded = cudf::dictionary::decode(results->view());
   cudf::test::fixed_width_column_wrapper<double> expected({1.2, 0.0, 0.0, 0.0, 4.125},
-                                                          {1, 0, 0, 0, 1});
+                                                          {true, false, false, false, true});
   CUDF_TEST_EXPECT_COLUMNS_EQUAL(decoded->view(), expected);
 }
 
diff --git a/cpp/tests/dictionary/gather_test.cpp b/cpp/tests/dictionary/gather_test.cpp
index 8fd8751bc76..71e3a2adaa1 100644
--- a/cpp/tests/dictionary/gather_test.cpp
+++ b/cpp/tests/dictionary/gather_test.cpp
@@ -45,7 +45,8 @@ TEST_F(DictionaryGatherTest, Gather)
 
 TEST_F(DictionaryGatherTest, GatherWithNulls)
 {
-  cudf::test::fixed_width_column_wrapper<int64_t> data{{1, 5, 5, 3, 7, 1}, {0, 1, 0, 1, 1, 1}};
+  cudf::test::fixed_width_column_wrapper<int64_t> data{{1, 5, 5, 3, 7, 1},
+                                                       {false, true, false, true, true, true}};
 
   auto dictionary = cudf::dictionary::encode(data);
   cudf::dictionary_column_view view(dictionary->view());
@@ -54,7 +55,7 @@ TEST_F(DictionaryGatherTest, GatherWithNulls)
   auto table_result = cudf::gather(cudf::table_view{{dictionary->view()}}, gather_map);
   auto result       = cudf::dictionary_column_view(table_result->view().column(0));
 
-  cudf::test::fixed_width_column_wrapper<int64_t> expected{{7, 5, 5, 7}, {1, 1, 0, 1}};
+  cudf::test::fixed_width_column_wrapper<int64_t> expected{{7, 5, 5, 7}, {true, true, false, true}};
   auto result_decoded = cudf::dictionary::decode(result);
   CUDF_TEST_EXPECT_COLUMNS_EQUAL(expected, result_decoded->view());
 }
diff --git a/cpp/tests/dictionary/remove_keys_test.cpp b/cpp/tests/dictionary/remove_keys_test.cpp
index 9950a39d630..7067201ba5e 100644
--- a/cpp/tests/dictionary/remove_keys_test.cpp
+++ b/cpp/tests/dictionary/remove_keys_test.cpp
@@ -74,7 +74,7 @@ TEST_F(DictionaryRemoveKeysTest, FloatColumn)
       cudf::dictionary::remove_keys(cudf::dictionary_column_view(dictionary->view()), del_keys);
     auto const decoded = cudf::dictionary::decode(result->view());
     cudf::test::fixed_width_column_wrapper<float> expected{{0., 7.125, 0.5, 0., 7.125, 0.5},
-                                                           {0, 1, 1, 0, 1, 1}};
+                                                           {false, true, true, false, true, true}};
     CUDF_TEST_EXPECT_COLUMNS_EQUAL(decoded->view(), expected);
   }
   {
@@ -90,8 +90,9 @@ TEST_F(DictionaryRemoveKeysTest, FloatColumn)
 
 TEST_F(DictionaryRemoveKeysTest, WithNull)
 {
-  cudf::test::fixed_width_column_wrapper<int64_t> input{{444, 0, 333, 111, 222, 222, 222, 444, 0},
-                                                        {1, 1, 1, 1, 1, 0, 1, 1, 1}};
+  cudf::test::fixed_width_column_wrapper<int64_t> input{
+    {444, 0, 333, 111, 222, 222, 222, 444, 0},
+    {true, true, true, true, true, false, true, true, true}};
   cudf::test::fixed_width_column_wrapper<int64_t> del_keys{0, 111, 777};
 
   auto const dictionary = cudf::dictionary::encode(input);
@@ -99,8 +100,9 @@ TEST_F(DictionaryRemoveKeysTest, WithNull)
     auto const result =
       cudf::dictionary::remove_keys(cudf::dictionary_column_view(dictionary->view()), del_keys);
     auto const decoded = cudf::dictionary::decode(result->view());
-    cudf::test::fixed_width_column_wrapper<int64_t> expected{{444, 0, 333, 0, 222, 0, 222, 444, 0},
-                                                             {1, 0, 1, 0, 1, 0, 1, 1, 0}};
+    cudf::test::fixed_width_column_wrapper<int64_t> expected{
+      {444, 0, 333, 0, 222, 0, 222, 444, 0},
+      {true, false, true, false, true, false, true, true, false}};
     CUDF_TEST_EXPECT_COLUMNS_EQUAL(decoded->view(), expected);
   }
   {
@@ -121,6 +123,6 @@ TEST_F(DictionaryRemoveKeysTest, Errors)
 
   cudf::test::fixed_width_column_wrapper<float> del_keys{1.0, 2.0, 3.0};
   EXPECT_THROW(cudf::dictionary::remove_keys(dictionary->view(), del_keys), cudf::data_type_error);
-  cudf::test::fixed_width_column_wrapper<int64_t> null_keys{{1, 2, 3}, {1, 0, 1}};
+  cudf::test::fixed_width_column_wrapper<int64_t> null_keys{{1, 2, 3}, {true, false, true}};
   EXPECT_THROW(cudf::dictionary::remove_keys(dictionary->view(), null_keys), cudf::logic_error);
 }
diff --git a/cpp/tests/dictionary/scatter_test.cpp b/cpp/tests/dictionary/scatter_test.cpp
index 2f77f4ee621..59279e0f0cd 100644
--- a/cpp/tests/dictionary/scatter_test.cpp
+++ b/cpp/tests/dictionary/scatter_test.cpp
@@ -90,10 +90,11 @@ TEST_F(DictionaryScatterTest, ScatterScalar)
 
 TEST_F(DictionaryScatterTest, WithNulls)
 {
-  cudf::test::fixed_width_column_wrapper<int64_t> data_source{{1, 5, 7, 9}, {0, 1, 1, 1}};
+  cudf::test::fixed_width_column_wrapper<int64_t> data_source{{1, 5, 7, 9},
+                                                              {false, true, true, true}};
   auto source = cudf::dictionary::encode(data_source);
-  cudf::test::fixed_width_column_wrapper<int64_t> data_target{{1, 5, 5, 3, 7, 1, 4, 2},
-                                                              {0, 1, 0, 1, 1, 1, 1, 1}};
+  cudf::test::fixed_width_column_wrapper<int64_t> data_target{
+    {1, 5, 5, 3, 7, 1, 4, 2}, {false, true, false, true, true, true, true, true}};
   auto target = cudf::dictionary::encode(data_target);
 
   cudf::test::fixed_width_column_wrapper<int32_t> scatter_map{7, 2, 3, 1};
@@ -104,15 +105,15 @@ TEST_F(DictionaryScatterTest, WithNulls)
   auto decoded =
     cudf::dictionary::decode(cudf::dictionary_column_view(table_result.front()->view()));
 
-  cudf::test::fixed_width_column_wrapper<int64_t> expected{{1, 9, 5, 7, 7, 1, 4, 1},
-                                                           {0, 1, 1, 1, 1, 1, 1, 0}};
+  cudf::test::fixed_width_column_wrapper<int64_t> expected{
+    {1, 9, 5, 7, 7, 1, 4, 1}, {false, true, true, true, true, true, true, false}};
   CUDF_TEST_EXPECT_COLUMNS_EQUAL(expected, decoded->view());
 }
 
 TEST_F(DictionaryScatterTest, ScalarWithNulls)
 {
-  cudf::test::fixed_width_column_wrapper<int64_t> data_target{{1, 5, 5, 3, 7, 1, 4, 2},
-                                                              {0, 1, 0, 1, 1, 1, 1, 1}};
+  cudf::test::fixed_width_column_wrapper<int64_t> data_target{
+    {1, 5, 5, 3, 7, 1, 4, 2}, {false, true, false, true, true, true, true, true}};
   auto target = cudf::dictionary::encode(data_target);
   std::vector<std::reference_wrapper<const cudf::scalar>> source;
   const cudf::numeric_scalar<int64_t> source_slr = cudf::test::make_type_param_scalar<int64_t>(100);
@@ -126,8 +127,8 @@ TEST_F(DictionaryScatterTest, ScalarWithNulls)
   auto decoded =
     cudf::dictionary::decode(cudf::dictionary_column_view(table_result.front()->view()));
 
-  cudf::test::fixed_width_column_wrapper<int64_t> expected{{1, 100, 100, 100, 7, 100, 4, 100},
-                                                           {0, 1, 1, 1, 1, 1, 1, 1}};
+  cudf::test::fixed_width_column_wrapper<int64_t> expected{
+    {1, 100, 100, 100, 7, 100, 4, 100}, {false, true, true, true, true, true, true, true}};
   CUDF_TEST_EXPECT_COLUMNS_EQUAL(expected, decoded->view());
 }
 
diff --git a/cpp/tests/dictionary/search_test.cpp b/cpp/tests/dictionary/search_test.cpp
index b49b4ce5aa0..1b73576e083 100644
--- a/cpp/tests/dictionary/search_test.cpp
+++ b/cpp/tests/dictionary/search_test.cpp
@@ -26,7 +26,8 @@ struct DictionarySearchTest : public cudf::test::BaseFixture {};
 TEST_F(DictionarySearchTest, StringsColumn)
 {
   cudf::test::dictionary_column_wrapper<std::string> dictionary(
-    {"fff", "aaa", "ddd", "bbb", "ccc", "ccc", "ccc", "", ""}, {1, 1, 1, 1, 1, 1, 1, 1, 0});
+    {"fff", "aaa", "ddd", "bbb", "ccc", "ccc", "ccc", "", ""},
+    {true, true, true, true, true, true, true, true, false});
 
   auto result = cudf::dictionary::get_index(dictionary, cudf::string_scalar("ccc"));
   EXPECT_TRUE(result->is_valid());
@@ -45,7 +46,8 @@ TEST_F(DictionarySearchTest, StringsColumn)
 
 TEST_F(DictionarySearchTest, WithNulls)
 {
-  cudf::test::dictionary_column_wrapper<int64_t> dictionary({9, 8, 7, 6, 4}, {0, 1, 1, 0, 1});
+  cudf::test::dictionary_column_wrapper<int64_t> dictionary({9, 8, 7, 6, 4},
+                                                            {false, true, true, false, true});
 
   auto result = cudf::dictionary::get_index(dictionary, cudf::numeric_scalar<int64_t>(4));
   EXPECT_TRUE(result->is_valid());
diff --git a/cpp/tests/dictionary/set_keys_test.cpp b/cpp/tests/dictionary/set_keys_test.cpp
index 5c9ec3567fe..62bd9e00584 100644
--- a/cpp/tests/dictionary/set_keys_test.cpp
+++ b/cpp/tests/dictionary/set_keys_test.cpp
@@ -57,22 +57,24 @@ TEST_F(DictionarySetKeysTest, FloatKeys)
   auto result = cudf::dictionary::set_keys(dictionary->view(), new_keys);
 
   cudf::test::fixed_width_column_wrapper<float> expected{{4.25, 7.125, 0.5, 0., 7.125, 0.5},
-                                                         {1, 1, 1, 0, 1, 1}};
+                                                         {true, true, true, false, true, true}};
   auto decoded = cudf::dictionary::decode(result->view());
   CUDF_TEST_EXPECT_COLUMNS_EQUAL(*decoded, expected);
 }
 
 TEST_F(DictionarySetKeysTest, WithNulls)
 {
-  cudf::test::fixed_width_column_wrapper<int64_t> input{{444, 0, 333, 111, 222, 222, 222, 444, 0},
-                                                        {1, 1, 1, 1, 1, 0, 1, 1, 1}};
+  cudf::test::fixed_width_column_wrapper<int64_t> input{
+    {444, 0, 333, 111, 222, 222, 222, 444, 0},
+    {true, true, true, true, true, false, true, true, true}};
   auto dictionary = cudf::dictionary::encode(input);
 
   cudf::test::fixed_width_column_wrapper<int64_t> new_keys{0, 222, 333, 444};
   auto result = cudf::dictionary::set_keys(dictionary->view(), new_keys);
 
   cudf::test::fixed_width_column_wrapper<int64_t> expected{
-    {444, 0, 333, 111, 222, 222, 222, 444, 0}, {1, 1, 1, 0, 1, 0, 1, 1, 1}};
+    {444, 0, 333, 111, 222, 222, 222, 444, 0},
+    {true, true, true, false, true, false, true, true, true}};
   auto decoded = cudf::dictionary::decode(result->view());
   CUDF_TEST_EXPECT_COLUMNS_EQUAL(*decoded, expected);
 }
@@ -84,7 +86,7 @@ TEST_F(DictionarySetKeysTest, Errors)
 
   cudf::test::fixed_width_column_wrapper<float> new_keys{1.0, 2.0, 3.0};
   EXPECT_THROW(cudf::dictionary::set_keys(dictionary->view(), new_keys), cudf::data_type_error);
-  cudf::test::fixed_width_column_wrapper<int64_t> null_keys{{1, 2, 3}, {1, 0, 1}};
+  cudf::test::fixed_width_column_wrapper<int64_t> null_keys{{1, 2, 3}, {true, false, true}};
   EXPECT_THROW(cudf::dictionary::set_keys(dictionary->view(), null_keys), cudf::logic_error);
 }
 
diff --git a/cpp/tests/dictionary/slice_test.cpp b/cpp/tests/dictionary/slice_test.cpp
index 42bf7d488d2..d80f8dee079 100644
--- a/cpp/tests/dictionary/slice_test.cpp
+++ b/cpp/tests/dictionary/slice_test.cpp
@@ -31,14 +31,16 @@ struct DictionarySliceTest : public cudf::test::BaseFixture {};
 TEST_F(DictionarySliceTest, SliceColumn)
 {
   cudf::test::strings_column_wrapper strings{
-    {"eee", "aaa", "ddd", "bbb", "ccc", "", "ccc", "eee", "aaa"}, {1, 1, 1, 1, 1, 0, 1, 1, 1}};
+    {"eee", "aaa", "ddd", "bbb", "ccc", "", "ccc", "eee", "aaa"},
+    {true, true, true, true, true, false, true, true, true}};
   auto dictionary = cudf::dictionary::encode(strings);
 
   std::vector<cudf::size_type> splits{1, 6};
   auto result = cudf::slice(dictionary->view(), splits);
 
   auto output = cudf::dictionary::decode(cudf::dictionary_column_view(result.front()));
-  cudf::test::strings_column_wrapper expected{{"aaa", "ddd", "bbb", "ccc", ""}, {1, 1, 1, 1, 0}};
+  cudf::test::strings_column_wrapper expected{{"aaa", "ddd", "bbb", "ccc", ""},
+                                              {true, true, true, true, false}};
   CUDF_TEST_EXPECT_COLUMNS_EQUAL(expected, *output);
 
   {
@@ -69,21 +71,22 @@ TEST_F(DictionarySliceTest, SliceColumn)
 TEST_F(DictionarySliceTest, SplitColumn)
 {
   cudf::test::fixed_width_column_wrapper<float> input{{4.25, 7.125, 0.5, 0., -11.75, 7.125, 0.5},
-                                                      {1, 1, 1, 0, 1, 1, 1}};
+                                                      {true, true, true, false, true, true, true}};
   auto dictionary = cudf::dictionary::encode(input);
 
   std::vector<cudf::size_type> splits{2, 6};
   auto results = cudf::split(dictionary->view(), splits);
 
-  cudf::test::fixed_width_column_wrapper<float> expected1{{4.25, 7.125}, {1, 1}};
+  cudf::test::fixed_width_column_wrapper<float> expected1{{4.25, 7.125}, {true, true}};
   auto output1 = cudf::dictionary::decode(cudf::dictionary_column_view(results[0]));
   CUDF_TEST_EXPECT_COLUMNS_EQUAL(expected1, output1->view());
 
-  cudf::test::fixed_width_column_wrapper<float> expected2{{0.5, 0., -11.75, 7.125}, {1, 0, 1, 1}};
+  cudf::test::fixed_width_column_wrapper<float> expected2{{0.5, 0., -11.75, 7.125},
+                                                          {true, false, true, true}};
   auto output2 = cudf::dictionary::decode(cudf::dictionary_column_view(results[1]));
   CUDF_TEST_EXPECT_COLUMNS_EQUAL(expected2, output2->view());
 
-  cudf::test::fixed_width_column_wrapper<float> expected3({0.5}, {1});
+  cudf::test::fixed_width_column_wrapper<float> expected3({0.5}, {true});
   auto output3 = cudf::dictionary::decode(cudf::dictionary_column_view(results[2]));
   CUDF_TEST_EXPECT_COLUMNS_EQUAL(expected3, output3->view());
 }
diff --git a/cpp/tests/groupby/argmax_tests.cpp b/cpp/tests/groupby/argmax_tests.cpp
index f9d034ad0c7..6b45d460cd6 100644
--- a/cpp/tests/groupby/argmax_tests.cpp
+++ b/cpp/tests/groupby/argmax_tests.cpp
@@ -97,8 +97,9 @@ TYPED_TEST(groupby_argmax_test, null_keys_and_values)
 
   if (std::is_same_v<V, bool>) return;
 
-  cudf::test::fixed_width_column_wrapper<K> keys({1, 2, 3, 1, 2, 2, 1, 3, 3, 2, 4},
-                                                 {1, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1});
+  cudf::test::fixed_width_column_wrapper<K> keys(
+    {1, 2, 3, 1, 2, 2, 1, 3, 3, 2, 4},
+    {true, true, false, true, true, true, true, true, true, true, true});
   cudf::test::fixed_width_column_wrapper<V> vals({9, 8, 7, 6, 5, 4, 3, 2, 1, 0, 4},
                                                  {0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 0});
 
diff --git a/cpp/tests/groupby/argmin_tests.cpp b/cpp/tests/groupby/argmin_tests.cpp
index 0211bc5fb43..c3d7360a072 100644
--- a/cpp/tests/groupby/argmin_tests.cpp
+++ b/cpp/tests/groupby/argmin_tests.cpp
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2020-2023, NVIDIA CORPORATION.
+ * Copyright (c) 2020-2024, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -98,8 +98,9 @@ TYPED_TEST(groupby_argmin_test, null_keys_and_values)
 
   if (std::is_same_v<V, bool>) return;
 
-  cudf::test::fixed_width_column_wrapper<K> keys({1, 2, 3, 1, 2, 2, 1, 3, 3, 2, 4},
-                                                 {1, 1, 1, 1, 1, 1, 1, 0, 1, 1, 1});
+  cudf::test::fixed_width_column_wrapper<K> keys(
+    {1, 2, 3, 1, 2, 2, 1, 3, 3, 2, 4},
+    {true, true, true, true, true, true, true, false, true, true, true});
   cudf::test::fixed_width_column_wrapper<V> vals({9, 8, 7, 6, 5, 4, 3, 2, 1, 0, 4},
                                                  {1, 1, 1, 1, 1, 0, 0, 1, 1, 1, 0});
 
diff --git a/cpp/tests/groupby/collect_set_tests.cpp b/cpp/tests/groupby/collect_set_tests.cpp
index 518fec65f61..61d2838590b 100644
--- a/cpp/tests/groupby/collect_set_tests.cpp
+++ b/cpp/tests/groupby/collect_set_tests.cpp
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2021-2023, NVIDIA CORPORATION.
+ * Copyright (c) 2021-2024, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -39,7 +39,7 @@ auto groupby_collect_set(cudf::column_view const& keys,
                          std::unique_ptr<cudf::groupby_aggregation>&& agg)
 {
   std::vector<cudf::groupby::aggregation_request> requests;
-  requests.emplace_back(cudf::groupby::aggregation_request());
+  requests.emplace_back();
   requests[0].values = values;
   requests[0].aggregations.emplace_back(std::move(agg));
 
diff --git a/cpp/tests/groupby/correlation_tests.cpp b/cpp/tests/groupby/correlation_tests.cpp
index 399ff9f51a6..26f714632dd 100644
--- a/cpp/tests/groupby/correlation_tests.cpp
+++ b/cpp/tests/groupby/correlation_tests.cpp
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2021-2023, NVIDIA CORPORATION.
+ * Copyright (c) 2021-2024, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -119,7 +119,7 @@ TYPED_TEST(groupby_correlation_test, null_keys_and_values)
 
   // clang-format off
   cudf::test::fixed_width_column_wrapper<K> keys({1, 2, 3, 1, 2, 2, 1, 3, 3, 2, 4},
-                                     {1, 1, 1, 1, 1, 1, 1, 0, 1, 1, 1});
+                                     {true, true, true, true, true, true, true, false, true, true, true});
   cudf::test::fixed_width_column_wrapper<V> val0({9, 1, 1, 2, 2, 3, 3,-1, 1, 4, 4},
                                      {0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1});
   cudf::test::fixed_width_column_wrapper<V> val1({1, 1, 1, 2, 0, 3, 3,-1, 0, 2, 2});
@@ -143,7 +143,7 @@ TYPED_TEST(groupby_correlation_test, null_values_same)
 
   // clang-format off
   cudf::test::fixed_width_column_wrapper<K> keys({1, 2, 3, 1, 2, 2, 1, 3, 3, 2, 4},
-                                     {1, 1, 1, 1, 1, 1, 1, 0, 1, 1, 1});
+                                     {true, true, true, true, true, true, true, false, true, true, true});
   cudf::test::fixed_width_column_wrapper<V> val0({9, 1, 1, 2, 2, 3, 3,-1, 1, 4, 4},
                                      {0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0});
   cudf::test::fixed_width_column_wrapper<V> val1({1, 1, 1, 2, 0, 3, 3,-1, 0, 2, 2},
@@ -172,7 +172,7 @@ TYPED_TEST(groupby_correlation_test, null_values_different)
 
   // clang-format off
   cudf::test::fixed_width_column_wrapper<K> keys({1, 2, 3, 1, 2, 2, 1, 3, 3, 2, 4},
-                                     {1, 1, 1, 1, 1, 1, 1, 0, 1, 1, 1});
+                                     {true, true, true, true, true, true, true, false, true, true, true});
   cudf::test::fixed_width_column_wrapper<V> val0({9, 1, 1, 2, 2, 3, 3,-1, 1, 4, 4},
                                      {0, 1, 1, 1, 0, 1, 1, 1, 1, 1, 1});
   cudf::test::fixed_width_column_wrapper<V> val1({1, 2, 1, 2,-1, 6, 3,-1, 0, 1, 2},
diff --git a/cpp/tests/groupby/count_scan_tests.cpp b/cpp/tests/groupby/count_scan_tests.cpp
index fb80989e8ed..b694d3514b6 100644
--- a/cpp/tests/groupby/count_scan_tests.cpp
+++ b/cpp/tests/groupby/count_scan_tests.cpp
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2021-2023, NVIDIA CORPORATION.
+ * Copyright (c) 2021-2024, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -112,7 +112,7 @@ TYPED_TEST(groupby_count_scan_test, null_keys_and_values)
   using result_wrapper = typename TestFixture::result_wrapper;
 
   // clang-format off
-  key_wrapper keys(  {1, 2, 3, 1, 2, 2, 1, 3, 3, 2, 4}, {1, 1, 1, 1, 1, 1, 1, 0, 1, 1, 1});
+  key_wrapper keys(  {1, 2, 3, 1, 2, 2, 1, 3, 3, 2, 4}, {true, true, true, true, true, true, true, false, true, true, true});
   value_wrapper vals({0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 4}, {0, 1, 1, 1, 1, 0, 1, 1, 1, 1, 0});
 
   //                        {1, 1, 1, 2, 2, 2, 2, 3, _, 3, 4}
diff --git a/cpp/tests/groupby/count_tests.cpp b/cpp/tests/groupby/count_tests.cpp
index 4f0fdd53a4d..9ed6c11f266 100644
--- a/cpp/tests/groupby/count_tests.cpp
+++ b/cpp/tests/groupby/count_tests.cpp
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2019-2023, NVIDIA CORPORATION.
+ * Copyright (c) 2019-2024, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -116,8 +116,9 @@ TYPED_TEST(groupby_count_test, null_keys_and_values)
   using V = TypeParam;
   using R = cudf::detail::target_type_t<V, cudf::aggregation::COUNT_VALID>;
 
-  cudf::test::fixed_width_column_wrapper<K> keys({1, 2, 3, 1, 2, 2, 1, 3, 3, 2, 4},
-                                                 {1, 1, 1, 1, 1, 1, 1, 0, 1, 1, 1});
+  cudf::test::fixed_width_column_wrapper<K> keys(
+    {1, 2, 3, 1, 2, 2, 1, 3, 3, 2, 4},
+    {true, true, true, true, true, true, true, false, true, true, true});
   cudf::test::fixed_width_column_wrapper<V> vals({0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 4},
                                                  {0, 1, 1, 1, 1, 0, 1, 1, 1, 1, 0});
 
diff --git a/cpp/tests/groupby/covariance_tests.cpp b/cpp/tests/groupby/covariance_tests.cpp
index 96001172e00..e3eb2da201f 100644
--- a/cpp/tests/groupby/covariance_tests.cpp
+++ b/cpp/tests/groupby/covariance_tests.cpp
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2021-2023, NVIDIA CORPORATION.
+ * Copyright (c) 2021-2024, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -129,7 +129,7 @@ TYPED_TEST(groupby_covariance_test, null_keys_and_values)
 
   // clang-format off
   cudf::test::fixed_width_column_wrapper<K> keys({1, 2, 3, 1, 2, 2, 1, 3, 3, 2, 4},
-                                     {1, 1, 1, 1, 1, 1, 1, 0, 1, 1, 1});
+                                     {true, true, true, true, true, true, true, false, true, true, true});
   cudf::test::fixed_width_column_wrapper<V> val0({9, 1, 1, 2, 2, 3, 3,-1, 1, 4, 4},
                                      {0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1});
   cudf::test::fixed_width_column_wrapper<V> val1({1, 1, 1, 2, 0, 3, 3,-1, 0, 2, 2});
@@ -150,7 +150,7 @@ TYPED_TEST(groupby_covariance_test, null_values_same)
 
   // clang-format off
   cudf::test::fixed_width_column_wrapper<K> keys({1, 2, 3, 1, 2, 2, 1, 3, 3, 2, 4},
-                                     {1, 1, 1, 1, 1, 1, 1, 0, 1, 1, 1});
+                                     {true, true, true, true, true, true, true, false, true, true, true});
   cudf::test::fixed_width_column_wrapper<V> val0({9, 1, 1, 2, 2, 3, 3,-1, 1, 4, 4},
                                      {0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0});
   cudf::test::fixed_width_column_wrapper<V> val1({1, 1, 1, 2, 0, 3, 3,-1, 0, 2, 2},
@@ -172,7 +172,7 @@ TYPED_TEST(groupby_covariance_test, null_values_different)
 
   // clang-format off
   cudf::test::fixed_width_column_wrapper<K> keys({1, 2, 3, 1, 2, 2, 1, 3, 3, 2, 4},
-                                     {1, 1, 1, 1, 1, 1, 1, 0, 1, 1, 1});
+                                     {true, true, true, true, true, true, true, false, true, true, true});
   cudf::test::fixed_width_column_wrapper<V> val0({9, 1, 1, 2, 2, 3, 3,-1, 1, 4, 4},
                                      {0, 1, 1, 1, 0, 1, 1, 1, 1, 1, 1});
   cudf::test::fixed_width_column_wrapper<V> val1({1, 2, 1, 2,-1, 3, 3,-1, 0, 4, 2},
diff --git a/cpp/tests/groupby/groupby_test_util.cpp b/cpp/tests/groupby/groupby_test_util.cpp
index 8bd109fca53..5d99d15ae77 100644
--- a/cpp/tests/groupby/groupby_test_util.cpp
+++ b/cpp/tests/groupby/groupby_test_util.cpp
@@ -58,7 +58,7 @@ void test_single_agg(cudf::column_view const& keys,
   }();
 
   std::vector<cudf::groupby::aggregation_request> requests;
-  requests.emplace_back(cudf::groupby::aggregation_request());
+  requests.emplace_back();
   requests[0].values = values;
 
   requests[0].aggregations.push_back(std::move(agg));
@@ -126,7 +126,7 @@ void test_single_scan(cudf::column_view const& keys,
                       std::vector<cudf::null_order> const& null_precedence)
 {
   std::vector<cudf::groupby::scan_request> requests;
-  requests.emplace_back(cudf::groupby::scan_request());
+  requests.emplace_back();
   requests[0].values = values;
 
   requests[0].aggregations.push_back(std::move(agg));
diff --git a/cpp/tests/groupby/groups_tests.cpp b/cpp/tests/groupby/groups_tests.cpp
index fb471e3a03e..f3d303c0fb8 100644
--- a/cpp/tests/groupby/groups_tests.cpp
+++ b/cpp/tests/groupby/groups_tests.cpp
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2020-2023, NVIDIA CORPORATION.
+ * Copyright (c) 2020-2024, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -108,7 +108,8 @@ TYPED_TEST(groupby_group_keys_and_values_test, some_nulls)
   using K = int32_t;
   using V = TypeParam;
 
-  cudf::test::fixed_width_column_wrapper<K> keys({1, 1, 3, 2, 1, 2}, {1, 0, 1, 0, 0, 1});
+  cudf::test::fixed_width_column_wrapper<K> keys({1, 1, 3, 2, 1, 2},
+                                                 {true, false, true, false, false, true});
   cudf::test::fixed_width_column_wrapper<K> expect_grouped_keys({1, 2, 3},
                                                                 cudf::test::iterators::no_nulls());
   cudf::test::fixed_width_column_wrapper<V> values({1, 2, 3, 4, 5, 6});
diff --git a/cpp/tests/groupby/keys_tests.cpp b/cpp/tests/groupby/keys_tests.cpp
index 7064abc459d..7a8e64dc61d 100644
--- a/cpp/tests/groupby/keys_tests.cpp
+++ b/cpp/tests/groupby/keys_tests.cpp
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2019-2023, NVIDIA CORPORATION.
+ * Copyright (c) 2019-2024, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -374,7 +374,7 @@ TEST_F(groupby_cache_test, duplicate_agggregations)
   cudf::groupby::groupby gb_obj(cudf::table_view({keys}));
 
   std::vector<cudf::groupby::aggregation_request> requests;
-  requests.emplace_back(cudf::groupby::aggregation_request());
+  requests.emplace_back();
   requests[0].values = vals;
   requests[0].aggregations.push_back(cudf::make_sum_aggregation<cudf::groupby_aggregation>());
   requests[0].aggregations.push_back(cudf::make_sum_aggregation<cudf::groupby_aggregation>());
@@ -403,10 +403,10 @@ TEST_F(groupby_cache_test, duplicate_columns)
   cudf::groupby::groupby gb_obj(cudf::table_view({keys}));
 
   std::vector<cudf::groupby::aggregation_request> requests;
-  requests.emplace_back(cudf::groupby::aggregation_request());
+  requests.emplace_back();
   requests[0].values = vals;
   requests[0].aggregations.push_back(cudf::make_sum_aggregation<cudf::groupby_aggregation>());
-  requests.emplace_back(cudf::groupby::aggregation_request());
+  requests.emplace_back();
   requests[1].values = vals;
   requests[1].aggregations.push_back(cudf::make_sum_aggregation<cudf::groupby_aggregation>());
 
diff --git a/cpp/tests/groupby/m2_tests.cpp b/cpp/tests/groupby/m2_tests.cpp
index 294791397b0..4359c154cf6 100644
--- a/cpp/tests/groupby/m2_tests.cpp
+++ b/cpp/tests/groupby/m2_tests.cpp
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2021-2023, NVIDIA CORPORATION.
+ * Copyright (c) 2021-2024, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -42,7 +42,7 @@ using M2s_col = cudf::test::fixed_width_column_wrapper<T>;
 auto compute_M2(cudf::column_view const& keys, cudf::column_view const& values)
 {
   std::vector<cudf::groupby::aggregation_request> requests;
-  requests.emplace_back(cudf::groupby::aggregation_request());
+  requests.emplace_back();
   requests[0].values = values;
   requests[0].aggregations.emplace_back(cudf::make_m2_aggregation<cudf::groupby_aggregation>());
 
diff --git a/cpp/tests/groupby/max_scan_tests.cpp b/cpp/tests/groupby/max_scan_tests.cpp
index 2d8400e02b7..d86de798844 100644
--- a/cpp/tests/groupby/max_scan_tests.cpp
+++ b/cpp/tests/groupby/max_scan_tests.cpp
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2021-2023, NVIDIA CORPORATION.
+ * Copyright (c) 2021-2024, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -127,7 +127,7 @@ TYPED_TEST(groupby_max_scan_test, null_keys_and_values)
   using result_wrapper = typename TestFixture::result_wrapper;
 
   // clang-format off
-  key_wrapper keys(  {1, 2, 3, 1, 2, 2, 1, 3, 3, 2, 4}, {1, 1, 1, 1, 1, 1, 1, 0, 1, 1, 1});
+  key_wrapper keys(  {1, 2, 3, 1, 2, 2, 1, 3, 3, 2, 4}, {true, true, true, true, true, true, true, false, true, true, true});
   value_wrapper vals({5, 6, 7, 8, 9, 0, 1, 2, 3, 4, 4}, {0, 1, 1, 1, 1, 0, 1, 1, 1, 1, 0});
 
                          //  {1, 1, 1, 2, 2, 2, 2, 3,   _, 3, 4}
diff --git a/cpp/tests/groupby/max_tests.cpp b/cpp/tests/groupby/max_tests.cpp
index 9481770dc58..6feeb4ee618 100644
--- a/cpp/tests/groupby/max_tests.cpp
+++ b/cpp/tests/groupby/max_tests.cpp
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2019-2023, NVIDIA CORPORATION.
+ * Copyright (c) 2019-2024, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -111,8 +111,9 @@ TYPED_TEST(groupby_max_test, null_keys_and_values)
   using V = TypeParam;
   using R = cudf::detail::target_type_t<V, cudf::aggregation::MAX>;
 
-  cudf::test::fixed_width_column_wrapper<K> keys({1, 2, 3, 1, 2, 2, 1, 3, 3, 2, 4},
-                                                 {1, 1, 1, 1, 1, 1, 1, 0, 1, 1, 1});
+  cudf::test::fixed_width_column_wrapper<K> keys(
+    {1, 2, 3, 1, 2, 2, 1, 3, 3, 2, 4},
+    {true, true, true, true, true, true, true, false, true, true, true});
   cudf::test::fixed_width_column_wrapper<V> vals({0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 4},
                                                  {1, 1, 1, 1, 1, 1, 0, 1, 1, 0, 0});
 
@@ -168,20 +169,24 @@ TEST_F(groupby_max_string_test, max_sorted_strings)
     {"",   "",   "",   "",   "",   "",   "06", "06", "06", "06", "10", "10", "10", "10", "14", "14",
      "14", "14", "18", "18", "18", "18", "22", "22", "22", "22", "26", "26", "26", "26", "30", "30",
      "30", "30", "34", "34", "34", "34", "38", "38", "38", "38", "42", "42", "42", "42"},
-    {0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
-     1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1});
+    {false, false, false, false, false, false, true, true, true, true, true, true,
+     true,  true,  true,  true,  true,  true,  true, true, true, true, true, true,
+     true,  true,  true,  true,  true,  true,  true, true, true, true, true, true,
+     true,  true,  true,  true,  true,  true,  true, true, true, true});
   cudf::test::strings_column_wrapper vals(
     {"", "", "",   "", "", "", "06", "", "", "", "10", "", "", "", "14", "",
      "", "", "18", "", "", "", "22", "", "", "", "26", "", "", "", "30", "",
      "", "", "34", "", "", "", "38", "", "", "", "42", "", "", ""},
-    {0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 1, 0, 0, 0, 1, 0, 0, 0, 1, 0, 0, 0, 1,
-     0, 0, 0, 1, 0, 0, 0, 1, 0, 0, 0, 1, 0, 0, 0, 1, 0, 0, 0, 1, 0, 0, 0});
+    {false, false, false, false, false, false, true, false, false, false, true, false,
+     false, false, true,  false, false, false, true, false, false, false, true, false,
+     false, false, true,  false, false, false, true, false, false, false, true, false,
+     false, false, true,  false, false, false, true, false, false, false});
   cudf::test::strings_column_wrapper expect_keys(
     {"06", "10", "14", "18", "22", "26", "30", "34", "38", "42", ""},
-    {1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0});
+    {true, true, true, true, true, true, true, true, true, true, false});
   cudf::test::strings_column_wrapper expect_vals(
     {"06", "10", "14", "18", "22", "26", "30", "34", "38", "42", ""},
-    {1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0});
+    {true, true, true, true, true, true, true, true, true, true, false});
 
   // cudf::test::fixed_width_column_wrapper<size_type> expect_argmax(
   // {6, 10, 14, 18, 22, 26, 30, 34, 38, 42, -1},
@@ -537,7 +542,7 @@ TYPED_TEST(groupby_max_floating_point_test, values_with_nan)
   auto const vals = floats_col{nan, nan};
 
   std::vector<cudf::groupby::aggregation_request> requests;
-  requests.emplace_back(cudf::groupby::aggregation_request());
+  requests.emplace_back();
   requests[0].values = vals;
   requests[0].aggregations.emplace_back(cudf::make_max_aggregation<cudf::groupby_aggregation>());
 
diff --git a/cpp/tests/groupby/mean_tests.cpp b/cpp/tests/groupby/mean_tests.cpp
index 2d6ad24a096..0cb5ee30a8b 100644
--- a/cpp/tests/groupby/mean_tests.cpp
+++ b/cpp/tests/groupby/mean_tests.cpp
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2019-2023, NVIDIA CORPORATION.
+ * Copyright (c) 2019-2024, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -116,8 +116,9 @@ TYPED_TEST(groupby_mean_test, null_keys_and_values)
   using R  = cudf::detail::target_type_t<V, cudf::aggregation::MEAN>;
   using RT = typename std::conditional<cudf::is_duration<R>(), int, double>::type;
 
-  cudf::test::fixed_width_column_wrapper<K> keys({1, 2, 3, 1, 2, 2, 1, 3, 3, 2, 4},
-                                                 {1, 1, 1, 1, 1, 1, 1, 0, 1, 1, 1});
+  cudf::test::fixed_width_column_wrapper<K> keys(
+    {1, 2, 3, 1, 2, 2, 1, 3, 3, 2, 4},
+    {true, true, true, true, true, true, true, false, true, true, true});
   cudf::test::fixed_width_column_wrapper<V> vals({0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 4},
                                                  {0, 1, 1, 1, 1, 0, 1, 1, 1, 1, 0});
 
diff --git a/cpp/tests/groupby/median_tests.cpp b/cpp/tests/groupby/median_tests.cpp
index 4b037c08ac3..49b4480831a 100644
--- a/cpp/tests/groupby/median_tests.cpp
+++ b/cpp/tests/groupby/median_tests.cpp
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2019-2023, NVIDIA CORPORATION.
+ * Copyright (c) 2019-2024, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -106,8 +106,9 @@ TYPED_TEST(groupby_median_test, null_keys_and_values)
   using V = TypeParam;
   using R = cudf::detail::target_type_t<V, cudf::aggregation::MEDIAN>;
 
-  cudf::test::fixed_width_column_wrapper<K> keys({1, 2, 3, 1, 2, 2, 1, 3, 3, 2, 4},
-                                                 {1, 1, 1, 1, 1, 1, 1, 0, 1, 1, 1});
+  cudf::test::fixed_width_column_wrapper<K> keys(
+    {1, 2, 3, 1, 2, 2, 1, 3, 3, 2, 4},
+    {true, true, true, true, true, true, true, false, true, true, true});
   cudf::test::fixed_width_column_wrapper<V> vals({0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 4},
                                                  {0, 1, 1, 1, 1, 0, 1, 1, 1, 1, 0});
 
diff --git a/cpp/tests/groupby/merge_lists_tests.cpp b/cpp/tests/groupby/merge_lists_tests.cpp
index f2909f870aa..279d71560b4 100644
--- a/cpp/tests/groupby/merge_lists_tests.cpp
+++ b/cpp/tests/groupby/merge_lists_tests.cpp
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2021-2023, NVIDIA CORPORATION.
+ * Copyright (c) 2021-2024, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -40,7 +40,7 @@ auto merge_lists(vcol_views const& keys_cols, vcol_views const& values_cols)
   auto const values = cudf::concatenate(values_cols);
 
   std::vector<cudf::groupby::aggregation_request> requests;
-  requests.emplace_back(cudf::groupby::aggregation_request());
+  requests.emplace_back();
   requests[0].values = *values;
   requests[0].aggregations.emplace_back(
     cudf::make_merge_lists_aggregation<cudf::groupby_aggregation>());
diff --git a/cpp/tests/groupby/merge_m2_tests.cpp b/cpp/tests/groupby/merge_m2_tests.cpp
index 1087410dfff..67f231e5206 100644
--- a/cpp/tests/groupby/merge_m2_tests.cpp
+++ b/cpp/tests/groupby/merge_m2_tests.cpp
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2021-2023, NVIDIA CORPORATION.
+ * Copyright (c) 2021-2024, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -57,7 +57,7 @@ using vcol_views  = std::vector<cudf::column_view>;
 auto compute_partial_results(cudf::column_view const& keys, cudf::column_view const& values)
 {
   std::vector<cudf::groupby::aggregation_request> requests;
-  requests.emplace_back(cudf::groupby::aggregation_request());
+  requests.emplace_back();
   requests[0].values = values;
   requests[0].aggregations.emplace_back(cudf::make_count_aggregation<cudf::groupby_aggregation>());
   requests[0].aggregations.emplace_back(cudf::make_mean_aggregation<cudf::groupby_aggregation>());
@@ -85,7 +85,7 @@ auto merge_M2(vcol_views const& keys_cols, vcol_views const& values_cols)
   auto const values = cudf::concatenate(values_cols);
 
   std::vector<cudf::groupby::aggregation_request> requests;
-  requests.emplace_back(cudf::groupby::aggregation_request());
+  requests.emplace_back();
   requests[0].values = *values;
   requests[0].aggregations.emplace_back(
     cudf::make_merge_m2_aggregation<cudf::groupby_aggregation>());
diff --git a/cpp/tests/groupby/merge_sets_tests.cpp b/cpp/tests/groupby/merge_sets_tests.cpp
index 5fc7e68b524..9736bb84dd6 100644
--- a/cpp/tests/groupby/merge_sets_tests.cpp
+++ b/cpp/tests/groupby/merge_sets_tests.cpp
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2021-2023, NVIDIA CORPORATION.
+ * Copyright (c) 2021-2024, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -42,7 +42,7 @@ auto merge_sets(vcol_views const& keys_cols, vcol_views const& values_cols)
   auto const values = cudf::concatenate(values_cols);
 
   std::vector<cudf::groupby::aggregation_request> requests;
-  requests.emplace_back(cudf::groupby::aggregation_request());
+  requests.emplace_back();
   requests[0].values = *values;
   requests[0].aggregations.emplace_back(
     cudf::make_merge_sets_aggregation<cudf::groupby_aggregation>());
diff --git a/cpp/tests/groupby/min_scan_tests.cpp b/cpp/tests/groupby/min_scan_tests.cpp
index 035f8e3926b..877eb7a1c53 100644
--- a/cpp/tests/groupby/min_scan_tests.cpp
+++ b/cpp/tests/groupby/min_scan_tests.cpp
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2021-2023, NVIDIA CORPORATION.
+ * Copyright (c) 2021-2024, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -123,7 +123,7 @@ TYPED_TEST(groupby_min_scan_test, null_keys_and_values)
   using result_wrapper = typename TestFixture::result_wrapper;
 
   // clang-format off
-  key_wrapper keys(  {1, 2, 3, 1, 2, 2, 1, 3, 3, 2, 4}, {1, 1, 1, 1, 1, 1, 1, 0, 1, 1, 1});
+  key_wrapper keys(  {1, 2, 3, 1, 2, 2, 1, 3, 3, 2, 4}, {true, true, true, true, true, true, true, false, true, true, true});
   value_wrapper vals({5, 6, 7, 8, 9, 0, 1, 2, 3, 4, 4}, {0, 1, 1, 1, 1, 0, 1, 1, 1, 1, 0});
 
                          //  { 1, 1, 1, 2, 2,  2, 2, 3, _, 3, 4}
diff --git a/cpp/tests/groupby/min_tests.cpp b/cpp/tests/groupby/min_tests.cpp
index 44f9b7040c6..38007a81f68 100644
--- a/cpp/tests/groupby/min_tests.cpp
+++ b/cpp/tests/groupby/min_tests.cpp
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2019-2023, NVIDIA CORPORATION.
+ * Copyright (c) 2019-2024, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -111,8 +111,9 @@ TYPED_TEST(groupby_min_test, null_keys_and_values)
   using V = TypeParam;
   using R = cudf::detail::target_type_t<V, cudf::aggregation::MIN>;
 
-  cudf::test::fixed_width_column_wrapper<K> keys({1, 2, 3, 1, 2, 2, 1, 3, 3, 2, 4},
-                                                 {1, 1, 1, 1, 1, 1, 1, 0, 1, 1, 1});
+  cudf::test::fixed_width_column_wrapper<K> keys(
+    {1, 2, 3, 1, 2, 2, 1, 3, 3, 2, 4},
+    {true, true, true, true, true, true, true, false, true, true, true});
   cudf::test::fixed_width_column_wrapper<V> vals({0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 4},
                                                  {0, 1, 1, 1, 1, 0, 1, 1, 1, 1, 0});
 
@@ -168,20 +169,24 @@ TEST_F(groupby_min_string_test, min_sorted_strings)
     {"",   "",   "",   "",   "",   "",   "06", "06", "06", "06", "10", "10", "10", "10", "14", "14",
      "14", "14", "18", "18", "18", "18", "22", "22", "22", "22", "26", "26", "26", "26", "30", "30",
      "30", "30", "34", "34", "34", "34", "38", "38", "38", "38", "42", "42", "42", "42"},
-    {0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
-     1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1});
+    {false, false, false, false, false, false, true, true, true, true, true, true,
+     true,  true,  true,  true,  true,  true,  true, true, true, true, true, true,
+     true,  true,  true,  true,  true,  true,  true, true, true, true, true, true,
+     true,  true,  true,  true,  true,  true,  true, true, true, true});
   cudf::test::strings_column_wrapper vals(
     {"", "", "",   "", "", "", "06", "", "", "", "10", "", "", "", "14", "",
      "", "", "18", "", "", "", "22", "", "", "", "26", "", "", "", "30", "",
      "", "", "34", "", "", "", "38", "", "", "", "42", "", "", ""},
-    {0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 1, 0, 0, 0, 1, 0, 0, 0, 1, 0, 0, 0, 1,
-     0, 0, 0, 1, 0, 0, 0, 1, 0, 0, 0, 1, 0, 0, 0, 1, 0, 0, 0, 1, 0, 0, 0});
+    {false, false, false, false, false, false, true, false, false, false, true, false,
+     false, false, true,  false, false, false, true, false, false, false, true, false,
+     false, false, true,  false, false, false, true, false, false, false, true, false,
+     false, false, true,  false, false, false, true, false, false, false});
   cudf::test::strings_column_wrapper expect_keys(
     {"06", "10", "14", "18", "22", "26", "30", "34", "38", "42", ""},
-    {1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0});
+    {true, true, true, true, true, true, true, true, true, true, false});
   cudf::test::strings_column_wrapper expect_vals(
     {"06", "10", "14", "18", "22", "26", "30", "34", "38", "42", ""},
-    {1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0});
+    {true, true, true, true, true, true, true, true, true, true, false});
 
   auto agg = cudf::make_min_aggregation<cudf::groupby_aggregation>();
   test_single_agg(keys,
@@ -533,7 +538,7 @@ TYPED_TEST(groupby_min_floating_point_test, values_with_nan)
   auto const vals = floats_col{nan, nan};
 
   std::vector<cudf::groupby::aggregation_request> requests;
-  requests.emplace_back(cudf::groupby::aggregation_request());
+  requests.emplace_back();
   requests[0].values = vals;
   requests[0].aggregations.emplace_back(cudf::make_min_aggregation<cudf::groupby_aggregation>());
 
diff --git a/cpp/tests/groupby/nth_element_tests.cpp b/cpp/tests/groupby/nth_element_tests.cpp
index 5fb911ea0f1..e274bfa8c65 100644
--- a/cpp/tests/groupby/nth_element_tests.cpp
+++ b/cpp/tests/groupby/nth_element_tests.cpp
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2020-2023, NVIDIA CORPORATION.
+ * Copyright (c) 2020-2024, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -173,7 +173,7 @@ TYPED_TEST(groupby_nth_element_test, null_keys_and_values)
   using R = cudf::detail::target_type_t<V, cudf::aggregation::NTH_ELEMENT>;
 
   cudf::test::fixed_width_column_wrapper<K> keys({1, 2, 3, 1, 2, 2, 1, 3, 3, 2, 4},
-                                     {1, 1, 1, 1, 1, 1, 1, 0, 1, 1, 1});
+                                     {true, true, true, true, true, true, true, false, true, true, true});
   cudf::test::fixed_width_column_wrapper<V, int32_t> vals({0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 4},
                                               {0, 1, 1, 1, 1, 0, 1, 1, 1, 1, 0});
 
@@ -193,7 +193,7 @@ TYPED_TEST(groupby_nth_element_test, null_keys_and_values_out_of_bounds)
   using R = cudf::detail::target_type_t<V, cudf::aggregation::NTH_ELEMENT>;
 
   cudf::test::fixed_width_column_wrapper<K> keys({1, 2, 3, 1, 2, 2, 1, 3, 3, 2, 4},
-                                     {1, 1, 1, 1, 1, 1, 1, 0, 1, 1, 1});
+                                     {true, true, true, true, true, true, true, false, true, true, true});
   cudf::test::fixed_width_column_wrapper<V, int32_t> vals({0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 4},
                                               {0, 1, 1, 1, 1, 0, 1, 1, 1, 1, 0});
   //                                        {1, 1, 1    2, 2, 2,    3, 3,   4}
@@ -213,7 +213,7 @@ TYPED_TEST(groupby_nth_element_test, exclude_nulls)
   using R = cudf::detail::target_type_t<V, cudf::aggregation::NTH_ELEMENT>;
 
   cudf::test::fixed_width_column_wrapper<K> keys({1, 2, 3, 3, 1, 2, 2, 1, 3, 3, 2, 4, 4, 2},
-                                     {1, 1, 1, 1, 1, 1, 1, 1, 0, 1, 1, 1, 1, 1});
+                                     {true, true, true, true, true, true, true, true, false, true, true, true, true, true});
   cudf::test::fixed_width_column_wrapper<V, int32_t> vals({0, 1, 2, 2, 3, 4, 5, 6, 7, 8, 9, 4, 4, 2},
                                               {0, 1, 1, 1, 1, 1, 0, 1, 1, 1, 1, 1, 0, 0});
 
@@ -255,7 +255,7 @@ TYPED_TEST(groupby_nth_element_test, exclude_nulls_negative_index)
   using R = cudf::detail::target_type_t<V, cudf::aggregation::NTH_ELEMENT>;
 
   cudf::test::fixed_width_column_wrapper<K> keys({1, 2, 3, 3, 1, 2, 2, 1, 3, 3, 2, 4, 4, 2},
-                                     {1, 1, 1, 1, 1, 1, 1, 1, 0, 1, 1, 1, 1, 1});
+                                     {true, true, true, true, true, true, true, true, false, true, true, true, true, true});
   cudf::test::fixed_width_column_wrapper<V, int32_t> vals({0, 1, 2, 2, 3, 4, 5, 6, 7, 8, 9, 4, 4, 2},
                                               {0, 1, 1, 1, 1, 1, 0, 1, 1, 1, 1, 1, 0, 0});
 
@@ -320,7 +320,7 @@ TEST_F(groupby_nth_element_string_test, basic_string)
 
   //+ve out of bounds
   agg = cudf::make_nth_element_aggregation<cudf::groupby_aggregation>(3);
-  cudf::test::strings_column_wrapper expect_vals3{{"", "9", ""}, {0, 1, 0}};
+  cudf::test::strings_column_wrapper expect_vals3{{"", "9", ""}, {false, true, false}};
   test_single_agg(keys, vals, expect_keys, expect_vals3, std::move(agg));
 
   //groupby.last()
@@ -338,7 +338,7 @@ TEST_F(groupby_nth_element_string_test, basic_string)
 
   //-ve out of bounds
   agg = cudf::make_nth_element_aggregation<cudf::groupby_aggregation>(-4);
-  cudf::test::strings_column_wrapper expect_vals7{{"", "1", ""}, {0, 1, 0}};
+  cudf::test::strings_column_wrapper expect_vals7{{"", "1", ""}, {false, true, false}};
   test_single_agg(keys, vals, expect_keys, expect_vals7, std::move(agg));
 }
 // clang-format on
@@ -420,13 +420,15 @@ TEST_F(groupby_nth_element_structs_test, Basics)
   auto child0 = ints{0, 1, 2, 3, 4, 5, 6, 7, 8, 9};
   auto child1 = doubles{0.1, 1.2, 2.3, 3.4, 4.51, 5.3e4, 6.3231, -0.07, 832.1, 9.999};
   auto child2 = strings{"", "a", "b", "c", "d", "e", "f", "g", "HH", "JJJ"};
-  auto values = structs{{child0, child1, child2}, {1, 0, 1, 0, 1, 1, 1, 1, 0, 1}};
-
-  auto expected_keys   = ints{0, 1, 2, 3};
-  auto expected_ch0    = ints{1, 4, 7, 0};
-  auto expected_ch1    = doubles{1.2, 4.51, -0.07, 0.0};
-  auto expected_ch2    = strings{"a", "d", "g", ""};
-  auto expected_values = structs{{expected_ch0, expected_ch1, expected_ch2}, {0, 1, 1, 0}};
+  auto values = structs{{child0, child1, child2},
+                        {true, false, true, false, true, true, true, true, false, true}};
+
+  auto expected_keys = ints{0, 1, 2, 3};
+  auto expected_ch0  = ints{1, 4, 7, 0};
+  auto expected_ch1  = doubles{1.2, 4.51, -0.07, 0.0};
+  auto expected_ch2  = strings{"a", "d", "g", ""};
+  auto expected_values =
+    structs{{expected_ch0, expected_ch1, expected_ch2}, {false, true, true, false}};
   test_single_agg(keys,
                   values,
                   expected_keys,
@@ -437,7 +439,7 @@ TEST_F(groupby_nth_element_structs_test, Basics)
   expected_ch0    = ints{0, 4, 6, 9};
   expected_ch1    = doubles{0.1, 4.51, 6.3231, 9.999};
   expected_ch2    = strings{"", "d", "f", "JJJ"};
-  expected_values = structs{{expected_ch0, expected_ch1, expected_ch2}, {1, 1, 1, 1}};
+  expected_values = structs{{expected_ch0, expected_ch1, expected_ch2}, {true, true, true, true}};
   test_single_agg(
     keys,
     values,
@@ -459,7 +461,8 @@ TEST_F(groupby_nth_element_structs_test, NestedStructs)
   auto child1_of_child1 = doubles{0.1, 1.2, 2.3, 3.4, 4.51, 5.3e4, 6.3231, -0.07, 832.1, 9.999};
   auto child1           = structs{child0_of_child1, child1_of_child1};
   auto child2           = lists{{0}, {1, 2, 3}, {}, {4}, {5, 6}, {}, {}, {7}, {8, 9}, {}};
-  auto values           = structs{{child0, child1, child2}, {1, 0, 1, 0, 1, 1, 1, 1, 0, 1}};
+  auto values           = structs{{child0, child1, child2},
+                                  {true, false, true, false, true, true, true, true, false, true}};
 
   auto expected_keys       = ints{0, 1, 2, 3};
   auto expected_ch0        = ints{1, 4, 7, 0};
@@ -467,7 +470,8 @@ TEST_F(groupby_nth_element_structs_test, NestedStructs)
   auto expected_ch1_of_ch1 = doubles{1.2, 4.51, -0.07, 0.0};
   auto expected_ch1        = structs{expected_ch0_of_ch1, expected_ch1_of_ch1};
   auto expected_ch2        = lists{{1, 2, 3}, {5, 6}, {7}, {}};
-  auto expected_values     = structs{{expected_ch0, expected_ch1, expected_ch2}, {0, 1, 1, 0}};
+  auto expected_values =
+    structs{{expected_ch0, expected_ch1, expected_ch2}, {false, true, true, false}};
   test_single_agg(keys,
                   values,
                   expected_keys,
@@ -480,7 +484,7 @@ TEST_F(groupby_nth_element_structs_test, NestedStructs)
   expected_ch1_of_ch1 = doubles{0.1, 4.51, 6.3231, 9.999};
   expected_ch1        = structs{expected_ch0_of_ch1, expected_ch1_of_ch1};
   expected_ch2        = lists{{0}, {5, 6}, {}, {}};
-  expected_values     = structs{{expected_ch0, expected_ch1, expected_ch2}, {1, 1, 1, 1}};
+  expected_values = structs{{expected_ch0, expected_ch1, expected_ch2}, {true, true, true, true}};
   test_single_agg(
     keys,
     values,
diff --git a/cpp/tests/groupby/nunique_tests.cpp b/cpp/tests/groupby/nunique_tests.cpp
index c9156d837f7..8c2f9299c05 100644
--- a/cpp/tests/groupby/nunique_tests.cpp
+++ b/cpp/tests/groupby/nunique_tests.cpp
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2020-2023, NVIDIA CORPORATION.
+ * Copyright (c) 2020-2024, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -125,8 +125,9 @@ TYPED_TEST(groupby_nunique_test, null_keys_and_values)
   using V = TypeParam;
   using R = cudf::detail::target_type_t<V, cudf::aggregation::NUNIQUE>;
 
-  cudf::test::fixed_width_column_wrapper<K> keys({1, 2, 3, 1, 2, 2, 1, 3, 3, 2, 4},
-                                                 {1, 1, 1, 1, 1, 1, 1, 0, 1, 1, 1});
+  cudf::test::fixed_width_column_wrapper<K> keys(
+    {1, 2, 3, 1, 2, 2, 1, 3, 3, 2, 4},
+    {true, true, true, true, true, true, true, false, true, true, true});
   cudf::test::fixed_width_column_wrapper<V> vals({0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 4},
                                                  {0, 1, 1, 1, 1, 0, 1, 1, 1, 1, 0});
 
@@ -150,8 +151,9 @@ TYPED_TEST(groupby_nunique_test, null_keys_and_values_with_duplicates)
   using V = TypeParam;
   using R = cudf::detail::target_type_t<V, cudf::aggregation::NUNIQUE>;
 
-  cudf::test::fixed_width_column_wrapper<K> keys({1, 2, 3, 3, 1, 2, 2, 1, 3, 3, 2, 4, 4, 2},
-                                                 {1, 1, 1, 1, 1, 1, 1, 1, 0, 1, 1, 1, 1, 1});
+  cudf::test::fixed_width_column_wrapper<K> keys(
+    {1, 2, 3, 3, 1, 2, 2, 1, 3, 3, 2, 4, 4, 2},
+    {true, true, true, true, true, true, true, true, false, true, true, true, true, true});
   cudf::test::fixed_width_column_wrapper<V> vals({0, 1, 2, 2, 3, 4, 5, 6, 7, 8, 9, 4, 4, 2},
                                                  {0, 1, 1, 1, 1, 1, 0, 1, 1, 1, 1, 0, 0, 0});
 
@@ -176,8 +178,9 @@ TYPED_TEST(groupby_nunique_test, include_nulls)
   using V = TypeParam;
   using R = cudf::detail::target_type_t<V, cudf::aggregation::NUNIQUE>;
 
-  cudf::test::fixed_width_column_wrapper<K> keys({1, 2, 3, 3, 1, 2, 2, 1, 3, 3, 2, 4, 4, 2},
-                                                 {1, 1, 1, 1, 1, 1, 1, 1, 0, 1, 1, 1, 1, 1});
+  cudf::test::fixed_width_column_wrapper<K> keys(
+    {1, 2, 3, 3, 1, 2, 2, 1, 3, 3, 2, 4, 4, 2},
+    {true, true, true, true, true, true, true, true, false, true, true, true, true, true});
   cudf::test::fixed_width_column_wrapper<V> vals({0, 1, 2, 2, 3, 4, 5, 6, 7, 8, 9, 4, 4, 2},
                                                  {0, 1, 1, 1, 1, 1, 0, 1, 1, 1, 1, 0, 0, 0});
 
@@ -204,7 +207,7 @@ TYPED_TEST(groupby_nunique_test, dictionary)
 
   // clang-format off
   cudf::test::fixed_width_column_wrapper<K> keys({1, 2, 3, 3, 1, 2, 2, 1, 0, 3, 2, 4, 4, 2},
-                                     {1, 1, 1, 1, 1, 1, 1, 1, 0, 1, 1, 1, 1, 1});
+                                     {true, true, true, true, true, true, true, true, false, true, true, true, true, true});
   cudf::test::dictionary_column_wrapper<V>  vals({0, 1, 2, 2, 3, 4, 0, 6, 7, 8, 9, 0, 0, 0},
                                      {0, 1, 1, 1, 1, 1, 0, 1, 1, 1, 1, 0, 0, 0});
 
diff --git a/cpp/tests/groupby/product_scan_tests.cpp b/cpp/tests/groupby/product_scan_tests.cpp
index 6010abd8a20..fd1512541a0 100644
--- a/cpp/tests/groupby/product_scan_tests.cpp
+++ b/cpp/tests/groupby/product_scan_tests.cpp
@@ -127,7 +127,7 @@ TYPED_TEST(groupby_product_scan_test, null_keys_and_values)
   using result_wrapper = typename TestFixture::result_wrapper;
 
   // clang-format off
-  key_wrapper keys(  {1, 2, 3, 1, 2, 2, 1, 3, 3, 2, 4}, {1, 1, 1, 1, 1, 1, 1, 0, 1, 1, 1});
+  key_wrapper keys(  {1, 2, 3, 1, 2, 2, 1, 3, 3, 2, 4}, {true, true, true, true, true, true, true, false, true, true, true});
   value_wrapper vals({0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 4}, {0, 1, 1, 1, 1, 0, 1, 1, 1, 1, 0});
 
   //                         { 1, 1, 1, 2, 2,  2,  2, 3, *, 3, 4};
diff --git a/cpp/tests/groupby/product_tests.cpp b/cpp/tests/groupby/product_tests.cpp
index 0145293682b..8be4040db1c 100644
--- a/cpp/tests/groupby/product_tests.cpp
+++ b/cpp/tests/groupby/product_tests.cpp
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2021-2023, NVIDIA CORPORATION.
+ * Copyright (c) 2021-2024, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -120,7 +120,7 @@ TYPED_TEST(groupby_product_test, null_keys_and_values)
 
   // clang-format off
   cudf::test::fixed_width_column_wrapper<K> keys(       { 1, 2, 3, 1, 2, 2, 1, 3, 3, 2, 4},
-                                            { 1, 1, 1, 1, 1, 1, 1, 0, 1, 1, 1});
+                                            { true, true, true, true, true, true, true, false, true, true, true});
   cudf::test::fixed_width_column_wrapper<V> vals(       { 0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 3},
                                             { 0, 1, 1, 1, 1, 0, 1, 1, 1, 1, 0});
 
diff --git a/cpp/tests/groupby/quantile_tests.cpp b/cpp/tests/groupby/quantile_tests.cpp
index 8d134f340a0..7a5fee08238 100644
--- a/cpp/tests/groupby/quantile_tests.cpp
+++ b/cpp/tests/groupby/quantile_tests.cpp
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2019-2023, NVIDIA CORPORATION.
+ * Copyright (c) 2019-2024, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -106,8 +106,9 @@ TYPED_TEST(groupby_quantile_test, null_keys_and_values)
   using V = TypeParam;
   using R = cudf::detail::target_type_t<V, cudf::aggregation::QUANTILE>;
 
-  cudf::test::fixed_width_column_wrapper<K> keys({1, 2, 3, 1, 2, 2, 1, 3, 3, 2, 4},
-                                                 {1, 1, 1, 1, 1, 1, 1, 0, 1, 1, 1});
+  cudf::test::fixed_width_column_wrapper<K> keys(
+    {1, 2, 3, 1, 2, 2, 1, 3, 3, 2, 4},
+    {true, true, true, true, true, true, true, false, true, true, true});
   cudf::test::fixed_width_column_wrapper<V> vals({0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 4},
                                                  {0, 1, 1, 1, 1, 0, 1, 1, 1, 1, 0});
 
diff --git a/cpp/tests/groupby/rank_scan_tests.cpp b/cpp/tests/groupby/rank_scan_tests.cpp
index 76b05566e4d..7f31bc9089f 100644
--- a/cpp/tests/groupby/rank_scan_tests.cpp
+++ b/cpp/tests/groupby/rank_scan_tests.cpp
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2021-2023, NVIDIA CORPORATION.
+ * Copyright (c) 2021-2024, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -244,7 +244,7 @@ TYPED_TEST(typed_groupby_rank_scan_test, mixedStructs)
     0.0, 0.0, 2.0 / 5, 2.0 / 5, 4.0 / 5, 5.0 / 5, 0.0, 0.0, 2.0 / 2, 0.0, 0.0, 2.0 / 2};
 
   std::vector<cudf::groupby::scan_request> requests;
-  requests.emplace_back(cudf::groupby::scan_request());
+  requests.emplace_back();
   requests[0].values = *struct_col;
   requests[0].aggregations.push_back(cudf::make_rank_aggregation<cudf::groupby_scan_aggregation>(
     cudf::rank_method::DENSE, {}, cudf::null_policy::INCLUDE));
@@ -295,8 +295,8 @@ TYPED_TEST(typed_groupby_rank_scan_test, nestedStructs)
     {"0", "0", "0", "0", "0", "0", "1", "1", "1", "1", "0", "1"}, nulls_at({9, 10, 11})};
 
   std::vector<cudf::groupby::scan_request> requests;
-  requests.emplace_back(cudf::groupby::scan_request());
-  requests.emplace_back(cudf::groupby::scan_request());
+  requests.emplace_back();
+  requests.emplace_back();
   requests[0].values = *nested_structs;
   requests[0].aggregations.push_back(
     cudf::make_rank_aggregation<cudf::groupby_scan_aggregation>(cudf::rank_method::DENSE));
@@ -363,8 +363,8 @@ TYPED_TEST(typed_groupby_rank_scan_test, structsWithNullPushdown)
     {"0", "0", "0", "0", "0", "0", "1", "1", "1", "X", "X", "X"}, nulls_at({9, 10, 11})};
 
   std::vector<cudf::groupby::scan_request> requests;
-  requests.emplace_back(cudf::groupby::scan_request());
-  requests.emplace_back(cudf::groupby::scan_request());
+  requests.emplace_back();
+  requests.emplace_back();
   requests[0].values = *possibly_null_structs;
   requests[0].aggregations.push_back(cudf::make_rank_aggregation<cudf::groupby_scan_aggregation>(
     cudf::rank_method::DENSE, {}, cudf::null_policy::INCLUDE));
diff --git a/cpp/tests/groupby/replace_nulls_tests.cpp b/cpp/tests/groupby/replace_nulls_tests.cpp
index d4bd278aaad..748a5bdd638 100644
--- a/cpp/tests/groupby/replace_nulls_tests.cpp
+++ b/cpp/tests/groupby/replace_nulls_tests.cpp
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2019-2023, NVIDIA CORPORATION.
+ * Copyright (c) 2019-2024, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -327,7 +327,7 @@ TEST_F(GroupbyReplaceNullsStructsTest, PrecedingFill)
   // Only null rows are replaced.
 
   SCW val =
-    this->data({{1, -1, 3, -1, -1, -1, 7}, {1, 0, 1, 0, 0, 0, 1}},
+    this->data({{1, -1, 3, -1, -1, -1, 7}, {true, false, true, false, false, false, true}},
                {{"x", "yy", "", "", "", "zz", ""}, {true, true, false, false, false, true, false}},
                LCW({{1, 2, 3}, {-1}, {}, {}, {42}, {}, {}}, Mask_t{1, 1, 0, 0, 1, 0, 0}.begin()),
                {1, 1, 0, 0, 1, 1, 0});
@@ -335,7 +335,7 @@ TEST_F(GroupbyReplaceNullsStructsTest, PrecedingFill)
   cudf::test::fixed_width_column_wrapper<K> expect_key{0, 0, 0, 1, 1, 1, 1};
 
   SCW expect_val = this->data(
-    {{-1, -1, -1, 1, 1, -1, -1}, {0, 0, 0, 1, 1, 0, 0}},
+    {{-1, -1, -1, 1, 1, -1, -1}, {false, false, false, true, true, false, false}},
     {{"yy", "yy", "", "x", "x", "zz", "zz"}, {true, true, false, true, true, true, true}},
     LCW({LCW{-1}, {-1}, {42}, {1, 2, 3}, {1, 2, 3}, {}, {}}, Mask_t{1, 1, 1, 1, 1, 0, 0}.begin()),
     {1, 1, 1, 1, 1, 1, 1});
@@ -352,7 +352,7 @@ TEST_F(GroupbyReplaceNullsStructsTest, FollowingFill)
   // Only null rows are replaced.
 
   SCW val =
-    this->data({{1, -1, 3, -1, -1, -1, 7}, {1, 0, 1, 0, 0, 0, 1}},
+    this->data({{1, -1, 3, -1, -1, -1, 7}, {true, false, true, false, false, false, true}},
                {{"x", "yy", "", "", "", "zz", ""}, {true, true, false, false, false, true, false}},
                LCW({{1, 2, 3}, {-1}, {}, {}, {42}, {}, {}}, Mask_t{1, 1, 0, 0, 1, 0, 0}.begin()),
                {1, 1, 0, 0, 1, 1, 0});
@@ -360,7 +360,7 @@ TEST_F(GroupbyReplaceNullsStructsTest, FollowingFill)
   cudf::test::fixed_width_column_wrapper<K> expect_key{0, 0, 0, 1, 1, 1, 1};
 
   SCW expect_val = this->data(
-    {{-1, -1, -1, 1, -1, -1, -1}, {0, 0, 0, 1, 0, 0, 0}},
+    {{-1, -1, -1, 1, -1, -1, -1}, {false, false, false, true, false, false, false}},
     {{"yy", "", "", "x", "zz", "zz", ""}, {true, false, false, true, true, true, false}},
     LCW({LCW{-1}, {42}, {42}, {1, 2, 3}, {}, {}, {}}, Mask_t{1, 1, 1, 1, 0, 0, 0}.begin()),
     {1, 1, 1, 1, 1, 1, 0});
diff --git a/cpp/tests/groupby/shift_tests.cpp b/cpp/tests/groupby/shift_tests.cpp
index 1a6abf2e734..14c9ceb4508 100644
--- a/cpp/tests/groupby/shift_tests.cpp
+++ b/cpp/tests/groupby/shift_tests.cpp
@@ -248,7 +248,7 @@ TEST_F(groupby_shift_string_test, ForwardShiftWithoutNull_NullScalar)
   cudf::test::fixed_width_column_wrapper<K> key{1, 2, 1, 2, 2, 1, 1};
   cudf::test::strings_column_wrapper val{"a", "bb", "cc", "d", "eee", "f", "gg"};
   cudf::test::strings_column_wrapper expected({"", "a", "cc", "f", "", "bb", "d"},
-                                              {0, 1, 1, 1, 0, 1, 1});
+                                              {false, true, true, true, false, true, true});
   cudf::size_type offset = 1;
   auto slr               = cudf::make_default_constructed_scalar(cudf::column_view(val).type());
 
@@ -260,9 +260,9 @@ TEST_F(groupby_shift_string_test, ForwardShiftWithNull_NullScalar)
   using K = int32_t;
   cudf::test::fixed_width_column_wrapper<K> key{1, 2, 1, 2, 2, 1, 1};
   cudf::test::strings_column_wrapper val({"a", "bb", "cc", "d", "eee", "f", "gg"},
-                                         {1, 0, 1, 1, 0, 0, 0});
+                                         {true, false, true, true, false, false, false});
   cudf::test::strings_column_wrapper expected({"", "", "a", "cc", "", "", ""},
-                                              {0, 0, 1, 1, 0, 0, 0});
+                                              {false, false, true, true, false, false, false});
   cudf::size_type offset = 2;
   auto slr               = cudf::make_default_constructed_scalar(cudf::column_view(val).type());
 
@@ -287,9 +287,9 @@ TEST_F(groupby_shift_string_test, ForwardShiftWithNull_ValidScalar)
   using K = int32_t;
   cudf::test::fixed_width_column_wrapper<K> key{1, 2, 1, 2, 2, 1, 1};
   cudf::test::strings_column_wrapper val({"a", "bb", "cc", "d", "eee", "f", "gg"},
-                                         {1, 1, 0, 0, 1, 0, 1});
+                                         {true, true, false, false, true, false, true});
   cudf::test::strings_column_wrapper expected({"42", "a", "", "", "42", "bb", ""},
-                                              {1, 1, 0, 0, 1, 1, 0});
+                                              {true, true, false, false, true, true, false});
 
   cudf::size_type offset = 1;
   auto slr               = cudf::make_string_scalar("42");
@@ -303,7 +303,7 @@ TEST_F(groupby_shift_string_test, BackwardShiftWithoutNull_NullScalar)
   cudf::test::fixed_width_column_wrapper<K> key{1, 2, 1, 2, 2, 1, 1};
   cudf::test::strings_column_wrapper val{"a", "bb", "cc", "d", "eee", "f", "gg"};
   cudf::test::strings_column_wrapper expected({"gg", "", "", "", "", "", ""},
-                                              {1, 0, 0, 0, 0, 0, 0});
+                                              {true, false, false, false, false, false, false});
 
   cudf::size_type offset = -3;
   auto slr               = cudf::make_default_constructed_scalar(cudf::column_view(val).type());
@@ -316,9 +316,9 @@ TEST_F(groupby_shift_string_test, BackwardShiftWithNull_NullScalar)
   using K = int32_t;
   cudf::test::fixed_width_column_wrapper<K> key{1, 2, 1, 2, 2, 1, 1};
   cudf::test::strings_column_wrapper val({"a", "bb", "cc", "d", "eee", "f", "gg"},
-                                         {1, 0, 1, 1, 0, 0, 0});
+                                         {true, false, true, true, false, false, false});
   cudf::test::strings_column_wrapper expected({"cc", "", "", "", "d", "", ""},
-                                              {1, 0, 0, 0, 1, 0, 0});
+                                              {true, false, false, false, true, false, false});
 
   cudf::size_type offset = -1;
   auto slr               = cudf::make_default_constructed_scalar(cudf::column_view(val).type());
@@ -344,9 +344,9 @@ TEST_F(groupby_shift_string_test, BackwardShiftWithNull_ValidScalar)
   using K = int32_t;
   cudf::test::fixed_width_column_wrapper<K> key{1, 2, 1, 2, 2, 1, 1};
   cudf::test::strings_column_wrapper val({"a", "bb", "cc", "d", "eee", "f", "gg"},
-                                         {1, 1, 0, 0, 1, 0, 1});
+                                         {true, true, false, false, true, false, true});
   cudf::test::strings_column_wrapper expected({"", "gg", "42", "42", "eee", "42", "42"},
-                                              {0, 1, 1, 1, 1, 1, 1});
+                                              {false, true, true, true, true, true, true});
 
   cudf::size_type offset = -2;
   auto slr               = cudf::make_string_scalar("42");
@@ -431,7 +431,8 @@ TYPED_TEST(groupby_shift_mixed_test, NoFill)
   cudf::test::fixed_width_column_wrapper<TypeParam> v2{1, 2, 3, 4, 5, 6, 7};
   cudf::table_view value{{v1, v2}};
 
-  cudf::test::strings_column_wrapper e1({"", "", "a", "cc", "", "", "bb"}, {0, 0, 1, 1, 0, 0, 1});
+  cudf::test::strings_column_wrapper e1({"", "", "a", "cc", "", "", "bb"},
+                                        {false, false, true, true, false, false, true});
   cudf::test::fixed_width_column_wrapper<TypeParam> e2({-1, 1, 3, 6, -1, 2, 4},
                                                        {0, 1, 1, 1, 0, 1, 1});
   cudf::table_view expected{{e1, e2}};
diff --git a/cpp/tests/groupby/std_tests.cpp b/cpp/tests/groupby/std_tests.cpp
index 4c07e2e8ddc..732a0ba9561 100644
--- a/cpp/tests/groupby/std_tests.cpp
+++ b/cpp/tests/groupby/std_tests.cpp
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2019-2023, NVIDIA CORPORATION.
+ * Copyright (c) 2019-2024, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -106,8 +106,9 @@ TYPED_TEST(groupby_std_test, null_keys_and_values)
   using V = TypeParam;
   using R = cudf::detail::target_type_t<V, cudf::aggregation::STD>;
 
-  cudf::test::fixed_width_column_wrapper<K> keys({1, 2, 3, 1, 2, 2, 1, 3, 3, 2, 4},
-                                                 {1, 1, 1, 1, 1, 1, 1, 0, 1, 1, 1});
+  cudf::test::fixed_width_column_wrapper<K> keys(
+    {1, 2, 3, 1, 2, 2, 1, 3, 3, 2, 4},
+    {true, true, true, true, true, true, true, false, true, true, true});
   cudf::test::fixed_width_column_wrapper<V> vals({0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 3},
                                                  {0, 1, 1, 1, 1, 0, 1, 1, 1, 1, 1});
 
@@ -127,8 +128,9 @@ TYPED_TEST(groupby_std_test, ddof_non_default)
   using V = TypeParam;
   using R = cudf::detail::target_type_t<V, cudf::aggregation::STD>;
 
-  cudf::test::fixed_width_column_wrapper<K> keys({1, 2, 3, 1, 2, 2, 1, 3, 3, 2, 4},
-                                                 {1, 1, 1, 1, 1, 1, 1, 0, 1, 1, 1});
+  cudf::test::fixed_width_column_wrapper<K> keys(
+    {1, 2, 3, 1, 2, 2, 1, 3, 3, 2, 4},
+    {true, true, true, true, true, true, true, false, true, true, true});
   cudf::test::fixed_width_column_wrapper<V> vals({0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 3},
                                                  {0, 1, 1, 1, 1, 0, 1, 1, 1, 1, 1});
 
diff --git a/cpp/tests/groupby/sum_of_squares_tests.cpp b/cpp/tests/groupby/sum_of_squares_tests.cpp
index 23724113d50..a5b3ac97773 100644
--- a/cpp/tests/groupby/sum_of_squares_tests.cpp
+++ b/cpp/tests/groupby/sum_of_squares_tests.cpp
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2021-2023, NVIDIA CORPORATION.
+ * Copyright (c) 2021-2024, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -104,8 +104,9 @@ TYPED_TEST(groupby_sum_of_squares_test, null_keys_and_values)
   using V = TypeParam;
   using R = cudf::detail::target_type_t<V, cudf::aggregation::SUM_OF_SQUARES>;
 
-  cudf::test::fixed_width_column_wrapper<K> keys({1, 2, 3, 1, 2, 2, 1, 3, 3, 2, 4},
-                                                 {1, 1, 1, 1, 1, 1, 1, 0, 1, 1, 1});
+  cudf::test::fixed_width_column_wrapper<K> keys(
+    {1, 2, 3, 1, 2, 2, 1, 3, 3, 2, 4},
+    {true, true, true, true, true, true, true, false, true, true, true});
   cudf::test::fixed_width_column_wrapper<V> vals({0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 3},
                                                  {0, 1, 1, 1, 1, 0, 1, 1, 1, 1, 0});
 
diff --git a/cpp/tests/groupby/sum_scan_tests.cpp b/cpp/tests/groupby/sum_scan_tests.cpp
index b03212f3197..13cb1b8dbca 100644
--- a/cpp/tests/groupby/sum_scan_tests.cpp
+++ b/cpp/tests/groupby/sum_scan_tests.cpp
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2021-2023, NVIDIA CORPORATION.
+ * Copyright (c) 2021-2024, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -130,7 +130,7 @@ TYPED_TEST(groupby_sum_scan_test, null_keys_and_values)
   using result_wrapper = typename TestFixture::result_wrapper;
 
   // clang-format off
-  key_wrapper keys(  {1, 2, 3, 1, 2, 2, 1, 3, 3, 2, 4}, {1, 1, 1, 1, 1, 1, 1, 0, 1, 1, 1});
+  key_wrapper keys(  {1, 2, 3, 1, 2, 2, 1, 3, 3, 2, 4}, {true, true, true, true, true, true, true, false, true, true, true});
   value_wrapper vals({0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 4}, {0, 1, 1, 1, 1, 0, 1, 1, 1, 1, 0});
 
   //                         { 1, 1, 1, 2, 2,  2,  2, 3, *, 3, 4};
diff --git a/cpp/tests/groupby/sum_tests.cpp b/cpp/tests/groupby/sum_tests.cpp
index 03cc3fab568..5f5329e5d7a 100644
--- a/cpp/tests/groupby/sum_tests.cpp
+++ b/cpp/tests/groupby/sum_tests.cpp
@@ -112,8 +112,9 @@ TYPED_TEST(groupby_sum_test, null_keys_and_values)
   using V = TypeParam;
   using R = cudf::detail::target_type_t<V, cudf::aggregation::SUM>;
 
-  cudf::test::fixed_width_column_wrapper<K> keys({1, 2, 3, 1, 2, 2, 1, 3, 3, 2, 4},
-                                                 {1, 1, 1, 1, 1, 1, 1, 0, 1, 1, 1});
+  cudf::test::fixed_width_column_wrapper<K> keys(
+    {1, 2, 3, 1, 2, 2, 1, 3, 3, 2, 4},
+    {true, true, true, true, true, true, true, false, true, true, true});
   cudf::test::fixed_width_column_wrapper<V> vals({0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 4},
                                                  {0, 1, 1, 1, 1, 0, 1, 1, 1, 1, 0});
 
diff --git a/cpp/tests/groupby/var_tests.cpp b/cpp/tests/groupby/var_tests.cpp
index baebc45b975..da03169c93f 100644
--- a/cpp/tests/groupby/var_tests.cpp
+++ b/cpp/tests/groupby/var_tests.cpp
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2019-2023, NVIDIA CORPORATION.
+ * Copyright (c) 2019-2024, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -106,8 +106,9 @@ TYPED_TEST(groupby_var_test, null_keys_and_values)
   using V = TypeParam;
   using R = cudf::detail::target_type_t<V, cudf::aggregation::VARIANCE>;
 
-  cudf::test::fixed_width_column_wrapper<K> keys({1, 2, 3, 1, 2, 2, 1, 3, 3, 2, 4},
-                                                 {1, 1, 1, 1, 1, 1, 1, 0, 1, 1, 1});
+  cudf::test::fixed_width_column_wrapper<K> keys(
+    {1, 2, 3, 1, 2, 2, 1, 3, 3, 2, 4},
+    {true, true, true, true, true, true, true, false, true, true, true});
   cudf::test::fixed_width_column_wrapper<V> vals({0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 3},
                                                  {0, 1, 1, 1, 1, 0, 1, 1, 1, 1, 1});
 
@@ -128,8 +129,9 @@ TYPED_TEST(groupby_var_test, ddof_non_default)
   using V = TypeParam;
   using R = cudf::detail::target_type_t<V, cudf::aggregation::VARIANCE>;
 
-  cudf::test::fixed_width_column_wrapper<K> keys({1, 2, 3, 1, 2, 2, 1, 3, 3, 2, 4},
-                                                 {1, 1, 1, 1, 1, 1, 1, 0, 1, 1, 1});
+  cudf::test::fixed_width_column_wrapper<K> keys(
+    {1, 2, 3, 1, 2, 2, 1, 3, 3, 2, 4},
+    {true, true, true, true, true, true, true, false, true, true, true});
   cudf::test::fixed_width_column_wrapper<V> vals({0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 3},
                                                  {0, 1, 1, 1, 1, 0, 1, 1, 1, 1, 1});
 
diff --git a/cpp/tests/hashing/md5_test.cpp b/cpp/tests/hashing/md5_test.cpp
index 081ab7978cd..69e518cbf8d 100644
--- a/cpp/tests/hashing/md5_test.cpp
+++ b/cpp/tests/hashing/md5_test.cpp
@@ -34,7 +34,7 @@ TEST_F(MD5HashTest, MultiValue)
      "A very long (greater than 128 bytes/char string) to test a multi hash-step data point in the "
      "MD5 hash function. This string needed to be longer.",
      "All work and no play makes Jack a dull boy",
-     "!\"#$%&\'()*+,-./0123456789:;<=>?@[\\]^_`{|}~",
+     R"(!"#$%&'()*+,-./0123456789:;<=>?@[\]^_`{|}~)",
      "Multi-byte characters: é¼³⅝"});
 
   /*
@@ -92,8 +92,8 @@ TEST_F(MD5HashTest, MultiValue)
 TEST_F(MD5HashTest, EmptyNullEquivalence)
 {
   // Test that empty strings hash the same as nulls
-  cudf::test::strings_column_wrapper const strings_col1({"", ""}, {1, 0});
-  cudf::test::strings_column_wrapper const strings_col2({"", ""}, {0, 1});
+  cudf::test::strings_column_wrapper const strings_col1({"", ""}, {true, false});
+  cudf::test::strings_column_wrapper const strings_col2({"", ""}, {false, true});
 
   auto const input1 = cudf::table_view({strings_col1});
   auto const input2 = cudf::table_view({strings_col2});
@@ -127,7 +127,7 @@ TEST_F(MD5HashTest, StringLists)
       "MD5 hash function. This string needed to be longer.",
       " It needed to be even longer."},
      {"All ", "work ", "and", " no", " play ", "makes Jack", " a dull boy"},
-     {"!\"#$%&\'()*+,-./0123456789:;<=>?@[\\]^_`", "{|}~"}});
+     {R"(!"#$%&'()*+,-./0123456789:;<=>?@[\]^_`)", "{|}~"}});
 
   auto const input1 = cudf::table_view({strings_col});
   auto const input2 = cudf::table_view({strings_list_col});
@@ -171,16 +171,24 @@ TYPED_TEST(MD5HashTestTyped, WithNulls)
 
 TEST_F(MD5HashTest, TestBoolListsWithNulls)
 {
-  cudf::test::fixed_width_column_wrapper<bool> const col1({0, 0, 0, 0, 1, 1, 1, 0, 0},
-                                                          {1, 0, 0, 0, 1, 1, 1, 0, 0});
-  cudf::test::fixed_width_column_wrapper<bool> const col2({0, 0, 0, 1, 0, 1, 0, 1, 0},
-                                                          {1, 0, 0, 1, 0, 1, 0, 1, 0});
-  cudf::test::fixed_width_column_wrapper<bool> const col3({0, 0, 0, 1, 1, 0, 0, 0, 1},
-                                                          {1, 0, 0, 1, 1, 0, 0, 0, 1});
+  cudf::test::fixed_width_column_wrapper<bool> const col1(
+    {0, 0, 0, 0, 1, 1, 1, 0, 0}, {true, false, false, false, true, true, true, false, false});
+  cudf::test::fixed_width_column_wrapper<bool> const col2(
+    {0, 0, 0, 1, 0, 1, 0, 1, 0}, {true, false, false, true, false, true, false, true, false});
+  cudf::test::fixed_width_column_wrapper<bool> const col3(
+    {0, 0, 0, 1, 1, 0, 0, 0, 1}, {true, false, false, true, true, false, false, false, true});
 
   auto validity = cudf::detail::make_counting_transform_iterator(0, [](auto i) { return i != 1; });
-  cudf::test::lists_column_wrapper<bool> const list_col(
-    {{0, 0, 0}, {1}, {}, {{1, 1, 1}, validity}, {1, 1}, {1, 1}, {1}, {1}, {1}}, validity);
+  cudf::test::lists_column_wrapper<bool> const list_col({{false, false, false},
+                                                         {true},
+                                                         {},
+                                                         {{true, true, true}, validity},
+                                                         {true, true},
+                                                         {true, true},
+                                                         {true},
+                                                         {true},
+                                                         {true}},
+                                                        validity);
 
   auto const input1 = cudf::table_view({col1, col2, col3});
   auto const input2 = cudf::table_view({list_col});
diff --git a/cpp/tests/hashing/murmurhash3_x86_32_test.cpp b/cpp/tests/hashing/murmurhash3_x86_32_test.cpp
index 24524140e74..c1a6e6ff6e1 100644
--- a/cpp/tests/hashing/murmurhash3_x86_32_test.cpp
+++ b/cpp/tests/hashing/murmurhash3_x86_32_test.cpp
@@ -72,26 +72,28 @@ TEST_F(MurmurHashTest, MultiValueNulls)
      "jumps over the lazy dog.",
      "All work and no play makes Jack a dull boy",
      R"(!"#$%&'()*+,-./0123456789:;<=>?@[\]^_`{|}~)"},
-    {0, 1, 1, 0, 1});
+    {false, true, true, false, true});
   cudf::test::strings_column_wrapper const strings_col2(
     {"different but null",
      "The quick brown fox",
      "jumps over the lazy dog.",
      "I am Jack's complete lack of null value",
      R"(!"#$%&'()*+,-./0123456789:;<=>?@[\]^_`{|}~)"},
-    {0, 1, 1, 0, 1});
+    {false, true, true, false, true});
 
   // Nulls with different values should be equal
   using limits = std::numeric_limits<int32_t>;
   cudf::test::fixed_width_column_wrapper<int32_t> const ints_col1(
-    {0, 100, -100, limits::min(), limits::max()}, {1, 0, 0, 1, 1});
+    {0, 100, -100, limits::min(), limits::max()}, {true, false, false, true, true});
   cudf::test::fixed_width_column_wrapper<int32_t> const ints_col2(
-    {0, -200, 200, limits::min(), limits::max()}, {1, 0, 0, 1, 1});
+    {0, -200, 200, limits::min(), limits::max()}, {true, false, false, true, true});
 
   // Nulls with different values should be equal
   // Different truth values should be equal
-  cudf::test::fixed_width_column_wrapper<bool> const bools_col1({0, 1, 0, 1, 1}, {1, 1, 0, 0, 1});
-  cudf::test::fixed_width_column_wrapper<bool> const bools_col2({0, 2, 1, 0, 255}, {1, 1, 0, 0, 1});
+  cudf::test::fixed_width_column_wrapper<bool> const bools_col1({0, 1, 0, 1, 1},
+                                                                {true, true, false, false, true});
+  cudf::test::fixed_width_column_wrapper<bool> const bools_col2({0, 2, 1, 0, 255},
+                                                                {true, true, false, false, true});
 
   // Nulls with different values should be equal
   using ts = cudf::timestamp_s;
@@ -101,14 +103,14 @@ TEST_F(MurmurHashTest, MultiValueNulls)
      static_cast<ts::duration>(-100),
      ts::duration::min(),
      ts::duration::max()},
-    {1, 0, 0, 1, 1});
+    {true, false, false, true, true});
   cudf::test::fixed_width_column_wrapper<ts, ts::duration> const secs_col2(
     {ts::duration::zero(),
      static_cast<ts::duration>(-200),
      static_cast<ts::duration>(200),
      ts::duration::min(),
      ts::duration::max()},
-    {1, 0, 0, 1, 1});
+    {true, false, false, true, true});
 
   auto const input1 = cudf::table_view({strings_col1, ints_col1, bools_col1, secs_col1});
   auto const input2 = cudf::table_view({strings_col2, ints_col2, bools_col2, secs_col2});
@@ -165,7 +167,8 @@ TEST_F(MurmurHashTest, NullableList)
   using LCW = cudf::test::lists_column_wrapper<uint64_t>;
   using ICW = cudf::test::fixed_width_column_wrapper<uint32_t>;
 
-  auto const valids = std::vector<bool>{1, 1, 1, 1, 1, 1, 1, 0, 1, 1, 0};
+  auto const valids =
+    std::vector<bool>{true, true, true, true, true, true, true, false, true, true, false};
   auto const col =
     LCW{{{}, {}, {1}, {1}, {2, 2}, {2}, {2}, {}, {2, 2}, {2, 2}, {}}, valids.begin()};
   auto expect = ICW{-2023148619,
@@ -203,17 +206,84 @@ TEST_F(MurmurHashTest, ListOfStruct)
 {
   auto col1 = cudf::test::fixed_width_column_wrapper<int32_t>{
     {-1, -1, 0, 2, 2, 2, 1, 2, 0, 2, 0, 2, 0, 2, 0, 0, 1, 2},
-    {1, 1, 1, 1, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0}};
+    {true,
+     true,
+     true,
+     true,
+     true,
+     false,
+     true,
+     true,
+     true,
+     true,
+     true,
+     true,
+     true,
+     true,
+     true,
+     true,
+     false,
+     false}};
   auto col2 = cudf::test::strings_column_wrapper{
     {"x", "x", "a", "a", "b", "b", "a", "b", "a", "b", "a", "c", "a", "c", "a", "c", "b", "b"},
-    {1, 1, 1, 1, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 1, 1}};
-  auto struct_col = cudf::test::structs_column_wrapper{
-    {col1, col2}, {0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1}};
+    {true,
+     true,
+     true,
+     true,
+     true,
+     false,
+     true,
+     true,
+     true,
+     true,
+     true,
+     true,
+     true,
+     true,
+     false,
+     false,
+     true,
+     true}};
+  auto struct_col = cudf::test::structs_column_wrapper{{col1, col2},
+                                                       {false,
+                                                        false,
+                                                        false,
+                                                        false,
+                                                        false,
+                                                        true,
+                                                        true,
+                                                        true,
+                                                        true,
+                                                        true,
+                                                        true,
+                                                        true,
+                                                        true,
+                                                        true,
+                                                        true,
+                                                        true,
+                                                        true,
+                                                        true}};
 
   auto offsets = cudf::test::fixed_width_column_wrapper<cudf::size_type>{
     0, 0, 0, 0, 0, 2, 3, 4, 5, 6, 8, 10, 12, 14, 15, 16, 17, 18};
 
-  auto list_nullmask = std::vector<bool>{1, 1, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1};
+  auto list_nullmask = std::vector<bool>{true,
+                                         true,
+                                         false,
+                                         false,
+                                         true,
+                                         true,
+                                         true,
+                                         true,
+                                         true,
+                                         true,
+                                         true,
+                                         true,
+                                         true,
+                                         true,
+                                         true,
+                                         true,
+                                         true};
   auto [null_mask, null_count] =
     cudf::test::detail::make_null_mask(list_nullmask.begin(), list_nullmask.end());
   auto list_column = cudf::make_lists_column(
@@ -279,14 +349,16 @@ TEST_F(MurmurHashTest, ListOfEmptyStruct)
   // [{}, {}]
   // [{}, {}]
 
-  auto struct_validity = std::vector<bool>{0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1};
+  auto struct_validity = std::vector<bool>{
+    false, false, false, false, false, false, false, false, true, true, true, true, true, true};
   auto [null_mask, null_count] =
     cudf::test::detail::make_null_mask(struct_validity.begin(), struct_validity.end());
   auto struct_col = cudf::make_structs_column(14, {}, null_count, std::move(null_mask));
 
   auto offsets = cudf::test::fixed_width_column_wrapper<cudf::size_type>{
     0, 0, 0, 0, 0, 2, 4, 6, 7, 8, 9, 10, 12, 14};
-  auto list_nullmask = std::vector<bool>{1, 1, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1};
+  auto list_nullmask = std::vector<bool>{
+    true, true, false, false, true, true, true, true, true, true, true, true, true};
   std::tie(null_mask, null_count) =
     cudf::test::detail::make_null_mask(list_nullmask.begin(), list_nullmask.end());
   auto list_column = cudf::make_lists_column(
@@ -322,7 +394,7 @@ TEST_F(MurmurHashTest, EmptyDeepList)
   auto list1 = cudf::test::lists_column_wrapper<int>{};
 
   auto offsets       = cudf::test::fixed_width_column_wrapper<cudf::size_type>{0, 0, 0, 0, 0};
-  auto list_nullmask = std::vector<bool>{1, 1, 0, 0};
+  auto list_nullmask = std::vector<bool>{true, true, false, false};
   auto [null_mask, null_count] =
     cudf::test::detail::make_null_mask(list_nullmask.begin(), list_nullmask.end());
   auto list_column = cudf::make_lists_column(
diff --git a/cpp/tests/hashing/sha1_test.cpp b/cpp/tests/hashing/sha1_test.cpp
index c3d0fe7450a..e28e71442a6 100644
--- a/cpp/tests/hashing/sha1_test.cpp
+++ b/cpp/tests/hashing/sha1_test.cpp
@@ -50,7 +50,7 @@ TEST_F(SHA1HashTest, MultiValue)
      "A very long (greater than 128 bytes/char string) to execute a multi hash-step data point in "
      "the hash function being tested. This string needed to be longer.",
      "All work and no play makes Jack a dull boy",
-     "!\"#$%&\'()*+,-./0123456789:;<=>?@[\\]^_`{|}~",
+     R"(!"#$%&'()*+,-./0123456789:;<=>?@[\]^_`{|}~)",
      "Multi-byte characters: é¼³⅝"});
 
   /*
@@ -114,8 +114,8 @@ TEST_F(SHA1HashTest, MultiValue)
 TEST_F(SHA1HashTest, EmptyNullEquivalence)
 {
   // Test that empty strings hash the same as nulls
-  cudf::test::strings_column_wrapper const strings_col1({"", ""}, {1, 0});
-  cudf::test::strings_column_wrapper const strings_col2({"", ""}, {0, 1});
+  cudf::test::strings_column_wrapper const strings_col1({"", ""}, {true, false});
+  cudf::test::strings_column_wrapper const strings_col2({"", ""}, {false, true});
 
   auto const input1 = cudf::table_view({strings_col1});
   auto const input2 = cudf::table_view({strings_col2});
@@ -133,7 +133,7 @@ TEST_F(SHA1HashTest, ListsUnsupported)
     {{""},
      {"", "Some inputs"},
      {"All ", "work ", "and", " no", " play ", "makes Jack", " a dull boy"},
-     {"!\"#$%&\'()*+,-./0123456789:;<=>?@[\\]^_`", "{|}~"}});
+     {R"(!"#$%&'()*+,-./0123456789:;<=>?@[\]^_`)", "{|}~"}});
 
   auto const input = cudf::table_view({strings_list_col});
 
diff --git a/cpp/tests/hashing/sha224_test.cpp b/cpp/tests/hashing/sha224_test.cpp
index def5e934177..61b584f94df 100644
--- a/cpp/tests/hashing/sha224_test.cpp
+++ b/cpp/tests/hashing/sha224_test.cpp
@@ -50,7 +50,7 @@ TEST_F(SHA224HashTest, MultiValue)
      "A very long (greater than 128 bytes/char string) to execute a multi hash-step data point in "
      "the hash function being tested. This string needed to be longer.",
      "All work and no play makes Jack a dull boy",
-     "!\"#$%&\'()*+,-./0123456789:;<=>?@[\\]^_`{|}~",
+     R"(!"#$%&'()*+,-./0123456789:;<=>?@[\]^_`{|}~)",
      "Multi-byte characters: é¼³⅝"});
 
   /*
@@ -114,8 +114,8 @@ TEST_F(SHA224HashTest, MultiValue)
 TEST_F(SHA224HashTest, EmptyNullEquivalence)
 {
   // Test that empty strings hash the same as nulls
-  cudf::test::strings_column_wrapper const strings_col1({"", ""}, {1, 0});
-  cudf::test::strings_column_wrapper const strings_col2({"", ""}, {0, 1});
+  cudf::test::strings_column_wrapper const strings_col1({"", ""}, {true, false});
+  cudf::test::strings_column_wrapper const strings_col2({"", ""}, {false, true});
 
   auto const input1 = cudf::table_view({strings_col1});
   auto const input2 = cudf::table_view({strings_col2});
@@ -133,7 +133,7 @@ TEST_F(SHA224HashTest, ListsUnsupported)
     {{""},
      {"", "Some inputs"},
      {"All ", "work ", "and", " no", " play ", "makes Jack", " a dull boy"},
-     {"!\"#$%&\'()*+,-./0123456789:;<=>?@[\\]^_`", "{|}~"}});
+     {R"(!"#$%&'()*+,-./0123456789:;<=>?@[\]^_`)", "{|}~"}});
 
   auto const input = cudf::table_view({strings_list_col});
 
diff --git a/cpp/tests/hashing/sha256_test.cpp b/cpp/tests/hashing/sha256_test.cpp
index 410a99edd77..cc95c7a2f0f 100644
--- a/cpp/tests/hashing/sha256_test.cpp
+++ b/cpp/tests/hashing/sha256_test.cpp
@@ -52,7 +52,7 @@ TEST_F(SHA256HashTest, MultiValue)
      "A very long (greater than 128 bytes/char string) to execute a multi hash-step data point in "
      "the hash function being tested. This string needed to be longer.",
      "All work and no play makes Jack a dull boy",
-     "!\"#$%&\'()*+,-./0123456789:;<=>?@[\\]^_`{|}~",
+     R"(!"#$%&'()*+,-./0123456789:;<=>?@[\]^_`{|}~)",
      "Multi-byte characters: é¼³⅝"});
 
   /*
@@ -115,8 +115,8 @@ TEST_F(SHA256HashTest, MultiValue)
 TEST_F(SHA256HashTest, EmptyNullEquivalence)
 {
   // Test that empty strings hash the same as nulls
-  cudf::test::strings_column_wrapper const strings_col1({"", ""}, {1, 0});
-  cudf::test::strings_column_wrapper const strings_col2({"", ""}, {0, 1});
+  cudf::test::strings_column_wrapper const strings_col1({"", ""}, {true, false});
+  cudf::test::strings_column_wrapper const strings_col2({"", ""}, {false, true});
 
   auto const input1 = cudf::table_view({strings_col1});
   auto const input2 = cudf::table_view({strings_col2});
@@ -134,7 +134,7 @@ TEST_F(SHA256HashTest, ListsUnsupported)
     {{""},
      {"", "Some inputs"},
      {"All ", "work ", "and", " no", " play ", "makes Jack", " a dull boy"},
-     {"!\"#$%&\'()*+,-./0123456789:;<=>?@[\\]^_`", "{|}~"}});
+     {R"(!"#$%&'()*+,-./0123456789:;<=>?@[\]^_`)", "{|}~"}});
 
   auto const input = cudf::table_view({strings_list_col});
 
diff --git a/cpp/tests/hashing/sha384_test.cpp b/cpp/tests/hashing/sha384_test.cpp
index 810fbc82d8e..4c79934f98d 100644
--- a/cpp/tests/hashing/sha384_test.cpp
+++ b/cpp/tests/hashing/sha384_test.cpp
@@ -50,7 +50,7 @@ TEST_F(SHA384HashTest, MultiValue)
      "A very long (greater than 128 bytes/char string) to execute a multi hash-step data point in "
      "the hash function being tested. This string needed to be longer.",
      "All work and no play makes Jack a dull boy",
-     "!\"#$%&\'()*+,-./0123456789:;<=>?@[\\]^_`{|}~",
+     R"(!"#$%&'()*+,-./0123456789:;<=>?@[\]^_`{|}~)",
      "Multi-byte characters: é¼³⅝"});
 
   /*
@@ -132,8 +132,8 @@ TEST_F(SHA384HashTest, MultiValue)
 TEST_F(SHA384HashTest, EmptyNullEquivalence)
 {
   // Test that empty strings hash the same as nulls
-  cudf::test::strings_column_wrapper const strings_col1({"", ""}, {1, 0});
-  cudf::test::strings_column_wrapper const strings_col2({"", ""}, {0, 1});
+  cudf::test::strings_column_wrapper const strings_col1({"", ""}, {true, false});
+  cudf::test::strings_column_wrapper const strings_col2({"", ""}, {false, true});
 
   auto const input1 = cudf::table_view({strings_col1});
   auto const input2 = cudf::table_view({strings_col2});
@@ -151,7 +151,7 @@ TEST_F(SHA384HashTest, ListsUnsupported)
     {{""},
      {"", "Some inputs"},
      {"All ", "work ", "and", " no", " play ", "makes Jack", " a dull boy"},
-     {"!\"#$%&\'()*+,-./0123456789:;<=>?@[\\]^_`", "{|}~"}});
+     {R"(!"#$%&'()*+,-./0123456789:;<=>?@[\]^_`)", "{|}~"}});
 
   auto const input = cudf::table_view({strings_list_col});
 
diff --git a/cpp/tests/hashing/sha512_test.cpp b/cpp/tests/hashing/sha512_test.cpp
index 93caa16c1c4..0eb1c60b8fc 100644
--- a/cpp/tests/hashing/sha512_test.cpp
+++ b/cpp/tests/hashing/sha512_test.cpp
@@ -50,7 +50,7 @@ TEST_F(SHA512HashTest, MultiValue)
      "A very long (greater than 128 bytes/char string) to execute a multi hash-step data point in "
      "the hash function being tested. This string needed to be longer.",
      "All work and no play makes Jack a dull boy",
-     "!\"#$%&\'()*+,-./0123456789:;<=>?@[\\]^_`{|}~",
+     R"(!"#$%&'()*+,-./0123456789:;<=>?@[\]^_`{|}~)",
      "Multi-byte characters: é¼³⅝"});
 
   /*
@@ -132,8 +132,8 @@ TEST_F(SHA512HashTest, MultiValue)
 TEST_F(SHA512HashTest, EmptyNullEquivalence)
 {
   // Test that empty strings hash the same as nulls
-  cudf::test::strings_column_wrapper const strings_col1({"", ""}, {1, 0});
-  cudf::test::strings_column_wrapper const strings_col2({"", ""}, {0, 1});
+  cudf::test::strings_column_wrapper const strings_col1({"", ""}, {true, false});
+  cudf::test::strings_column_wrapper const strings_col2({"", ""}, {false, true});
 
   auto const input1 = cudf::table_view({strings_col1});
   auto const input2 = cudf::table_view({strings_col2});
@@ -151,7 +151,7 @@ TEST_F(SHA512HashTest, ListsUnsupported)
     {{""},
      {"", "Some inputs"},
      {"All ", "work ", "and", " no", " play ", "makes Jack", " a dull boy"},
-     {"!\"#$%&\'()*+,-./0123456789:;<=>?@[\\]^_`", "{|}~"}});
+     {R"(!"#$%&'()*+,-./0123456789:;<=>?@[\]^_`)", "{|}~"}});
 
   auto const input = cudf::table_view({strings_list_col});
 
diff --git a/cpp/tests/interop/dlpack_test.cpp b/cpp/tests/interop/dlpack_test.cpp
index ecc8558243d..330f07ac8e2 100644
--- a/cpp/tests/interop/dlpack_test.cpp
+++ b/cpp/tests/interop/dlpack_test.cpp
@@ -105,7 +105,7 @@ TEST_F(DLPackUntypedTests, MultipleTypesToDlpack)
 TEST_F(DLPackUntypedTests, InvalidNullsToDlpack)
 {
   cudf::test::fixed_width_column_wrapper<int32_t> col1({1, 2, 3, 4});
-  cudf::test::fixed_width_column_wrapper<int32_t> col2({1, 2, 3, 4}, {1, 0, 1, 1});
+  cudf::test::fixed_width_column_wrapper<int32_t> col2({1, 2, 3, 4}, {true, false, true, true});
   cudf::table_view input({col1, col2});
   EXPECT_THROW(cudf::to_dlpack(input), cudf::logic_error);
 }
diff --git a/cpp/tests/interop/from_arrow_device_test.cpp b/cpp/tests/interop/from_arrow_device_test.cpp
index d776ca57ef6..a4dc7531765 100644
--- a/cpp/tests/interop/from_arrow_device_test.cpp
+++ b/cpp/tests/interop/from_arrow_device_test.cpp
@@ -70,7 +70,7 @@ TEST_F(FromArrowDeviceTest, FailConditions)
 
 TEST_F(FromArrowDeviceTest, EmptyTable)
 {
-  const auto [table, schema, arr] = get_nanoarrow_tables(0);
+  auto const [table, schema, arr] = get_nanoarrow_tables(0);
 
   auto expected_cudf_table = table->view();
 
@@ -354,7 +354,7 @@ TEST_F(FromArrowDeviceTest, StructColumn)
 
   NANOARROW_THROW_NOT_OK(ArrowBufferSetAllocator(ArrowArrayBuffer(array_a, 0), noop_alloc));
   ArrowArrayValidityBitmap(array_a)->buffer.data =
-    const_cast<uint8_t*>(reinterpret_cast<const uint8_t*>(view_a.null_mask()));
+    const_cast<uint8_t*>(reinterpret_cast<uint8_t const*>(view_a.null_mask()));
 
   populate_from_col<cudf::string_view>(array_a->children[0], view_a.child(0));
   populate_from_col<int32_t>(array_a->children[1], view_a.child(1));
@@ -372,7 +372,7 @@ TEST_F(FromArrowDeviceTest, StructColumn)
 
   NANOARROW_THROW_NOT_OK(ArrowBufferSetAllocator(ArrowArrayBuffer(array_struct, 0), noop_alloc));
   ArrowArrayValidityBitmap(array_struct)->buffer.data =
-    const_cast<uint8_t*>(reinterpret_cast<const uint8_t*>(view_struct.null_mask()));
+    const_cast<uint8_t*>(reinterpret_cast<uint8_t const*>(view_struct.null_mask()));
 
   populate_from_col<cudf::string_view>(array_struct->children[0], view_struct.child(0));
   populate_from_col<int32_t>(array_struct->children[1], view_struct.child(1));
@@ -392,7 +392,7 @@ TEST_F(FromArrowDeviceTest, StructColumn)
   {
     // there's one boolean column so we should have one "owned_mem" column in the
     // returned unique_ptr's custom deleter
-    const cudf::custom_view_deleter<cudf::table_view>& deleter = got_cudf_table_view.get_deleter();
+    cudf::custom_view_deleter<cudf::table_view> const& deleter = got_cudf_table_view.get_deleter();
     EXPECT_EQ(deleter.owned_mem_.size(), 1);
   }
 
@@ -405,7 +405,7 @@ TEST_F(FromArrowDeviceTest, StructColumn)
   {
     // there's one boolean column so we should have one "owned_mem" column in the
     // returned unique_ptr's custom deleter
-    const cudf::custom_view_deleter<cudf::column_view>& deleter = got_cudf_col.get_deleter();
+    cudf::custom_view_deleter<cudf::column_view> const& deleter = got_cudf_col.get_deleter();
     EXPECT_EQ(deleter.owned_mem_.size(), 1);
   }
 }
@@ -479,7 +479,7 @@ TEST_F(FromArrowDeviceTest, DictionaryIndicesType)
   CUDF_TEST_EXPECT_TABLES_EQUAL(expected_table_view, *got_cudf_table_view);
 
   {
-    const cudf::custom_view_deleter<cudf::table_view>& deleter = got_cudf_table_view.get_deleter();
+    cudf::custom_view_deleter<cudf::table_view> const& deleter = got_cudf_table_view.get_deleter();
     EXPECT_EQ(deleter.owned_mem_.size(), 0);
   }
 
@@ -490,7 +490,7 @@ TEST_F(FromArrowDeviceTest, DictionaryIndicesType)
   CUDF_TEST_EXPECT_TABLES_EQUAL(*got_cudf_table_view, from_struct);
 
   {
-    const cudf::custom_view_deleter<cudf::column_view>& deleter = got_cudf_col.get_deleter();
+    cudf::custom_view_deleter<cudf::column_view> const& deleter = got_cudf_col.get_deleter();
     EXPECT_EQ(deleter.owned_mem_.size(), 0);
   }
 }
diff --git a/cpp/tests/interop/from_arrow_host_test.cpp b/cpp/tests/interop/from_arrow_host_test.cpp
index e6e52099a0c..cbfa4911c3c 100644
--- a/cpp/tests/interop/from_arrow_host_test.cpp
+++ b/cpp/tests/interop/from_arrow_host_test.cpp
@@ -76,7 +76,7 @@ get_nanoarrow_host_tables(cudf::size_type length)
   ArrowBitmapInit(&struct_validity);
   NANOARROW_THROW_NOT_OK(ArrowBitmapReserve(&struct_validity, length));
   ArrowBitmapAppendInt8Unsafe(
-    &struct_validity, reinterpret_cast<const int8_t*>(test_data.bool_data_validity.data()), length);
+    &struct_validity, reinterpret_cast<int8_t const*>(test_data.bool_data_validity.data()), length);
   arrow->children[5]->length = length;
   ArrowArraySetValidityBitmap(arrow->children[5], &struct_validity);
   arrow->children[5]->null_count =
@@ -267,7 +267,7 @@ TEST_F(FromArrowHostDeviceTest, NestedList)
   EXPECT_EQ(
     NANOARROW_OK,
     ArrowBufferAppend(
-      offset_buf, reinterpret_cast<const void*>(offset.data()), offset.size() * sizeof(int32_t)));
+      offset_buf, reinterpret_cast<void const*>(offset.data()), offset.size() * sizeof(int32_t)));
 
   // move our base list to be the child of the one we just created
   // so that we now have an equivalent value to what we created for cudf
@@ -416,7 +416,7 @@ TEST_F(FromArrowHostDeviceTest, StructColumn)
   EXPECT_EQ(
     NANOARROW_OK,
     ArrowBufferAppend(
-      offset_buf, reinterpret_cast<const void*>(offset.data()), offset.size() * sizeof(int32_t)));
+      offset_buf, reinterpret_cast<void const*>(offset.data()), offset.size() * sizeof(int32_t)));
 
   list_arr.move(array_a->children[3]->children[0]);
 
diff --git a/cpp/tests/interop/from_arrow_test.cpp b/cpp/tests/interop/from_arrow_test.cpp
index 94b0c75f184..aec2bab7196 100644
--- a/cpp/tests/interop/from_arrow_test.cpp
+++ b/cpp/tests/interop/from_arrow_test.cpp
@@ -39,17 +39,19 @@
 std::unique_ptr<cudf::table> get_cudf_table()
 {
   std::vector<std::unique_ptr<cudf::column>> columns;
-  columns.emplace_back(
-    cudf::test::fixed_width_column_wrapper<int32_t>({1, 2, 5, 2, 7}, {1, 0, 1, 1, 1}).release());
+  columns.emplace_back(cudf::test::fixed_width_column_wrapper<int32_t>(
+                         {1, 2, 5, 2, 7}, {true, false, true, true, true})
+                         .release());
   columns.emplace_back(cudf::test::fixed_width_column_wrapper<int64_t>({1, 2, 3, 4, 5}).release());
-  columns.emplace_back(
-    cudf::test::strings_column_wrapper({"fff", "aaa", "", "fff", "ccc"}, {1, 1, 1, 0, 1})
-      .release());
-  auto col4 = cudf::test::fixed_width_column_wrapper<int32_t>({1, 2, 5, 2, 7}, {1, 0, 1, 1, 1});
+  columns.emplace_back(cudf::test::strings_column_wrapper({"fff", "aaa", "", "fff", "ccc"},
+                                                          {true, true, true, false, true})
+                         .release());
+  auto col4 = cudf::test::fixed_width_column_wrapper<int32_t>({1, 2, 5, 2, 7},
+                                                              {true, false, true, true, true});
   columns.emplace_back(std::move(cudf::dictionary::encode(col4)));
-  columns.emplace_back(
-    cudf::test::fixed_width_column_wrapper<bool>({true, false, true, false, true}, {1, 0, 1, 1, 0})
-      .release());
+  columns.emplace_back(cudf::test::fixed_width_column_wrapper<bool>(
+                         {true, false, true, false, true}, {true, false, true, true, false})
+                         .release());
   // columns.emplace_back(cudf::test::lists_column_wrapper<int>({{1, 2}, {3, 4}, {}, {6}, {7, 8,
   // 9}}).release());
   return std::make_unique<cudf::table>(std::move(columns));
@@ -171,15 +173,17 @@ TEST_F(FromArrowTest, StructColumn)
       "Samuel Vimes", "Carrot Ironfoundersson", "Angua von Überwald"}
       .release();
   auto str_col2 =
-    cudf::test::strings_column_wrapper{{"CUDF", "ROCKS", "EVERYWHERE"}, {0, 1, 0}}.release();
+    cudf::test::strings_column_wrapper{{"CUDF", "ROCKS", "EVERYWHERE"}, {false, true, false}}
+      .release();
   int num_rows{str_col->size()};
   auto int_col = cudf::test::fixed_width_column_wrapper<int32_t, int32_t>{{48, 27, 25}}.release();
   auto int_col2 =
-    cudf::test::fixed_width_column_wrapper<int32_t, int32_t>{{12, 24, 47}, {1, 0, 1}}.release();
-  auto bool_col = cudf::test::fixed_width_column_wrapper<bool>{{true, true, false}}.release();
-  auto list_col =
-    cudf::test::lists_column_wrapper<int64_t>({{{1, 2}, {3, 4}, {5}}, {{{6}}}, {{7}, {8, 9}}})
+    cudf::test::fixed_width_column_wrapper<int32_t, int32_t>{{12, 24, 47}, {true, false, true}}
       .release();
+  auto bool_col = cudf::test::fixed_width_column_wrapper<bool>{{true, true, false}}.release();
+  auto list_col = cudf::test::lists_column_wrapper<int64_t>(
+                    {{{1, 2}, {3, 4}, {5}}, {{{6}}}, {{7}, {8, 9}}})  // NOLINT
+                    .release();
   vector_of_columns cols2;
   cols2.push_back(std::move(str_col2));
   cols2.push_back(std::move(int_col2));
@@ -261,7 +265,8 @@ TEST_F(FromArrowTest, DictionaryIndicesType)
   auto arrow_table = arrow::Table::Make(schema, {array1, array2, array3});
 
   std::vector<std::unique_ptr<cudf::column>> columns;
-  auto col = cudf::test::fixed_width_column_wrapper<int64_t>({1, 2, 5, 2, 7}, {1, 0, 1, 1, 1});
+  auto col = cudf::test::fixed_width_column_wrapper<int64_t>({1, 2, 5, 2, 7},
+                                                             {true, false, true, true, true});
   columns.emplace_back(std::move(cudf::dictionary::encode(col)));
   columns.emplace_back(std::move(cudf::dictionary::encode(col)));
   columns.emplace_back(std::move(cudf::dictionary::encode(col)));
@@ -299,7 +304,8 @@ TEST_F(FromArrowTest, ChunkedArray)
     std::vector<std::shared_ptr<arrow::Array>>{string_array_1, string_array_2});
   auto dict_chunked_array = std::make_shared<arrow::ChunkedArray>(
     std::vector<std::shared_ptr<arrow::Array>>{dict_array1, dict_array2});
-  auto boolean_array = get_arrow_array<bool>({true, false, true, false, true}, {1, 0, 1, 1, 0});
+  auto boolean_array =
+    get_arrow_array<bool>({true, false, true, false, true}, {true, false, true, true, false});
   auto boolean_chunked_array = std::make_shared<arrow::ChunkedArray>(boolean_array);
 
   std::vector<std::shared_ptr<arrow::Field>> schema_vector(
@@ -404,8 +410,9 @@ TEST_F(FromArrowTest, FixedPoint128TableNulls)
   for (auto const scale : {3, 2, 1, 0, -1, -2, -3}) {
     auto const data     = std::vector<__int128_t>{1, 2, 3, 4, 5, 6, 0, 0};
     auto const validity = std::vector<int32_t>{1, 1, 1, 1, 1, 1, 0, 0};
-    auto const col =
-      fp_wrapper<__int128_t>({1, 2, 3, 4, 5, 6, 0, 0}, {1, 1, 1, 1, 1, 1, 0, 0}, scale_type{scale});
+    auto const col      = fp_wrapper<__int128_t>({1, 2, 3, 4, 5, 6, 0, 0},
+                                            {true, true, true, true, true, true, false, false},
+                                            scale_type{scale});
     auto const expected = cudf::table_view({col});
 
     auto const arr = make_decimal128_arrow_array(data, validity, scale);
diff --git a/cpp/tests/interop/nanoarrow_utils.hpp b/cpp/tests/interop/nanoarrow_utils.hpp
index a79e6fdc49c..94c4372e74a 100644
--- a/cpp/tests/interop/nanoarrow_utils.hpp
+++ b/cpp/tests/interop/nanoarrow_utils.hpp
@@ -97,7 +97,7 @@ std::enable_if_t<cudf::is_fixed_width<T>() and !std::is_same_v<T, bool>, void> p
   ArrowArrayValidityBitmap(arr)->buffer.size_bytes =
     cudf::bitmask_allocation_size_bytes(view.size());
   ArrowArrayValidityBitmap(arr)->buffer.data =
-    const_cast<uint8_t*>(reinterpret_cast<const uint8_t*>(view.null_mask()));
+    const_cast<uint8_t*>(reinterpret_cast<uint8_t const*>(view.null_mask()));
   NANOARROW_THROW_NOT_OK(ArrowBufferSetAllocator(ArrowArrayBuffer(arr, 1), noop_alloc));
   ArrowArrayBuffer(arr, 1)->size_bytes = sizeof(T) * view.size();
   ArrowArrayBuffer(arr, 1)->data       = const_cast<uint8_t*>(view.data<uint8_t>());
@@ -117,7 +117,7 @@ std::enable_if_t<std::is_same_v<T, bool>, void> populate_from_col(ArrowArray* ar
   ArrowArrayValidityBitmap(arr)->buffer.size_bytes =
     cudf::bitmask_allocation_size_bytes(view.size());
   ArrowArrayValidityBitmap(arr)->buffer.data =
-    const_cast<uint8_t*>(reinterpret_cast<const uint8_t*>(view.null_mask()));
+    const_cast<uint8_t*>(reinterpret_cast<uint8_t const*>(view.null_mask()));
 
   auto bitmask = cudf::bools_to_mask(view);
   auto ptr     = reinterpret_cast<uint8_t*>(bitmask.first->data());
@@ -147,7 +147,7 @@ std::enable_if_t<std::is_same_v<T, cudf::string_view>, void> populate_from_col(
   ArrowArrayValidityBitmap(arr)->buffer.size_bytes =
     cudf::bitmask_allocation_size_bytes(view.size());
   ArrowArrayValidityBitmap(arr)->buffer.data =
-    const_cast<uint8_t*>(reinterpret_cast<const uint8_t*>(view.null_mask()));
+    const_cast<uint8_t*>(reinterpret_cast<uint8_t const*>(view.null_mask()));
 
   cudf::strings_column_view sview{view};
   if (view.size() > 0) {
@@ -159,7 +159,7 @@ std::enable_if_t<std::is_same_v<T, cudf::string_view>, void> populate_from_col(
     ArrowArrayBuffer(arr, 2)->data       = const_cast<uint8_t*>(view.data<uint8_t>());
   } else {
     auto zero          = rmm::device_scalar<int32_t>(0, cudf::get_default_stream());
-    const uint8_t* ptr = reinterpret_cast<uint8_t*>(zero.data());
+    uint8_t const* ptr = reinterpret_cast<uint8_t*>(zero.data());
     nanoarrow::BufferInitWrapped(ArrowArrayBuffer(arr, 1), std::move(zero), ptr, 4);
   }
 }
@@ -173,7 +173,7 @@ void populate_dict_from_col(ArrowArray* arr, cudf::dictionary_column_view dview)
   ArrowArrayValidityBitmap(arr)->buffer.size_bytes =
     cudf::bitmask_allocation_size_bytes(dview.size());
   ArrowArrayValidityBitmap(arr)->buffer.data =
-    const_cast<uint8_t*>(reinterpret_cast<const uint8_t*>(dview.null_mask()));
+    const_cast<uint8_t*>(reinterpret_cast<uint8_t const*>(dview.null_mask()));
 
   NANOARROW_THROW_NOT_OK(ArrowBufferSetAllocator(ArrowArrayBuffer(arr, 1), noop_alloc));
   ArrowArrayBuffer(arr, 1)->size_bytes = sizeof(IND_TYPE) * dview.indices().size();
@@ -225,7 +225,7 @@ get_nanoarrow_array(std::vector<T> const& data, std::vector<uint8_t> const& mask
     ArrowBitmap bitmap;
     ArrowBitmapInit(&bitmap);
     NANOARROW_THROW_NOT_OK(ArrowBitmapReserve(&bitmap, mask.size()));
-    ArrowBitmapAppendInt8Unsafe(&bitmap, reinterpret_cast<const int8_t*>(mask.data()), mask.size());
+    ArrowBitmapAppendInt8Unsafe(&bitmap, reinterpret_cast<int8_t const*>(mask.data()), mask.size());
 
     ArrowArraySetValidityBitmap(tmp.get(), &bitmap);
     tmp->null_count =
@@ -343,7 +343,7 @@ nanoarrow::UniqueArray get_nanoarrow_list_array(std::vector<T> const& data,
     ArrowBitmapInit(&bitmap);
     NANOARROW_THROW_NOT_OK(ArrowBitmapReserve(&bitmap, list_validity.size()));
     ArrowBitmapAppendInt8Unsafe(
-      &bitmap, reinterpret_cast<const int8_t*>(list_validity.data()), list_validity.size());
+      &bitmap, reinterpret_cast<int8_t const*>(list_validity.data()), list_validity.size());
 
     ArrowArraySetValidityBitmap(tmp.get(), &bitmap);
     tmp->null_count =
diff --git a/cpp/tests/interop/to_arrow_device_test.cpp b/cpp/tests/interop/to_arrow_device_test.cpp
index 4c73cd637a4..860544b8606 100644
--- a/cpp/tests/interop/to_arrow_device_test.cpp
+++ b/cpp/tests/interop/to_arrow_device_test.cpp
@@ -206,7 +206,7 @@ get_nanoarrow_tables(cudf::size_type length)
   ArrowArrayValidityBitmap(arrow->children[5])->buffer.size_bytes =
     cudf::bitmask_allocation_size_bytes(struct_view.size());
   ArrowArrayValidityBitmap(arrow->children[5])->buffer.data =
-    const_cast<uint8_t*>(reinterpret_cast<const uint8_t*>(struct_view.null_mask()));
+    const_cast<uint8_t*>(reinterpret_cast<uint8_t const*>(struct_view.null_mask()));
 
   ArrowError error;
   if (ArrowArrayFinishBuilding(arrow.get(), NANOARROW_VALIDATION_LEVEL_MINIMAL, &error) !=
@@ -229,7 +229,7 @@ void populate_list_from_col(ArrowArray* arr, cudf::lists_column_view view)
   ArrowArrayValidityBitmap(arr)->buffer.size_bytes =
     cudf::bitmask_allocation_size_bytes(view.size());
   ArrowArrayValidityBitmap(arr)->buffer.data =
-    const_cast<uint8_t*>(reinterpret_cast<const uint8_t*>(view.null_mask()));
+    const_cast<uint8_t*>(reinterpret_cast<uint8_t const*>(view.null_mask()));
 
   NANOARROW_THROW_NOT_OK(ArrowBufferSetAllocator(ArrowArrayBuffer(arr, 1), noop_alloc));
   ArrowArrayBuffer(arr, 1)->size_bytes = sizeof(int32_t) * view.offsets().size();
@@ -237,7 +237,7 @@ void populate_list_from_col(ArrowArray* arr, cudf::lists_column_view view)
 }
 
 struct BaseArrowFixture : public cudf::test::BaseFixture {
-  void compare_schemas(const ArrowSchema* expected, const ArrowSchema* actual)
+  void compare_schemas(ArrowSchema const* expected, ArrowSchema const* actual)
   {
     EXPECT_STREQ(expected->format, actual->format);
     EXPECT_STREQ(expected->name, actual->name);
@@ -264,9 +264,9 @@ struct BaseArrowFixture : public cudf::test::BaseFixture {
   }
 
   void compare_device_buffers(const size_t nbytes,
-                              const int buffer_idx,
-                              const ArrowArray* expected,
-                              const ArrowArray* actual)
+                              int const buffer_idx,
+                              ArrowArray const* expected,
+                              ArrowArray const* actual)
   {
     std::vector<uint8_t> actual_bytes;
     std::vector<uint8_t> expected_bytes;
@@ -281,9 +281,9 @@ struct BaseArrowFixture : public cudf::test::BaseFixture {
     ASSERT_EQ(expected_bytes, actual_bytes);
   }
 
-  void compare_arrays(const ArrowSchema* schema,
-                      const ArrowArray* expected,
-                      const ArrowArray* actual)
+  void compare_arrays(ArrowSchema const* schema,
+                      ArrowArray const* expected,
+                      ArrowArray const* actual)
   {
     ArrowSchemaView schema_view;
     NANOARROW_THROW_NOT_OK(ArrowSchemaViewInit(&schema_view, schema, nullptr));
@@ -337,7 +337,7 @@ TYPED_TEST_SUITE(ToArrowDeviceTestDurationsTest, cudf::test::DurationTypes);
 
 TEST_F(ToArrowDeviceTest, EmptyTable)
 {
-  const auto [table, schema, arr] = get_nanoarrow_tables(0);
+  auto const [table, schema, arr] = get_nanoarrow_tables(0);
 
   auto struct_meta          = cudf::column_metadata{"f"};
   struct_meta.children_meta = {{"integral"}, {"string"}};
@@ -653,7 +653,7 @@ TEST_F(ToArrowDeviceTest, StructColumn)
 
   NANOARROW_THROW_NOT_OK(ArrowBufferSetAllocator(ArrowArrayBuffer(array_a, 0), noop_alloc));
   ArrowArrayValidityBitmap(array_a)->buffer.data =
-    const_cast<uint8_t*>(reinterpret_cast<const uint8_t*>(view_a.null_mask()));
+    const_cast<uint8_t*>(reinterpret_cast<uint8_t const*>(view_a.null_mask()));
 
   populate_from_col<cudf::string_view>(array_a->children[0], view_a.child(0));
   populate_from_col<int32_t>(array_a->children[1], view_a.child(1));
@@ -671,7 +671,7 @@ TEST_F(ToArrowDeviceTest, StructColumn)
 
   NANOARROW_THROW_NOT_OK(ArrowBufferSetAllocator(ArrowArrayBuffer(array_struct, 0), noop_alloc));
   ArrowArrayValidityBitmap(array_struct)->buffer.data =
-    const_cast<uint8_t*>(reinterpret_cast<const uint8_t*>(view_struct.null_mask()));
+    const_cast<uint8_t*>(reinterpret_cast<uint8_t const*>(view_struct.null_mask()));
 
   populate_from_col<cudf::string_view>(array_struct->children[0], view_struct.child(0));
   populate_from_col<int32_t>(array_struct->children[1], view_struct.child(1));
@@ -736,7 +736,7 @@ TEST_F(ToArrowDeviceTest, FixedPoint64Table)
     NANOARROW_THROW_NOT_OK(
       ArrowBufferSetAllocator(ArrowArrayBuffer(expected_array->children[0], 0), noop_alloc));
     ArrowArrayValidityBitmap(expected_array->children[0])->buffer.data =
-      const_cast<uint8_t*>(reinterpret_cast<const uint8_t*>(input.view().column(0).null_mask()));
+      const_cast<uint8_t*>(reinterpret_cast<uint8_t const*>(input.view().column(0).null_mask()));
 
     auto data_ptr = reinterpret_cast<uint8_t*>(result_dev_data->data());
     NANOARROW_THROW_NOT_OK(ArrowBufferSetAllocator(
diff --git a/cpp/tests/io/csv_test.cpp b/cpp/tests/io/csv_test.cpp
index 880dc911954..ff433264446 100644
--- a/cpp/tests/io/csv_test.cpp
+++ b/cpp/tests/io/csv_test.cpp
@@ -938,7 +938,7 @@ TEST_F(CsvReaderTest, Strings)
     outfile << names[0] << ',' << names[1] << '\n';
     outfile << "10,abc def ghi" << '\n';
     outfile << "20,\"jkl mno pqr\"" << '\n';
-    outfile << "30,stu \"\"vwx\"\" yz" << '\n';
+    outfile << R"(30,stu ""vwx"" yz)" << '\n';
   }
 
   cudf::io::csv_reader_options in_opts =
@@ -996,7 +996,7 @@ TEST_F(CsvReaderTest, StringsQuotesIgnored)
     std::ofstream outfile(filepath, std::ofstream::out);
     outfile << names[0] << ',' << names[1] << '\n';
     outfile << "10,\"abcdef ghi\"" << '\n';
-    outfile << "20,\"jkl \"\"mno\"\" pqr\"" << '\n';
+    outfile << R"(20,"jkl ""mno"" pqr")" << '\n';
     outfile << "30,stu \"vwx\" yz" << '\n';
   }
 
diff --git a/cpp/tests/io/json_chunked_reader.cpp b/cpp/tests/io/json_chunked_reader.cpp
index 7482cb1b70d..23d54f7263c 100644
--- a/cpp/tests/io/json_chunked_reader.cpp
+++ b/cpp/tests/io/json_chunked_reader.cpp
@@ -76,10 +76,10 @@ std::vector<cudf::io::table_with_metadata> skeleton_for_parellel_chunk_reader(
   auto prev                = first_delimiter_index[0];
   for (size_t i = 1; i < num_chunks; i++) {
     if (first_delimiter_index[i] == no_min_value) continue;
-    record_ranges.push_back({prev, first_delimiter_index[i]});
+    record_ranges.emplace_back(prev, first_delimiter_index[i]);
     prev = first_delimiter_index[i];
   }
-  record_ranges.push_back({prev, total_source_size});
+  record_ranges.emplace_back(prev, total_source_size);
 
   std::vector<cudf::io::table_with_metadata> tables;
   // Process each chunk in parallel.
diff --git a/cpp/tests/io/json_quote_normalization_test.cpp b/cpp/tests/io/json_quote_normalization_test.cpp
index 5260b435482..55ad0afe499 100644
--- a/cpp/tests/io/json_quote_normalization_test.cpp
+++ b/cpp/tests/io/json_quote_normalization_test.cpp
@@ -35,7 +35,7 @@
 // Base test fixture for tests
 struct JsonNormalizationTest : public cudf::test::BaseFixture {};
 
-void run_test(const std::string& host_input, const std::string& expected_host_output)
+void run_test(std::string const& host_input, std::string const& expected_host_output)
 {
   // RMM memory resource
   std::shared_ptr<rmm::mr::device_memory_resource> rsc =
diff --git a/cpp/tests/io/json_test.cpp b/cpp/tests/io/json_test.cpp
index 4c01a1fb87b..9c76c344157 100644
--- a/cpp/tests/io/json_test.cpp
+++ b/cpp/tests/io/json_test.cpp
@@ -1829,7 +1829,7 @@ TYPED_TEST(JsonValidFixedPointReaderTest, SingleColumnPositiveScale)
 
 TYPED_TEST(JsonFixedPointReaderTest, EmptyValues)
 {
-  auto const buffer = std::string{"{\"col0\":\"\"}"};
+  auto const buffer = std::string{R"({"col0":""})"};
 
   cudf::io::json_reader_options const in_opts =
     cudf::io::json_reader_options::builder(cudf::io::source_info{buffer.c_str(), buffer.size()})
@@ -2424,7 +2424,7 @@ TEST_P(JsonDelimiterParamTest, JsonLinesDelimiter)
    * linearly in O(n), we can do it in O(log n) by doubling the input in each iteration. The total
    * number of such iterations is log_repetitions.
    */
-  std::size_t const log_repetitions =
+  auto const log_repetitions =
     static_cast<std::size_t>(std::ceil(std::log2(string_size / input.size())));
   std::size_t const repetitions = 1UL << log_repetitions;
   for (std::size_t i = 0; i < log_repetitions; i++) {
diff --git a/cpp/tests/io/json_tree.cpp b/cpp/tests/io/json_tree.cpp
index 3577b47a7e2..7a72b77e1fb 100644
--- a/cpp/tests/io/json_tree.cpp
+++ b/cpp/tests/io/json_tree.cpp
@@ -297,8 +297,8 @@ tree_meta_t2 get_tree_representation_cpu(
   };
 
   // Includes quote char for end-of-string token or Skips the quote char for beginning-of-field-name
-  auto get_token_index = [include_quote_char](cuio_json::PdaTokenT const token,
-                                              cuio_json::SymbolOffsetT const token_index) {
+  auto get_token_index = [](cuio_json::PdaTokenT const token,
+                            cuio_json::SymbolOffsetT const token_index) {
     constexpr cuio_json::SymbolOffsetT quote_char_size = 1;
     switch (token) {
       // Strip off or include quote char for StringBegin
@@ -398,10 +398,10 @@ tree_meta_t2 get_tree_representation_cpu(
 
     // Modify the stack if needed
     if (token == cuio_json::token_t::FieldNameBegin) {
-      parent_stack.push({node_id, field_name_node});
+      parent_stack.emplace(node_id, field_name_node);
     } else {
       if (does_push(token)) {
-        parent_stack.push({node_id, no_field_name_node});
+        parent_stack.emplace(node_id, no_field_name_node);
       } else if (does_pop(token)) {
         CUDF_EXPECTS(parent_stack.size() >= 1, "Invalid JSON input.");
         parent_stack.pop();
diff --git a/cpp/tests/io/orc_chunked_reader_test.cu b/cpp/tests/io/orc_chunked_reader_test.cu
index 1c1b53ea17f..2b78a5e7251 100644
--- a/cpp/tests/io/orc_chunked_reader_test.cu
+++ b/cpp/tests/io/orc_chunked_reader_test.cu
@@ -1308,9 +1308,9 @@ TEST_F(OrcChunkedReaderInputLimitTest, ReadWithRowSelection)
   int constexpr num_rows_to_read = rows_per_stripe * 5 + random_val;
 
   // Just shift the read data region back by a random offset.
-  const auto num_rows_to_skip = num_rows - num_rows_to_read - random_val;
+  auto const num_rows_to_skip = num_rows - num_rows_to_read - random_val;
 
-  const auto sequence_start = num_rows_to_skip % num_rows;
+  auto const sequence_start = num_rows_to_skip % num_rows;
   auto const skipped_col = int32s_col(it + sequence_start, it + sequence_start + num_rows_to_read);
   auto const expected    = cudf::table_view{{skipped_col}};
 
diff --git a/cpp/tests/io/orc_test.cpp b/cpp/tests/io/orc_test.cpp
index a544a812efb..b5e080f3cc5 100644
--- a/cpp/tests/io/orc_test.cpp
+++ b/cpp/tests/io/orc_test.cpp
@@ -2140,7 +2140,7 @@ TEST_F(OrcReaderTest, SizeTypeRowsOverflow)
   EXPECT_EQ(metadata.num_stripes(), total_rows / 1'000'000);
 
   constexpr auto num_rows_to_read = 1'000'000;
-  const auto num_rows_to_skip     = metadata.num_rows() - num_rows_to_read;
+  auto const num_rows_to_skip     = metadata.num_rows() - num_rows_to_read;
 
   // Read the last million rows
   cudf::io::orc_reader_options skip_opts =
@@ -2148,9 +2148,9 @@ TEST_F(OrcReaderTest, SizeTypeRowsOverflow)
       cudf::io::source_info{out_buffer.data(), out_buffer.size()})
       .use_index(false)
       .skip_rows(num_rows_to_skip);
-  const auto got_with_skip = cudf::io::read_orc(skip_opts).tbl;
+  auto const got_with_skip = cudf::io::read_orc(skip_opts).tbl;
 
-  const auto sequence_start = num_rows_to_skip % num_rows;
+  auto const sequence_start = num_rows_to_skip % num_rows;
   column_wrapper<int8_t, typename decltype(sequence)::value_type> skipped_col(
     sequence + sequence_start, sequence + sequence_start + num_rows_to_read, no_nulls());
   table_view expected({skipped_col});
@@ -2163,7 +2163,7 @@ TEST_F(OrcReaderTest, SizeTypeRowsOverflow)
       cudf::io::source_info{out_buffer.data(), out_buffer.size()})
       .use_index(false)
       .stripes({{metadata.num_stripes() - 1}});
-  const auto got_with_stripe_selection = cudf::io::read_orc(stripe_opts).tbl;
+  auto const got_with_stripe_selection = cudf::io::read_orc(stripe_opts).tbl;
 
   CUDF_TEST_EXPECT_TABLES_EQUAL(expected, got_with_stripe_selection->view());
 }
diff --git a/cpp/tests/io/parquet_chunked_writer_test.cpp b/cpp/tests/io/parquet_chunked_writer_test.cpp
index a0c9641097b..282c6f3adad 100644
--- a/cpp/tests/io/parquet_chunked_writer_test.cpp
+++ b/cpp/tests/io/parquet_chunked_writer_test.cpp
@@ -228,10 +228,12 @@ TEST_F(ParquetChunkedWriterTest, ListOfStruct)
   auto table_1 = table_view({*list_col_1});
 
   // Table 2
-  auto weight_2   = cudf::test::fixed_width_column_wrapper<float>{{1.1, -1.0, -1.0}};
-  auto ages_2     = cudf::test::fixed_width_column_wrapper<int32_t>{{31, 351, 351}, {1, 1, 0}};
-  auto struct_1_2 = cudf::test::structs_column_wrapper{{weight_2, ages_2}, {1, 0, 1}};
-  auto is_human_2 = cudf::test::fixed_width_column_wrapper<bool>{{false, false, false}, {1, 1, 0}};
+  auto weight_2 = cudf::test::fixed_width_column_wrapper<float>{{1.1, -1.0, -1.0}};
+  auto ages_2 =
+    cudf::test::fixed_width_column_wrapper<int32_t>{{31, 351, 351}, {true, true, false}};
+  auto struct_1_2 = cudf::test::structs_column_wrapper{{weight_2, ages_2}, {true, false, true}};
+  auto is_human_2 =
+    cudf::test::fixed_width_column_wrapper<bool>{{false, false, false}, {true, true, false}};
   auto struct_2_2 = cudf::test::structs_column_wrapper{{is_human_2, struct_1_2}};
 
   auto list_offsets_column_2 =
@@ -313,10 +315,11 @@ TEST_F(ParquetChunkedWriterTest, ListOfStructOfStructOfListOfList)
   // [[], [], []]
   lcw flats_2{lcw{lcw{}}, lcw{lcw{}, lcw{}, lcw{}}};
 
-  auto weight_2   = cudf::test::fixed_width_column_wrapper<float>{{-1.0, -1.0}};
-  auto ages_2     = cudf::test::fixed_width_column_wrapper<int32_t>{{351, 351}, {1, 0}};
-  auto struct_1_2 = cudf::test::structs_column_wrapper{{weight_2, ages_2, land_2, flats_2}, {0, 1}};
-  auto is_human_2 = cudf::test::fixed_width_column_wrapper<bool>{{false, false}, {1, 0}};
+  auto weight_2 = cudf::test::fixed_width_column_wrapper<float>{{-1.0, -1.0}};
+  auto ages_2   = cudf::test::fixed_width_column_wrapper<int32_t>{{351, 351}, {true, false}};
+  auto struct_1_2 =
+    cudf::test::structs_column_wrapper{{weight_2, ages_2, land_2, flats_2}, {false, true}};
+  auto is_human_2 = cudf::test::fixed_width_column_wrapper<bool>{{false, false}, {true, false}};
   auto struct_2_2 = cudf::test::structs_column_wrapper{{is_human_2, struct_1_2}};
 
   auto list_offsets_column_2 =
@@ -495,10 +498,12 @@ TEST_F(ParquetChunkedWriterTest, DifferentNullabilityStruct)
 
   // Table 2: struct_1 and is_human are nullable now so if we hadn't assumed worst case (nullable)
   // when writing table_1, we would have wrong pages for it.
-  auto weight_2   = cudf::test::fixed_width_column_wrapper<float>{{1.1, -1.0, -1.0}};
-  auto ages_2     = cudf::test::fixed_width_column_wrapper<int32_t>{{31, 351, 351}, {1, 1, 0}};
-  auto struct_1_2 = cudf::test::structs_column_wrapper{{weight_2, ages_2}, {1, 0, 1}};
-  auto is_human_2 = cudf::test::fixed_width_column_wrapper<bool>{{false, false, false}, {1, 1, 0}};
+  auto weight_2 = cudf::test::fixed_width_column_wrapper<float>{{1.1, -1.0, -1.0}};
+  auto ages_2 =
+    cudf::test::fixed_width_column_wrapper<int32_t>{{31, 351, 351}, {true, true, false}};
+  auto struct_1_2 = cudf::test::structs_column_wrapper{{weight_2, ages_2}, {true, false, true}};
+  auto is_human_2 =
+    cudf::test::fixed_width_column_wrapper<bool>{{false, false, false}, {true, true, false}};
   auto struct_2_2 = cudf::test::structs_column_wrapper{{is_human_2, struct_1_2}};
   auto table_2    = cudf::table_view({struct_2_2});
 
@@ -628,9 +633,10 @@ TEST_F(ParquetChunkedWriterTest, ForcedNullabilityStruct)
   auto struct_2_1 = cudf::test::structs_column_wrapper{{is_human_1, struct_1_1}};
   auto table_1    = cudf::table_view({struct_2_1});
 
-  auto weight_2   = cudf::test::fixed_width_column_wrapper<float>{{1.1, -1.0, -1.0}};
-  auto ages_2     = cudf::test::fixed_width_column_wrapper<int32_t>{{31, 351, 351}, {1, 1, 0}};
-  auto struct_1_2 = cudf::test::structs_column_wrapper{{weight_2, ages_2}, {1, 0, 1}};
+  auto weight_2 = cudf::test::fixed_width_column_wrapper<float>{{1.1, -1.0, -1.0}};
+  auto ages_2 =
+    cudf::test::fixed_width_column_wrapper<int32_t>{{31, 351, 351}, {true, true, false}};
+  auto struct_1_2 = cudf::test::structs_column_wrapper{{weight_2, ages_2}, {true, false, true}};
   auto is_human_2 = cudf::test::fixed_width_column_wrapper<bool>{{false, false, false}};
   auto struct_2_2 = cudf::test::structs_column_wrapper{{is_human_2, struct_1_2}};
   auto table_2    = cudf::table_view({struct_2_2});
diff --git a/cpp/tests/io/parquet_reader_test.cpp b/cpp/tests/io/parquet_reader_test.cpp
index aa9172b0608..2edf9e0aee6 100644
--- a/cpp/tests/io/parquet_reader_test.cpp
+++ b/cpp/tests/io/parquet_reader_test.cpp
@@ -119,7 +119,7 @@ TEST_F(ParquetReaderTest, UserBoundsWithNulls)
 {
   // clang-format off
   cudf::test::fixed_width_column_wrapper<float> col{{1,1,1,1,1,1,1,1, 2,2,2,2,2,2,2,2, 3,3,3,3,3,3,3,3, 4,4,4,4,4,4,4,4,  5,5,5,5,5,5,5,5, 6,6,6,6,6,6,6,6, 7,7,7,7,7,7,7,7, 8,8,8,8,8,8,8,8}
-                                                   ,{1,1,1,0,0,0,1,1, 1,1,1,1,1,1,1,1, 0,0,0,0,0,0,0,0, 1,1,1,1,1,1,0,0,  1,0,1,1,1,1,1,1, 1,1,1,1,1,1,1,1, 1,1,1,1,1,1,1,1, 1,1,1,1,1,1,1,0}};
+                                                   ,{true,true,true,false,false,false,true,true, true,true,true,true,true,true,true,true, false,false,false,false,false,false,false,false, true,true,true,true,true,true,false,false,  true,false,true,true,true,true,true,true, true,true,true,true,true,true,true,true, true,true,true,true,true,true,true,true, true,true,true,true,true,true,true,false}};
   // clang-format on
   cudf::table_view tbl({col});
   auto filepath = temp_env->get_temp_filepath("UserBoundsWithNulls.parquet");
@@ -168,7 +168,7 @@ TEST_F(ParquetReaderTest, UserBoundsWithNullsMixedTypes)
   // list<float>
   constexpr int floats_per_row = 4;
   auto c1_offset_iter          = cudf::detail::make_counting_transform_iterator(
-    0, [floats_per_row](cudf::size_type idx) { return idx * floats_per_row; });
+    0, [](cudf::size_type idx) { return idx * floats_per_row; });
   cudf::test::fixed_width_column_wrapper<cudf::size_type> c1_offsets(c1_offset_iter,
                                                                      c1_offset_iter + num_rows + 1);
   cudf::test::fixed_width_column_wrapper<float> c1_floats(
@@ -192,7 +192,7 @@ TEST_F(ParquetReaderTest, UserBoundsWithNullsMixedTypes)
   constexpr int num_string_rows = num_rows * string_per_row;
   cudf::test::strings_column_wrapper string_col{string_iter, string_iter + num_string_rows};
   auto offset_iter = cudf::detail::make_counting_transform_iterator(
-    0, [string_per_row](cudf::size_type idx) { return idx * string_per_row; });
+    0, [](cudf::size_type idx) { return idx * string_per_row; });
   cudf::test::fixed_width_column_wrapper<cudf::size_type> offsets(offset_iter,
                                                                   offset_iter + num_rows + 1);
 
@@ -444,16 +444,18 @@ TEST_F(ParquetReaderTest, SelectNestedColumn)
 
   auto weights_col = cudf::test::fixed_width_column_wrapper<float>{1.1, 2.4, 5.3, 8.0, 9.6, 6.9};
 
-  auto ages_col =
-    cudf::test::fixed_width_column_wrapper<int32_t>{{48, 27, 25, 31, 351, 351}, {1, 1, 1, 1, 1, 0}};
+  auto ages_col = cudf::test::fixed_width_column_wrapper<int32_t>{
+    {48, 27, 25, 31, 351, 351}, {true, true, true, true, true, false}};
 
-  auto struct_1 = cudf::test::structs_column_wrapper{{weights_col, ages_col}, {1, 1, 1, 1, 0, 1}};
+  auto struct_1 = cudf::test::structs_column_wrapper{{weights_col, ages_col},
+                                                     {true, true, true, true, false, true}};
 
   auto is_human_col = cudf::test::fixed_width_column_wrapper<bool>{
-    {true, true, false, false, false, false}, {1, 1, 0, 1, 1, 0}};
+    {true, true, false, false, false, false}, {true, true, false, true, true, false}};
 
-  auto struct_2 =
-    cudf::test::structs_column_wrapper{{is_human_col, struct_1}, {0, 1, 1, 1, 1, 1}}.release();
+  auto struct_2 = cudf::test::structs_column_wrapper{{is_human_col, struct_1},
+                                                     {false, true, true, true, true, true}}
+                    .release();
 
   auto input = table_view({*struct_2});
 
@@ -477,10 +479,12 @@ TEST_F(ParquetReaderTest, SelectNestedColumn)
     auto const result = cudf::io::read_parquet(read_args);
 
     auto expect_ages_col = cudf::test::fixed_width_column_wrapper<int32_t>{
-      {48, 27, 25, 31, 351, 351}, {1, 1, 1, 1, 1, 0}};
-    auto expect_s_1 = cudf::test::structs_column_wrapper{{expect_ages_col}, {1, 1, 1, 1, 0, 1}};
+      {48, 27, 25, 31, 351, 351}, {true, true, true, true, true, false}};
+    auto expect_s_1 =
+      cudf::test::structs_column_wrapper{{expect_ages_col}, {true, true, true, true, false, true}};
     auto expect_s_2 =
-      cudf::test::structs_column_wrapper{{expect_s_1}, {0, 1, 1, 1, 1, 1}}.release();
+      cudf::test::structs_column_wrapper{{expect_s_1}, {false, true, true, true, true, true}}
+        .release();
     auto expected = table_view({*expect_s_2});
 
     cudf::io::table_input_metadata expected_metadata(expected);
@@ -502,13 +506,14 @@ TEST_F(ParquetReaderTest, SelectNestedColumn)
       cudf::test::fixed_width_column_wrapper<float>{1.1, 2.4, 5.3, 8.0, 9.6, 6.9};
 
     auto expected_ages_col = cudf::test::fixed_width_column_wrapper<int32_t>{
-      {48, 27, 25, 31, 351, 351}, {1, 1, 1, 1, 1, 0}};
+      {48, 27, 25, 31, 351, 351}, {true, true, true, true, true, false}};
 
     auto expected_s_1 = cudf::test::structs_column_wrapper{
-      {expected_weights_col, expected_ages_col}, {1, 1, 1, 1, 0, 1}};
+      {expected_weights_col, expected_ages_col}, {true, true, true, true, false, true}};
 
     auto expect_s_2 =
-      cudf::test::structs_column_wrapper{{expected_s_1}, {0, 1, 1, 1, 1, 1}}.release();
+      cudf::test::structs_column_wrapper{{expected_s_1}, {false, true, true, true, true, true}}
+        .release();
     auto expected = table_view({*expect_s_2});
 
     cudf::io::table_input_metadata expected_metadata(expected);
@@ -531,17 +536,17 @@ TEST_F(ParquetReaderTest, SelectNestedColumn)
       cudf::test::fixed_width_column_wrapper<float>{1.1, 2.4, 5.3, 8.0, 9.6, 6.9};
 
     auto expected_ages_col = cudf::test::fixed_width_column_wrapper<int32_t>{
-      {48, 27, 25, 31, 351, 351}, {1, 1, 1, 1, 1, 0}};
+      {48, 27, 25, 31, 351, 351}, {true, true, true, true, true, false}};
 
     auto expected_is_human_col = cudf::test::fixed_width_column_wrapper<bool>{
-      {true, true, false, false, false, false}, {1, 1, 0, 1, 1, 0}};
+      {true, true, false, false, false, false}, {true, true, false, true, true, false}};
 
     auto expect_s_1 = cudf::test::structs_column_wrapper{{expected_ages_col, expected_weights_col},
-                                                         {1, 1, 1, 1, 0, 1}};
+                                                         {true, true, true, true, false, true}};
 
-    auto expect_s_2 =
-      cudf::test::structs_column_wrapper{{expect_s_1, expected_is_human_col}, {0, 1, 1, 1, 1, 1}}
-        .release();
+    auto expect_s_2 = cudf::test::structs_column_wrapper{{expect_s_1, expected_is_human_col},
+                                                         {false, true, true, true, true, true}}
+                        .release();
 
     auto expected = table_view({*expect_s_2});
 
@@ -1980,7 +1985,8 @@ TEST_F(ParquetReaderTest, RepeatedNoAnnotations)
 
   column_wrapper<int32_t> col0{1, 2, 3, 4, 5, 6};
   column_wrapper<int64_t> child0{{5555555555l, 1111111111l, 1111111111l, 2222222222l, 3333333333l}};
-  cudf::test::strings_column_wrapper child1{{"-", "home", "home", "-", "mobile"}, {0, 1, 1, 0, 1}};
+  cudf::test::strings_column_wrapper child1{{"-", "home", "home", "-", "mobile"},
+                                            {false, true, true, false, true}};
   auto struct_col = cudf::test::structs_column_wrapper{{child0, child1}};
 
   auto list_offsets_column =
@@ -1996,8 +2002,8 @@ TEST_F(ParquetReaderTest, RepeatedNoAnnotations)
   std::vector<std::unique_ptr<cudf::column>> struct_children;
   struct_children.push_back(std::move(list_col));
 
-  auto outer_struct =
-    cudf::test::structs_column_wrapper{{std::move(struct_children)}, {0, 0, 1, 1, 1, 1}};
+  auto outer_struct = cudf::test::structs_column_wrapper{{std::move(struct_children)},
+                                                         {false, false, true, true, true, true}};
   table_view expected{{col0, outer_struct}};
 
   CUDF_TEST_EXPECT_TABLES_EQUAL(result.tbl->view(), expected);
diff --git a/cpp/tests/io/parquet_v2_test.cpp b/cpp/tests/io/parquet_v2_test.cpp
index 25d58a96512..f106fd5a487 100644
--- a/cpp/tests/io/parquet_v2_test.cpp
+++ b/cpp/tests/io/parquet_v2_test.cpp
@@ -317,9 +317,10 @@ TEST_P(ParquetV2Test, SlicedTable)
 
   // Struct column
   auto ages_col = cudf::test::fixed_width_column_wrapper<int32_t>{
-    {48, 27, 25, 31, 351, 351, 29, 15}, {1, 1, 1, 1, 1, 0, 1, 1}};
+    {48, 27, 25, 31, 351, 351, 29, 15}, {true, true, true, true, true, false, true, true}};
 
-  auto col5 = cudf::test::structs_column_wrapper{{ages_col}, {1, 1, 1, 1, 0, 1, 1, 1}};
+  auto col5 = cudf::test::structs_column_wrapper{{ages_col},
+                                                 {true, true, true, true, false, true, true, true}};
 
   // Struct/List mixed column
 
@@ -503,8 +504,8 @@ TEST_P(ParquetV2Test, StructOfList)
 
   auto weights_col = cudf::test::fixed_width_column_wrapper<float>{1.1, 2.4, 5.3, 8.0, 9.6, 6.9};
 
-  auto ages_col =
-    cudf::test::fixed_width_column_wrapper<int32_t>{{48, 27, 25, 31, 351, 351}, {1, 1, 1, 1, 1, 0}};
+  auto ages_col = cudf::test::fixed_width_column_wrapper<int32_t>{
+    {48, 27, 25, 31, 351, 351}, {true, true, true, true, true, false}};
 
   auto valids  = cudf::detail::make_counting_transform_iterator(0, [](auto i) { return i % 2; });
   auto valids2 = cudf::detail::make_counting_transform_iterator(0, [](auto i) { return i != 3; });
@@ -533,13 +534,14 @@ TEST_P(ParquetV2Test, StructOfList)
             lcw{lcw{}, lcw{}, lcw{}}};
 
   auto struct_1 = cudf::test::structs_column_wrapper{{weights_col, ages_col, land_unit, flats},
-                                                     {1, 1, 1, 1, 0, 1}};
+                                                     {true, true, true, true, false, true}};
 
   auto is_human_col = cudf::test::fixed_width_column_wrapper<bool>{
-    {true, true, false, false, false, false}, {1, 1, 0, 1, 1, 0}};
+    {true, true, false, false, false, false}, {true, true, false, true, true, false}};
 
-  auto struct_2 =
-    cudf::test::structs_column_wrapper{{is_human_col, struct_1}, {0, 1, 1, 1, 1, 1}}.release();
+  auto struct_2 = cudf::test::structs_column_wrapper{{is_human_col, struct_1},
+                                                     {false, true, true, true, true, true}}
+                    .release();
 
   auto expected = table_view({*struct_2});
 
@@ -580,16 +582,18 @@ TEST_P(ParquetV2Test, ListOfStruct)
 
   auto weight_col = cudf::test::fixed_width_column_wrapper<float>{1.1, 2.4, 5.3, 8.0, 9.6, 6.9};
 
-  auto ages_col =
-    cudf::test::fixed_width_column_wrapper<int32_t>{{48, 27, 25, 31, 351, 351}, {1, 1, 1, 1, 1, 0}};
+  auto ages_col = cudf::test::fixed_width_column_wrapper<int32_t>{
+    {48, 27, 25, 31, 351, 351}, {true, true, true, true, true, false}};
 
-  auto struct_1 = cudf::test::structs_column_wrapper{{weight_col, ages_col}, {1, 1, 1, 1, 0, 1}};
+  auto struct_1 = cudf::test::structs_column_wrapper{{weight_col, ages_col},
+                                                     {true, true, true, true, false, true}};
 
   auto is_human_col = cudf::test::fixed_width_column_wrapper<bool>{
-    {true, true, false, false, false, false}, {1, 1, 0, 1, 1, 0}};
+    {true, true, false, false, false, false}, {true, true, false, true, true, false}};
 
-  auto struct_2 =
-    cudf::test::structs_column_wrapper{{is_human_col, struct_1}, {0, 1, 1, 1, 1, 1}}.release();
+  auto struct_2 = cudf::test::structs_column_wrapper{{is_human_col, struct_1},
+                                                     {false, true, true, true, true, true}}
+                    .release();
 
   auto list_offsets_column =
     cudf::test::fixed_width_column_wrapper<cudf::size_type>{0, 2, 5, 5, 6}.release();
@@ -752,9 +756,8 @@ TEST_P(ParquetV2Test, CheckColumnOffsetIndex)
       auto const oi = read_offset_index(source, chunk);
 
       int64_t num_vals = 0;
-      for (size_t o = 0; o < oi.page_locations.size(); o++) {
-        auto const& page_loc = oi.page_locations[o];
-        auto const ph        = read_page_header(source, page_loc);
+      for (auto const& page_loc : oi.page_locations) {
+        auto const ph = read_page_header(source, page_loc);
         EXPECT_EQ(ph.type, expected_hdr_type);
         EXPECT_EQ(page_loc.first_row_index, num_vals);
         num_vals += is_v2 ? ph.data_page_header_v2.num_rows : ph.data_page_header.num_values;
@@ -779,8 +782,8 @@ TEST_P(ParquetV2Test, CheckColumnOffsetIndex)
         EXPECT_EQ(ci.null_counts.value()[p], 0);
         EXPECT_TRUE(compare_binary(stats.min_value.value(), ci.min_values[p], ptype, ctype) <= 0);
       }
-      for (size_t p = 0; p < ci.max_values.size(); p++)
-        EXPECT_TRUE(compare_binary(stats.max_value.value(), ci.max_values[p], ptype, ctype) >= 0);
+      for (auto const& max_value : ci.max_values)
+        EXPECT_TRUE(compare_binary(stats.max_value.value(), max_value, ptype, ctype) >= 0);
     }
   }
 }
@@ -857,9 +860,8 @@ TEST_P(ParquetV2Test, CheckColumnOffsetIndexNulls)
       auto const oi = read_offset_index(source, chunk);
 
       int64_t num_vals = 0;
-      for (size_t o = 0; o < oi.page_locations.size(); o++) {
-        auto const& page_loc = oi.page_locations[o];
-        auto const ph        = read_page_header(source, page_loc);
+      for (auto const& page_loc : oi.page_locations) {
+        auto const ph = read_page_header(source, page_loc);
         EXPECT_EQ(ph.type, expected_hdr_type);
         EXPECT_EQ(page_loc.first_row_index, num_vals);
         num_vals += is_v2 ? ph.data_page_header_v2.num_rows : ph.data_page_header.num_values;
@@ -889,8 +891,8 @@ TEST_P(ParquetV2Test, CheckColumnOffsetIndexNulls)
         }
         EXPECT_TRUE(compare_binary(stats.min_value.value(), ci.min_values[p], ptype, ctype) <= 0);
       }
-      for (size_t p = 0; p < ci.max_values.size(); p++) {
-        EXPECT_TRUE(compare_binary(stats.max_value.value(), ci.max_values[p], ptype, ctype) >= 0);
+      for (auto const& max_value : ci.max_values) {
+        EXPECT_TRUE(compare_binary(stats.max_value.value(), max_value, ptype, ctype) >= 0);
       }
     }
   }
@@ -953,9 +955,8 @@ TEST_P(ParquetV2Test, CheckColumnOffsetIndexNullColumn)
       auto const oi = read_offset_index(source, chunk);
 
       int64_t num_vals = 0;
-      for (size_t o = 0; o < oi.page_locations.size(); o++) {
-        auto const& page_loc = oi.page_locations[o];
-        auto const ph        = read_page_header(source, page_loc);
+      for (auto const& page_loc : oi.page_locations) {
+        auto const ph = read_page_header(source, page_loc);
         EXPECT_EQ(ph.type, expected_hdr_type);
         EXPECT_EQ(page_loc.first_row_index, num_vals);
         num_vals += is_v2 ? ph.data_page_header_v2.num_rows : ph.data_page_header.num_values;
@@ -1055,9 +1056,8 @@ TEST_P(ParquetV2Test, CheckColumnOffsetIndexStruct)
       auto const oi = read_offset_index(source, chunk);
 
       int64_t num_vals = 0;
-      for (size_t o = 0; o < oi.page_locations.size(); o++) {
-        auto const& page_loc = oi.page_locations[o];
-        auto const ph        = read_page_header(source, page_loc);
+      for (auto const& page_loc : oi.page_locations) {
+        auto const ph = read_page_header(source, page_loc);
         EXPECT_EQ(ph.type, expected_hdr_type);
         EXPECT_EQ(page_loc.first_row_index, num_vals);
         // last column has 2 values per row
@@ -1075,11 +1075,11 @@ TEST_P(ParquetV2Test, CheckColumnOffsetIndexStruct)
 
       auto const ptype = fmd.schema[colidx].type;
       auto const ctype = fmd.schema[colidx].converted_type;
-      for (size_t p = 0; p < ci.min_values.size(); p++) {
-        EXPECT_TRUE(compare_binary(stats.min_value.value(), ci.min_values[p], ptype, ctype) <= 0);
+      for (auto const& min_value : ci.min_values) {
+        EXPECT_TRUE(compare_binary(stats.min_value.value(), min_value, ptype, ctype) <= 0);
       }
-      for (size_t p = 0; p < ci.max_values.size(); p++) {
-        EXPECT_TRUE(compare_binary(stats.max_value.value(), ci.max_values[p], ptype, ctype) >= 0);
+      for (auto const& max_value : ci.max_values) {
+        EXPECT_TRUE(compare_binary(stats.max_value.value(), max_value, ptype, ctype) >= 0);
       }
     }
   }
@@ -1141,8 +1141,7 @@ TEST_P(ParquetV2Test, CheckColumnOffsetIndexStructNulls)
   // col3 will have num_ordered_rows / 4 nulls total
   int const null_mods[] = {0, 2, 3, 4};
 
-  for (size_t r = 0; r < fmd.row_groups.size(); r++) {
-    auto const& rg = fmd.row_groups[r];
+  for (auto const& rg : fmd.row_groups) {
     for (size_t c = 0; c < rg.columns.size(); c++) {
       auto const& chunk = rg.columns[c];
 
@@ -1343,8 +1342,7 @@ TEST_P(ParquetV2Test, CheckColumnIndexListWithNulls)
 
   read_footer(source, &fmd);
 
-  for (size_t r = 0; r < fmd.row_groups.size(); r++) {
-    auto const& rg = fmd.row_groups[r];
+  for (auto const& rg : fmd.row_groups) {
     for (size_t c = 0; c < rg.columns.size(); c++) {
       auto const& chunk = rg.columns[c];
 
@@ -1371,9 +1369,8 @@ TEST_P(ParquetV2Test, CheckColumnIndexListWithNulls)
       // the first row index is correct
       auto const oi = read_offset_index(source, chunk);
 
-      for (size_t o = 0; o < oi.page_locations.size(); o++) {
-        auto const& page_loc = oi.page_locations[o];
-        auto const ph        = read_page_header(source, page_loc);
+      for (auto const& page_loc : oi.page_locations) {
+        auto const ph = read_page_header(source, page_loc);
         EXPECT_EQ(ph.type, expected_hdr_type);
         // check null counts in V2 header
         if (is_v2) { EXPECT_EQ(ph.data_page_header_v2.num_nulls, expected_null_counts[c]); }
diff --git a/cpp/tests/io/parquet_writer_test.cpp b/cpp/tests/io/parquet_writer_test.cpp
index ad0860e265e..84ab83e33d0 100644
--- a/cpp/tests/io/parquet_writer_test.cpp
+++ b/cpp/tests/io/parquet_writer_test.cpp
@@ -134,7 +134,7 @@ TEST_F(ParquetWriterTest, MultiIndex)
     cudf::io::parquet_writer_options::builder(cudf::io::sink_info{filepath}, expected)
       .metadata(expected_metadata)
       .key_value_metadata(
-        {{{"pandas", "\"index_columns\": [\"int8s\", \"int16s\"], \"column1\": [\"int32s\"]"}}});
+        {{{"pandas", R"("index_columns": ["int8s", "int16s"], "column1": ["int32s"])"}}});
   cudf::io::write_parquet(out_opts);
 
   cudf::io::parquet_reader_options in_opts =
@@ -242,16 +242,18 @@ TEST_F(ParquetWriterTest, Struct)
   // `Name` column has all valid values.
   auto names_col = cudf::test::strings_column_wrapper{names.begin(), names.end()};
 
-  auto ages_col =
-    cudf::test::fixed_width_column_wrapper<int32_t>{{48, 27, 25, 31, 351, 351}, {1, 1, 1, 1, 1, 0}};
+  auto ages_col = cudf::test::fixed_width_column_wrapper<int32_t>{
+    {48, 27, 25, 31, 351, 351}, {true, true, true, true, true, false}};
 
-  auto struct_1 = cudf::test::structs_column_wrapper{{names_col, ages_col}, {1, 1, 1, 1, 0, 1}};
+  auto struct_1 = cudf::test::structs_column_wrapper{{names_col, ages_col},
+                                                     {true, true, true, true, false, true}};
 
   auto is_human_col = cudf::test::fixed_width_column_wrapper<bool>{
-    {true, true, false, false, false, false}, {1, 1, 0, 1, 1, 0}};
+    {true, true, false, false, false, false}, {true, true, false, true, true, false}};
 
-  auto struct_2 =
-    cudf::test::structs_column_wrapper{{is_human_col, struct_1}, {0, 1, 1, 1, 1, 1}}.release();
+  auto struct_2 = cudf::test::structs_column_wrapper{{is_human_col, struct_1},
+                                                     {false, true, true, true, true, true}}
+                    .release();
 
   auto expected = table_view({*struct_2});
 
@@ -274,7 +276,7 @@ class custom_test_data_sink : public cudf::io::data_sink {
     CUDF_EXPECTS(outfile_.is_open(), "Cannot open output file");
   }
 
-  virtual ~custom_test_data_sink() { flush(); }
+  ~custom_test_data_sink() override { flush(); }
 
   void host_write(void const* data, size_t size) override
   {
@@ -1968,7 +1970,7 @@ class custom_test_memmap_sink : public cudf::io::data_sink {
     mm_writer = cudf::io::data_sink::create(mm_writer_buf);
   }
 
-  virtual ~custom_test_memmap_sink() { mm_writer->flush(); }
+  ~custom_test_memmap_sink() override { mm_writer->flush(); }
 
   void host_write(void const* data, size_t size) override { mm_writer->host_write(data, size); }
 
diff --git a/cpp/tests/join/distinct_join_tests.cpp b/cpp/tests/join/distinct_join_tests.cpp
index 698256251ef..05ae4ea1d04 100644
--- a/cpp/tests/join/distinct_join_tests.cpp
+++ b/cpp/tests/join/distinct_join_tests.cpp
@@ -148,12 +148,12 @@ TEST_F(DistinctJoinTest, InnerJoinNoNulls)
 TEST_F(DistinctJoinTest, InnerJoinWithNulls)
 {
   column_wrapper<int32_t> col0_0{{3, 1, 2, 0, 2}};
-  strcol_wrapper col0_1({"s1", "s1", "s0", "s4", "s0"}, {1, 1, 0, 1, 1});
+  strcol_wrapper col0_1({"s1", "s1", "s0", "s4", "s0"}, {true, true, false, true, true});
   column_wrapper<int32_t> col0_2{{1, 1, 2, 4, 1}};
 
   column_wrapper<int32_t> col1_0{{1, 2, 0, 2, 3}};
   strcol_wrapper col1_1({"s1", "s0", "s1", "s0", "s1"});
-  column_wrapper<int32_t> col1_2{{1, 1, 1, 1, 1}, {0, 1, 1, 0, 1}};
+  column_wrapper<int32_t> col1_2{{1, 1, 1, 1, 1}, {false, true, true, false, true}};
 
   CVector cols0, cols1;
   cols0.push_back(col0_0.release());
@@ -170,10 +170,10 @@ TEST_F(DistinctJoinTest, InnerJoinWithNulls)
   auto result        = distinct_join.inner_join();
 
   column_wrapper<int32_t> col_gold_0{{3, 2}};
-  strcol_wrapper col_gold_1({"s1", "s0"}, {1, 1});
+  strcol_wrapper col_gold_1({"s1", "s0"}, {true, true});
   column_wrapper<int32_t> col_gold_2{{1, 1}};
   column_wrapper<int32_t> col_gold_3{{3, 2}};
-  strcol_wrapper col_gold_4({"s1", "s0"}, {1, 1});
+  strcol_wrapper col_gold_4({"s1", "s0"}, {true, true});
   column_wrapper<int32_t> col_gold_5{{1, 1}};
   CVector cols_gold;
   cols_gold.push_back(col_gold_0.release());
@@ -190,21 +190,22 @@ TEST_F(DistinctJoinTest, InnerJoinWithNulls)
 TEST_F(DistinctJoinTest, InnerJoinWithStructsAndNulls)
 {
   column_wrapper<int32_t> col0_0{{3, 1, 2, 0, 2}};
-  strcol_wrapper col0_1({"s1", "s1", "s0", "s4", "s0"}, {1, 1, 0, 1, 1});
-  column_wrapper<int32_t> col0_2{{0, 1, 2, 4, 4}, {1, 1, 1, 1, 0}};
+  strcol_wrapper col0_1({"s1", "s1", "s0", "s4", "s0"}, {true, true, false, true, true});
+  column_wrapper<int32_t> col0_2{{0, 1, 2, 4, 4}, {true, true, true, true, false}};
   std::initializer_list<std::string> col0_names = {
     "Samuel Vimes", "Carrot Ironfoundersson", "Detritus", "Samuel Vimes", "Angua von Überwald"};
   auto col0_names_col = strcol_wrapper{col0_names.begin(), col0_names.end()};
   auto col0_ages_col  = column_wrapper<int32_t>{{48, 27, 351, 31, 25}};
 
-  auto col0_is_human_col = column_wrapper<bool>{{true, true, false, false, false}, {1, 1, 0, 1, 0}};
+  auto col0_is_human_col =
+    column_wrapper<bool>{{true, true, false, false, false}, {true, true, false, true, false}};
 
   auto col0_3 =
     cudf::test::structs_column_wrapper{{col0_names_col, col0_ages_col, col0_is_human_col}};
 
   column_wrapper<int32_t> col1_0{{2, 2, 0, 4, 3}};
   strcol_wrapper col1_1({"s1", "s0", "s1", "s2", "s1"});
-  column_wrapper<int32_t> col1_2{{1, 1, 1, 2, 0}, {1, 0, 1, 1, 1}};
+  column_wrapper<int32_t> col1_2{{1, 1, 1, 2, 0}, {true, false, true, true, true}};
   std::initializer_list<std::string> col1_names = {"Carrot Ironfoundersson",
                                                    "Angua von Überwald",
                                                    "Detritus",
@@ -213,7 +214,8 @@ TEST_F(DistinctJoinTest, InnerJoinWithStructsAndNulls)
   auto col1_names_col = strcol_wrapper{col1_names.begin(), col1_names.end()};
   auto col1_ages_col  = column_wrapper<int32_t>{{31, 25, 351, 27, 48}};
 
-  auto col1_is_human_col = column_wrapper<bool>{{true, false, false, false, true}, {1, 0, 0, 1, 1}};
+  auto col1_is_human_col =
+    column_wrapper<bool>{{true, false, false, false, true}, {true, false, false, true, true}};
 
   auto col1_3 =
     cudf::test::structs_column_wrapper{{col1_names_col, col1_ages_col, col1_is_human_col}};
@@ -235,23 +237,23 @@ TEST_F(DistinctJoinTest, InnerJoinWithStructsAndNulls)
   auto result        = distinct_join.inner_join();
 
   column_wrapper<int32_t> col_gold_0{{3, 2}};
-  strcol_wrapper col_gold_1({"s1", "s0"}, {1, 1});
-  column_wrapper<int32_t> col_gold_2{{0, 4}, {1, 0}};
+  strcol_wrapper col_gold_1({"s1", "s0"}, {true, true});
+  column_wrapper<int32_t> col_gold_2{{0, 4}, {true, false}};
   auto col_gold_3_names_col = strcol_wrapper{"Samuel Vimes", "Angua von Überwald"};
   auto col_gold_3_ages_col  = column_wrapper<int32_t>{{48, 25}};
 
-  auto col_gold_3_is_human_col = column_wrapper<bool>{{true, false}, {1, 0}};
+  auto col_gold_3_is_human_col = column_wrapper<bool>{{true, false}, {true, false}};
 
   auto col_gold_3 = cudf::test::structs_column_wrapper{
     {col_gold_3_names_col, col_gold_3_ages_col, col_gold_3_is_human_col}};
 
   column_wrapper<int32_t> col_gold_4{{3, 2}};
-  strcol_wrapper col_gold_5({"s1", "s0"}, {1, 1});
-  column_wrapper<int32_t> col_gold_6{{0, -1}, {1, 0}};
+  strcol_wrapper col_gold_5({"s1", "s0"}, {true, true});
+  column_wrapper<int32_t> col_gold_6{{0, -1}, {true, false}};
   auto col_gold_7_names_col = strcol_wrapper{"Samuel Vimes", "Angua von Überwald"};
   auto col_gold_7_ages_col  = column_wrapper<int32_t>{{48, 25}};
 
-  auto col_gold_7_is_human_col = column_wrapper<bool>{{true, false}, {1, 0}};
+  auto col_gold_7_is_human_col = column_wrapper<bool>{{true, false}, {true, false}};
 
   auto col_gold_7 = cudf::test::structs_column_wrapper{
     {col_gold_7_names_col, col_gold_7_ages_col, col_gold_7_is_human_col}};
@@ -275,7 +277,7 @@ TEST_F(DistinctJoinTest, EmptyBuildTableInnerJoin)
   column_wrapper<int32_t> col0_1;
 
   column_wrapper<int32_t> col1_0{{2, 2, 0, 4, 3}};
-  column_wrapper<int32_t> col1_1{{1, 0, 1, 2, 1}, {1, 0, 1, 1, 1}};
+  column_wrapper<int32_t> col1_1{{1, 0, 1, 2, 1}, {true, false, true, true, true}};
 
   CVector cols0, cols1;
   cols0.push_back(col0_0.release());
@@ -298,7 +300,7 @@ TEST_F(DistinctJoinTest, EmptyBuildTableLeftJoin)
   column_wrapper<int32_t> col0_1;
 
   column_wrapper<int32_t> col1_0{{2, 2, 0, 4, 3}};
-  column_wrapper<int32_t> col1_1{{1, 0, 1, 2, 1}, {1, 0, 1, 1, 1}};
+  column_wrapper<int32_t> col1_1{{1, 0, 1, 2, 1}, {true, false, true, true, true}};
 
   CVector cols0, cols1;
   cols0.push_back(col0_0.release());
@@ -320,7 +322,7 @@ TEST_F(DistinctJoinTest, EmptyBuildTableLeftJoin)
 TEST_F(DistinctJoinTest, EmptyProbeTableInnerJoin)
 {
   column_wrapper<int32_t> col0_0{{2, 2, 0, 4, 3}};
-  column_wrapper<int32_t> col0_1{{1, 0, 1, 2, 1}, {1, 0, 1, 1, 1}};
+  column_wrapper<int32_t> col0_1{{1, 0, 1, 2, 1}, {true, false, true, true, true}};
 
   column_wrapper<int32_t> col1_0;
   column_wrapper<int32_t> col1_1;
@@ -343,7 +345,7 @@ TEST_F(DistinctJoinTest, EmptyProbeTableInnerJoin)
 TEST_F(DistinctJoinTest, EmptyProbeTableLeftJoin)
 {
   column_wrapper<int32_t> col0_0{{2, 2, 0, 4, 3}};
-  column_wrapper<int32_t> col0_1{{1, 0, 1, 2, 1}, {1, 0, 1, 1, 1}};
+  column_wrapper<int32_t> col0_1{{1, 0, 1, 2, 1}, {true, false, true, true, true}};
 
   column_wrapper<int32_t> col1_0;
   column_wrapper<int32_t> col1_1;
@@ -384,8 +386,8 @@ TEST_F(DistinctJoinTest, LeftJoinNoNulls)
 
   column_wrapper<int32_t> col_gold_0({3, 1, 2, 0, 3});
   strcol_wrapper col_gold_1({"s0", "s1", "s2", "s4", "s1"});
-  column_wrapper<int32_t> col_gold_2{{-1, -1, -1, -1, 3}, {0, 0, 0, 0, 1}};
-  strcol_wrapper col_gold_3{{"", "", "", "", "s1"}, {0, 0, 0, 0, 1}};
+  column_wrapper<int32_t> col_gold_2{{-1, -1, -1, -1, 3}, {false, false, false, false, true}};
+  strcol_wrapper col_gold_3{{"", "", "", "", "s1"}, {false, false, false, false, true}};
   CVector cols_gold;
   cols_gold.push_back(col_gold_0.release());
   cols_gold.push_back(col_gold_1.release());
@@ -404,7 +406,7 @@ TEST_F(DistinctJoinTest, LeftJoinNoNulls)
 TEST_F(DistinctJoinTest, LeftJoinWithNulls)
 {
   column_wrapper<int32_t> col0_0{{3, 1, 2, 0, 2}};
-  strcol_wrapper col0_1({"s1", "s1", "", "s4", "s0"}, {1, 1, 0, 1, 1});
+  strcol_wrapper col0_1({"s1", "s1", "", "s4", "s0"}, {true, true, false, true, true});
 
   column_wrapper<int32_t> col1_0{{2, 2, 0, 4, 3}};
   strcol_wrapper col1_1({"s1", "s0", "s1", "s2", "s1"});
@@ -422,10 +424,10 @@ TEST_F(DistinctJoinTest, LeftJoinWithNulls)
   auto result        = distinct_join.left_join();
   auto gather_map    = std::pair{std::move(result), std::move(get_left_indices(result->size()))};
 
-  column_wrapper<int32_t> col_gold_0{{3, 1, 2, 0, 2}, {1, 1, 1, 1, 1}};
-  strcol_wrapper col_gold_1({"s1", "s1", "", "s4", "s0"}, {1, 1, 0, 1, 1});
-  column_wrapper<int32_t> col_gold_2{{3, -1, -1, -1, 2}, {1, 0, 0, 0, 1}};
-  strcol_wrapper col_gold_3{{"s1", "", "", "", "s0"}, {1, 0, 0, 0, 1}};
+  column_wrapper<int32_t> col_gold_0{{3, 1, 2, 0, 2}, {true, true, true, true, true}};
+  strcol_wrapper col_gold_1({"s1", "s1", "", "s4", "s0"}, {true, true, false, true, true});
+  column_wrapper<int32_t> col_gold_2{{3, -1, -1, -1, 2}, {true, false, false, false, true}};
+  strcol_wrapper col_gold_3{{"s1", "", "", "", "s0"}, {true, false, false, false, true}};
 
   CVector cols_gold;
   cols_gold.push_back(col_gold_0.release());
@@ -442,15 +444,17 @@ TEST_F(DistinctJoinTest, LeftJoinWithStructsAndNulls)
 {
   auto col0_names_col = strcol_wrapper{
     "Samuel Vimes", "Carrot Ironfoundersson", "Detritus", "Samuel Vimes", "Angua von Überwald"};
-  auto col0_ages_col     = column_wrapper<int32_t>{{48, 27, 351, 31, 25}};
-  auto col0_is_human_col = column_wrapper<bool>{{true, true, false, false, false}, {1, 1, 0, 1, 0}};
+  auto col0_ages_col = column_wrapper<int32_t>{{48, 27, 351, 31, 25}};
+  auto col0_is_human_col =
+    column_wrapper<bool>{{true, true, false, false, false}, {true, true, false, true, false}};
   auto col0 =
     cudf::test::structs_column_wrapper{{col0_names_col, col0_ages_col, col0_is_human_col}};
 
   auto col1_names_col = strcol_wrapper{
     "Samuel Vimes", "Detritus", "Detritus", "Carrot Ironfoundersson", "Angua von Überwald"};
-  auto col1_ages_col     = column_wrapper<int32_t>{{48, 35, 351, 22, 25}};
-  auto col1_is_human_col = column_wrapper<bool>{{true, true, false, false, true}, {1, 1, 0, 1, 1}};
+  auto col1_ages_col = column_wrapper<int32_t>{{48, 35, 351, 22, 25}};
+  auto col1_is_human_col =
+    column_wrapper<bool>{{true, true, false, false, true}, {true, true, false, true, true}};
   auto col1 =
     cudf::test::structs_column_wrapper{{col1_names_col, col1_ages_col, col1_is_human_col}};
 
@@ -469,7 +473,7 @@ TEST_F(DistinctJoinTest, LeftJoinWithStructsAndNulls)
     "Samuel Vimes", "Detritus", "Carrot Ironfoundersson", "Samuel Vimes", "Angua von Überwald"};
   auto col0_gold_ages_col = column_wrapper<int32_t>{{48, 351, 27, 31, 25}};
   auto col0_gold_is_human_col =
-    column_wrapper<bool>{{true, false, true, false, false}, {1, 0, 1, 1, 0}};
+    column_wrapper<bool>{{true, false, true, false, false}, {true, false, true, true, false}};
   auto col0_gold = cudf::test::structs_column_wrapper{
     {col0_gold_names_col, col0_gold_ages_col, col0_gold_is_human_col}};
 
@@ -480,12 +484,14 @@ TEST_F(DistinctJoinTest, LeftJoinWithStructsAndNulls)
                                               "",
                                               "",
                                             },
-                                            {1, 1, 0, 0, 0}};
-  auto col1_gold_ages_col  = column_wrapper<int32_t>{{48, 351, -1, -1, -1}, {1, 1, 0, 0, 0}};
+                                            {true, true, false, false, false}};
+  auto col1_gold_ages_col =
+    column_wrapper<int32_t>{{48, 351, -1, -1, -1}, {true, true, false, false, false}};
   auto col1_gold_is_human_col =
-    column_wrapper<bool>{{true, false, false, false, false}, {1, 0, 0, 0, 0}};
+    column_wrapper<bool>{{true, false, false, false, false}, {true, false, false, false, false}};
   auto col1_gold = cudf::test::structs_column_wrapper{
-    {col1_gold_names_col, col1_gold_ages_col, col1_gold_is_human_col}, {1, 1, 0, 0, 0}};
+    {col1_gold_names_col, col1_gold_ages_col, col1_gold_is_human_col},
+    {true, true, false, false, false}};
 
   CVector cols_gold;
   cols_gold.push_back(col0_gold.release());
diff --git a/cpp/tests/join/join_tests.cpp b/cpp/tests/join/join_tests.cpp
index c35ad5319e4..4e88414d553 100644
--- a/cpp/tests/join/join_tests.cpp
+++ b/cpp/tests/join/join_tests.cpp
@@ -201,12 +201,14 @@ TEST_F(JoinTest, LeftJoinNoNullsWithNoCommon)
   auto result_sort_order = cudf::sorted_order(result->view());
   auto sorted_result     = cudf::gather(result->view(), *result_sort_order);
 
-  column_wrapper<int32_t> col_gold_0{{3, 1, 2, 2, 0, 3}, {1, 1, 1, 1, 1, 1}};
-  strcol_wrapper col_gold_1({"s0", "s1", "s2", "s2", "s4", "s1"}, {1, 1, 1, 1, 1, 1});
-  column_wrapper<int32_t> col_gold_2{{0, 1, 2, 2, 4, 1}, {1, 1, 1, 1, 1, 1}};
-  column_wrapper<int32_t> col_gold_3{{3, -1, 2, 2, 0, 3}, {1, 0, 1, 1, 1, 1}};
-  strcol_wrapper col_gold_4({"s1", "", "s1", "s0", "s1", "s1"}, {1, 0, 1, 1, 1, 1});
-  column_wrapper<int32_t> col_gold_5{{1, -1, 1, 0, 1, 1}, {1, 0, 1, 1, 1, 1}};
+  column_wrapper<int32_t> col_gold_0{{3, 1, 2, 2, 0, 3}, {true, true, true, true, true, true}};
+  strcol_wrapper col_gold_1({"s0", "s1", "s2", "s2", "s4", "s1"},
+                            {true, true, true, true, true, true});
+  column_wrapper<int32_t> col_gold_2{{0, 1, 2, 2, 4, 1}, {true, true, true, true, true, true}};
+  column_wrapper<int32_t> col_gold_3{{3, -1, 2, 2, 0, 3}, {true, false, true, true, true, true}};
+  strcol_wrapper col_gold_4({"s1", "", "s1", "s0", "s1", "s1"},
+                            {true, false, true, true, true, true});
+  column_wrapper<int32_t> col_gold_5{{1, -1, 1, 0, 1, 1}, {true, false, true, true, true, true}};
   CVector cols_gold;
   cols_gold.push_back(col_gold_0.release());
   cols_gold.push_back(col_gold_1.release());
@@ -247,14 +249,18 @@ TEST_F(JoinTest, FullJoinNoNulls)
   auto result_sort_order = cudf::sorted_order(result->view());
   auto sorted_result     = cudf::gather(result->view(), *result_sort_order);
 
-  column_wrapper<int32_t> col_gold_0{{3, 1, 2, 0, 3, -1, -1, -1, -1}, {1, 1, 1, 1, 1, 0, 0, 0, 0}};
+  column_wrapper<int32_t> col_gold_0{{3, 1, 2, 0, 3, -1, -1, -1, -1},
+                                     {true, true, true, true, true, false, false, false, false}};
   strcol_wrapper col_gold_1({"s0", "s1", "s2", "s4", "s1", "", "", "", ""},
-                            {1, 1, 1, 1, 1, 0, 0, 0, 0});
-  column_wrapper<int32_t> col_gold_2{{0, 1, 2, 4, 1, -1, -1, -1, -1}, {1, 1, 1, 1, 1, 0, 0, 0, 0}};
-  column_wrapper<int32_t> col_gold_3{{-1, -1, -1, -1, 3, 2, 2, 0, 4}, {0, 0, 0, 0, 1, 1, 1, 1, 1}};
+                            {true, true, true, true, true, false, false, false, false});
+  column_wrapper<int32_t> col_gold_2{{0, 1, 2, 4, 1, -1, -1, -1, -1},
+                                     {true, true, true, true, true, false, false, false, false}};
+  column_wrapper<int32_t> col_gold_3{{-1, -1, -1, -1, 3, 2, 2, 0, 4},
+                                     {false, false, false, false, true, true, true, true, true}};
   strcol_wrapper col_gold_4({"", "", "", "", "s1", "s1", "s0", "s1", "s2"},
-                            {0, 0, 0, 0, 1, 1, 1, 1, 1});
-  column_wrapper<int32_t> col_gold_5{{-1, -1, -1, -1, 1, 1, 0, 1, 2}, {0, 0, 0, 0, 1, 1, 1, 1, 1}};
+                            {false, false, false, false, true, true, true, true, true});
+  column_wrapper<int32_t> col_gold_5{{-1, -1, -1, -1, 1, 1, 0, 1, 2},
+                                     {false, false, false, false, true, true, true, true, true}};
 
   CVector cols_gold;
   cols_gold.push_back(col_gold_0.release());
@@ -277,7 +283,7 @@ TEST_F(JoinTest, FullJoinWithNulls)
   strcol_wrapper col0_1({"s0", "s1", "s2", "s4", "s1"});
   column_wrapper<int32_t> col0_2{{0, 1, 2, 4, 1}};
 
-  column_wrapper<int32_t> col1_0{{2, 2, 0, 4, 3}, {1, 1, 1, 0, 1}};
+  column_wrapper<int32_t> col1_0{{2, 2, 0, 4, 3}, {true, true, true, false, true}};
   strcol_wrapper col1_1{{"s1", "s0", "s1", "s2", "s1"}};
   column_wrapper<int32_t> col1_2{{1, 0, 1, 2, 1}};
 
@@ -296,14 +302,18 @@ TEST_F(JoinTest, FullJoinWithNulls)
   auto result_sort_order = cudf::sorted_order(result->view());
   auto sorted_result     = cudf::gather(result->view(), *result_sort_order);
 
-  column_wrapper<int32_t> col_gold_0{{3, 1, 2, 0, 3, -1, -1, -1, -1}, {1, 1, 1, 1, 1, 0, 0, 0, 0}};
+  column_wrapper<int32_t> col_gold_0{{3, 1, 2, 0, 3, -1, -1, -1, -1},
+                                     {true, true, true, true, true, false, false, false, false}};
   strcol_wrapper col_gold_1({"s0", "s1", "s2", "s4", "s1", "", "", "", ""},
-                            {1, 1, 1, 1, 1, 0, 0, 0, 0});
-  column_wrapper<int32_t> col_gold_2{{0, 1, 2, 4, 1, -1, -1, -1, -1}, {1, 1, 1, 1, 1, 0, 0, 0, 0}};
-  column_wrapper<int32_t> col_gold_3{{-1, -1, -1, -1, 3, 2, 2, 0, 4}, {0, 0, 0, 0, 1, 1, 1, 1, 0}};
+                            {true, true, true, true, true, false, false, false, false});
+  column_wrapper<int32_t> col_gold_2{{0, 1, 2, 4, 1, -1, -1, -1, -1},
+                                     {true, true, true, true, true, false, false, false, false}};
+  column_wrapper<int32_t> col_gold_3{{-1, -1, -1, -1, 3, 2, 2, 0, 4},
+                                     {false, false, false, false, true, true, true, true, false}};
   strcol_wrapper col_gold_4({"", "", "", "", "s1", "s1", "s0", "s1", "s2"},
-                            {0, 0, 0, 0, 1, 1, 1, 1, 1});
-  column_wrapper<int32_t> col_gold_5{{-1, -1, -1, -1, 1, 1, 0, 1, 2}, {0, 0, 0, 0, 1, 1, 1, 1, 1}};
+                            {false, false, false, false, true, true, true, true, true});
+  column_wrapper<int32_t> col_gold_5{{-1, -1, -1, -1, 1, 1, 0, 1, 2},
+                                     {false, false, false, false, true, true, true, true, true}};
 
   CVector cols_gold;
   cols_gold.push_back(col_gold_0.release());
@@ -324,12 +334,12 @@ TEST_F(JoinTest, FullJoinOnNulls)
 {
   // clang-format off
   column_wrapper<int32_t> col0_0{{  3,    1 },
-                                 {  1,    0  }};
+                                 {  true,    false  }};
   strcol_wrapper          col0_1({"s0", "s1" });
   column_wrapper<int32_t> col0_2{{  0,    1 }};
 
   column_wrapper<int32_t> col1_0{{  2,    5,    3,    7 },
-                                 {  1,    1,    1,    0 }};
+                                 {  true,    true,    true,    false }};
   strcol_wrapper          col1_1({"s1", "s0", "s0", "s1" });
   column_wrapper<int32_t> col1_2{{  1,    4,    2,    8 }};
 
@@ -349,13 +359,13 @@ TEST_F(JoinTest, FullJoinOnNulls)
   auto sorted_result     = cudf::gather(result->view(), *result_sort_order);
 
   column_wrapper<int32_t> col_gold_0{{   3,   -1,   -1,    -1},
-                                     {   1,    0,    0,     0}};
+                                     {   true,    false,    false,     false}};
   strcol_wrapper          col_gold_1{{ "s0", "s1",  "",    ""},
-                                     {   1,    1,    0,     0}};
+                                     {   true,    true,    false,     false}};
   column_wrapper<int32_t> col_gold_2{{   0,    1,   -1,    -1},
-                                     {   1,    1,    0,     0}};
+                                     {   true,    true,    false,     false}};
   column_wrapper<int32_t> col_gold_3{{   3,   -1,    2,     5},
-                                     {   1,    0,    1,     1}};
+                                     {   true,    false,    true,     true}};
   strcol_wrapper          col_gold_4{{ "s0", "s1", "s1",  "s0"}};
   column_wrapper<int32_t> col_gold_5{{   2,    8,    1,     4}};
 
@@ -382,17 +392,17 @@ TEST_F(JoinTest, FullJoinOnNulls)
   sorted_result     = cudf::gather(result->view(), *result_sort_order);
 
   col_gold_0 =               {{   3,   -1,   -1,    -1,   -1},
-                              {   1,    0,    0,     0,    0}};
+                              {   true,    false,    false,     false,    false}};
   col_gold_1 = strcol_wrapper{{ "s0", "s1",   "",    "",   ""},
-                              {   1,    1,    0,     0,    0}};
+                              {   true,    true,    false,     false,    false}};
   col_gold_2 =               {{   0,    1,   -1,    -1,   -1},
-                              {   1,    1,    0,     0,    0}};
+                              {   true,    true,    false,     false,    false}};
   col_gold_3 =               {{   3,   -1,    2,     5,   -1},
-                              {   1,    0,    1,     1,    0}};
+                              {   true,    false,    true,     true,    false}};
   col_gold_4 = strcol_wrapper{{ "s0",  "",  "s1",  "s0",  "s1"},
-                              {   1,    0,    1,     1,    1}};
+                              {   true,    false,    true,     true,    true}};
   col_gold_5 =               {{   2,   -1,    1,     4,    8},
-                              {   1,    0,    1,     1,    1}};
+                              {   true,    false,    true,     true,    true}};
 
   // clang-format on
 
@@ -440,9 +450,9 @@ TEST_F(JoinTest, LeftJoinNoNulls)
   column_wrapper<int32_t> col_gold_0({3, 1, 2, 0, 3});
   strcol_wrapper col_gold_1({"s0", "s1", "s2", "s4", "s1"});
   column_wrapper<int32_t> col_gold_2({0, 1, 2, 4, 1});
-  column_wrapper<int32_t> col_gold_3{{-1, -1, -1, -1, 3}, {0, 0, 0, 0, 1}};
-  strcol_wrapper col_gold_4{{"", "", "", "", "s1"}, {0, 0, 0, 0, 1}};
-  column_wrapper<int32_t> col_gold_5{{-1, -1, -1, -1, 1}, {0, 0, 0, 0, 1}};
+  column_wrapper<int32_t> col_gold_3{{-1, -1, -1, -1, 3}, {false, false, false, false, true}};
+  strcol_wrapper col_gold_4{{"", "", "", "", "s1"}, {false, false, false, false, true}};
+  column_wrapper<int32_t> col_gold_5{{-1, -1, -1, -1, 1}, {false, false, false, false, true}};
   CVector cols_gold;
   cols_gold.push_back(col_gold_0.release());
   cols_gold.push_back(col_gold_1.release());
@@ -460,12 +470,12 @@ TEST_F(JoinTest, LeftJoinNoNulls)
 TEST_F(JoinTest, LeftJoinWithNulls)
 {
   column_wrapper<int32_t> col0_0{{3, 1, 2, 0, 2}};
-  strcol_wrapper col0_1({"s1", "s1", "", "s4", "s0"}, {1, 1, 0, 1, 1});
+  strcol_wrapper col0_1({"s1", "s1", "", "s4", "s0"}, {true, true, false, true, true});
   column_wrapper<int32_t> col0_2{{0, 1, 2, 4, 1}};
 
   column_wrapper<int32_t> col1_0{{2, 2, 0, 4, 3}};
   strcol_wrapper col1_1({"s1", "s0", "s1", "s2", "s1"});
-  column_wrapper<int32_t> col1_2{{1, 0, 1, 2, 1}, {1, 0, 1, 1, 1}};
+  column_wrapper<int32_t> col1_2{{1, 0, 1, 2, 1}, {true, false, true, true, true}};
 
   CVector cols0, cols1;
   cols0.push_back(col0_0.release());
@@ -482,12 +492,12 @@ TEST_F(JoinTest, LeftJoinWithNulls)
   auto result_sort_order = cudf::sorted_order(result->view());
   auto sorted_result     = cudf::gather(result->view(), *result_sort_order);
 
-  column_wrapper<int32_t> col_gold_0{{3, 1, 2, 0, 2}, {1, 1, 1, 1, 1}};
-  strcol_wrapper col_gold_1({"s1", "s1", "", "s4", "s0"}, {1, 1, 0, 1, 1});
-  column_wrapper<int32_t> col_gold_2{{0, 1, 2, 4, 1}, {1, 1, 1, 1, 1}};
-  column_wrapper<int32_t> col_gold_3{{3, -1, -1, -1, 2}, {1, 0, 0, 0, 1}};
-  strcol_wrapper col_gold_4{{"s1", "", "", "", "s0"}, {1, 0, 0, 0, 1}};
-  column_wrapper<int32_t> col_gold_5{{1, -1, -1, -1, -1}, {1, 0, 0, 0, 0}};
+  column_wrapper<int32_t> col_gold_0{{3, 1, 2, 0, 2}, {true, true, true, true, true}};
+  strcol_wrapper col_gold_1({"s1", "s1", "", "s4", "s0"}, {true, true, false, true, true});
+  column_wrapper<int32_t> col_gold_2{{0, 1, 2, 4, 1}, {true, true, true, true, true}};
+  column_wrapper<int32_t> col_gold_3{{3, -1, -1, -1, 2}, {true, false, false, false, true}};
+  strcol_wrapper col_gold_4{{"s1", "", "", "", "s0"}, {true, false, false, false, true}};
+  column_wrapper<int32_t> col_gold_5{{1, -1, -1, -1, -1}, {true, false, false, false, false}};
 
   CVector cols_gold;
   cols_gold.push_back(col_gold_0.release());
@@ -506,25 +516,27 @@ TEST_F(JoinTest, LeftJoinWithNulls)
 TEST_F(JoinTest, LeftJoinWithStructsAndNulls)
 {
   column_wrapper<int32_t> col0_0{{3, 1, 2, 0, 2}};
-  strcol_wrapper col0_1({"s1", "s1", "", "s4", "s0"}, {1, 1, 0, 1, 1});
+  strcol_wrapper col0_1({"s1", "s1", "", "s4", "s0"}, {true, true, false, true, true});
   column_wrapper<int32_t> col0_2{{0, 1, 2, 4, 1}};
   auto col0_names_col = strcol_wrapper{
     "Samuel Vimes", "Carrot Ironfoundersson", "Detritus", "Samuel Vimes", "Angua von Überwald"};
   auto col0_ages_col = column_wrapper<int32_t>{{48, 27, 351, 31, 25}};
 
-  auto col0_is_human_col = column_wrapper<bool>{{true, true, false, false, false}, {1, 1, 0, 1, 0}};
+  auto col0_is_human_col =
+    column_wrapper<bool>{{true, true, false, false, false}, {true, true, false, true, false}};
 
   auto col0_3 =
     cudf::test::structs_column_wrapper{{col0_names_col, col0_ages_col, col0_is_human_col}};
 
   column_wrapper<int32_t> col1_0{{2, 2, 0, 4, 3}};
   strcol_wrapper col1_1({"s1", "s0", "s1", "s2", "s1"});
-  column_wrapper<int32_t> col1_2{{1, 0, 1, 2, 1}, {1, 0, 1, 1, 1}};
+  column_wrapper<int32_t> col1_2{{1, 0, 1, 2, 1}, {true, false, true, true, true}};
   auto col1_names_col = strcol_wrapper{
     "Samuel Vimes", "Detritus", "Detritus", "Carrot Ironfoundersson", "Angua von Überwald"};
   auto col1_ages_col = column_wrapper<int32_t>{{48, 35, 351, 22, 25}};
 
-  auto col1_is_human_col = column_wrapper<bool>{{true, true, false, false, true}, {1, 1, 0, 1, 1}};
+  auto col1_is_human_col =
+    column_wrapper<bool>{{true, true, false, false, true}, {true, true, false, true, true}};
 
   auto col1_3 =
     cudf::test::structs_column_wrapper{{col1_names_col, col1_ages_col, col1_is_human_col}};
@@ -546,22 +558,22 @@ TEST_F(JoinTest, LeftJoinWithStructsAndNulls)
   auto result_sort_order = cudf::sorted_order(result->view());
   auto sorted_result     = cudf::gather(result->view(), *result_sort_order);
 
-  column_wrapper<int32_t> col_gold_0{{3, 2, 1, 0, 2}, {1, 1, 1, 1, 1}};
-  strcol_wrapper col_gold_1({"s1", "", "s1", "s4", "s0"}, {1, 0, 1, 1, 1});
-  column_wrapper<int32_t> col_gold_2{{0, 2, 1, 4, 1}, {1, 1, 1, 1, 1}};
+  column_wrapper<int32_t> col_gold_0{{3, 2, 1, 0, 2}, {true, true, true, true, true}};
+  strcol_wrapper col_gold_1({"s1", "", "s1", "s4", "s0"}, {true, false, true, true, true});
+  column_wrapper<int32_t> col_gold_2{{0, 2, 1, 4, 1}, {true, true, true, true, true}};
   auto col0_gold_names_col = strcol_wrapper{
     "Samuel Vimes", "Detritus", "Carrot Ironfoundersson", "Samuel Vimes", "Angua von Überwald"};
   auto col0_gold_ages_col = column_wrapper<int32_t>{{48, 351, 27, 31, 25}};
 
   auto col0_gold_is_human_col =
-    column_wrapper<bool>{{true, false, true, false, false}, {1, 0, 1, 1, 0}};
+    column_wrapper<bool>{{true, false, true, false, false}, {true, false, true, true, false}};
 
   auto col_gold_3 = cudf::test::structs_column_wrapper{
     {col0_gold_names_col, col0_gold_ages_col, col0_gold_is_human_col}};
 
-  column_wrapper<int32_t> col_gold_4{{2, 0, -1, -1, -1}, {1, 1, 0, 0, 0}};
-  strcol_wrapper col_gold_5{{"s1", "s1", "", "", ""}, {1, 1, 0, 0, 0}};
-  column_wrapper<int32_t> col_gold_6{{1, 1, -1, -1, -1}, {1, 1, 0, 0, 0}};
+  column_wrapper<int32_t> col_gold_4{{2, 0, -1, -1, -1}, {true, true, false, false, false}};
+  strcol_wrapper col_gold_5{{"s1", "s1", "", "", ""}, {true, true, false, false, false}};
+  column_wrapper<int32_t> col_gold_6{{1, 1, -1, -1, -1}, {true, true, false, false, false}};
   auto col1_gold_names_col = strcol_wrapper{{
                                               "Samuel Vimes",
                                               "Detritus",
@@ -569,14 +581,16 @@ TEST_F(JoinTest, LeftJoinWithStructsAndNulls)
                                               "",
                                               "",
                                             },
-                                            {1, 1, 0, 0, 0}};
-  auto col1_gold_ages_col  = column_wrapper<int32_t>{{48, 351, -1, -1, -1}, {1, 1, 0, 0, 0}};
+                                            {true, true, false, false, false}};
+  auto col1_gold_ages_col =
+    column_wrapper<int32_t>{{48, 351, -1, -1, -1}, {true, true, false, false, false}};
 
   auto col1_gold_is_human_col =
-    column_wrapper<bool>{{true, false, false, false, false}, {1, 0, 0, 0, 0}};
+    column_wrapper<bool>{{true, false, false, false, false}, {true, false, false, false, false}};
 
   auto col_gold_7 = cudf::test::structs_column_wrapper{
-    {col1_gold_names_col, col1_gold_ages_col, col1_gold_is_human_col}, {1, 1, 0, 0, 0}};
+    {col1_gold_names_col, col1_gold_ages_col, col1_gold_is_human_col},
+    {true, true, false, false, false}};
 
   CVector cols_gold;
   cols_gold.push_back(col_gold_0.release());
@@ -598,12 +612,12 @@ TEST_F(JoinTest, LeftJoinOnNulls)
 {
   // clang-format off
   column_wrapper<int32_t> col0_0{{  3,    1,    2},
-                                 {  1,    0,    1}};
+                                 {  true,    false,    true}};
   strcol_wrapper          col0_1({"s0", "s1", "s2" });
   column_wrapper<int32_t> col0_2{{  0,    1,    2 }};
 
   column_wrapper<int32_t> col1_0{{  2,    5,    3,    7 },
-                                 {  1,    1,    1,    0 }};
+                                 {  true,    true,    true,    false }};
   strcol_wrapper          col1_1({"s1", "s0", "s0", "s1" });
   column_wrapper<int32_t> col1_2{{  1,    4,    2,    8 }};
 
@@ -623,17 +637,17 @@ TEST_F(JoinTest, LeftJoinOnNulls)
   auto sorted_result     = cudf::gather(result->view(), *result_sort_order);
 
   column_wrapper<int32_t> col_gold_0{{   3,    -1,    2},
-                                     {   1,     0,    1}};
+                                     {   true,     false,    true}};
   strcol_wrapper          col_gold_1({ "s0",  "s1", "s2"},
-                                     {   1,     1,    1});
+                                     {   true,     true,    true});
   column_wrapper<int32_t> col_gold_2{{   0,     1,    2},
-                                     {   1,     1,    1}};
+                                     {   true,     true,    true}};
   column_wrapper<int32_t> col_gold_3{{   3,    -1,   -1},
-                                     {   1,     0,    0}};
+                                     {   true,     false,    false}};
   strcol_wrapper          col_gold_4({ "s0",  "s1",  ""},
-                                     {   1,     1,    0});
+                                     {   true,     true,    false});
   column_wrapper<int32_t> col_gold_5{{   2,     8,   -1},
-                                     {   1,     1,    0}};
+                                     {   true,     true,    false}};
 
   CVector cols_gold;
   cols_gold.push_back(col_gold_0.release());
@@ -658,17 +672,17 @@ TEST_F(JoinTest, LeftJoinOnNulls)
 
 
   col_gold_0 = {{   3,    -1,    2},
-                {   1,     0,    1}};
+                {   true,     false,    true}};
   col_gold_1 = {{ "s0",  "s1", "s2"},
-                {   1,     1,    1}};
+                {   true,     true,    true}};
   col_gold_2 = {{   0,     1,    2},
-                {   1,     1,    1}};
+                {   true,     true,    true}};
   col_gold_3 = {{   3,    -1,   -1},
-                {   1,     0,    0}};
+                {   true,     false,    false}};
   col_gold_4 = {{ "s0",   "",   ""},
-                {   1,     0,    0}};
+                {   true,     false,    false}};
   col_gold_5 = {{   2,    -1,   -1},
-                {   1,     0,    0}};
+                {   true,     false,    false}};
 
   // clang-format on
   CVector cols_gold_nulls_unequal;
@@ -732,12 +746,12 @@ TEST_F(JoinTest, InnerJoinNoNulls)
 TEST_F(JoinTest, InnerJoinWithNulls)
 {
   column_wrapper<int32_t> col0_0{{3, 1, 2, 0, 2}};
-  strcol_wrapper col0_1({"s1", "s1", "s0", "s4", "s0"}, {1, 1, 0, 1, 1});
+  strcol_wrapper col0_1({"s1", "s1", "s0", "s4", "s0"}, {true, true, false, true, true});
   column_wrapper<int32_t> col0_2{{0, 1, 2, 4, 1}};
 
   column_wrapper<int32_t> col1_0{{2, 2, 0, 4, 3}};
   strcol_wrapper col1_1({"s1", "s0", "s1", "s2", "s1"});
-  column_wrapper<int32_t> col1_2{{1, 0, 1, 2, 1}, {1, 0, 1, 1, 1}};
+  column_wrapper<int32_t> col1_2{{1, 0, 1, 2, 1}, {true, false, true, true, true}};
 
   CVector cols0, cols1;
   cols0.push_back(col0_0.release());
@@ -755,11 +769,11 @@ TEST_F(JoinTest, InnerJoinWithNulls)
   auto sorted_result     = cudf::gather(result->view(), *result_sort_order);
 
   column_wrapper<int32_t> col_gold_0{{3, 2}};
-  strcol_wrapper col_gold_1({"s1", "s0"}, {1, 1});
+  strcol_wrapper col_gold_1({"s1", "s0"}, {true, true});
   column_wrapper<int32_t> col_gold_2{{0, 1}};
   column_wrapper<int32_t> col_gold_3{{3, 2}};
-  strcol_wrapper col_gold_4({"s1", "s0"}, {1, 1});
-  column_wrapper<int32_t> col_gold_5{{1, -1}, {1, 0}};
+  strcol_wrapper col_gold_4({"s1", "s0"}, {true, true});
+  column_wrapper<int32_t> col_gold_5{{1, -1}, {true, false}};
   CVector cols_gold;
   cols_gold.push_back(col_gold_0.release());
   cols_gold.push_back(col_gold_1.release());
@@ -777,21 +791,22 @@ TEST_F(JoinTest, InnerJoinWithNulls)
 TEST_F(JoinTest, InnerJoinWithStructsAndNulls)
 {
   column_wrapper<int32_t> col0_0{{3, 1, 2, 0, 2}};
-  strcol_wrapper col0_1({"s1", "s1", "s0", "s4", "s0"}, {1, 1, 0, 1, 1});
+  strcol_wrapper col0_1({"s1", "s1", "s0", "s4", "s0"}, {true, true, false, true, true});
   column_wrapper<int32_t> col0_2{{0, 1, 2, 4, 1}};
   std::initializer_list<std::string> col0_names = {
     "Samuel Vimes", "Carrot Ironfoundersson", "Detritus", "Samuel Vimes", "Angua von Überwald"};
   auto col0_names_col = strcol_wrapper{col0_names.begin(), col0_names.end()};
   auto col0_ages_col  = column_wrapper<int32_t>{{48, 27, 351, 31, 25}};
 
-  auto col0_is_human_col = column_wrapper<bool>{{true, true, false, false, false}, {1, 1, 0, 1, 0}};
+  auto col0_is_human_col =
+    column_wrapper<bool>{{true, true, false, false, false}, {true, true, false, true, false}};
 
   auto col0_3 =
     cudf::test::structs_column_wrapper{{col0_names_col, col0_ages_col, col0_is_human_col}};
 
   column_wrapper<int32_t> col1_0{{2, 2, 0, 4, 3}};
   strcol_wrapper col1_1({"s1", "s0", "s1", "s2", "s1"});
-  column_wrapper<int32_t> col1_2{{1, 0, 1, 2, 1}, {1, 0, 1, 1, 1}};
+  column_wrapper<int32_t> col1_2{{1, 0, 1, 2, 1}, {true, false, true, true, true}};
   std::initializer_list<std::string> col1_names = {"Carrot Ironfoundersson",
                                                    "Angua von Überwald",
                                                    "Detritus",
@@ -800,7 +815,8 @@ TEST_F(JoinTest, InnerJoinWithStructsAndNulls)
   auto col1_names_col = strcol_wrapper{col1_names.begin(), col1_names.end()};
   auto col1_ages_col  = column_wrapper<int32_t>{{351, 25, 27, 31, 48}};
 
-  auto col1_is_human_col = column_wrapper<bool>{{true, false, false, false, true}, {1, 0, 0, 1, 1}};
+  auto col1_is_human_col =
+    column_wrapper<bool>{{true, false, false, false, true}, {true, false, false, true, true}};
 
   auto col1_3 =
     cudf::test::structs_column_wrapper{{col1_names_col, col1_ages_col, col1_is_human_col}};
@@ -823,23 +839,23 @@ TEST_F(JoinTest, InnerJoinWithStructsAndNulls)
   auto sorted_result     = cudf::gather(result->view(), *result_sort_order);
 
   column_wrapper<int32_t> col_gold_0{{3, 2}};
-  strcol_wrapper col_gold_1({"s1", "s0"}, {1, 1});
+  strcol_wrapper col_gold_1({"s1", "s0"}, {true, true});
   column_wrapper<int32_t> col_gold_2{{0, 1}};
   auto col_gold_3_names_col = strcol_wrapper{"Samuel Vimes", "Angua von Überwald"};
   auto col_gold_3_ages_col  = column_wrapper<int32_t>{{48, 25}};
 
-  auto col_gold_3_is_human_col = column_wrapper<bool>{{true, false}, {1, 0}};
+  auto col_gold_3_is_human_col = column_wrapper<bool>{{true, false}, {true, false}};
 
   auto col_gold_3 = cudf::test::structs_column_wrapper{
     {col_gold_3_names_col, col_gold_3_ages_col, col_gold_3_is_human_col}};
 
   column_wrapper<int32_t> col_gold_4{{3, 2}};
-  strcol_wrapper col_gold_5({"s1", "s0"}, {1, 1});
-  column_wrapper<int32_t> col_gold_6{{1, -1}, {1, 0}};
+  strcol_wrapper col_gold_5({"s1", "s0"}, {true, true});
+  column_wrapper<int32_t> col_gold_6{{1, -1}, {true, false}};
   auto col_gold_7_names_col = strcol_wrapper{"Samuel Vimes", "Angua von Überwald"};
   auto col_gold_7_ages_col  = column_wrapper<int32_t>{{48, 25}};
 
-  auto col_gold_7_is_human_col = column_wrapper<bool>{{true, false}, {1, 0}};
+  auto col_gold_7_is_human_col = column_wrapper<bool>{{true, false}, {true, false}};
 
   auto col_gold_7 = cudf::test::structs_column_wrapper{
     {col_gold_7_names_col, col_gold_7_ages_col, col_gold_7_is_human_col}};
@@ -865,12 +881,12 @@ TEST_F(JoinTest, InnerJoinOnNulls)
   // clang-format off
   column_wrapper<int32_t> col0_0{{  3,    1,    2,    0,    2}};
   strcol_wrapper          col0_1({"s1", "s1", "s8", "s4", "s0"},
-                                 {  1,    1,    0,    1,    1});
+                                 {  true,    true,    false,    true,    true});
   column_wrapper<int32_t> col0_2{{  0,    1,    2,    4,    1}};
 
   column_wrapper<int32_t> col1_0{{  2,    2,    0,    4,    3}};
   strcol_wrapper          col1_1({"s1", "s0", "s1", "s2", "s1"},
-                                 {  1,    0,    1,    1,    1});
+                                 {  true,    false,    true,    true,    true});
   column_wrapper<int32_t> col1_2{{  1,    0,    1,    2,    1}};
 
   CVector cols0, cols1;
@@ -890,11 +906,11 @@ TEST_F(JoinTest, InnerJoinOnNulls)
 
   column_wrapper<int32_t> col_gold_0 {{  3,    2}};
   strcol_wrapper          col_gold_1 ({"s1", "s0"},
-                                      {  1,    0});
+                                      {  true,    false});
   column_wrapper<int32_t> col_gold_2{{   0,    2}};
   column_wrapper<int32_t> col_gold_3 {{  3,    2}};
   strcol_wrapper          col_gold_4 ({"s1", "s0"},
-                                      {  1,    0});
+                                      {  true,    false});
   column_wrapper<int32_t> col_gold_5{{   1,    0}};
   CVector cols_gold;
   cols_gold.push_back(col_gold_0.release());
@@ -919,11 +935,11 @@ TEST_F(JoinTest, InnerJoinOnNulls)
 
   col_gold_0 =               {{  3}};
   col_gold_1 = strcol_wrapper({"s1"},
-                              {  1});
+                              {  true});
   col_gold_2 =               {{  0}};
   col_gold_3 =               {{  3}};
   col_gold_4 = strcol_wrapper({"s1"},
-                              {  1});
+                              {  true});
   col_gold_5 =               {{  1}};
 
   // clang-format on
@@ -949,7 +965,7 @@ TEST_F(JoinTest, EmptyLeftTableInnerJoin)
   column_wrapper<int32_t> col0_1;
 
   column_wrapper<int32_t> col1_0{{2, 2, 0, 4, 3}};
-  column_wrapper<int32_t> col1_1{{1, 0, 1, 2, 1}, {1, 0, 1, 1, 1}};
+  column_wrapper<int32_t> col1_1{{1, 0, 1, 2, 1}, {true, false, true, true, true}};
 
   CVector cols0, cols1;
   cols0.push_back(col0_0.release());
@@ -970,7 +986,7 @@ TEST_F(JoinTest, EmptyLeftTableLeftJoin)
   column_wrapper<int32_t> col0_1;
 
   column_wrapper<int32_t> col1_0{{2, 2, 0, 4, 3}};
-  column_wrapper<int32_t> col1_1{{1, 0, 1, 2, 1}, {1, 0, 1, 1, 1}};
+  column_wrapper<int32_t> col1_1{{1, 0, 1, 2, 1}, {true, false, true, true, true}};
 
   CVector cols0, cols1;
   cols0.push_back(col0_0.release());
@@ -991,7 +1007,7 @@ TEST_F(JoinTest, EmptyLeftTableFullJoin)
   column_wrapper<int32_t> col0_1;
 
   column_wrapper<int32_t> col1_0{{2, 2, 0, 4, 3}};
-  column_wrapper<int32_t> col1_1{{1, 0, 1, 2, 1}, {1, 0, 1, 1, 1}};
+  column_wrapper<int32_t> col1_1{{1, 0, 1, 2, 1}, {true, false, true, true, true}};
 
   CVector cols0, cols1;
   cols0.push_back(col0_0.release());
@@ -1006,10 +1022,10 @@ TEST_F(JoinTest, EmptyLeftTableFullJoin)
   auto result_sort_order = cudf::sorted_order(result->view());
   auto sorted_result     = cudf::gather(result->view(), *result_sort_order);
 
-  column_wrapper<int32_t> col_gold_0{{-1, -1, -1, -1, -1}, {0, 0, 0, 0, 0}};
-  column_wrapper<int32_t> col_gold_1{{-1, -1, -1, -1, -1}, {0, 0, 0, 0, 0}};
+  column_wrapper<int32_t> col_gold_0{{-1, -1, -1, -1, -1}, {false, false, false, false, false}};
+  column_wrapper<int32_t> col_gold_1{{-1, -1, -1, -1, -1}, {false, false, false, false, false}};
   column_wrapper<int32_t> col_gold_2{{2, 2, 0, 4, 3}};
-  column_wrapper<int32_t> col_gold_3{{1, 0, 1, 2, 1}, {1, 0, 1, 1, 1}};
+  column_wrapper<int32_t> col_gold_3{{1, 0, 1, 2, 1}, {true, false, true, true, true}};
 
   CVector cols_gold;
   cols_gold.push_back(col_gold_0.release());
@@ -1028,7 +1044,7 @@ TEST_F(JoinTest, EmptyLeftTableFullJoin)
 TEST_F(JoinTest, EmptyRightTableInnerJoin)
 {
   column_wrapper<int32_t> col0_0{{2, 2, 0, 4, 3}};
-  column_wrapper<int32_t> col0_1{{1, 0, 1, 2, 1}, {1, 0, 1, 1, 1}};
+  column_wrapper<int32_t> col0_1{{1, 0, 1, 2, 1}, {true, false, true, true, true}};
 
   column_wrapper<int32_t> col1_0;
   column_wrapper<int32_t> col1_1;
@@ -1066,8 +1082,8 @@ TEST_F(JoinTest, EmptyRightTableInnerJoin)
 
 TEST_F(JoinTest, EmptyRightTableLeftJoin)
 {
-  column_wrapper<int32_t> col0_0{{2, 2, 0, 4, 3}, {1, 1, 1, 1, 1}};
-  column_wrapper<int32_t> col0_1{{1, 0, 1, 2, 1}, {1, 0, 1, 1, 1}};
+  column_wrapper<int32_t> col0_0{{2, 2, 0, 4, 3}, {true, true, true, true, true}};
+  column_wrapper<int32_t> col0_1{{1, 0, 1, 2, 1}, {true, false, true, true, true}};
 
   column_wrapper<int32_t> col1_0;
   column_wrapper<int32_t> col1_1;
@@ -1106,7 +1122,7 @@ TEST_F(JoinTest, EmptyRightTableLeftJoin)
 TEST_F(JoinTest, EmptyRightTableFullJoin)
 {
   column_wrapper<int32_t> col0_0{{2, 2, 0, 4, 3}};
-  column_wrapper<int32_t> col0_1{{1, 0, 1, 2, 1}, {1, 0, 1, 1, 1}};
+  column_wrapper<int32_t> col0_1{{1, 0, 1, 2, 1}, {true, false, true, true, true}};
 
   column_wrapper<int32_t> col1_0;
   column_wrapper<int32_t> col1_1;
@@ -1262,10 +1278,10 @@ TEST_F(JoinTest, EqualValuesLeftJoin)
 
   auto result = left_join(t0, t1, {0, 1}, {0, 1});
 
-  column_wrapper<int32_t> col_gold_0{{0, 0, 0, 0}, {1, 1, 1, 1}};
-  strcol_wrapper col_gold_1({"s0", "s0", "s0", "s0"}, {1, 1, 1, 1});
-  column_wrapper<int32_t> col_gold_2{{0, 0, 0, 0}, {1, 1, 1, 1}};
-  strcol_wrapper col_gold_3({"s0", "s0", "s0", "s0"}, {1, 1, 1, 1});
+  column_wrapper<int32_t> col_gold_0{{0, 0, 0, 0}, {true, true, true, true}};
+  strcol_wrapper col_gold_1({"s0", "s0", "s0", "s0"}, {true, true, true, true});
+  column_wrapper<int32_t> col_gold_2{{0, 0, 0, 0}, {true, true, true, true}};
+  strcol_wrapper col_gold_3({"s0", "s0", "s0", "s0"}, {true, true, true, true});
 
   CVector cols_gold;
   cols_gold.push_back(col_gold_0.release());
@@ -1416,7 +1432,8 @@ TEST_F(JoinTest, HashJoinWithStructsAndNulls)
     "Samuel Vimes", "Carrot Ironfoundersson", "Detritus", "Samuel Vimes", "Angua von Überwald"};
   auto col0_ages_col = column_wrapper<int32_t>{{48, 27, 351, 31, 25}};
 
-  auto col0_is_human_col = column_wrapper<bool>{{true, true, false, false, false}, {1, 1, 0, 1, 0}};
+  auto col0_is_human_col =
+    column_wrapper<bool>{{true, true, false, false, false}, {true, true, false, true, false}};
 
   auto col0 =
     cudf::test::structs_column_wrapper{{col0_names_col, col0_ages_col, col0_is_human_col}};
@@ -1425,7 +1442,8 @@ TEST_F(JoinTest, HashJoinWithStructsAndNulls)
     "Samuel Vimes", "Detritus", "Detritus", "Carrot Ironfoundersson", "Angua von Überwald"};
   auto col1_ages_col = column_wrapper<int32_t>{{48, 35, 351, 22, 25}};
 
-  auto col1_is_human_col = column_wrapper<bool>{{true, true, false, false, true}, {1, 1, 0, 1, 1}};
+  auto col1_is_human_col =
+    column_wrapper<bool>{{true, true, false, false, true}, {true, true, false, true, true}};
 
   auto col1 =
     cudf::test::structs_column_wrapper{{col1_names_col, col1_ages_col, col1_is_human_col}};
@@ -1638,13 +1656,13 @@ TEST_F(JoinDictionaryTest, LeftJoinNoNulls)
 TEST_F(JoinDictionaryTest, LeftJoinWithNulls)
 {
   column_wrapper<int32_t> col0_0{{3, 1, 2, 0, 2}};
-  strcol_wrapper col0_1({"s1", "s1", "s0", "s4", "s0"}, {1, 1, 0, 1, 1});
+  strcol_wrapper col0_1({"s1", "s1", "s0", "s4", "s0"}, {true, true, false, true, true});
   column_wrapper<int32_t> col0_2_w{{0, 1, 2, 4, 1}};
   auto col0_2 = cudf::dictionary::encode(col0_2_w);
 
   column_wrapper<int32_t> col1_0{{2, 2, 0, 4, 3}};
   strcol_wrapper col1_1({"s1", "s0", "s1", "s2", "s1"});
-  column_wrapper<int32_t> col1_2_w{{1, 0, 1, 2, 1}, {1, 0, 1, 1, 1}};
+  column_wrapper<int32_t> col1_2_w{{1, 0, 1, 2, 1}, {true, false, true, true, true}};
   auto col1_2 = cudf::dictionary::encode(col1_2_w);
 
   auto t0 = cudf::table_view({col0_0, col0_1, col0_2->view()});
@@ -1712,13 +1730,13 @@ TEST_F(JoinDictionaryTest, InnerJoinNoNulls)
 TEST_F(JoinDictionaryTest, InnerJoinWithNulls)
 {
   column_wrapper<int32_t> col0_0{{3, 1, 2, 0, 2}};
-  strcol_wrapper col0_1({"s1", "s1", "s0", "s4", "s0"}, {1, 1, 0, 1, 1});
+  strcol_wrapper col0_1({"s1", "s1", "s0", "s4", "s0"}, {true, true, false, true, true});
   column_wrapper<int32_t> col0_2_w{{0, 1, 2, 4, 1}};
   auto col0_2 = cudf::dictionary::encode(col0_2_w);
 
   column_wrapper<int32_t> col1_0{{2, 2, 0, 4, 3}};
   strcol_wrapper col1_1({"s1", "s0", "s1", "s2", "s1"});
-  column_wrapper<int32_t> col1_2_w{{1, 0, 1, 2, 1}, {1, 0, 1, 1, 1}};
+  column_wrapper<int32_t> col1_2_w{{1, 0, 1, 2, 1}, {true, false, true, true, true}};
   auto col1_2 = cudf::dictionary::encode(col1_2_w);
 
   auto t0 = cudf::table_view({col0_0, col0_1, col0_2->view()});
@@ -1790,7 +1808,7 @@ TEST_F(JoinDictionaryTest, FullJoinWithNulls)
   strcol_wrapper col0_1({"s0", "s1", "s2", "s4", "s1"});
   column_wrapper<int32_t> col0_2{{0, 1, 2, 4, 1}};
 
-  column_wrapper<int32_t> col1_0_w{{2, 2, 0, 4, 3}, {1, 1, 1, 0, 1}};
+  column_wrapper<int32_t> col1_0_w{{2, 2, 0, 4, 3}, {true, true, true, false, true}};
   auto col1_0 = cudf::dictionary::encode(col1_0_w);
   strcol_wrapper col1_1{{"s1", "s0", "s1", "s2", "s1"}};
   column_wrapper<int32_t> col1_2{{1, 0, 1, 2, 1}};
@@ -1834,12 +1852,13 @@ TEST_F(JoinTest, FullJoinWithStructsAndNulls)
   auto col0_names_col = strcol_wrapper{col0_names.begin(), col0_names.end()};
   auto col0_ages_col  = column_wrapper<int32_t>{{48, 27, 25, 31, 351}};
 
-  auto col0_is_human_col = column_wrapper<bool>{{true, true, false, false, false}, {1, 1, 0, 1, 1}};
+  auto col0_is_human_col =
+    column_wrapper<bool>{{true, true, false, false, false}, {true, true, false, true, true}};
 
   auto col0_3 = cudf::test::structs_column_wrapper{
-    {col0_names_col, col0_ages_col, col0_is_human_col}, {1, 1, 1, 1, 1}};
+    {col0_names_col, col0_ages_col, col0_is_human_col}, {true, true, true, true, true}};
 
-  column_wrapper<int32_t> col1_0{{2, 2, 0, 4, 3}, {1, 1, 1, 0, 1}};
+  column_wrapper<int32_t> col1_0{{2, 2, 0, 4, 3}, {true, true, true, false, true}};
   strcol_wrapper col1_1{{"s1", "s0", "s1", "s2", "s1"}};
   column_wrapper<int32_t> col1_2{{1, 0, 1, 2, 1}};
 
@@ -1851,7 +1870,8 @@ TEST_F(JoinTest, FullJoinWithStructsAndNulls)
   auto col1_names_col = strcol_wrapper{col1_names.begin(), col1_names.end()};
   auto col1_ages_col  = column_wrapper<int32_t>{{27, 48, 27, 25, 27}};
 
-  auto col1_is_human_col = column_wrapper<bool>{{true, true, true, false, true}, {1, 1, 1, 0, 1}};
+  auto col1_is_human_col =
+    column_wrapper<bool>{{true, true, true, false, true}, {true, true, true, false, true}};
 
   auto col1_3 =
     cudf::test::structs_column_wrapper{{col1_names_col, col1_ages_col, col1_is_human_col}};
@@ -1873,59 +1893,69 @@ TEST_F(JoinTest, FullJoinWithStructsAndNulls)
   auto result_sort_order = cudf::sorted_order(result->view());
   auto sorted_result     = cudf::gather(result->view(), *result_sort_order);
 
-  column_wrapper<int32_t> col_gold_0{{3, 1, 2, 0, 3, -1, -1, -1, -1, -1},
-                                     {1, 1, 1, 1, 1, 0, 0, 0, 0, 0}};
+  column_wrapper<int32_t> col_gold_0{
+    {3, 1, 2, 0, 3, -1, -1, -1, -1, -1},
+    {true, true, true, true, true, false, false, false, false, false}};
   strcol_wrapper col_gold_1({"s0", "s1", "s2", "s4", "s1", "", "", "", "", ""},
-                            {1, 1, 1, 1, 1, 0, 0, 0, 0, 0});
-  column_wrapper<int32_t> col_gold_2{{0, 1, 2, 4, 1, -1, -1, -1, -1, -1},
-                                     {1, 1, 1, 1, 1, 0, 0, 0, 0, 0}};
-  auto gold_names0_col = strcol_wrapper{{"Samuel Vimes",
-                                         "Carrot Ironfoundersson",
-                                         "Angua von Überwald",
-                                         "Detritus",
-                                         "Carrot Ironfoundersson",
-                                         "",
-                                         "",
-                                         "",
-                                         "",
-                                         ""},
-                                        {1, 1, 1, 1, 1, 0, 0, 0, 0, 0}};
-  auto gold_ages0_col  = column_wrapper<int32_t>{{48, 27, 25, 31, 351, -1, -1, -1, -1, -1},
-                                                 {1, 1, 1, 1, 1, 0, 0, 0, 0, 0}};
+                            {true, true, true, true, true, false, false, false, false, false});
+  column_wrapper<int32_t> col_gold_2{
+    {0, 1, 2, 4, 1, -1, -1, -1, -1, -1},
+    {true, true, true, true, true, false, false, false, false, false}};
+  auto gold_names0_col =
+    strcol_wrapper{{"Samuel Vimes",
+                    "Carrot Ironfoundersson",
+                    "Angua von Überwald",
+                    "Detritus",
+                    "Carrot Ironfoundersson",
+                    "",
+                    "",
+                    "",
+                    "",
+                    ""},
+                   {true, true, true, true, true, false, false, false, false, false}};
+  auto gold_ages0_col =
+    column_wrapper<int32_t>{{48, 27, 25, 31, 351, -1, -1, -1, -1, -1},
+                            {true, true, true, true, true, false, false, false, false, false}};
 
   auto gold_is_human0_col =
     column_wrapper<bool>{{true, true, false, false, false, false, false, false, false, false},
-                         {1, 1, 0, 1, 1, 0, 0, 0, 0, 0}};
+                         {true, true, false, true, true, false, false, false, false, false}};
 
   auto col_gold_3 = cudf::test::structs_column_wrapper{
-    {gold_names0_col, gold_ages0_col, gold_is_human0_col}, {1, 1, 1, 1, 1, 0, 0, 0, 0, 0}};
+    {gold_names0_col, gold_ages0_col, gold_is_human0_col},
+    {true, true, true, true, true, false, false, false, false, false}};
 
-  column_wrapper<int32_t> col_gold_4{{-1, -1, -1, -1, -1, 3, 2, 2, 0, 4},
-                                     {0, 0, 0, 0, 0, 1, 1, 1, 1, 0}};
+  column_wrapper<int32_t> col_gold_4{
+    {-1, -1, -1, -1, -1, 3, 2, 2, 0, 4},
+    {false, false, false, false, false, true, true, true, true, false}};
   strcol_wrapper col_gold_5({"", "", "", "", "", "s1", "s1", "s0", "s1", "s2"},
-                            {0, 0, 0, 0, 0, 1, 1, 1, 1, 1});
-  column_wrapper<int32_t> col_gold_6{{-1, -1, -1, -1, -1, 1, 1, 0, 1, 2},
-                                     {0, 0, 0, 0, 0, 1, 1, 1, 1, 1}};
-  auto gold_names1_col = strcol_wrapper{{"",
-                                         "",
-                                         "",
-                                         "",
-                                         "",
-                                         "Carrot Ironfoundersson",
-                                         "Carrot Ironfoundersson",
-                                         "Samuel Vimes",
-                                         "Carrot Ironfoundersson",
-                                         "Angua von Überwald"},
-                                        {0, 0, 0, 0, 0, 1, 1, 1, 1, 1}};
-  auto gold_ages1_col  = column_wrapper<int32_t>{{-1, -1, -1, -1, -1, 27, 27, 48, 27, 25},
-                                                 {0, 0, 0, 0, 0, 1, 1, 1, 1, 1}};
+                            {false, false, false, false, false, true, true, true, true, true});
+  column_wrapper<int32_t> col_gold_6{
+    {-1, -1, -1, -1, -1, 1, 1, 0, 1, 2},
+    {false, false, false, false, false, true, true, true, true, true}};
+  auto gold_names1_col =
+    strcol_wrapper{{"",
+                    "",
+                    "",
+                    "",
+                    "",
+                    "Carrot Ironfoundersson",
+                    "Carrot Ironfoundersson",
+                    "Samuel Vimes",
+                    "Carrot Ironfoundersson",
+                    "Angua von Überwald"},
+                   {false, false, false, false, false, true, true, true, true, true}};
+  auto gold_ages1_col =
+    column_wrapper<int32_t>{{-1, -1, -1, -1, -1, 27, 27, 48, 27, 25},
+                            {false, false, false, false, false, true, true, true, true, true}};
 
   auto gold_is_human1_col =
     column_wrapper<bool>{{false, false, false, false, false, true, true, true, true, false},
-                         {0, 0, 0, 0, 0, 1, 1, 1, 1, 0}};
+                         {false, false, false, false, false, true, true, true, true, false}};
 
   auto col_gold_7 = cudf::test::structs_column_wrapper{
-    {gold_names1_col, gold_ages1_col, gold_is_human1_col}, {0, 0, 0, 0, 0, 1, 1, 1, 1, 1}};
+    {gold_names1_col, gold_ages1_col, gold_is_human1_col},
+    {false, false, false, false, false, true, true, true, true, true}};
 
   CVector cols_gold;
   cols_gold.push_back(col_gold_0.release());
diff --git a/cpp/tests/join/semi_anti_join_tests.cpp b/cpp/tests/join/semi_anti_join_tests.cpp
index 61bb3069308..de3d8bdaa23 100644
--- a/cpp/tests/join/semi_anti_join_tests.cpp
+++ b/cpp/tests/join/semi_anti_join_tests.cpp
@@ -114,8 +114,8 @@ TEST_F(JoinTest, TestSimple)
 std::pair<std::unique_ptr<cudf::table>, std::unique_ptr<cudf::table>> get_saj_tables(
   std::vector<bool> const& left_is_human_nulls, std::vector<bool> const& right_is_human_nulls)
 {
-  column_wrapper<int32_t> col0_0{{99, 1, 2, 0, 2}, {0, 1, 1, 1, 1}};
-  strcol_wrapper col0_1({"s1", "s1", "s0", "s4", "s0"}, {1, 1, 0, 1, 1});
+  column_wrapper<int32_t> col0_0{{99, 1, 2, 0, 2}, {false, true, true, true, true}};
+  strcol_wrapper col0_1({"s1", "s1", "s0", "s4", "s0"}, {true, true, false, true, true});
   column_wrapper<int32_t> col0_2{{0, 1, 2, 4, 1}};
   auto col0_names_col = strcol_wrapper{
     "Samuel Vimes", "Carrot Ironfoundersson", "Detritus", "Samuel Vimes", "Angua von Überwald"};
@@ -125,11 +125,11 @@ std::pair<std::unique_ptr<cudf::table>, std::unique_ptr<cudf::table>> get_saj_ta
     column_wrapper<bool>{{true, true, false, false, false}, left_is_human_nulls.begin()};
 
   auto col0_3 = cudf::test::structs_column_wrapper{
-    {col0_names_col, col0_ages_col, col0_is_human_col}, {1, 1, 1, 1, 1}};
+    {col0_names_col, col0_ages_col, col0_is_human_col}, {true, true, true, true, true}};
 
-  column_wrapper<int32_t> col1_0{{2, 2, 0, 4, -99}, {1, 1, 1, 1, 0}};
+  column_wrapper<int32_t> col1_0{{2, 2, 0, 4, -99}, {true, true, true, true, false}};
   strcol_wrapper col1_1({"s1", "s0", "s1", "s2", "s1"});
-  column_wrapper<int32_t> col1_2{{1, 0, 1, 2, 1}, {1, 0, 1, 1, 1}};
+  column_wrapper<int32_t> col1_2{{1, 0, 1, 2, 1}, {true, false, true, true, true}};
   auto col1_names_col = strcol_wrapper{"Carrot Ironfoundersson",
                                        "Angua von Überwald",
                                        "Detritus",
@@ -158,20 +158,20 @@ std::pair<std::unique_ptr<cudf::table>, std::unique_ptr<cudf::table>> get_saj_ta
 
 TEST_F(JoinTest, SemiJoinWithStructsAndNulls)
 {
-  auto tables = get_saj_tables({1, 1, 0, 1, 0}, {1, 0, 0, 1, 1});
+  auto tables = get_saj_tables({true, true, false, true, false}, {true, false, false, true, true});
 
   auto result =
     left_semi_join(*tables.first, *tables.second, {0, 1, 3}, {0, 1, 3}, cudf::null_equality::EQUAL);
   auto result_sort_order = cudf::sorted_order(result->view());
   auto sorted_result     = cudf::gather(result->view(), *result_sort_order);
 
-  column_wrapper<int32_t> col_gold_0{{99, 2}, {0, 1}};
-  strcol_wrapper col_gold_1({"s1", "s0"}, {1, 1});
+  column_wrapper<int32_t> col_gold_0{{99, 2}, {false, true}};
+  strcol_wrapper col_gold_1({"s1", "s0"}, {true, true});
   column_wrapper<int32_t> col_gold_2{{0, 1}};
   auto col_gold_3_names_col = strcol_wrapper{"Samuel Vimes", "Angua von Überwald"};
   auto col_gold_3_ages_col  = column_wrapper<int32_t>{{48, 25}};
 
-  auto col_gold_3_is_human_col = column_wrapper<bool>{{true, false}, {1, 0}};
+  auto col_gold_3_is_human_col = column_wrapper<bool>{{true, false}, {true, false}};
 
   auto col_gold_3 = cudf::test::structs_column_wrapper{
     {col_gold_3_names_col, col_gold_3_ages_col, col_gold_3_is_human_col}};
@@ -190,20 +190,20 @@ TEST_F(JoinTest, SemiJoinWithStructsAndNulls)
 
 TEST_F(JoinTest, SemiJoinWithStructsAndNullsNotEqual)
 {
-  auto tables = get_saj_tables({1, 1, 0, 1, 1}, {1, 1, 0, 1, 1});
+  auto tables = get_saj_tables({true, true, false, true, true}, {true, true, false, true, true});
 
   auto result = left_semi_join(
     *tables.first, *tables.second, {0, 1, 3}, {0, 1, 3}, cudf::null_equality::UNEQUAL);
   auto result_sort_order = cudf::sorted_order(result->view());
   auto sorted_result     = cudf::gather(result->view(), *result_sort_order);
 
-  column_wrapper<int32_t> col_gold_0{{2}, {1}};
-  strcol_wrapper col_gold_1({"s0"}, {1});
+  column_wrapper<int32_t> col_gold_0{{2}, {true}};
+  strcol_wrapper col_gold_1({"s0"}, {true});
   column_wrapper<int32_t> col_gold_2{{1}};
   auto col_gold_3_names_col = strcol_wrapper{"Angua von Überwald"};
   auto col_gold_3_ages_col  = column_wrapper<int32_t>{{25}};
 
-  auto col_gold_3_is_human_col = column_wrapper<bool>{{false}, {1}};
+  auto col_gold_3_is_human_col = column_wrapper<bool>{{false}, {true}};
 
   auto col_gold_3 = cudf::test::structs_column_wrapper{
     {col_gold_3_names_col, col_gold_3_ages_col, col_gold_3_is_human_col}};
@@ -223,20 +223,20 @@ TEST_F(JoinTest, SemiJoinWithStructsAndNullsNotEqual)
 
 TEST_F(JoinTest, AntiJoinWithStructsAndNulls)
 {
-  auto tables = get_saj_tables({1, 1, 0, 1, 0}, {1, 0, 0, 1, 1});
+  auto tables = get_saj_tables({true, true, false, true, false}, {true, false, false, true, true});
 
   auto result =
     left_anti_join(*tables.first, *tables.second, {0, 1, 3}, {0, 1, 3}, cudf::null_equality::EQUAL);
   auto result_sort_order = cudf::sorted_order(result->view());
   auto sorted_result     = cudf::gather(result->view(), *result_sort_order);
 
-  column_wrapper<int32_t> col_gold_0{{1, 2, 0}, {1, 1, 1}};
-  strcol_wrapper col_gold_1({"s1", "s0", "s4"}, {1, 0, 1});
+  column_wrapper<int32_t> col_gold_0{{1, 2, 0}, {true, true, true}};
+  strcol_wrapper col_gold_1({"s1", "s0", "s4"}, {true, false, true});
   column_wrapper<int32_t> col_gold_2{{1, 2, 4}};
   auto col_gold_3_names_col = strcol_wrapper{"Carrot Ironfoundersson", "Detritus", "Samuel Vimes"};
   auto col_gold_3_ages_col  = column_wrapper<int32_t>{{27, 351, 31}};
 
-  auto col_gold_3_is_human_col = column_wrapper<bool>{{true, false, false}, {1, 0, 1}};
+  auto col_gold_3_is_human_col = column_wrapper<bool>{{true, false, false}, {true, false, true}};
 
   auto col_gold_3 = cudf::test::structs_column_wrapper{
     {col_gold_3_names_col, col_gold_3_ages_col, col_gold_3_is_human_col}};
@@ -256,21 +256,22 @@ TEST_F(JoinTest, AntiJoinWithStructsAndNulls)
 
 TEST_F(JoinTest, AntiJoinWithStructsAndNullsNotEqual)
 {
-  auto tables = get_saj_tables({1, 1, 0, 1, 1}, {1, 1, 0, 1, 1});
+  auto tables = get_saj_tables({true, true, false, true, true}, {true, true, false, true, true});
 
   auto result = left_anti_join(
     *tables.first, *tables.second, {0, 1, 3}, {0, 1, 3}, cudf::null_equality::UNEQUAL);
   auto result_sort_order = cudf::sorted_order(result->view());
   auto sorted_result     = cudf::gather(result->view(), *result_sort_order);
 
-  column_wrapper<int32_t> col_gold_0{{99, 1, 2, 0}, {0, 1, 1, 1}};
-  strcol_wrapper col_gold_1({"s1", "s1", "s0", "s4"}, {1, 1, 0, 1});
+  column_wrapper<int32_t> col_gold_0{{99, 1, 2, 0}, {false, true, true, true}};
+  strcol_wrapper col_gold_1({"s1", "s1", "s0", "s4"}, {true, true, false, true});
   column_wrapper<int32_t> col_gold_2{{0, 1, 2, 4}};
   auto col_gold_3_names_col =
     strcol_wrapper{"Samuel Vimes", "Carrot Ironfoundersson", "Detritus", "Samuel Vimes"};
   auto col_gold_3_ages_col = column_wrapper<int32_t>{{48, 27, 351, 31}};
 
-  auto col_gold_3_is_human_col = column_wrapper<bool>{{true, true, false, false}, {1, 1, 0, 1}};
+  auto col_gold_3_is_human_col =
+    column_wrapper<bool>{{true, true, false, false}, {true, true, false, true}};
 
   auto col_gold_3 = cudf::test::structs_column_wrapper{
     {col_gold_3_names_col, col_gold_3_ages_col, col_gold_3_is_human_col}};
diff --git a/cpp/tests/json/json_tests.cpp b/cpp/tests/json/json_tests.cpp
index e38ca6628f3..a9186874e83 100644
--- a/cpp/tests/json/json_tests.cpp
+++ b/cpp/tests/json/json_tests.cpp
@@ -454,8 +454,8 @@ TEST_F(JsonPathTests, GetJsonObjectFilter)
 TEST_F(JsonPathTests, GetJsonObjectNullInputs)
 {
   {
-    std::string str("{\"a\" : \"b\"}");
-    cudf::test::strings_column_wrapper input({str, str, str, str}, {1, 0, 1, 0});
+    std::string str(R"({"a" : "b"})");
+    cudf::test::strings_column_wrapper input({str, str, str, str}, {true, false, true, false});
 
     std::string json_path("$.a");
     auto result_raw = cudf::get_json_object(cudf::strings_column_view(input), json_path);
@@ -786,7 +786,7 @@ TEST_F(JsonPathTests, StripQuotes)
   // but with string_quotes_from_single_strings false, we expect
   // "b"   (with quotes)
   {
-    std::string str("{\"a\" : \"b\"}");
+    std::string str(R"({"a" : "b"})");
     cudf::test::strings_column_wrapper input({str, str});
 
     cudf::get_json_object_options options;
diff --git a/cpp/tests/large_strings/large_strings_fixture.cpp b/cpp/tests/large_strings/large_strings_fixture.cpp
index 416b106c5a5..ac8159369a1 100644
--- a/cpp/tests/large_strings/large_strings_fixture.cpp
+++ b/cpp/tests/large_strings/large_strings_fixture.cpp
@@ -41,7 +41,7 @@ class LargeStringsData {
     _data[std::string(name)] = std::move(data);
   }
 
-  cudf::table_view get_table(std::string_view name) const
+  [[nodiscard]] cudf::table_view get_table(std::string_view name) const
   {
     std::string key{name};
     return _data.find(key) != _data.end() ? _data.at(key)->view() : cudf::table_view{};
@@ -54,13 +54,16 @@ class LargeStringsData {
     _data[std::string(name)] = std::make_unique<cudf::table>(std::move(cols));
   }
 
-  cudf::column_view get_column(std::string_view name) const
+  [[nodiscard]] cudf::column_view get_column(std::string_view name) const
   {
     std::string key{name};
     return _data.find(key) != _data.end() ? _data.at(key)->view().column(0) : cudf::column_view{};
   }
 
-  bool has_key(std::string_view name) const { return _data.find(std::string(name)) != _data.end(); }
+  [[nodiscard]] bool has_key(std::string_view name) const
+  {
+    return _data.find(std::string(name)) != _data.end();
+  }
 
  protected:
   std::map<std::string, DataPointer> _data;
diff --git a/cpp/tests/lists/contains_tests.cpp b/cpp/tests/lists/contains_tests.cpp
index 961437ba81e..718ee83cf09 100644
--- a/cpp/tests/lists/contains_tests.cpp
+++ b/cpp/tests/lists/contains_tests.cpp
@@ -385,7 +385,7 @@ TEST_F(ContainsTest, BoolScalarWithNullsInLists)
     std::move(null_mask));
 
   // Search space: [ [x], [1,1], [x,1,1,x], [], x, [1,1,x], [x], [1,1,x,1] ]
-  auto search_key_one = create_scalar_search_key<T>(1);
+  auto search_key_one = create_scalar_search_key<T>(true);
   {
     // CONTAINS
     auto result   = cudf::lists::contains(search_space->view(), *search_key_one);
diff --git a/cpp/tests/lists/count_elements_tests.cpp b/cpp/tests/lists/count_elements_tests.cpp
index 0933740b850..032bd0fa6ae 100644
--- a/cpp/tests/lists/count_elements_tests.cpp
+++ b/cpp/tests/lists/count_elements_tests.cpp
@@ -43,7 +43,8 @@ TYPED_TEST(ListsElementsNumericsTest, CountElements)
   LCW input({LCW{3, 2, 1}, LCW{}, LCW{30, 20, 10, 50}, LCW{100, 120}, LCW{0}}, validity);
 
   auto result = cudf::lists::count_elements(cudf::lists_column_view(input));
-  cudf::test::fixed_width_column_wrapper<int32_t> expected({3, 0, 4, 2, 1}, {1, 0, 1, 1, 1});
+  cudf::test::fixed_width_column_wrapper<int32_t> expected({3, 0, 4, 2, 1},
+                                                           {true, false, true, true, true});
   CUDF_TEST_EXPECT_COLUMNS_EQUAL(expected, *result);
 }
 
@@ -57,7 +58,8 @@ TEST_F(ListsElementsTest, CountElementsStrings)
     validity);
 
   auto result = cudf::lists::count_elements(cudf::lists_column_view(input));
-  cudf::test::fixed_width_column_wrapper<int32_t> expected({3, 0, 4, 2, 1}, {1, 0, 1, 1, 1});
+  cudf::test::fixed_width_column_wrapper<int32_t> expected({3, 0, 4, 2, 1},
+                                                           {true, false, true, true, true});
   CUDF_TEST_EXPECT_COLUMNS_EQUAL(expected, *result);
 }
 
@@ -72,7 +74,7 @@ TEST_F(ListsElementsTest, CountElementsSliced)
 
   auto sliced = cudf::slice(input, {1, 4}).front();
   auto result = cudf::lists::count_elements(cudf::lists_column_view(sliced));
-  cudf::test::fixed_width_column_wrapper<int32_t> expected({0, 4, 2}, {0, 1, 1});
+  cudf::test::fixed_width_column_wrapper<int32_t> expected({0, 4, 2}, {false, true, true});
   CUDF_TEST_EXPECT_COLUMNS_EQUAL(expected, *result);
 }
 
@@ -87,7 +89,7 @@ TYPED_TEST(ListsElementsNumericsTest, CountElementsNestedLists)
            validity.begin());
 
   auto result = cudf::lists::count_elements(cudf::lists_column_view(list));
-  cudf::test::fixed_width_column_wrapper<int32_t> expected({2, 1, 3, 5}, {1, 0, 1, 1});
+  cudf::test::fixed_width_column_wrapper<int32_t> expected({2, 1, 3, 5}, {true, false, true, true});
   CUDF_TEST_EXPECT_COLUMNS_EQUAL(expected, *result);
 }
 
diff --git a/cpp/tests/lists/explode_tests.cpp b/cpp/tests/lists/explode_tests.cpp
index 4ba7a773cb7..be332de0ba0 100644
--- a/cpp/tests/lists/explode_tests.cpp
+++ b/cpp/tests/lists/explode_tests.cpp
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2021-2023, NVIDIA CORPORATION.
+ * Copyright (c) 2021-2024, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -178,7 +178,8 @@ TEST_F(ExplodeTest, NullsInList)
     LCW({1, null, 7}, valids), LCW({5, null, 0, null}, valids), LCW{}, LCW({0, null, 8}, valids)};
   FCW b{100, 200, 300, 400};
 
-  FCW expected_a({1, null, 7, 5, null, 0, null, 0, null, 8}, {1, 0, 1, 1, 0, 1, 0, 1, 0, 1});
+  FCW expected_a({1, null, 7, 5, null, 0, null, 0, null, 8},
+                 {true, false, true, true, false, true, false, true, false, true});
   FCW expected_b{100, 100, 100, 200, 200, 200, 200, 400, 400, 400};
 
   cudf::table_view t({a, b});
@@ -308,7 +309,8 @@ TEST_F(ExplodeTest, NullsInNestedDoubleExplode)
         LCW{LCW{0, 3}, LCW{5}, LCW({2, null}, valids)}};
   FCW b{100, 200, 300};
 
-  FCW expected_a({1, null, 7, 6, 5, 5, 6, 0, 3, 5, 2, null}, {1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0});
+  FCW expected_a({1, null, 7, 6, 5, 5, 6, 0, 3, 5, 2, null},
+                 {true, false, true, true, true, true, true, true, true, true, true, false});
   FCW expected_b{100, 100, 100, 100, 100, 200, 200, 300, 300, 300, 300, 300};
 
   cudf::table_view t({a, b});
@@ -432,9 +434,10 @@ TEST_F(ExplodeTest, ListOfStructsWithEmpties)
 
   auto ret = cudf::explode(t, 0);
   auto expected_numeric_col =
-    cudf::test::fixed_width_column_wrapper<int32_t>{{1, null, null}, {1, 0, 0}};
+    cudf::test::fixed_width_column_wrapper<int32_t>{{1, null, null}, {true, false, false}};
 
-  auto expected_a = cudf::test::structs_column_wrapper{{expected_numeric_col}, {1, 1, 0}}.release();
+  auto expected_a =
+    cudf::test::structs_column_wrapper{{expected_numeric_col}, {true, true, false}}.release();
   auto expected_b = cudf::test::strings_column_wrapper({"a", "b", "c"}).release();
 
   cudf::table_view expected({expected_a->view(), expected_b->view()});
@@ -600,7 +603,7 @@ TEST_F(ExplodeOuterTest, SingleNull)
   LCW a({LCW{null}, LCW{5, 6}, LCW{}, LCW{0, 3}}, first_invalid);
   FCW b({100, 200, 300, 400});
 
-  FCW expected_a{{null, 5, 6, 0, 0, 3}, {0, 1, 1, 0, 1, 1}};
+  FCW expected_a{{null, 5, 6, 0, 0, 3}, {false, true, true, false, true, true}};
   FCW expected_b{100, 200, 200, 300, 400, 400};
 
   cudf::table_view t({a, b});
@@ -609,7 +612,7 @@ TEST_F(ExplodeOuterTest, SingleNull)
   auto ret = cudf::explode_outer(t, 0);
   CUDF_TEST_EXPECT_TABLES_EQUAL(ret->view(), expected);
 
-  FCW expected_pos_col{{0, 0, 1, 0, 0, 1}, {0, 1, 1, 0, 1, 1}};
+  FCW expected_pos_col{{0, 0, 1, 0, 0, 1}, {false, true, true, false, true, true}};
   cudf::table_view pos_expected({expected_pos_col, expected_a, expected_b});
   auto pos_ret = cudf::explode_outer_position(t, 0);
   CUDF_TEST_EXPECT_TABLES_EQUAL(pos_ret->view(), pos_expected);
@@ -630,8 +633,8 @@ TEST_F(ExplodeOuterTest, Nulls)
   LCW a({LCW{1, 2, 7}, LCW{null}, LCW{0, 3}}, valids);
   FCW b({100, null, 300}, valids);
 
-  FCW expected_a({1, 2, 7, null, 0, 3}, {1, 1, 1, 0, 1, 1});
-  FCW expected_b({100, 100, 100, null, 300, 300}, {1, 1, 1, 0, 1, 1});
+  FCW expected_a({1, 2, 7, null, 0, 3}, {true, true, true, false, true, true});
+  FCW expected_b({100, 100, 100, null, 300, 300}, {true, true, true, false, true, true});
 
   cudf::table_view t({a, b});
   cudf::table_view expected({expected_a, expected_b});
@@ -639,7 +642,7 @@ TEST_F(ExplodeOuterTest, Nulls)
   auto ret = cudf::explode_outer(t, 0);
   CUDF_TEST_EXPECT_TABLES_EQUAL(ret->view(), expected);
 
-  FCW expected_pos_col{{0, 1, 2, 0, 0, 1}, {1, 1, 1, 0, 1, 1}};
+  FCW expected_pos_col{{0, 1, 2, 0, 0, 1}, {true, true, true, false, true, true}};
   cudf::table_view pos_expected({expected_pos_col, expected_a, expected_b});
 
   auto pos_ret = cudf::explode_outer_position(t, 0);
@@ -660,7 +663,7 @@ TEST_F(ExplodeOuterTest, AllNulls)
   LCW a({LCW{null}, LCW{null}, LCW{null}}, non_valid);
   FCW b({100, 200, 300});
 
-  FCW expected_a({null, null, null}, {0, 0, 0});
+  FCW expected_a({null, null, null}, {false, false, false});
   FCW expected_b({100, 200, 300});
 
   cudf::table_view t({a, b});
@@ -669,7 +672,7 @@ TEST_F(ExplodeOuterTest, AllNulls)
   auto ret = cudf::explode_outer(t, 0);
   CUDF_TEST_EXPECT_TABLES_EQUAL(ret->view(), expected);
 
-  FCW expected_pos_col{{0, 0, 0}, {0, 0, 0}};
+  FCW expected_pos_col{{0, 0, 0}, {false, false, false}};
   cudf::table_view pos_expected({expected_pos_col, expected_a, expected_b});
 
   auto pos_ret = cudf::explode_outer_position(t, 0);
@@ -693,7 +696,8 @@ TEST_F(ExplodeOuterTest, SequentialNulls)
   LCW a{LCW({1, 2, null}, third_invalid), LCW{3, 4}, LCW{}, LCW{}, LCW{5, 6, 7}};
   FCW b{100, 200, 300, 400, 500};
 
-  FCW expected_a({1, 2, null, 3, 4, null, null, 5, 6, 7}, {1, 1, 0, 1, 1, 0, 0, 1, 1, 1});
+  FCW expected_a({1, 2, null, 3, 4, null, null, 5, 6, 7},
+                 {true, true, false, true, true, false, false, true, true, true});
   FCW expected_b({100, 100, 100, 200, 200, 300, 400, 500, 500, 500});
 
   cudf::table_view t({a, b});
@@ -702,7 +706,8 @@ TEST_F(ExplodeOuterTest, SequentialNulls)
   auto ret = cudf::explode_outer(t, 0);
   CUDF_TEST_EXPECT_TABLES_EQUAL(ret->view(), expected);
 
-  FCW expected_pos_col{{0, 1, 2, 0, 1, 0, 0, 0, 1, 2}, {1, 1, 1, 1, 1, 0, 0, 1, 1, 1}};
+  FCW expected_pos_col{{0, 1, 2, 0, 1, 0, 0, 0, 1, 2},
+                       {true, true, true, true, true, false, false, true, true, true}};
   cudf::table_view pos_expected({expected_pos_col, expected_a, expected_b});
 
   auto pos_ret = cudf::explode_outer_position(t, 0);
@@ -724,7 +729,7 @@ TEST_F(ExplodeOuterTest, MoreEmptyThanData)
   LCW a{LCW{1, 2}, LCW{}, LCW{}, LCW{}, LCW{}, LCW{3}};
   FCW b{100, 200, 300, 400, 500, 600};
 
-  FCW expected_a({1, 2, null, null, null, null, 3}, {1, 1, 0, 0, 0, 0, 1});
+  FCW expected_a({1, 2, null, null, null, null, 3}, {true, true, false, false, false, false, true});
   FCW expected_b({100, 100, 200, 300, 400, 500, 600});
 
   cudf::table_view t({a, b});
@@ -733,7 +738,7 @@ TEST_F(ExplodeOuterTest, MoreEmptyThanData)
   auto ret = cudf::explode_outer(t, 0);
   CUDF_TEST_EXPECT_TABLES_EQUAL(ret->view(), expected);
 
-  FCW expected_pos_col{{0, 1, 0, 0, 0, 0, 0}, {1, 1, 0, 0, 0, 0, 1}};
+  FCW expected_pos_col{{0, 1, 0, 0, 0, 0, 0}, {true, true, false, false, false, false, true}};
   cudf::table_view pos_expected({expected_pos_col, expected_a, expected_b});
 
   auto pos_ret = cudf::explode_outer_position(t, 0);
@@ -754,7 +759,7 @@ TEST_F(ExplodeOuterTest, TrailingEmptys)
   LCW a{LCW{1, 2}, LCW{}, LCW{}, LCW{}, LCW{}};
   FCW b{100, 200, 300, 400, 500};
 
-  FCW expected_a({1, 2, null, null, null, null}, {1, 1, 0, 0, 0, 0});
+  FCW expected_a({1, 2, null, null, null, null}, {true, true, false, false, false, false});
   FCW expected_b({100, 100, 200, 300, 400, 500});
 
   cudf::table_view t({a, b});
@@ -763,7 +768,7 @@ TEST_F(ExplodeOuterTest, TrailingEmptys)
   auto ret = cudf::explode_outer(t, 0);
   CUDF_TEST_EXPECT_TABLES_EQUAL(ret->view(), expected);
 
-  FCW expected_pos_col{{0, 1, 0, 0, 0, 0}, {1, 1, 0, 0, 0, 0}};
+  FCW expected_pos_col{{0, 1, 0, 0, 0, 0}, {true, true, false, false, false, false}};
   cudf::table_view pos_expected({expected_pos_col, expected_a, expected_b});
 
   auto pos_ret = cudf::explode_outer_position(t, 0);
@@ -786,7 +791,7 @@ TEST_F(ExplodeOuterTest, LeadingNulls)
   LCW a({LCW{null}, LCW{null}, LCW{null}, LCW{null}, LCW{1, 2}}, valids);
   FCW b{100, 200, 300, 400, 500};
 
-  FCW expected_a({null, null, null, null, 1, 2}, {0, 0, 0, 0, 1, 1});
+  FCW expected_a({null, null, null, null, 1, 2}, {false, false, false, false, true, true});
   FCW expected_b({100, 200, 300, 400, 500, 500});
 
   cudf::table_view t({a, b});
@@ -795,7 +800,7 @@ TEST_F(ExplodeOuterTest, LeadingNulls)
   auto ret = cudf::explode_outer(t, 0);
   CUDF_TEST_EXPECT_TABLES_EQUAL(ret->view(), expected);
 
-  FCW expected_pos_col{{0, 0, 0, 0, 0, 1}, {0, 0, 0, 0, 1, 1}};
+  FCW expected_pos_col{{0, 0, 0, 0, 0, 1}, {false, false, false, false, true, true}};
   cudf::table_view pos_expected({expected_pos_col, expected_a, expected_b});
 
   auto pos_ret = cudf::explode_outer_position(t, 0);
@@ -820,7 +825,7 @@ TEST_F(ExplodeOuterTest, NullsInList)
   FCW b{100, 200, 300, 400};
 
   FCW expected_a({1, null, 7, 5, null, 0, null, null, 0, null, 8},
-                 {1, 0, 1, 1, 0, 1, 0, 0, 1, 0, 1});
+                 {true, false, true, true, false, true, false, false, true, false, true});
   FCW expected_b{100, 100, 100, 200, 200, 200, 200, 300, 400, 400, 400};
 
   cudf::table_view t({a, b});
@@ -830,7 +835,8 @@ TEST_F(ExplodeOuterTest, NullsInList)
 
   CUDF_TEST_EXPECT_TABLES_EQUAL(ret->view(), expected);
 
-  FCW expected_pos_col{{0, 1, 2, 0, 1, 2, 3, 0, 0, 1, 2}, {1, 1, 1, 1, 1, 1, 1, 0, 1, 1, 1}};
+  FCW expected_pos_col{{0, 1, 2, 0, 1, 2, 3, 0, 0, 1, 2},
+                       {true, true, true, true, true, true, true, false, true, true, true}};
   cudf::table_view pos_expected({expected_pos_col, expected_a, expected_b});
 
   auto pos_ret = cudf::explode_outer_position(t, 0);
@@ -890,7 +896,7 @@ TEST_F(ExplodeOuterTest, NestedNulls)
   auto ret = cudf::explode_outer(t, 0);
   CUDF_TEST_EXPECT_TABLES_EQUAL(ret->view(), expected);
 
-  FCW expected_pos_col{{0, 1, 0, 0, 1, 2}, {1, 1, 0, 1, 1, 1}};
+  FCW expected_pos_col{{0, 1, 0, 0, 1, 2}, {true, true, false, true, true, true}};
   cudf::table_view pos_expected({expected_pos_col, expected_a, expected_b});
 
   auto pos_ret = cudf::explode_outer_position(t, 0);
@@ -950,7 +956,7 @@ TEST_F(ExplodeOuterTest, NullsInNestedDoubleExplode)
   FCW b{100, 200, 300};
 
   FCW expected_a({1, null, null, 7, 6, 5, 5, 6, 0, 3, 5, 2, null},
-                 {1, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0});
+                 {true, false, false, true, true, true, true, true, true, true, true, true, false});
   FCW expected_b{100, 100, 100, 100, 100, 100, 200, 200, 300, 300, 300, 300, 300};
 
   cudf::table_view t({a, b});
@@ -961,8 +967,9 @@ TEST_F(ExplodeOuterTest, NullsInNestedDoubleExplode)
 
   CUDF_TEST_EXPECT_TABLES_EQUAL(ret->view(), expected);
 
-  FCW expected_pos_col{{0, 1, 0, 0, 1, 2, 0, 1, 0, 1, 0, 0, 1},
-                       {1, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1}};
+  FCW expected_pos_col{
+    {0, 1, 0, 0, 1, 2, 0, 1, 0, 1, 0, 0, 1},
+    {true, true, false, true, true, true, true, true, true, true, true, true, true}};
   cudf::table_view pos_expected({expected_pos_col, expected_a, expected_b});
 
   auto pos_ret = cudf::explode_outer_position(first_explode_ret->view(), 0);
@@ -1075,17 +1082,18 @@ TEST_F(ExplodeOuterTest, ListOfStructsWithEmpties)
 
   auto ret = cudf::explode_outer(t, 0);
 
-  auto expected_numeric_col =
-    cudf::test::fixed_width_column_wrapper<int32_t>{{1, null, null, null, null}, {1, 0, 0, 0, 0}};
+  auto expected_numeric_col = cudf::test::fixed_width_column_wrapper<int32_t>{
+    {1, null, null, null, null}, {true, false, false, false, false}};
 
   auto expected_a =
-    cudf::test::structs_column_wrapper{{expected_numeric_col}, {1, 1, 0, 0, 0}}.release();
+    cudf::test::structs_column_wrapper{{expected_numeric_col}, {true, true, false, false, false}}
+      .release();
   auto expected_b = cudf::test::strings_column_wrapper({"a", "b", "c", "d", "e"}).release();
 
   cudf::table_view expected({expected_a->view(), expected_b->view()});
 
   CUDF_TEST_EXPECT_TABLES_EQUAL(ret->view(), expected);
-  FCW expected_pos_col{{0, 0, 0, null, null}, {1, 1, 1, 0, 0}};
+  FCW expected_pos_col{{0, 0, 0, null, null}, {true, true, true, false, false}};
   cudf::table_view pos_expected({expected_pos_col, expected_a->view(), expected_b->view()});
 
   auto pos_ret = cudf::explode_outer_position(t, 0);
diff --git a/cpp/tests/lists/sort_lists_tests.cpp b/cpp/tests/lists/sort_lists_tests.cpp
index 7d925da85a7..a3280f901c5 100644
--- a/cpp/tests/lists/sort_lists_tests.cpp
+++ b/cpp/tests/lists/sort_lists_tests.cpp
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2021-2023, NVIDIA CORPORATION.
+ * Copyright (c) 2021-2024, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -82,9 +82,9 @@ TYPED_TEST(SortLists, Null)
 {
   using T = TypeParam;
   if (std::is_same_v<T, bool>) return;
-  std::vector<bool> valids_o{1, 1, 0, 1};
-  std::vector<bool> valids_a{1, 1, 1, 0};
-  std::vector<bool> valids_b{0, 1, 1, 1};
+  std::vector<bool> valids_o{true, true, false, true};
+  std::vector<bool> valids_a{true, true, true, false};
+  std::vector<bool> valids_b{false, true, true, true};
 
   // List<T>
   LCW<T> list{{{3, 2, 4, 1}, valids_o.begin()}, {5}, {10, 8, 9}, {6, 7}};
diff --git a/cpp/tests/merge/merge_dictionary_test.cpp b/cpp/tests/merge/merge_dictionary_test.cpp
index 55365cb972a..dd528c19e4e 100644
--- a/cpp/tests/merge/merge_dictionary_test.cpp
+++ b/cpp/tests/merge/merge_dictionary_test.cpp
@@ -101,18 +101,19 @@ TEST_F(MergeDictionaryTest, Merge2Columns)
 
 TEST_F(MergeDictionaryTest, WithNulls)
 {
-  cudf::test::fixed_width_column_wrapper<int8_t> left_w1({1, 2, 2, 4, 4, 5, 0},
-                                                         {1, 1, 1, 1, 1, 1, 0});
+  cudf::test::fixed_width_column_wrapper<int8_t> left_w1(
+    {1, 2, 2, 4, 4, 5, 0}, {true, true, true, true, true, true, false});
   auto left1 = cudf::dictionary::encode(left_w1);
-  cudf::test::fixed_width_column_wrapper<int64_t> left_w2({1000, 1000, 800, 500, 500, 100, 0},
-                                                          {1, 1, 1, 1, 1, 1, 0});
+  cudf::test::fixed_width_column_wrapper<int64_t> left_w2(
+    {1000, 1000, 800, 500, 500, 100, 0}, {true, true, true, true, true, true, false});
   auto left2 = cudf::dictionary::encode(left_w2);
   cudf::table_view left_view{{left1->view(), left2->view()}};
 
-  cudf::test::fixed_width_column_wrapper<int8_t> right_w1({1, 1, 2, 4, 5, 0}, {1, 1, 1, 1, 1, 0});
+  cudf::test::fixed_width_column_wrapper<int8_t> right_w1({1, 1, 2, 4, 5, 0},
+                                                          {true, true, true, true, true, false});
   auto right1 = cudf::dictionary::encode(right_w1);
   cudf::test::fixed_width_column_wrapper<int64_t> right_w2({1000, 800, 800, 400, 100, 0},
-                                                           {1, 1, 1, 1, 1, 0});
+                                                           {true, true, true, true, true, false});
   auto right2 = cudf::dictionary::encode(right_w2);
   cudf::table_view right_view{{right1->view(), right2->view()}};
 
@@ -125,10 +126,11 @@ TEST_F(MergeDictionaryTest, WithNulls)
   auto decoded2 = cudf::dictionary::decode(result->get_column(1).view());
 
   cudf::test::fixed_width_column_wrapper<int8_t> expected_1(
-    {1, 1, 1, 2, 2, 2, 4, 4, 4, 5, 5, 0, 0}, {1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0});
+    {1, 1, 1, 2, 2, 2, 4, 4, 4, 5, 5, 0, 0},
+    {true, true, true, true, true, true, true, true, true, true, true, false, false});
   cudf::test::fixed_width_column_wrapper<int64_t> expected_2(
     {1000, 1000, 800, 1000, 800, 800, 500, 500, 400, 100, 100, 0, 0},
-    {1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0});
+    {true, true, true, true, true, true, true, true, true, true, true, false, false});
   CUDF_TEST_EXPECT_COLUMNS_EQUAL(expected_1, decoded1->view());
   CUDF_TEST_EXPECT_COLUMNS_EQUAL(expected_2, decoded2->view());
 
diff --git a/cpp/tests/merge/merge_string_test.cpp b/cpp/tests/merge/merge_string_test.cpp
index 28179a7341c..97979e79010 100644
--- a/cpp/tests/merge/merge_string_test.cpp
+++ b/cpp/tests/merge/merge_string_test.cpp
@@ -228,7 +228,7 @@ TYPED_TEST(MergeStringTest, Merge1StringKeyNullColumns)
 {
   // data: "ab", "bc", "cd", "de" | valid: 1 1 1 0
   strings_column_wrapper leftColWrap1({"ab", "bc", "cd", "de", "ef", "fg", "gh", "hi"},
-                                      {1, 1, 1, 1, 1, 1, 1, 0});
+                                      {true, true, true, true, true, true, true, false});
 
   cudf::size_type inputRows = static_cast<cudf::column_view const&>(leftColWrap1).size();
 
@@ -245,7 +245,7 @@ TYPED_TEST(MergeStringTest, Merge1StringKeyNullColumns)
 
   // data: "ac", "bd", "ce", "df" | valid: 1 1 1 0
   strings_column_wrapper rightColWrap1({"ac", "bd", "ce", "df", "eg", "fh", "gi", "hj"},
-                                       {1, 1, 1, 1, 1, 1, 1, 0});
+                                       {true, true, true, true, true, true, true, false});
   fixed_width_column_wrapper<TypeParam, typename decltype(sequence0)::value_type> rightColWrap2(
     sequence0, sequence0 + inputRows);
 
@@ -280,7 +280,22 @@ TYPED_TEST(MergeStringTest, Merge1StringKeyNullColumns)
                                             "gi",
                                             "hi",
                                             "hj"},
-                                           {1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0});
+                                           {true,
+                                            true,
+                                            true,
+                                            true,
+                                            true,
+                                            true,
+                                            true,
+                                            true,
+                                            true,
+                                            true,
+                                            true,
+                                            true,
+                                            true,
+                                            true,
+                                            false,
+                                            false});
   auto seq_out2 = cudf::detail::make_counting_transform_iterator(0, [outputRows](auto row) {
     if (cudf::type_to_id<TypeParam>() == cudf::type_id::BOOL8)
       return 0;
@@ -303,9 +318,9 @@ TYPED_TEST(MergeStringTest, Merge1StringKeyNullColumns)
 TYPED_TEST(MergeStringTest, Merge2StringKeyNullColumns)
 {
   strings_column_wrapper leftColWrap1({"ab", "bc", "cd", "de", "ef", "fg", "gh", "hi"},
-                                      {1, 1, 1, 1, 1, 1, 1, 0});
+                                      {true, true, true, true, true, true, true, false});
   strings_column_wrapper leftColWrap3({"zy", "yx", "xw", "wv", "vu", "ut", "ts", "sr"},
-                                      {1, 1, 1, 1, 1, 1, 1, 0});
+                                      {true, true, true, true, true, true, true, false});
 
   cudf::size_type inputRows = static_cast<cudf::column_view const&>(leftColWrap1).size();
 
@@ -324,7 +339,7 @@ TYPED_TEST(MergeStringTest, Merge2StringKeyNullColumns)
   cudf::table_view left_view{{leftColWrap1, leftColWrap2, leftColWrap3}};
 
   strings_column_wrapper rightColWrap1({"ac", "bd", "ce", "df", "eg", "fh", "gi", "hj"},
-                                       {1, 1, 1, 1, 1, 1, 1, 0});
+                                       {true, true, true, true, true, true, true, false});
 
   EXPECT_EQ(inputRows, static_cast<cudf::column_view const&>(rightColWrap1).size());
 
@@ -338,7 +353,7 @@ TYPED_TEST(MergeStringTest, Merge2StringKeyNullColumns)
     sequence_r, sequence_r + inputRows);
 
   strings_column_wrapper rightColWrap3({"zx", "yw", "xv", "wu", "vt", "us", "tr", "sp"},
-                                       {1, 1, 1, 1, 1, 1, 1, 0});
+                                       {true, true, true, true, true, true, true, false});
 
   EXPECT_EQ(inputRows, static_cast<cudf::column_view const&>(rightColWrap3).size());
 
@@ -371,7 +386,22 @@ TYPED_TEST(MergeStringTest, Merge2StringKeyNullColumns)
                                             "gi",
                                             "hi",
                                             "hj"},
-                                           {1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0});
+                                           {true,
+                                            true,
+                                            true,
+                                            true,
+                                            true,
+                                            true,
+                                            true,
+                                            true,
+                                            true,
+                                            true,
+                                            true,
+                                            true,
+                                            true,
+                                            true,
+                                            false,
+                                            false});
 
   auto seq_out2 = cudf::detail::make_counting_transform_iterator(
     0, [bool8 = (cudf::type_to_id<TypeParam>() == cudf::type_id::BOOL8)](auto row) {
@@ -397,7 +427,22 @@ TYPED_TEST(MergeStringTest, Merge2StringKeyNullColumns)
                                             "tr",
                                             "sr",
                                             "sp"},
-                                           {1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0});
+                                           {true,
+                                            true,
+                                            true,
+                                            true,
+                                            true,
+                                            true,
+                                            true,
+                                            true,
+                                            true,
+                                            true,
+                                            true,
+                                            true,
+                                            true,
+                                            true,
+                                            false,
+                                            false});
 
   auto expected_column_view1{static_cast<cudf::column_view const&>(expectedDataWrap1)};
   auto expected_column_view2{static_cast<cudf::column_view const&>(expectedDataWrap2)};
diff --git a/cpp/tests/partitioning/hash_partition_test.cpp b/cpp/tests/partitioning/hash_partition_test.cpp
index 521e1193036..24dadf9b520 100644
--- a/cpp/tests/partitioning/hash_partition_test.cpp
+++ b/cpp/tests/partitioning/hash_partition_test.cpp
@@ -140,7 +140,7 @@ TEST_F(HashPartition, MixedColumnTypes)
 
 TEST_F(HashPartition, NullableStrings)
 {
-  strings_column_wrapper strings({"a", "bb", "ccc", "d"}, {1, 1, 1, 1});
+  strings_column_wrapper strings({"a", "bb", "ccc", "d"}, {true, true, true, true});
   cudf::table_view input({strings});
 
   std::vector<cudf::size_type> const columns_to_hash({0});
diff --git a/cpp/tests/partitioning/round_robin_test.cpp b/cpp/tests/partitioning/round_robin_test.cpp
index 8049c7c3a7a..89d23c39dca 100644
--- a/cpp/tests/partitioning/round_robin_test.cpp
+++ b/cpp/tests/partitioning/round_robin_test.cpp
@@ -62,7 +62,7 @@ TYPED_TEST(RoundRobinTest, RoundRobinPartitions13_3)
 {
   strings_column_wrapper rrColWrap1(
     {"a", "b", "c", "d", "e", "f", "g", "h", "i", "j", "k", "l", "m"},
-    {1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0});
+    {true, true, true, true, true, true, true, true, true, true, true, true, false});
 
   cudf::size_type inputRows = static_cast<cudf::column_view const&>(rrColWrap1).size();
 
@@ -90,7 +90,7 @@ TYPED_TEST(RoundRobinTest, RoundRobinPartitions13_3)
 
     strings_column_wrapper expectedDataWrap1(
       {"a", "d", "g", "j", "m", "b", "e", "h", "k", "c", "f", "i", "l"},
-      {1, 1, 1, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1});
+      {true, true, true, true, false, true, true, true, true, true, true, true, true});
 
     auto expected_column_view1{static_cast<cudf::column_view const&>(expectedDataWrap1)};
     CUDF_TEST_EXPECT_COLUMNS_EQUAL(expected_column_view1, output_column_view1);
@@ -128,7 +128,7 @@ TYPED_TEST(RoundRobinTest, RoundRobinPartitions13_3)
 
     strings_column_wrapper expectedDataWrap1(
       {"c", "f", "i", "l", "a", "d", "g", "j", "m", "b", "e", "h", "k"},
-      {1, 1, 1, 1, 1, 1, 1, 1, 0, 1, 1, 1, 1});
+      {true, true, true, true, true, true, true, true, false, true, true, true, true});
 
     auto expected_column_view1{static_cast<cudf::column_view const&>(expectedDataWrap1)};
     CUDF_TEST_EXPECT_COLUMNS_EQUAL(expected_column_view1, output_column_view1);
@@ -166,7 +166,7 @@ TYPED_TEST(RoundRobinTest, RoundRobinPartitions13_3)
 
     strings_column_wrapper expectedDataWrap1(
       {"b", "e", "h", "k", "c", "f", "i", "l", "a", "d", "g", "j", "m"},
-      {1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0});
+      {true, true, true, true, true, true, true, true, true, true, true, true, false});
 
     auto expected_column_view1{static_cast<cudf::column_view const&>(expectedDataWrap1)};
     CUDF_TEST_EXPECT_COLUMNS_EQUAL(expected_column_view1, output_column_view1);
@@ -195,8 +195,9 @@ TYPED_TEST(RoundRobinTest, RoundRobinPartitions13_3)
 
 TYPED_TEST(RoundRobinTest, RoundRobinPartitions11_3)
 {
-  strings_column_wrapper rrColWrap1({"a", "b", "c", "d", "e", "f", "g", "h", "i", "j", "k"},
-                                    {1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0});
+  strings_column_wrapper rrColWrap1(
+    {"a", "b", "c", "d", "e", "f", "g", "h", "i", "j", "k"},
+    {true, true, true, true, true, true, true, true, true, true, false});
 
   cudf::size_type inputRows = static_cast<cudf::column_view const&>(rrColWrap1).size();
 
@@ -223,7 +224,8 @@ TYPED_TEST(RoundRobinTest, RoundRobinPartitions11_3)
     auto output_column_view2{p_outputTable->view().column(1)};
 
     strings_column_wrapper expectedDataWrap1(
-      {"a", "d", "g", "j", "b", "e", "h", "k", "c", "f", "i"}, {1, 1, 1, 1, 1, 1, 1, 0, 1, 1, 1});
+      {"a", "d", "g", "j", "b", "e", "h", "k", "c", "f", "i"},
+      {true, true, true, true, true, true, true, false, true, true, true});
 
     auto expected_column_view1{static_cast<cudf::column_view const&>(expectedDataWrap1)};
     CUDF_TEST_EXPECT_COLUMNS_EQUAL(expected_column_view1, output_column_view1);
@@ -260,7 +262,8 @@ TYPED_TEST(RoundRobinTest, RoundRobinPartitions11_3)
     auto output_column_view2{p_outputTable->view().column(1)};
 
     strings_column_wrapper expectedDataWrap1(
-      {"c", "f", "i", "a", "d", "g", "j", "b", "e", "h", "k"}, {1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0});
+      {"c", "f", "i", "a", "d", "g", "j", "b", "e", "h", "k"},
+      {true, true, true, true, true, true, true, true, true, true, false});
 
     auto expected_column_view1{static_cast<cudf::column_view const&>(expectedDataWrap1)};
     CUDF_TEST_EXPECT_COLUMNS_EQUAL(expected_column_view1, output_column_view1);
@@ -297,7 +300,8 @@ TYPED_TEST(RoundRobinTest, RoundRobinPartitions11_3)
     auto output_column_view2{p_outputTable->view().column(1)};
 
     strings_column_wrapper expectedDataWrap1(
-      {"b", "e", "h", "k", "c", "f", "i", "a", "d", "g", "j"}, {1, 1, 1, 0, 1, 1, 1, 1, 1, 1, 1});
+      {"b", "e", "h", "k", "c", "f", "i", "a", "d", "g", "j"},
+      {true, true, true, false, true, true, true, true, true, true, true});
 
     auto expected_column_view1{static_cast<cudf::column_view const&>(expectedDataWrap1)};
     CUDF_TEST_EXPECT_COLUMNS_EQUAL(expected_column_view1, output_column_view1);
@@ -326,8 +330,9 @@ TYPED_TEST(RoundRobinTest, RoundRobinPartitions11_3)
 
 TYPED_TEST(RoundRobinTest, RoundRobinDegeneratePartitions11_15)
 {
-  strings_column_wrapper rrColWrap1({"a", "b", "c", "d", "e", "f", "g", "h", "i", "j", "k"},
-                                    {1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0});
+  strings_column_wrapper rrColWrap1(
+    {"a", "b", "c", "d", "e", "f", "g", "h", "i", "j", "k"},
+    {true, true, true, true, true, true, true, true, true, true, false});
 
   cudf::size_type inputRows = static_cast<cudf::column_view const&>(rrColWrap1).size();
 
@@ -354,7 +359,8 @@ TYPED_TEST(RoundRobinTest, RoundRobinDegeneratePartitions11_15)
     auto output_column_view2{p_outputTable->view().column(1)};
 
     strings_column_wrapper expectedDataWrap1(
-      {"a", "b", "c", "d", "e", "f", "g", "h", "i", "j", "k"}, {1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0});
+      {"a", "b", "c", "d", "e", "f", "g", "h", "i", "j", "k"},
+      {true, true, true, true, true, true, true, true, true, true, false});
 
     auto expected_column_view1{static_cast<cudf::column_view const&>(expectedDataWrap1)};
     CUDF_TEST_EXPECT_COLUMNS_EQUAL(expected_column_view1, output_column_view1);
@@ -392,7 +398,8 @@ TYPED_TEST(RoundRobinTest, RoundRobinDegeneratePartitions11_15)
     auto output_column_view2{p_outputTable->view().column(1)};
 
     strings_column_wrapper expectedDataWrap1(
-      {"f", "g", "h", "i", "j", "k", "a", "b", "c", "d", "e"}, {1, 1, 1, 1, 1, 0, 1, 1, 1, 1, 1});
+      {"f", "g", "h", "i", "j", "k", "a", "b", "c", "d", "e"},
+      {true, true, true, true, true, false, true, true, true, true, true});
 
     auto expected_column_view1{static_cast<cudf::column_view const&>(expectedDataWrap1)};
     CUDF_TEST_EXPECT_COLUMNS_EQUAL(expected_column_view1, output_column_view1);
@@ -430,7 +437,8 @@ TYPED_TEST(RoundRobinTest, RoundRobinDegeneratePartitions11_15)
     auto output_column_view2{p_outputTable->view().column(1)};
 
     strings_column_wrapper expectedDataWrap1(
-      {"b", "c", "d", "e", "f", "g", "h", "i", "j", "k", "a"}, {1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 1});
+      {"b", "c", "d", "e", "f", "g", "h", "i", "j", "k", "a"},
+      {true, true, true, true, true, true, true, true, true, false, true});
 
     auto expected_column_view1{static_cast<cudf::column_view const&>(expectedDataWrap1)};
     CUDF_TEST_EXPECT_COLUMNS_EQUAL(expected_column_view1, output_column_view1);
@@ -460,8 +468,9 @@ TYPED_TEST(RoundRobinTest, RoundRobinDegeneratePartitions11_15)
 
 TYPED_TEST(RoundRobinTest, RoundRobinDegeneratePartitions11_11)
 {
-  strings_column_wrapper rrColWrap1({"a", "b", "c", "d", "e", "f", "g", "h", "i", "j", "k"},
-                                    {1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0});
+  strings_column_wrapper rrColWrap1(
+    {"a", "b", "c", "d", "e", "f", "g", "h", "i", "j", "k"},
+    {true, true, true, true, true, true, true, true, true, true, false});
 
   cudf::size_type inputRows = static_cast<cudf::column_view const&>(rrColWrap1).size();
 
@@ -488,7 +497,8 @@ TYPED_TEST(RoundRobinTest, RoundRobinDegeneratePartitions11_11)
     auto output_column_view2{p_outputTable->view().column(1)};
 
     strings_column_wrapper expectedDataWrap1(
-      {"j", "k", "a", "b", "c", "d", "e", "f", "g", "h", "i"}, {1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1});
+      {"j", "k", "a", "b", "c", "d", "e", "f", "g", "h", "i"},
+      {true, false, true, true, true, true, true, true, true, true, true});
 
     auto expected_column_view1{static_cast<cudf::column_view const&>(expectedDataWrap1)};
     CUDF_TEST_EXPECT_COLUMNS_EQUAL(expected_column_view1, output_column_view1);
@@ -527,7 +537,8 @@ TYPED_TEST(RoundRobinTest, RoundRobinNPartitionsDivideNRows)
   strings_column_wrapper rrColWrap1(
     {"a", "b", "c", "d", "e", "f", "g", "h", "i", "j", "k",
      "l", "m", "n", "o", "p", "q", "r", "s", "t", "u"},
-    {1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0});
+    {true, true, true, true, true, true, true, true, true, true, true,
+     true, true, true, true, true, true, true, true, true, false});
 
   cudf::size_type inputRows = static_cast<cudf::column_view const&>(rrColWrap1).size();
 
@@ -563,7 +574,8 @@ TYPED_TEST(RoundRobinTest, RoundRobinNPartitionsDivideNRows)
     strings_column_wrapper expectedDataWrap1(
       {"a", "d", "g", "j", "m", "p", "s", "b", "e", "h", "k",
        "n", "q", "t", "c", "f", "i", "l", "o", "r", "u"},
-      {1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0});
+      {true, true, true, true, true, true, true, true, true, true, true,
+       true, true, true, true, true, true, true, true, true, false});
 
     auto expected_column_view1{static_cast<cudf::column_view const&>(expectedDataWrap1)};
     CUDF_TEST_EXPECT_COLUMNS_EQUAL(expected_column_view1, output_column_view1);
@@ -610,7 +622,8 @@ TYPED_TEST(RoundRobinTest, RoundRobinNPartitionsDivideNRows)
     strings_column_wrapper expectedDataWrap1(
       {"c", "f", "i", "l", "o", "r", "u", "a", "d", "g", "j",
        "m", "p", "s", "b", "e", "h", "k", "n", "q", "t"},
-      {1, 1, 1, 1, 1, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1});
+      {true, true, true, true, true, true, false, true, true, true, true,
+       true, true, true, true, true, true, true,  true, true, true});
 
     auto expected_column_view1{static_cast<cudf::column_view const&>(expectedDataWrap1)};
     CUDF_TEST_EXPECT_COLUMNS_EQUAL(expected_column_view1, output_column_view1);
@@ -640,8 +653,9 @@ TYPED_TEST(RoundRobinTest, RoundRobinNPartitionsDivideNRows)
 
 TYPED_TEST(RoundRobinTest, RoundRobinSinglePartition)
 {
-  strings_column_wrapper rrColWrap1({"a", "b", "c", "d", "e", "f", "g", "h", "i", "j", "k"},
-                                    {1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0});
+  strings_column_wrapper rrColWrap1(
+    {"a", "b", "c", "d", "e", "f", "g", "h", "i", "j", "k"},
+    {true, true, true, true, true, true, true, true, true, true, false});
 
   cudf::size_type inputRows = static_cast<cudf::column_view const&>(rrColWrap1).size();
 
@@ -665,8 +679,9 @@ TYPED_TEST(RoundRobinTest, RoundRobinSinglePartition)
   auto output_column_view1{p_outputTable->view().column(0)};
   auto output_column_view2{p_outputTable->view().column(1)};
 
-  strings_column_wrapper expectedDataWrap1({"a", "b", "c", "d", "e", "f", "g", "h", "i", "j", "k"},
-                                           {1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0});
+  strings_column_wrapper expectedDataWrap1(
+    {"a", "b", "c", "d", "e", "f", "g", "h", "i", "j", "k"},
+    {true, true, true, true, true, true, true, true, true, true, false});
 
   auto expected_column_view1{static_cast<cudf::column_view const&>(expectedDataWrap1)};
   CUDF_TEST_EXPECT_COLUMNS_EQUAL(expected_column_view1, output_column_view1);
@@ -693,8 +708,9 @@ TYPED_TEST(RoundRobinTest, RoundRobinSinglePartition)
 
 TYPED_TEST(RoundRobinTest, RoundRobinIncorrectNumPartitions)
 {
-  strings_column_wrapper rrColWrap1({"a", "b", "c", "d", "e", "f", "g", "h", "i", "j", "k"},
-                                    {1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0});
+  strings_column_wrapper rrColWrap1(
+    {"a", "b", "c", "d", "e", "f", "g", "h", "i", "j", "k"},
+    {true, true, true, true, true, true, true, true, true, true, false});
 
   cudf::size_type inputRows = static_cast<cudf::column_view const&>(rrColWrap1).size();
 
@@ -719,8 +735,9 @@ TYPED_TEST(RoundRobinTest, RoundRobinIncorrectNumPartitions)
 
 TYPED_TEST(RoundRobinTest, RoundRobinIncorrectStartPartition)
 {
-  strings_column_wrapper rrColWrap1({"a", "b", "c", "d", "e", "f", "g", "h", "i", "j", "k"},
-                                    {1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0});
+  strings_column_wrapper rrColWrap1(
+    {"a", "b", "c", "d", "e", "f", "g", "h", "i", "j", "k"},
+    {true, true, true, true, true, true, true, true, true, true, false});
 
   cudf::size_type inputRows = static_cast<cudf::column_view const&>(rrColWrap1).size();
 
diff --git a/cpp/tests/quantiles/percentile_approx_test.cpp b/cpp/tests/quantiles/percentile_approx_test.cpp
index 46d4066ddff..06c6b9dfbe4 100644
--- a/cpp/tests/quantiles/percentile_approx_test.cpp
+++ b/cpp/tests/quantiles/percentile_approx_test.cpp
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2022-2023, NVIDIA CORPORATION.
+ * Copyright (c) 2022-2024, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -384,7 +384,7 @@ TEST_F(PercentileApproxTest, EmptyInput)
   auto result = cudf::percentile_approx(tdv, percentiles);
 
   cudf::test::fixed_width_column_wrapper<cudf::size_type> offsets{0, 0, 0, 0};
-  std::vector<bool> nulls{0, 0, 0};
+  std::vector<bool> nulls{false, false, false};
   auto [null_mask, null_count] = cudf::test::detail::make_null_mask(nulls.begin(), nulls.end());
 
   auto expected = cudf::make_lists_column(3,
@@ -416,7 +416,7 @@ TEST_F(PercentileApproxTest, EmptyPercentiles)
   auto result = cudf::percentile_approx(tdv, percentiles);
 
   cudf::test::fixed_width_column_wrapper<cudf::size_type> offsets{0, 0, 0};
-  std::vector<bool> nulls{0, 0};
+  std::vector<bool> nulls{false, false};
   auto [null_mask, null_count] = cudf::test::detail::make_null_mask(nulls.begin(), nulls.end());
 
   auto expected = cudf::make_lists_column(2,
@@ -444,10 +444,11 @@ TEST_F(PercentileApproxTest, NullPercentiles)
 
   cudf::tdigest::tdigest_column_view tdv(*tdigest_column.second[0].results[0]);
 
-  cudf::test::fixed_width_column_wrapper<double> npercentiles{{0.5, 0.5, 1.0, 1.0}, {0, 0, 1, 1}};
+  cudf::test::fixed_width_column_wrapper<double> npercentiles{{0.5, 0.5, 1.0, 1.0},
+                                                              {false, false, true, true}};
   auto result = cudf::percentile_approx(tdv, npercentiles);
 
-  std::vector<bool> valids{0, 0, 1, 1};
+  std::vector<bool> valids{false, false, true, true};
   cudf::test::lists_column_wrapper<double> expected{{{99, 99, 4, 4}, valids.begin()},
                                                     {{99, 99, 8, 8}, valids.begin()}};
 
diff --git a/cpp/tests/quantiles/quantile_test.cpp b/cpp/tests/quantiles/quantile_test.cpp
index b25a4d6c666..6e88365b6e8 100644
--- a/cpp/tests/quantiles/quantile_test.cpp
+++ b/cpp/tests/quantiles/quantile_test.cpp
@@ -413,7 +413,7 @@ TYPED_TEST(QuantileTest, TestInterpolateExtremaLow)
 TYPED_TEST(QuantileTest, TestEmpty)
 {
   auto input    = cudf::test::fixed_width_column_wrapper<TypeParam>({});
-  auto expected = cudf::test::fixed_width_column_wrapper<double>({0, 0}, {0, 0});
+  auto expected = cudf::test::fixed_width_column_wrapper<double>({0, 0}, {false, false});
   auto actual   = cudf::quantile(input, {0.5, 0.25});
 }
 
diff --git a/cpp/tests/quantiles/quantiles_test.cpp b/cpp/tests/quantiles/quantiles_test.cpp
index b7faa20e8c1..44d4ec61852 100644
--- a/cpp/tests/quantiles/quantiles_test.cpp
+++ b/cpp/tests/quantiles/quantiles_test.cpp
@@ -119,7 +119,8 @@ TYPED_TEST(QuantilesTest, TestMultiColumnUnsorted)
   auto input_a = cudf::test::strings_column_wrapper(
     {"C", "B", "A", "A", "D", "B", "D", "B", "D", "C", "C", "C",
      "D", "B", "D", "B", "C", "C", "A", "D", "B", "A", "A", "A"},
-    {1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1});
+    {true, true, true, true, true, true, true, true, true, true, true, true,
+     true, true, true, true, true, true, true, true, true, true, true, true});
 
   cudf::test::fixed_width_column_wrapper<T, int32_t> input_b(
     {4, 3, 5, 0, 1, 0, 4, 1, 5, 3, 0, 5, 2, 4, 3, 2, 1, 2, 3, 0, 5, 1, 4, 2},
@@ -133,7 +134,8 @@ TYPED_TEST(QuantilesTest, TestMultiColumnUnsorted)
                                 cudf::sorted::NO,
                                 {cudf::order::ASCENDING, cudf::order::DESCENDING});
 
-  auto expected_a = cudf::test::strings_column_wrapper({"A", "C", "C", "B", "D"}, {1, 1, 1, 1, 1});
+  auto expected_a =
+    cudf::test::strings_column_wrapper({"A", "C", "C", "B", "D"}, {true, true, true, true, true});
 
   cudf::test::fixed_width_column_wrapper<T, int32_t> expected_b({5, 5, 1, 5, 0}, {1, 1, 1, 1, 1});
 
@@ -149,7 +151,8 @@ TYPED_TEST(QuantilesTest, TestMultiColumnAssumedSorted)
   auto input_a = cudf::test::strings_column_wrapper(
     {"C", "B", "A", "A", "D", "B", "D", "B", "D", "C", "C", "C",
      "D", "B", "D", "B", "C", "C", "A", "D", "B", "A", "A", "A"},
-    {1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1});
+    {true, true, true, true, true, true, true, true, true, true, true, true,
+     true, true, true, true, true, true, true, true, true, true, true, true});
 
   cudf::test::fixed_width_column_wrapper<T, int32_t> input_b(
     {4, 3, 5, 0, 1, 0, 4, 1, 5, 3, 0, 5, 2, 4, 3, 2, 1, 2, 3, 0, 5, 1, 4, 2},
@@ -160,7 +163,8 @@ TYPED_TEST(QuantilesTest, TestMultiColumnAssumedSorted)
   auto actual = cudf::quantiles(
     input, {0.0f, 0.5f, 0.7f, 0.25f, 1.0f}, cudf::interpolation::NEAREST, cudf::sorted::YES);
 
-  auto expected_a = cudf::test::strings_column_wrapper({"C", "D", "C", "D", "A"}, {1, 1, 1, 1, 1});
+  auto expected_a =
+    cudf::test::strings_column_wrapper({"C", "D", "C", "D", "A"}, {true, true, true, true, true});
 
   cudf::test::fixed_width_column_wrapper<T, int32_t> expected_b({4, 2, 1, 4, 2}, {1, 1, 1, 1, 1});
 
diff --git a/cpp/tests/reductions/collect_ops_tests.cpp b/cpp/tests/reductions/collect_ops_tests.cpp
index 65d0b3a54ad..a41682bc632 100644
--- a/cpp/tests/reductions/collect_ops_tests.cpp
+++ b/cpp/tests/reductions/collect_ops_tests.cpp
@@ -56,7 +56,7 @@ TYPED_TEST(CollectTestFixedWidth, CollectList)
   using fw_wrapper = cudf::test::fixed_width_column_wrapper<TypeParam, int32_t>;
 
   std::vector<int> values({5, 0, -120, -111, 0, 64, 63, 99, 123, -16});
-  std::vector<bool> null_mask({1, 1, 0, 1, 1, 1, 0, 1, 0, 1});
+  std::vector<bool> null_mask({true, true, false, true, true, true, false, true, false, true});
 
   // null_include without nulls
   fw_wrapper col(values.begin(), values.end());
@@ -88,7 +88,7 @@ TYPED_TEST(CollectTestFixedWidth, CollectSet)
   using fw_wrapper = cudf::test::fixed_width_column_wrapper<TypeParam, int32_t>;
 
   std::vector<int> values({5, 0, 120, 0, 0, 64, 64, 99, 120, 99});
-  std::vector<bool> null_mask({1, 1, 0, 1, 1, 1, 0, 1, 0, 1});
+  std::vector<bool> null_mask({true, true, false, true, true, true, false, true, false, true});
 
   fw_wrapper col(values.begin(), values.end());
   fw_wrapper col_with_null(values.begin(), values.end(), null_mask.begin());
@@ -197,11 +197,11 @@ TEST_F(CollectTest, CollectSetWithNaN)
   using fp_wrapper = cudf::test::fixed_width_column_wrapper<float>;
 
   fp_wrapper col{{1.0f, 1.0f, -2.3e-5f, -2.3e-5f, 2.3e5f, 2.3e5f, -NAN, -NAN, NAN, NAN, 0.0f, 0.0f},
-                 {1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0}};
+                 {true, true, true, true, true, true, true, true, true, true, false, false}};
 
   // nan unequal with null equal
   fp_wrapper expected1{{-2.3e-5f, 1.0f, 2.3e5f, -NAN, -NAN, NAN, NAN, 0.0f},
-                       {1, 1, 1, 1, 1, 1, 1, 0}};
+                       {true, true, true, true, true, true, true, false}};
   auto const ret1 = collect_set(
     col,
     cudf::make_collect_set_aggregation<cudf::reduce_aggregation>(
@@ -210,7 +210,7 @@ TEST_F(CollectTest, CollectSetWithNaN)
 
   // nan unequal with null unequal
   fp_wrapper expected2{{-2.3e-5f, 1.0f, 2.3e5f, -NAN, -NAN, NAN, NAN, 0.0f, 0.0f},
-                       {1, 1, 1, 1, 1, 1, 1, 0, 0}};
+                       {true, true, true, true, true, true, true, false, false}};
   auto const ret2 = collect_set(
     col,
     cudf::make_collect_set_aggregation<cudf::reduce_aggregation>(
@@ -218,7 +218,7 @@ TEST_F(CollectTest, CollectSetWithNaN)
   CUDF_TEST_EXPECT_COLUMNS_EQUAL(expected2, dynamic_cast<cudf::list_scalar*>(ret2.get())->view());
 
   // nan equal with null equal
-  fp_wrapper expected3{{-2.3e-5f, 1.0f, 2.3e5f, NAN, 0.0f}, {1, 1, 1, 1, 0}};
+  fp_wrapper expected3{{-2.3e-5f, 1.0f, 2.3e5f, NAN, 0.0f}, {true, true, true, true, false}};
   auto const ret3 = collect_set(
     col,
     cudf::make_collect_set_aggregation<cudf::reduce_aggregation>(
@@ -226,7 +226,8 @@ TEST_F(CollectTest, CollectSetWithNaN)
   CUDF_TEST_EXPECT_COLUMNS_EQUAL(expected3, dynamic_cast<cudf::list_scalar*>(ret3.get())->view());
 
   // nan equal with null unequal
-  fp_wrapper expected4{{-2.3e-5f, 1.0f, 2.3e5f, -NAN, 0.0f, 0.0f}, {1, 1, 1, 1, 0, 0}};
+  fp_wrapper expected4{{-2.3e-5f, 1.0f, 2.3e5f, -NAN, 0.0f, 0.0f},
+                       {true, true, true, true, false, false}};
   auto const ret4 = collect_set(
     col,
     cudf::make_collect_set_aggregation<cudf::reduce_aggregation>(
@@ -248,7 +249,8 @@ TEST_F(CollectTest, MergeSetsWithNaN)
   };
 
   // nan unequal with null equal
-  fp_wrapper expected1{{-2.3e-5f, 1.0f, 2.3e5f, -NAN, NAN, NAN, 0.0f}, {1, 1, 1, 1, 1, 1, 0}};
+  fp_wrapper expected1{{-2.3e-5f, 1.0f, 2.3e5f, -NAN, NAN, NAN, 0.0f},
+                       {true, true, true, true, true, true, false}};
   auto const ret1 = collect_set(col,
                                 cudf::make_merge_sets_aggregation<cudf::reduce_aggregation>(
                                   cudf::null_equality::EQUAL, cudf::nan_equality::UNEQUAL));
@@ -256,21 +258,22 @@ TEST_F(CollectTest, MergeSetsWithNaN)
 
   // nan unequal with null unequal
   fp_wrapper expected2{{-2.3e-5f, 1.0f, 2.3e5f, -NAN, NAN, NAN, 0.0f, 0.0f, 0.0f},
-                       {1, 1, 1, 1, 1, 1, 0, 0, 0}};
+                       {true, true, true, true, true, true, false, false, false}};
   auto const ret2 = collect_set(col,
                                 cudf::make_merge_sets_aggregation<cudf::reduce_aggregation>(
                                   cudf::null_equality::UNEQUAL, cudf::nan_equality::UNEQUAL));
   CUDF_TEST_EXPECT_COLUMNS_EQUAL(expected2, dynamic_cast<cudf::list_scalar*>(ret2.get())->view());
 
   // nan equal with null equal
-  fp_wrapper expected3{{-2.3e-5f, 1.0f, 2.3e5f, -NAN, 0.0f}, {1, 1, 1, 1, 0}};
+  fp_wrapper expected3{{-2.3e-5f, 1.0f, 2.3e5f, -NAN, 0.0f}, {true, true, true, true, false}};
   auto const ret3 = collect_set(col,
                                 cudf::make_merge_sets_aggregation<cudf::reduce_aggregation>(
                                   cudf::null_equality::EQUAL, cudf::nan_equality::ALL_EQUAL));
   CUDF_TEST_EXPECT_COLUMNS_EQUAL(expected3, dynamic_cast<cudf::list_scalar*>(ret3.get())->view());
 
   // nan equal with null unequal
-  fp_wrapper expected4{{-2.3e-5f, 1.0f, 2.3e5f, -NAN, 0.0f, 0.0f, 0.0f}, {1, 1, 1, 1, 0, 0, 0}};
+  fp_wrapper expected4{{-2.3e-5f, 1.0f, 2.3e5f, -NAN, 0.0f, 0.0f, 0.0f},
+                       {true, true, true, true, false, false, false}};
   auto const ret4 = collect_set(col,
                                 cudf::make_merge_sets_aggregation<cudf::reduce_aggregation>(
                                   cudf::null_equality::UNEQUAL, cudf::nan_equality::ALL_EQUAL));
@@ -282,8 +285,8 @@ TEST_F(CollectTest, CollectStrings)
   using str_col   = cudf::test::strings_column_wrapper;
   using lists_col = cudf::test::lists_column_wrapper<cudf::string_view>;
 
-  auto const s_col =
-    str_col{{"a", "a", "b", "b", "b", "c", "c", "d", "e", "e"}, {1, 1, 1, 0, 1, 1, 0, 1, 1, 1}};
+  auto const s_col = str_col{{"a", "a", "b", "b", "b", "c", "c", "d", "e", "e"},
+                             {true, true, true, false, true, true, false, true, true, true}};
 
   // collect_list including nulls
   auto const ret1 = cudf::reduce(s_col,
@@ -306,8 +309,9 @@ TEST_F(CollectTest, CollectStrings)
   CUDF_TEST_EXPECT_COLUMNS_EQUAL(expected3, dynamic_cast<cudf::list_scalar*>(ret3.get())->view());
 
   // collect_set with null_unequal
-  auto const expected4 = str_col{{"a", "b", "c", "d", "e", "", ""}, {1, 1, 1, 1, 1, 0, 0}};
-  auto const ret4      = collect_set(s_col,
+  auto const expected4 =
+    str_col{{"a", "b", "c", "d", "e", "", ""}, {true, true, true, true, true, false, false}};
+  auto const ret4 = collect_set(s_col,
                                 cudf::make_collect_set_aggregation<cudf::reduce_aggregation>(
                                   cudf::null_policy::INCLUDE, cudf::null_equality::UNEQUAL));
   CUDF_TEST_EXPECT_COLUMNS_EQUAL(expected4, dynamic_cast<cudf::list_scalar*>(ret4.get())->view());
@@ -322,22 +326,23 @@ TEST_F(CollectTest, CollectStrings)
 
   // merge_lists
   auto const expected5 = str_col{{"a", "a", "b", "b", "null", "c", "null", "d", "null", "e"},
-                                 {1, 1, 1, 1, 0, 1, 0, 1, 0, 1}};
+                                 {true, true, true, true, false, true, false, true, false, true}};
   auto const ret5      = cudf::reduce(strings,
                                  *cudf::make_merge_lists_aggregation<cudf::reduce_aggregation>(),
                                  cudf::data_type{cudf::type_id::LIST});
   CUDF_TEST_EXPECT_COLUMNS_EQUAL(expected5, dynamic_cast<cudf::list_scalar*>(ret5.get())->view());
 
   // merge_sets with null_equal
-  auto const expected6 = str_col{{"a", "b", "c", "d", "e", "null"}, {1, 1, 1, 1, 1, 0}};
+  auto const expected6 =
+    str_col{{"a", "b", "c", "d", "e", "null"}, {true, true, true, true, true, false}};
   auto const ret6 =
     collect_set(strings, cudf::make_merge_sets_aggregation<cudf::reduce_aggregation>());
   CUDF_TEST_EXPECT_COLUMNS_EQUAL(expected6, dynamic_cast<cudf::list_scalar*>(ret6.get())->view());
 
   // merge_sets with null_unequal
-  auto const expected7 =
-    str_col{{"a", "b", "c", "d", "e", "null", "null", "null"}, {1, 1, 1, 1, 1, 0, 0, 0}};
-  auto const ret7 = collect_set(
+  auto const expected7 = str_col{{"a", "b", "c", "d", "e", "null", "null", "null"},
+                                 {true, true, true, true, true, false, false, false}};
+  auto const ret7      = collect_set(
     strings,
     cudf::make_merge_sets_aggregation<cudf::reduce_aggregation>(cudf::null_equality::UNEQUAL));
   CUDF_TEST_EXPECT_COLUMNS_EQUAL(expected7, dynamic_cast<cudf::list_scalar*>(ret7.get())->view());
@@ -358,7 +363,7 @@ TEST_F(CollectTest, CollectEmptys)
   CUDF_TEST_EXPECT_COLUMNS_EQUAL(int_col{}, dynamic_cast<cudf::list_scalar*>(ret.get())->view());
 
   // test collect all null columns
-  auto all_nulls = int_col{{1, 2, 3, 4, 5}, {0, 0, 0, 0, 0}};
+  auto all_nulls = int_col{{1, 2, 3, 4, 5}, {false, false, false, false, false}};
   ret            = cudf::reduce(all_nulls,
                      *cudf::make_collect_list_aggregation<cudf::reduce_aggregation>(),
                      cudf::data_type{cudf::type_id::LIST});
diff --git a/cpp/tests/reductions/list_rank_test.cpp b/cpp/tests/reductions/list_rank_test.cpp
index f5aeb87a3c0..f5470f7d881 100644
--- a/cpp/tests/reductions/list_rank_test.cpp
+++ b/cpp/tests/reductions/list_rank_test.cpp
@@ -117,17 +117,84 @@ TEST_F(ListRankScanTest, ListOfStruct)
 
   auto col1 = cudf::test::fixed_width_column_wrapper<int32_t>{
     {-1, -1, 0, 2, 2, 2, 1, 2, 0, 2, 0, 2, 0, 2, 0, 0, 1, 2},
-    {1, 1, 1, 1, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0}};
+    {true,
+     true,
+     true,
+     true,
+     true,
+     false,
+     true,
+     true,
+     true,
+     true,
+     true,
+     true,
+     true,
+     true,
+     true,
+     true,
+     false,
+     false}};
   auto col2 = cudf::test::strings_column_wrapper{
     {"x", "x", "a", "a", "b", "b", "a", "b", "a", "b", "a", "c", "a", "c", "a", "c", "b", "b"},
-    {1, 1, 1, 1, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 1, 1}};
-  auto struct_col = cudf::test::structs_column_wrapper{
-    {col1, col2}, {0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1}};
+    {true,
+     true,
+     true,
+     true,
+     true,
+     false,
+     true,
+     true,
+     true,
+     true,
+     true,
+     true,
+     true,
+     true,
+     false,
+     false,
+     true,
+     true}};
+  auto struct_col = cudf::test::structs_column_wrapper{{col1, col2},
+                                                       {false,
+                                                        false,
+                                                        false,
+                                                        false,
+                                                        false,
+                                                        true,
+                                                        true,
+                                                        true,
+                                                        true,
+                                                        true,
+                                                        true,
+                                                        true,
+                                                        true,
+                                                        true,
+                                                        true,
+                                                        true,
+                                                        true,
+                                                        true}};
 
   auto offsets = cudf::test::fixed_width_column_wrapper<cudf::size_type>{
     0, 0, 0, 0, 0, 2, 3, 4, 5, 6, 8, 10, 12, 14, 15, 16, 17, 18};
 
-  auto list_nullmask = std::vector<bool>{1, 1, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1};
+  auto list_nullmask = std::vector<bool>{true,
+                                         true,
+                                         false,
+                                         false,
+                                         true,
+                                         true,
+                                         true,
+                                         true,
+                                         true,
+                                         true,
+                                         true,
+                                         true,
+                                         true,
+                                         true,
+                                         true,
+                                         true,
+                                         true};
   auto [null_mask, null_count] =
     cudf::test::detail::make_null_mask(list_nullmask.begin(), list_nullmask.end());
   auto list_column = cudf::column_view(cudf::data_type(cudf::type_id::LIST),
@@ -178,14 +245,16 @@ TEST_F(ListRankScanTest, ListOfEmptyStruct)
   // [{}, {}]
   // [{}, {}]
 
-  auto struct_validity = std::vector<bool>{0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1};
+  auto struct_validity = std::vector<bool>{
+    false, false, false, false, false, false, false, false, true, true, true, true, true, true};
   auto [null_mask, null_count] =
     cudf::test::detail::make_null_mask(struct_validity.begin(), struct_validity.end());
   auto struct_col = cudf::make_structs_column(14, {}, null_count, std::move(null_mask));
 
   auto offsets = cudf::test::fixed_width_column_wrapper<cudf::size_type>{
     0, 0, 0, 0, 0, 2, 4, 6, 7, 8, 9, 10, 12, 14};
-  auto list_nullmask = std::vector<bool>{1, 1, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1};
+  auto list_nullmask = std::vector<bool>{
+    true, true, false, false, true, true, true, true, true, true, true, true, true};
   std::tie(null_mask, null_count) =
     cudf::test::detail::make_null_mask(list_nullmask.begin(), list_nullmask.end());
   auto list_column = cudf::make_lists_column(
@@ -213,7 +282,7 @@ TEST_F(ListRankScanTest, EmptyDeepList)
   auto list1 = cudf::test::lists_column_wrapper<int>{};
 
   auto offsets       = cudf::test::fixed_width_column_wrapper<cudf::size_type>{0, 0, 0, 0, 0};
-  auto list_nullmask = std::vector<bool>{1, 1, 0, 0};
+  auto list_nullmask = std::vector<bool>{true, true, false, false};
   auto [null_mask, null_count] =
     cudf::test::detail::make_null_mask(list_nullmask.begin(), list_nullmask.end());
   auto list_column = cudf::make_lists_column(
diff --git a/cpp/tests/reductions/reduction_tests.cpp b/cpp/tests/reductions/reduction_tests.cpp
index c41594e6933..0ec4cfa34c4 100644
--- a/cpp/tests/reductions/reduction_tests.cpp
+++ b/cpp/tests/reductions/reduction_tests.cpp
@@ -91,7 +91,7 @@ struct ReductionTest : public cudf::test::BaseFixture {
 
   ReductionTest() {}
 
-  ~ReductionTest() {}
+  ~ReductionTest() override {}
 
   template <typename T_out>
   std::pair<T_out, bool> reduction_test(cudf::column_view const& underlying_column,
@@ -132,8 +132,9 @@ TYPED_TEST(MinMaxReductionTest, MinMaxTypes)
 {
   using T = TypeParam;
   std::vector<int> int_values({5, 0, -120, -111, 0, 64, 63, 99, 123, -16});
-  std::vector<bool> host_bools({1, 1, 0, 1, 1, 1, 0, 1, 0, 1});
-  std::vector<bool> all_null({0, 0, 0, 0, 0, 0, 0, 0, 0, 0});
+  std::vector<bool> host_bools({true, true, false, true, true, true, false, true, false, true});
+  std::vector<bool> all_null(
+    {false, false, false, false, false, false, false, false, false, false});
   std::vector<T> v       = convert_values<T>(int_values);
   T init_value           = convert_int<T>(100);
   auto const init_scalar = cudf::make_fixed_width_scalar<T>(init_value);
@@ -259,7 +260,7 @@ TYPED_TEST(SumReductionTest, Sum)
 {
   using T = TypeParam;
   std::vector<int> int_values({6, -14, 13, 64, 0, -13, -20, 45});
-  std::vector<bool> host_bools({1, 1, 0, 0, 1, 1, 1, 1});
+  std::vector<bool> host_bools({true, true, false, false, true, true, true, true});
   std::vector<T> v       = convert_values<T>(int_values);
   T init_value           = convert_int<T>(100);
   auto const init_scalar = cudf::make_fixed_width_scalar<T>(init_value);
@@ -304,7 +305,7 @@ TYPED_TEST(ReductionTest, Product)
   }
 
   std::vector<int> int_values({5, -1, 1, 0, 3, 2, 4});
-  std::vector<bool> host_bools({1, 1, 0, 0, 1, 1, 1});
+  std::vector<bool> host_bools({true, true, false, false, true, true, true});
   std::vector<TypeParam> v = convert_values<TypeParam>(int_values);
   T init_value             = convert_int<T>(4);
   auto const init_scalar   = cudf::make_fixed_width_scalar<T>(init_value);
@@ -355,7 +356,7 @@ TYPED_TEST(ReductionTest, SumOfSquare)
 {
   using T = TypeParam;
   std::vector<int> int_values({-3, 2, 1, 0, 5, -3, -2});
-  std::vector<bool> host_bools({1, 1, 0, 0, 1, 1, 1, 1});
+  std::vector<bool> host_bools({true, true, false, false, true, true, true, true});
   std::vector<T> v = convert_values<T>(int_values);
 
   auto calc_reduction = [](std::vector<T>& v) {
@@ -600,7 +601,7 @@ TYPED_TEST(ReductionAnyAllTest, AnyAllTrueTrue)
 {
   using T = TypeParam;
   std::vector<int> int_values({true, true, true, true});
-  std::vector<bool> host_bools({1, 1, 0, 1});
+  std::vector<bool> host_bools({true, true, false, true});
   std::vector<T> v       = convert_values<T>(int_values);
   auto const init_scalar = cudf::make_fixed_width_scalar<T>(convert_int<T>(true));
 
@@ -663,7 +664,7 @@ TYPED_TEST(ReductionAnyAllTest, AnyAllFalseFalse)
 {
   using T = TypeParam;
   std::vector<int> int_values({false, false, false, false});
-  std::vector<bool> host_bools({1, 1, 0, 1});
+  std::vector<bool> host_bools({true, true, false, true});
   std::vector<T> v       = convert_values<T>(int_values);
   auto const init_scalar = cudf::make_fixed_width_scalar<T>(convert_int<T>(false));
 
@@ -733,7 +734,7 @@ TYPED_TEST(MultiStepReductionTest, Mean)
 {
   using T = TypeParam;
   std::vector<int> int_values({-3, 2, 1, 0, 5, -3, -2, 28});
-  std::vector<bool> host_bools({1, 1, 0, 1, 1, 1, 0, 1});
+  std::vector<bool> host_bools({true, true, false, true, true, true, false, true});
 
   auto calc_mean = [](std::vector<T>& v, cudf::size_type valid_count) {
     double sum = std::accumulate(v.begin(), v.end(), double{0});
@@ -778,7 +779,7 @@ TYPED_TEST(MultiStepReductionTest, DISABLED_var_std)
 {
   using T = TypeParam;
   std::vector<int> int_values({-3, 2, 1, 0, 5, -3, -2, 28});
-  std::vector<bool> host_bools({1, 1, 0, 1, 1, 1, 0, 1});
+  std::vector<bool> host_bools({true, true, false, true, true, true, false, true});
 
   auto calc_var = [](std::vector<T>& v, cudf::size_type valid_count, int ddof) {
     double mean = std::accumulate(v.begin(), v.end(), double{0});
@@ -865,7 +866,7 @@ TYPED_TEST(ReductionMultiStepErrorCheck, DISABLED_ErrorHandling)
 {
   using T = TypeParam;
   std::vector<int> int_values({-3, 2});
-  std::vector<bool> host_bools({1, 0});
+  std::vector<bool> host_bools({true, false});
 
   std::vector<T> v = convert_values<T>(int_values);
   cudf::test::fixed_width_column_wrapper<T> col(v.begin(), v.end());
@@ -941,9 +942,11 @@ TEST_F(ReductionDtypeTest, all_null_output)
 {
   auto sum_agg = cudf::make_sum_aggregation<reduce_aggregation>();
 
-  auto const col =
-    cudf::test::fixed_point_column_wrapper<int32_t>{{0, 0, 0}, {0, 0, 0}, numeric::scale_type{-2}}
-      .release();
+  auto const col = cudf::test::fixed_point_column_wrapper<int32_t>{
+    {0, 0, 0},
+    {false, false, false},
+    numeric::scale_type{
+      -2}}.release();
 
   std::unique_ptr<cudf::scalar> result = cudf::reduce(*col, *sum_agg, col->type());
   EXPECT_EQ(result->is_valid(), false);
@@ -1097,7 +1100,7 @@ TEST_F(ReductionEmptyTest, empty_column)
   // expect result.is_valid() is false
   int col_size = 5;
   std::vector<T> col_data(col_size);
-  std::vector<bool> valids(col_size, 0);
+  std::vector<bool> valids(col_size, false);
 
   cudf::test::fixed_width_column_wrapper<T> col_nulls = construct_null_column(col_data, valids);
   CUDF_EXPECT_NO_THROW(statement(col_nulls));
@@ -1138,7 +1141,7 @@ TEST_P(ReductionParamTest, DISABLED_std_var)
 {
   int ddof = GetParam();
   std::vector<double> int_values({-3, 2, 1, 0, 5, -3, -2, 28});
-  std::vector<bool> host_bools({1, 1, 0, 1, 1, 1, 0, 1});
+  std::vector<bool> host_bools({true, true, false, true, true, true, false, true});
 
   auto calc_var = [ddof](std::vector<double>& v, cudf::size_type valid_count) {
     double mean = std::accumulate(v.begin(), v.end(), double{0});
@@ -1270,7 +1273,7 @@ TEST_P(StringReductionTest, MinMax)
 {
   // data and valid arrays
   std::vector<std::string> host_strings(GetParam());
-  std::vector<bool> host_bools({1, 0, 1, 1, 1, 1, 0, 0, 1});
+  std::vector<bool> host_bools({true, false, true, true, true, true, false, false, true});
   bool succeed(true);
   std::string initial_value = "init";
 
@@ -1361,7 +1364,7 @@ TEST_P(StringReductionTest, DictionaryMinMax)
             expected_max_result);
 
   // column with nulls
-  std::vector<bool> validity({1, 0, 1, 1, 1, 1, 0, 0, 1});
+  std::vector<bool> validity({true, false, true, true, true, true, false, false, true});
   cudf::test::dictionary_column_wrapper<std::string> col_nulls(
     host_strings.begin(), host_strings.end(), validity.begin());
 
@@ -1429,7 +1432,7 @@ TYPED_TEST(ReductionTest, Median)
   using T = TypeParam;
   //{-20, -14, -13,  0, 6, 13, 45, 64/None} =  3.0, 0.0
   std::vector<int> int_values({6, -14, 13, 64, 0, -13, -20, 45});
-  std::vector<bool> host_bools({1, 1, 1, 0, 1, 1, 1, 1});
+  std::vector<bool> host_bools({true, true, true, false, true, true, true, true});
   std::vector<T> v = convert_values<T>(int_values);
 
   // test without nulls
@@ -1488,7 +1491,7 @@ TYPED_TEST(ReductionTest, Quantile)
   using T = TypeParam;
   //{-20, -14, -13,  0, 6, 13, 45, 64/None}
   std::vector<int> int_values({6, -14, 13, 64, 0, -13, -20, 45});
-  std::vector<bool> host_bools({1, 1, 1, 0, 1, 1, 1, 1});
+  std::vector<bool> host_bools({true, true, true, false, true, true, true, true});
   std::vector<T> v = convert_values<T>(int_values);
   cudf::interpolation interp{cudf::interpolation::LINEAR};
 
@@ -1528,7 +1531,7 @@ TYPED_TEST(ReductionTest, UniqueCount)
 {
   using T = TypeParam;
   std::vector<int> int_values({1, -3, 1, 2, 0, 2, -4, 45});  // 6 unique values
-  std::vector<bool> host_bools({1, 1, 1, 0, 1, 1, 1, 1});
+  std::vector<bool> host_bools({true, true, true, false, true, true, true, true});
   std::vector<T> v = convert_values<T>(int_values);
 
   // test without nulls
@@ -2311,7 +2314,7 @@ TYPED_TEST(DictionaryAnyAllTest, AnyAll)
   }
   // with nulls
   {
-    std::vector<bool> valid({1, 1, 0, 1});
+    std::vector<bool> valid({true, true, false, true});
     cudf::test::dictionary_column_wrapper<T> all_col(v_all.begin(), v_all.end(), valid.begin());
     EXPECT_TRUE(this->template reduction_test<bool>(all_col, *any_agg, output_dtype).first);
     EXPECT_TRUE(this->template reduction_test<bool>(all_col, *all_agg, output_dtype).first);
@@ -2351,7 +2354,7 @@ TYPED_TEST(DictionaryReductionTest, Sum)
             expected_value);
 
   // test with nulls
-  std::vector<bool> validity({1, 1, 0, 0, 1, 1, 1, 1});
+  std::vector<bool> validity({true, true, false, false, true, true, true, true});
   cudf::test::dictionary_column_wrapper<T> col_nulls(v.begin(), v.end(), validity.begin());
   expected_value = [v, validity] {
     auto const r = replace_nulls(v, validity, T{0});
@@ -2385,7 +2388,7 @@ TYPED_TEST(DictionaryReductionTest, Product)
             calc_prod(v));
 
   // test with nulls
-  std::vector<bool> validity({1, 1, 0, 0, 1, 1, 1});
+  std::vector<bool> validity({true, true, false, false, true, true, true});
   cudf::test::dictionary_column_wrapper<T> col_nulls(v.begin(), v.end(), validity.begin());
 
   EXPECT_EQ(this
@@ -2416,7 +2419,7 @@ TYPED_TEST(DictionaryReductionTest, SumOfSquare)
             calc_reduction(v));
 
   // test with nulls
-  std::vector<bool> validity({1, 1, 0, 0, 1, 1, 1, 1});
+  std::vector<bool> validity({true, true, false, false, true, true, true, true});
   cudf::test::dictionary_column_wrapper<T> col_nulls(v.begin(), v.end(), validity.begin());
 
   EXPECT_EQ(
@@ -2449,7 +2452,7 @@ TYPED_TEST(DictionaryReductionTest, Mean)
             calc_mean(v, v.size()));
 
   // test with nulls
-  std::vector<bool> validity({1, 1, 0, 1, 1, 1, 0, 1});
+  std::vector<bool> validity({true, true, false, true, true, true, false, true});
   cudf::test::dictionary_column_wrapper<T> col_nulls(v.begin(), v.end(), validity.begin());
 
   cudf::size_type valid_count = std::count(validity.begin(), validity.end(), true);
@@ -2495,7 +2498,7 @@ TYPED_TEST(DictionaryReductionTest, DISABLED_VarStd)
   EXPECT_EQ(this->template reduction_test<double>(col, *std_agg, output_type).first, std);
 
   // test with nulls
-  std::vector<bool> validity({1, 1, 0, 1, 1, 1, 0, 1});
+  std::vector<bool> validity({true, true, false, true, true, true, false, true});
   cudf::test::dictionary_column_wrapper<T> col_nulls(v.begin(), v.end(), validity.begin());
 
   cudf::size_type const valid_count = std::count(validity.begin(), validity.end(), true);
@@ -2528,7 +2531,7 @@ TYPED_TEST(DictionaryReductionTest, NthElement)
             v[n]);
 
   // test with nulls
-  std::vector<bool> validity({1, 1, 0, 1, 1, 1, 0, 1});
+  std::vector<bool> validity({true, true, false, true, true, true, false, true});
   cudf::test::dictionary_column_wrapper<T> col_nulls(v.begin(), v.end(), validity.begin());
 
   EXPECT_EQ(this
@@ -2565,7 +2568,7 @@ TYPED_TEST(DictionaryReductionTest, UniqueCount)
             6);
 
   // test with nulls
-  std::vector<bool> validity({1, 1, 1, 0, 1, 1, 1, 1});
+  std::vector<bool> validity({true, true, true, false, true, true, true, true});
   cudf::test::dictionary_column_wrapper<T> col_nulls(v.begin(), v.end(), validity.begin());
 
   EXPECT_EQ(this
@@ -2598,7 +2601,7 @@ TYPED_TEST(DictionaryReductionTest, Median)
     (std::is_signed_v<T>) ? 3.0 : 13.5);
 
   // test with nulls
-  std::vector<bool> validity({1, 1, 1, 0, 1, 1, 1, 1});
+  std::vector<bool> validity({true, true, true, false, true, true, true, true});
   cudf::test::dictionary_column_wrapper<T> col_nulls(v.begin(), v.end(), validity.begin());
   EXPECT_EQ(this
               ->template reduction_test<double>(
@@ -2629,7 +2632,7 @@ TYPED_TEST(DictionaryReductionTest, Quantile)
             64.0);
 
   // test with nulls
-  std::vector<bool> validity({1, 1, 1, 0, 1, 1, 1, 1});
+  std::vector<bool> validity({true, true, true, false, true, true, true, true});
   cudf::test::dictionary_column_wrapper<T> col_nulls(v.begin(), v.end(), validity.begin());
 
   EXPECT_EQ(this
@@ -2686,7 +2689,7 @@ TEST_F(ListReductionTest, ListReductionNthElement)
     *cudf::make_nth_element_aggregation<reduce_aggregation>(2, cudf::null_policy::INCLUDE));
 
   // test with null-exclude
-  std::vector<bool> validity{1, 0, 0, 1, 1, 0};
+  std::vector<bool> validity{true, false, false, true, true, false};
   LCW col_nulls({{-3}, {2, 1}, {0, 5, -3}, {-2}, {}, {28}}, validity.begin());
   this->reduction_test(
     col_nulls,
@@ -2709,7 +2712,7 @@ TEST_F(ListReductionTest, NestedListReductionNthElement)
   using LCW = cudf::test::lists_column_wrapper<int>;
 
   // test without nulls
-  auto validity    = std::vector<bool>{1, 0, 0, 1, 1};
+  auto validity    = std::vector<bool>{true, false, false, true, true};
   auto nested_list = LCW(
     {{LCW{}, LCW{2, 3, 4}}, {}, {LCW{5}, LCW{6}, LCW{7, 8}}, {LCW{9, 10}}, {LCW{11}, LCW{12, 13}}},
     validity.begin());
@@ -2743,7 +2746,7 @@ TEST_F(ListReductionTest, NonValidListReductionNthElement)
   using ElementCol = cudf::test::fixed_width_column_wrapper<int>;
 
   // test against col.size() <= col.null_count()
-  std::vector<bool> validity{0};
+  std::vector<bool> validity{false};
   this->reduction_test(
     LCW{{{1, 2}}, validity.begin()},
     ElementCol{},  // expected_value,
@@ -2891,8 +2894,9 @@ TEST_F(StructReductionTest, StructReductionNthElement)
   // test without nulls
   auto child0 = *ICW{-3, 2, 1, 0, 5, -3, -2, 28}.release();
   auto child1 = *ICW{0, 1, 2, 3, 4, 5, 6, 7}.release();
-  auto child2 =
-    *ICW{{-10, 10, -100, 100, -1000, 1000, -10000, 10000}, {1, 0, 0, 1, 1, 1, 0, 1}}.release();
+  auto child2 = *ICW{{-10, 10, -100, 100, -1000, 1000, -10000, 10000},
+                     {true, false, false, true, true, true, false, true}}
+                   .release();
   std::vector<std::unique_ptr<cudf::column>> input_vector;
   input_vector.push_back(std::make_unique<cudf::column>(child0));
   input_vector.push_back(std::make_unique<cudf::column>(child1));
@@ -2900,7 +2904,7 @@ TEST_F(StructReductionTest, StructReductionNthElement)
   auto struct_col  = SCW(std::move(input_vector));
   auto result_col0 = ICW{1};
   auto result_col1 = ICW{2};
-  auto result_col2 = ICW{{0}, {0}};
+  auto result_col2 = ICW{{0}, {false}};
   this->reduction_test(
     struct_col,
     cudf::table_view{{result_col0, result_col1, result_col2}},  // expected_value,
@@ -2909,15 +2913,15 @@ TEST_F(StructReductionTest, StructReductionNthElement)
     *cudf::make_nth_element_aggregation<reduce_aggregation>(2, cudf::null_policy::INCLUDE));
 
   // test with null-include
-  std::vector<bool> validity{1, 1, 1, 0, 1, 0, 0, 1};
+  std::vector<bool> validity{true, true, true, false, true, false, false, true};
   input_vector.clear();
   input_vector.push_back(std::make_unique<cudf::column>(child0));
   input_vector.push_back(std::make_unique<cudf::column>(child1));
   input_vector.push_back(std::make_unique<cudf::column>(child2));
   struct_col  = SCW(std::move(input_vector), validity);
-  result_col0 = ICW{{0}, {0}};
-  result_col1 = ICW{{0}, {0}};
-  result_col2 = ICW{{0}, {0}};
+  result_col0 = ICW{{0}, {false}};
+  result_col1 = ICW{{0}, {false}};
+  result_col2 = ICW{{0}, {false}};
   this->reduction_test(
     struct_col,
     cudf::table_view{{result_col0, result_col1, result_col2}},  // expected_value,
@@ -2926,9 +2930,9 @@ TEST_F(StructReductionTest, StructReductionNthElement)
     *cudf::make_nth_element_aggregation<reduce_aggregation>(6, cudf::null_policy::INCLUDE));
 
   // test with null-exclude
-  result_col0 = ICW{{28}, {1}};
-  result_col1 = ICW{{7}, {1}};
-  result_col2 = ICW{{10000}, {1}};
+  result_col0 = ICW{{28}, {true}};
+  result_col1 = ICW{{7}, {true}};
+  result_col2 = ICW{{10000}, {true}};
   this->reduction_test(
     struct_col,
     cudf::table_view{{result_col0, result_col1, result_col2}},  // expected_value,
@@ -2942,15 +2946,16 @@ TEST_F(StructReductionTest, NestedStructReductionNthElement)
   using ICW = cudf::test::fixed_width_column_wrapper<int>;
   using LCW = cudf::test::lists_column_wrapper<int>;
 
-  auto int_col0      = ICW{-4, -3, -2, -1, 0};
-  auto struct_col0   = SCW({int_col0}, std::vector<bool>{1, 0, 0, 1, 1});
-  auto int_col1      = ICW{0, 1, 2, 3, 4};
-  auto list_col      = LCW{{0}, {}, {1, 2}, {3}, {4}};
-  auto struct_col1   = SCW({struct_col0, int_col1, list_col}, std::vector<bool>{1, 1, 1, 0, 1});
+  auto int_col0    = ICW{-4, -3, -2, -1, 0};
+  auto struct_col0 = SCW({int_col0}, std::vector<bool>{true, false, false, true, true});
+  auto int_col1    = ICW{0, 1, 2, 3, 4};
+  auto list_col    = LCW{{0}, {}, {1, 2}, {3}, {4}};
+  auto struct_col1 =
+    SCW({struct_col0, int_col1, list_col}, std::vector<bool>{true, true, true, false, true});
   auto result_child0 = ICW{0};
-  auto result_col0   = SCW({result_child0}, std::vector<bool>{0});
-  auto result_col1   = ICW{{1}, {1}};
-  auto result_col2   = LCW({LCW{}}, std::vector<bool>{1}.begin());
+  auto result_col0   = SCW({result_child0}, std::vector<bool>{false});
+  auto result_col1   = ICW{{1}, {true}};
+  auto result_col2   = LCW({LCW{}}, std::vector<bool>{true}.begin());
   // test without nulls
   this->reduction_test(
     struct_col1,
@@ -2961,9 +2966,9 @@ TEST_F(StructReductionTest, NestedStructReductionNthElement)
 
   // test with null-include
   result_child0 = ICW{0};
-  result_col0   = SCW({result_child0}, std::vector<bool>{0});
-  result_col1   = ICW{{0}, {0}};
-  result_col2   = LCW({LCW{3}}, std::vector<bool>{0}.begin());
+  result_col0   = SCW({result_child0}, std::vector<bool>{false});
+  result_col1   = ICW{{0}, {false}};
+  result_col2   = LCW({LCW{3}}, std::vector<bool>{false}.begin());
   this->reduction_test(
     struct_col1,
     cudf::table_view{{result_col0, result_col1, result_col2}},  // expected_value,
@@ -2973,9 +2978,9 @@ TEST_F(StructReductionTest, NestedStructReductionNthElement)
 
   // test with null-exclude
   result_child0 = ICW{0};
-  result_col0   = SCW({result_child0}, std::vector<bool>{1});
-  result_col1   = ICW{{4}, {1}};
-  result_col2   = LCW({LCW{4}}, std::vector<bool>{1}.begin());
+  result_col0   = SCW({result_child0}, std::vector<bool>{true});
+  result_col1   = ICW{{4}, {true}};
+  result_col2   = LCW({LCW{4}}, std::vector<bool>{true}.begin());
   this->reduction_test(
     struct_col1,
     cudf::table_view{{result_col0, result_col1, result_col2}},  // expected_value,
@@ -2991,11 +2996,11 @@ TEST_F(StructReductionTest, NonValidStructReductionNthElement)
   // test against col.size() <= col.null_count()
   auto child0     = ICW{-3, 3};
   auto child1     = ICW{0, 0};
-  auto child2     = ICW{{-10, 10}, {0, 1}};
-  auto struct_col = SCW{{child0, child1, child2}, {0, 0}};
-  auto ret_col0   = ICW{{0}, {0}};
-  auto ret_col1   = ICW{{0}, {0}};
-  auto ret_col2   = ICW{{0}, {0}};
+  auto child2     = ICW{{-10, 10}, {false, true}};
+  auto struct_col = SCW{{child0, child1, child2}, {false, false}};
+  auto ret_col0   = ICW{{0}, {false}};
+  auto ret_col1   = ICW{{0}, {false}};
+  auto ret_col2   = ICW{{0}, {false}};
   this->reduction_test(
     struct_col,
     cudf::table_view{{ret_col0, ret_col1, ret_col2}},  // expected_value,
diff --git a/cpp/tests/reductions/scan_tests.cpp b/cpp/tests/reductions/scan_tests.cpp
index 161b1ee61ac..76dbbaef491 100644
--- a/cpp/tests/reductions/scan_tests.cpp
+++ b/cpp/tests/reductions/scan_tests.cpp
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2019-2023, NVIDIA CORPORATION.
+ * Copyright (c) 2019-2024, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -217,7 +217,8 @@ TYPED_TEST_SUITE(ScanTest, TestTypes);
 TYPED_TEST(ScanTest, Min)
 {
   auto const v = make_vector<TypeParam>({123, 64, 63, 99, -5, 123, -16, -120, -111});
-  auto const b = thrust::host_vector<bool>(std::vector<bool>{1, 0, 1, 1, 1, 1, 0, 0, 1});
+  auto const b = thrust::host_vector<bool>(
+    std::vector<bool>{true, false, true, true, true, true, false, false, true});
 
   // no nulls
   this->scan_test(v, {}, *cudf::make_min_aggregation<scan_aggregation>(), scan_type::INCLUSIVE);
@@ -249,7 +250,8 @@ TYPED_TEST(ScanTest, Min)
 TYPED_TEST(ScanTest, Max)
 {
   auto const v = make_vector<TypeParam>({-120, 5, 0, -120, -111, 64, 63, 99, 123, -16});
-  auto const b = thrust::host_vector<bool>(std::vector<bool>{1, 0, 1, 1, 1, 1, 0, 1, 0, 1});
+  auto const b = thrust::host_vector<bool>(
+    std::vector<bool>{true, false, true, true, true, true, false, true, false, true});
 
   // inclusive
   // no nulls
@@ -282,7 +284,7 @@ TYPED_TEST(ScanTest, Max)
 TYPED_TEST(ScanTest, Product)
 {
   auto const v = make_vector<TypeParam>({5, -1, 1, 3, -2, 4});
-  auto const b = thrust::host_vector<bool>(std::vector<bool>{1, 1, 1, 0, 1, 1});
+  auto const b = thrust::host_vector<bool>(std::vector<bool>{true, true, true, false, true, true});
 
   // no nulls
   this->scan_test(v, {}, *cudf::make_product_aggregation<scan_aggregation>(), scan_type::INCLUSIVE);
@@ -318,7 +320,8 @@ TYPED_TEST(ScanTest, Sum)
       return make_vector<TypeParam>({-120, 5, 6, 113, -111, 64, -63, 9, 34, -16});
     return make_vector<TypeParam>({12, 5, 6, 13, 11, 14, 3, 9, 34, 16});
   }();
-  auto const b = thrust::host_vector<bool>(std::vector<bool>{1, 0, 1, 1, 0, 0, 1, 1, 1, 1});
+  auto const b = thrust::host_vector<bool>(
+    std::vector<bool>{true, false, true, true, false, false, true, true, true, true});
 
   // no nulls
   this->scan_test(v, {}, *cudf::make_sum_aggregation<scan_aggregation>(), scan_type::INCLUSIVE);
@@ -379,7 +382,7 @@ TYPED_TEST(ScanTest, EmptyColumn)
 TYPED_TEST(ScanTest, LeadingNulls)
 {
   auto const v = make_vector<TypeParam>({100, 200, 300});
-  auto const b = thrust::host_vector<bool>(std::vector<bool>{0, 1, 1});
+  auto const b = thrust::host_vector<bool>(std::vector<bool>{false, true, true});
 
   // skipna = true (default)
   this->scan_test(v,
diff --git a/cpp/tests/reductions/segmented_reduction_tests.cpp b/cpp/tests/reductions/segmented_reduction_tests.cpp
index 21a5c0c176c..37efc116d2a 100644
--- a/cpp/tests/reductions/segmented_reduction_tests.cpp
+++ b/cpp/tests/reductions/segmented_reduction_tests.cpp
@@ -796,7 +796,7 @@ TEST_F(SegmentedReductionTestUntyped, Mean)
   auto const output_type = cudf::data_type{cudf::type_id::FLOAT32};
 
   auto const expected =
-    cudf::test::fixed_width_column_wrapper<float>{{10, 0, 30, 70}, {1, 0, 1, 1}};
+    cudf::test::fixed_width_column_wrapper<float>{{10, 0, 30, 70}, {true, false, true, true}};
   auto result =
     cudf::segmented_reduce(input, d_offsets, *agg, output_type, cudf::null_policy::INCLUDE);
   CUDF_TEST_EXPECT_COLUMNS_EQUIVALENT(*result, expected);
@@ -807,19 +807,21 @@ TEST_F(SegmentedReductionTestUntyped, Mean)
 TEST_F(SegmentedReductionTestUntyped, MeanNulls)
 {
   auto const input = cudf::test::fixed_width_column_wrapper<int32_t>(
-    {10, 20, 30, 40, 50, 60, 0, 80, 90}, {1, 1, 1, 1, 1, 1, 0, 1, 1});
+    {10, 20, 30, 40, 50, 60, 0, 80, 90}, {true, true, true, true, true, true, false, true, true});
   auto const offsets   = std::vector<cudf::size_type>{0, 1, 1, 4, 9};
   auto const d_offsets = cudf::detail::make_device_uvector_async(
     offsets, cudf::get_default_stream(), rmm::mr::get_current_device_resource());
   auto const agg         = cudf::make_mean_aggregation<cudf::segmented_reduce_aggregation>();
   auto const output_type = cudf::data_type{cudf::type_id::FLOAT64};
 
-  auto expected = cudf::test::fixed_width_column_wrapper<double>{{10, 0, 30, 70}, {1, 0, 1, 1}};
+  auto expected =
+    cudf::test::fixed_width_column_wrapper<double>{{10, 0, 30, 70}, {true, false, true, true}};
   auto result =
     cudf::segmented_reduce(input, d_offsets, *agg, output_type, cudf::null_policy::EXCLUDE);
   CUDF_TEST_EXPECT_COLUMNS_EQUIVALENT(*result, expected);
 
-  expected = cudf::test::fixed_width_column_wrapper<double>{{10, 0, 30, 0}, {1, 0, 1, 0}};
+  expected =
+    cudf::test::fixed_width_column_wrapper<double>{{10, 0, 30, 0}, {true, false, true, false}};
   result = cudf::segmented_reduce(input, d_offsets, *agg, output_type, cudf::null_policy::INCLUDE);
   CUDF_TEST_EXPECT_COLUMNS_EQUIVALENT(*result, expected);
 }
@@ -834,8 +836,8 @@ TEST_F(SegmentedReductionTestUntyped, SumOfSquares)
   auto const agg = cudf::make_sum_of_squares_aggregation<cudf::segmented_reduce_aggregation>();
   auto const output_type = cudf::data_type{cudf::type_id::INT32};
 
-  auto const expected =
-    cudf::test::fixed_width_column_wrapper<int32_t>{{100, 0, 2900, 25500}, {1, 0, 1, 1}};
+  auto const expected = cudf::test::fixed_width_column_wrapper<int32_t>{{100, 0, 2900, 25500},
+                                                                        {true, false, true, true}};
 
   auto result =
     cudf::segmented_reduce(input, d_offsets, *agg, output_type, cudf::null_policy::INCLUDE);
@@ -847,20 +849,21 @@ TEST_F(SegmentedReductionTestUntyped, SumOfSquares)
 TEST_F(SegmentedReductionTestUntyped, SumOfSquaresNulls)
 {
   auto const input = cudf::test::fixed_width_column_wrapper<int32_t>(
-    {10, 20, 30, 40, 50, 60, 0, 80, 90}, {1, 1, 1, 1, 1, 1, 0, 1, 1});
+    {10, 20, 30, 40, 50, 60, 0, 80, 90}, {true, true, true, true, true, true, false, true, true});
   auto const offsets   = std::vector<cudf::size_type>{0, 1, 1, 4, 9};
   auto const d_offsets = cudf::detail::make_device_uvector_async(
     offsets, cudf::get_default_stream(), rmm::mr::get_current_device_resource());
   auto const agg = cudf::make_sum_of_squares_aggregation<cudf::segmented_reduce_aggregation>();
   auto const output_type = cudf::data_type{cudf::type_id::INT64};
 
-  auto expected =
-    cudf::test::fixed_width_column_wrapper<int64_t>{{100, 0, 2900, 20600}, {1, 0, 1, 1}};
+  auto expected = cudf::test::fixed_width_column_wrapper<int64_t>{{100, 0, 2900, 20600},
+                                                                  {true, false, true, true}};
   auto result =
     cudf::segmented_reduce(input, d_offsets, *agg, output_type, cudf::null_policy::EXCLUDE);
   CUDF_TEST_EXPECT_COLUMNS_EQUIVALENT(*result, expected);
 
-  expected = cudf::test::fixed_width_column_wrapper<int64_t>{{100, 0, 2900, 0}, {1, 0, 1, 0}};
+  expected =
+    cudf::test::fixed_width_column_wrapper<int64_t>{{100, 0, 2900, 0}, {true, false, true, false}};
   result = cudf::segmented_reduce(input, d_offsets, *agg, output_type, cudf::null_policy::INCLUDE);
   CUDF_TEST_EXPECT_COLUMNS_EQUIVALENT(*result, expected);
 }
@@ -877,7 +880,7 @@ TEST_F(SegmentedReductionTestUntyped, StandardDeviation)
   auto const output_type = cudf::data_type{cudf::type_id::FLOAT32};
 
   auto expected = cudf::test::fixed_width_column_wrapper<float>{
-    {NaN, 0.f, 10.f, static_cast<float>(std::sqrt(250.))}, {1, 0, 1, 1}};
+    {NaN, 0.f, 10.f, static_cast<float>(std::sqrt(250.))}, {true, false, true, true}};
   auto result =
     cudf::segmented_reduce(input, d_offsets, *agg, output_type, cudf::null_policy::INCLUDE);
   CUDF_TEST_EXPECT_COLUMNS_EQUIVALENT(*result, expected);
@@ -889,7 +892,7 @@ TEST_F(SegmentedReductionTestUntyped, StandardDeviationNulls)
 {
   constexpr double NaN{std::numeric_limits<double>::quiet_NaN()};
   auto const input = cudf::test::fixed_width_column_wrapper<int32_t>(
-    {10, 0, 20, 30, 54, 63, 0, 72, 81}, {1, 0, 1, 1, 1, 1, 0, 1, 1});
+    {10, 0, 20, 30, 54, 63, 0, 72, 81}, {true, false, true, true, true, true, false, true, true});
   auto const offsets   = std::vector<cudf::size_type>{0, 1, 1, 4, 9};
   auto const d_offsets = cudf::detail::make_device_uvector_async(
     offsets, cudf::get_default_stream(), rmm::mr::get_current_device_resource());
@@ -897,12 +900,13 @@ TEST_F(SegmentedReductionTestUntyped, StandardDeviationNulls)
   auto const output_type = cudf::data_type{cudf::type_id::FLOAT64};
 
   auto expected = cudf::test::fixed_width_column_wrapper<double>{
-    {NaN, 0., std::sqrt(50.), std::sqrt(135.)}, {1, 0, 1, 1}};
+    {NaN, 0., std::sqrt(50.), std::sqrt(135.)}, {true, false, true, true}};
   auto result =
     cudf::segmented_reduce(input, d_offsets, *agg, output_type, cudf::null_policy::EXCLUDE);
   CUDF_TEST_EXPECT_COLUMNS_EQUIVALENT(*result, expected);
 
-  expected = cudf::test::fixed_width_column_wrapper<double>{{NaN, 0., 0., 0.}, {1, 0, 0, 0}};
+  expected =
+    cudf::test::fixed_width_column_wrapper<double>{{NaN, 0., 0., 0.}, {true, false, false, false}};
   result = cudf::segmented_reduce(input, d_offsets, *agg, output_type, cudf::null_policy::INCLUDE);
   CUDF_TEST_EXPECT_COLUMNS_EQUIVALENT(*result, expected);
 }
@@ -918,8 +922,8 @@ TEST_F(SegmentedReductionTestUntyped, Variance)
   auto const agg         = cudf::make_variance_aggregation<cudf::segmented_reduce_aggregation>();
   auto const output_type = cudf::data_type{cudf::type_id::FLOAT32};
 
-  auto expected =
-    cudf::test::fixed_width_column_wrapper<float>{{NaN, 0.f, 100.f, 250.f}, {1, 0, 1, 1}};
+  auto expected = cudf::test::fixed_width_column_wrapper<float>{{NaN, 0.f, 100.f, 250.f},
+                                                                {true, false, true, true}};
   auto result =
     cudf::segmented_reduce(input, d_offsets, *agg, output_type, cudf::null_policy::INCLUDE);
   CUDF_TEST_EXPECT_COLUMNS_EQUIVALENT(*result, expected);
@@ -931,7 +935,7 @@ TEST_F(SegmentedReductionTestUntyped, VarianceNulls)
 {
   constexpr double NaN{std::numeric_limits<double>::quiet_NaN()};
   auto const input = cudf::test::fixed_width_column_wrapper<int32_t>(
-    {10, 0, 20, 30, 54, 63, 0, 72, 81}, {1, 0, 1, 1, 1, 1, 0, 1, 1});
+    {10, 0, 20, 30, 54, 63, 0, 72, 81}, {true, false, true, true, true, true, false, true, true});
   auto const offsets   = std::vector<cudf::size_type>{0, 1, 1, 4, 9};
   auto const d_offsets = cudf::detail::make_device_uvector_async(
     offsets, cudf::get_default_stream(), rmm::mr::get_current_device_resource());
@@ -939,12 +943,13 @@ TEST_F(SegmentedReductionTestUntyped, VarianceNulls)
   auto const output_type = cudf::data_type{cudf::type_id::FLOAT64};
 
   auto expected =
-    cudf::test::fixed_width_column_wrapper<double>{{NaN, 0., 50., 135.}, {1, 0, 1, 1}};
+    cudf::test::fixed_width_column_wrapper<double>{{NaN, 0., 50., 135.}, {true, false, true, true}};
   auto result =
     cudf::segmented_reduce(input, d_offsets, *agg, output_type, cudf::null_policy::EXCLUDE);
   CUDF_TEST_EXPECT_COLUMNS_EQUIVALENT(*result, expected);
 
-  expected = cudf::test::fixed_width_column_wrapper<double>{{NaN, 0., 0., 0.}, {1, 0, 0, 0}};
+  expected =
+    cudf::test::fixed_width_column_wrapper<double>{{NaN, 0., 0., 0.}, {true, false, false, false}};
   result = cudf::segmented_reduce(input, d_offsets, *agg, output_type, cudf::null_policy::INCLUDE);
   CUDF_TEST_EXPECT_COLUMNS_EQUIVALENT(*result, expected);
 }
@@ -959,8 +964,8 @@ TEST_F(SegmentedReductionTestUntyped, NUnique)
   auto const agg         = cudf::make_nunique_aggregation<cudf::segmented_reduce_aggregation>();
   auto const output_type = cudf::data_type{cudf::type_id::INT32};
 
-  auto expected =
-    cudf::test::fixed_width_column_wrapper<cudf::size_type>{{1, 0, 1, 2, 3}, {1, 0, 1, 1, 1}};
+  auto expected = cudf::test::fixed_width_column_wrapper<cudf::size_type>{
+    {1, 0, 1, 2, 3}, {true, false, true, true, true}};
   auto result =
     cudf::segmented_reduce(input, d_offsets, *agg, output_type, cudf::null_policy::EXCLUDE);
   CUDF_TEST_EXPECT_COLUMNS_EQUIVALENT(*result, expected);
@@ -972,21 +977,21 @@ TEST_F(SegmentedReductionTestUntyped, NUnique)
 TEST_F(SegmentedReductionTestUntyped, NUniqueNulls)
 {
   auto const input = cudf::test::fixed_width_column_wrapper<int32_t>(
-    {10, 0, 20, 30, 60, 60, 70, 70, 0}, {1, 0, 1, 1, 1, 1, 1, 1, 0});
+    {10, 0, 20, 30, 60, 60, 70, 70, 0}, {true, false, true, true, true, true, true, true, false});
   auto const offsets   = std::vector<cudf::size_type>{0, 1, 1, 2, 4, 9};
   auto const d_offsets = cudf::detail::make_device_uvector_async(
     offsets, cudf::get_default_stream(), rmm::mr::get_current_device_resource());
   auto const agg         = cudf::make_nunique_aggregation<cudf::segmented_reduce_aggregation>();
   auto const output_type = cudf::data_type{cudf::type_id::INT32};
 
-  auto expected =
-    cudf::test::fixed_width_column_wrapper<cudf::size_type>{{1, 0, 0, 2, 2}, {1, 0, 0, 1, 1}};
+  auto expected = cudf::test::fixed_width_column_wrapper<cudf::size_type>{
+    {1, 0, 0, 2, 2}, {true, false, false, true, true}};
   auto result =
     cudf::segmented_reduce(input, d_offsets, *agg, output_type, cudf::null_policy::EXCLUDE);
   CUDF_TEST_EXPECT_COLUMNS_EQUIVALENT(*result, expected);
 
-  expected =
-    cudf::test::fixed_width_column_wrapper<cudf::size_type>{{1, 0, 1, 2, 3}, {1, 0, 1, 1, 1}};
+  expected = cudf::test::fixed_width_column_wrapper<cudf::size_type>{
+    {1, 0, 1, 2, 3}, {true, false, true, true, true}};
   result = cudf::segmented_reduce(input, d_offsets, *agg, output_type, cudf::null_policy::INCLUDE);
   CUDF_TEST_EXPECT_COLUMNS_EQUIVALENT(*result, expected);
 }
@@ -994,7 +999,7 @@ TEST_F(SegmentedReductionTestUntyped, NUniqueNulls)
 TEST_F(SegmentedReductionTestUntyped, Errors)
 {
   auto const input = cudf::test::fixed_width_column_wrapper<int32_t>(
-    {10, 0, 20, 30, 54, 63, 0, 72, 81}, {1, 0, 1, 1, 1, 1, 0, 1, 1});
+    {10, 0, 20, 30, 54, 63, 0, 72, 81}, {true, false, true, true, true, true, false, true, true});
   auto const offsets   = std::vector<cudf::size_type>{0, 1, 1, 4, 9};
   auto const d_offsets = cudf::detail::make_device_uvector_async(
     offsets, cudf::get_default_stream(), rmm::mr::get_current_device_resource());
@@ -1104,8 +1109,8 @@ TEST_F(SegmentedReductionTestUntyped, EmptyInputWithOffsets)
   auto const offsets   = std::vector<cudf::size_type>{0, 0, 0, 0, 0, 0};
   auto const d_offsets = cudf::detail::make_device_uvector_async(
     offsets, cudf::get_default_stream(), rmm::mr::get_current_device_resource());
-  auto const expect =
-    cudf::test::fixed_width_column_wrapper<int32_t>{{XXX, XXX, XXX, XXX, XXX}, {0, 0, 0, 0, 0}};
+  auto const expect = cudf::test::fixed_width_column_wrapper<int32_t>{
+    {XXX, XXX, XXX, XXX, XXX}, {false, false, false, false, false}};
 
   auto aggregates =
     std::vector<std::unique_ptr<cudf::segmented_reduce_aggregation,
@@ -1123,8 +1128,8 @@ TEST_F(SegmentedReductionTestUntyped, EmptyInputWithOffsets)
     CUDF_TEST_EXPECT_COLUMNS_EQUAL(*result, expect);
   }
 
-  auto const expect_bool =
-    cudf::test::fixed_width_column_wrapper<bool>{{XXX, XXX, XXX, XXX, XXX}, {0, 0, 0, 0, 0}};
+  auto const expect_bool = cudf::test::fixed_width_column_wrapper<bool>{
+    {XXX, XXX, XXX, XXX, XXX}, {false, false, false, false, false}};
 
   auto result =
     cudf::segmented_reduce(input,
@@ -1498,7 +1503,7 @@ TEST_F(SegmentedReductionStringTest, EmptyInputWithOffsets)
   auto const offsets   = std::vector<cudf::size_type>{0, 0, 0, 0};
   auto const d_offsets = cudf::detail::make_device_uvector_async(
     offsets, cudf::get_default_stream(), rmm::mr::get_current_device_resource());
-  auto const expect = cudf::test::strings_column_wrapper({XXX, XXX, XXX}, {0, 0, 0});
+  auto const expect = cudf::test::strings_column_wrapper({XXX, XXX, XXX}, {false, false, false});
 
   auto result =
     cudf::segmented_reduce(input,
diff --git a/cpp/tests/reshape/byte_cast_tests.cpp b/cpp/tests/reshape/byte_cast_tests.cpp
index 0b4cd0c9b40..cd280302677 100644
--- a/cpp/tests/reshape/byte_cast_tests.cpp
+++ b/cpp/tests/reshape/byte_cast_tests.cpp
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2020-2023, NVIDIA CORPORATION.
+ * Copyright (c) 2020-2024, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -54,7 +54,8 @@ TEST_F(ByteCastTest, int16ValuesWithNulls)
     cudf::detail::make_counting_transform_iterator(0, [](auto i) { return i % 2; });
 
   cudf::test::fixed_width_column_wrapper<int16_t> const int16_col(
-    {short(0), short(100), short(-100), limits::min(), limits::max()}, {0, 1, 0, 1, 0});
+    {short(0), short(100), short(-100), limits::min(), limits::max()},
+    {false, true, false, true, false});
 
   auto int16_data = cudf::test::fixed_width_column_wrapper<uint8_t>{0x00, 0x64, 0x80, 0x00};
   auto [null_mask, null_count] = cudf::test::detail::make_null_mask(odd_validity, odd_validity + 5);
@@ -99,7 +100,7 @@ TEST_F(ByteCastTest, int32ValuesWithNulls)
     cudf::detail::make_counting_transform_iterator(0, [](auto i) { return (i + 1) % 2; });
 
   cudf::test::fixed_width_column_wrapper<int32_t> const int32_col(
-    {0, 100, -100, limits::min(), limits::max()}, {1, 0, 1, 0, 1});
+    {0, 100, -100, limits::min(), limits::max()}, {true, false, true, false, true});
 
   auto int32_data = cudf::test::fixed_width_column_wrapper<uint8_t>{
     0x00, 0x00, 0x00, 0x00, 0xff, 0xff, 0xff, 0x9c, 0x7f, 0xff, 0xff, 0xff};
@@ -154,7 +155,8 @@ TEST_F(ByteCastTest, int64ValuesWithNulls)
     cudf::detail::make_counting_transform_iterator(0, [](auto i) { return i % 2; });
 
   cudf::test::fixed_width_column_wrapper<int64_t> const int64_col(
-    {long(0), long(100), long(-100), limits::min(), limits::max()}, {0, 1, 0, 1, 0});
+    {long(0), long(100), long(-100), limits::min(), limits::max()},
+    {false, true, false, true, false});
 
   auto int64_data = cudf::test::fixed_width_column_wrapper<uint8_t>{
     0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x64, 0x80, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00};
@@ -215,7 +217,8 @@ TEST_F(ByteCastTest, fp32ValuesWithNulls)
     cudf::detail::make_counting_transform_iterator(0, [](auto i) { return (i + 1) % 2; });
 
   cudf::test::fixed_width_column_wrapper<float> const fp32_col(
-    {float(0.0), float(100.0), float(-100.0), limits::min(), limits::max()}, {1, 0, 1, 0, 1});
+    {float(0.0), float(100.0), float(-100.0), limits::min(), limits::max()},
+    {true, false, true, false, true});
 
   auto fp32_data = cudf::test::fixed_width_column_wrapper<uint8_t>{
     0x00, 0x00, 0x00, 0x00, 0xc2, 0xc8, 0x00, 0x00, 0x7f, 0x7f, 0xff, 0xff};
@@ -286,7 +289,8 @@ TEST_F(ByteCastTest, fp64ValuesWithNulls)
     cudf::detail::make_counting_transform_iterator(0, [](auto i) { return i % 2; });
 
   cudf::test::fixed_width_column_wrapper<double> const fp64_col(
-    {double(0.0), double(100.0), double(-100.0), limits::min(), limits::max()}, {0, 1, 0, 1, 0});
+    {double(0.0), double(100.0), double(-100.0), limits::min(), limits::max()},
+    {false, true, false, true, false});
 
   auto fp64_data = cudf::test::fixed_width_column_wrapper<uint8_t>{
     0x40, 0x59, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x10, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00};
diff --git a/cpp/tests/rolling/collect_ops_test.cpp b/cpp/tests/rolling/collect_ops_test.cpp
index a6fa5b33c5b..f702dc78371 100644
--- a/cpp/tests/rolling/collect_ops_test.cpp
+++ b/cpp/tests/rolling/collect_ops_test.cpp
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2021-2023, NVIDIA CORPORATION.
+ * Copyright (c) 2021-2024, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -253,8 +253,9 @@ TYPED_TEST(TypedCollectListTest, RollingWindowWithNullInputsHonoursMinPeriods)
                            min_periods,
                            *cudf::make_collect_list_aggregation<cudf::rolling_aggregation>());
 
-    auto expected_result_child_values   = std::vector<int32_t>{0, 1, 2, 1, 2, 3, 2, 3, 4, 3, 4, 5};
-    auto expected_result_child_validity = std::vector<bool>{1, 0, 1, 0, 1, 1, 1, 1, 0, 1, 0, 1};
+    auto expected_result_child_values = std::vector<int32_t>{0, 1, 2, 1, 2, 3, 2, 3, 4, 3, 4, 5};
+    auto expected_result_child_validity =
+      std::vector<bool>{true, false, true, false, true, true, true, true, false, true, false, true};
     auto expected_result_child =
       cudf::test::fixed_width_column_wrapper<T, int32_t>(expected_result_child_values.begin(),
                                                          expected_result_child_values.end(),
@@ -325,8 +326,9 @@ TYPED_TEST(TypedCollectListTest, RollingWindowWithNullInputsHonoursMinPeriods)
                            min_periods,
                            *cudf::make_collect_list_aggregation<cudf::rolling_aggregation>());
 
-    auto expected_result_child_values   = std::vector<int32_t>{0, 1, 2, 3, 1, 2, 3, 4, 2, 3, 4, 5};
-    auto expected_result_child_validity = std::vector<bool>{1, 0, 1, 1, 0, 1, 1, 0, 1, 1, 0, 1};
+    auto expected_result_child_values = std::vector<int32_t>{0, 1, 2, 3, 1, 2, 3, 4, 2, 3, 4, 5};
+    auto expected_result_child_validity =
+      std::vector<bool>{true, false, true, true, false, true, true, false, true, true, false, true};
     auto expected_result_child =
       cudf::test::fixed_width_column_wrapper<T, int32_t>(expected_result_child_values.begin(),
                                                          expected_result_child_values.end(),
@@ -432,7 +434,7 @@ TEST_F(CollectListTest, RollingWindowHonoursMinPeriodsOnStrings)
                          *cudf::make_collect_list_aggregation<cudf::rolling_aggregation>());
   auto expected_result_2 = cudf::test::lists_column_wrapper<cudf::string_view>{
     {{}, {"0", "1", "2", "3"}, {"1", "2", "3", "4"}, {"2", "3", "4", "5"}, {}, {}},
-    cudf::detail::make_counting_transform_iterator(0, [num_elements](auto i) {
+    cudf::detail::make_counting_transform_iterator(0, [](auto i) {
       return i != 0 && i < 4;
     })}.release();
 
@@ -525,7 +527,7 @@ TEST_F(CollectListTest, RollingWindowHonoursMinPeriodsWithDecimal)
       cudf::test::fixed_width_column_wrapper<cudf::size_type>{0, 0, 4, 8, 12, 12, 12}.release();
     auto expected_num_rows = expected_offsets->size() - 1;
     auto null_mask_iter    = cudf::detail::make_counting_transform_iterator(
-      cudf::size_type{0}, [expected_num_rows](auto i) { return i > 0 && i < 4; });
+      cudf::size_type{0}, [](auto i) { return i > 0 && i < 4; });
 
     auto [null_mask, null_count] =
       cudf::test::detail::make_null_mask(null_mask_iter, null_mask_iter + expected_num_rows);
@@ -833,8 +835,9 @@ TEST_F(CollectListTest, GroupedTimeRangeRollingWindowOnStringsWithNulls)
       1, 1, 2, 2, 3, 1, 4, 5, 6};
   auto const group_column =
     cudf::test::fixed_width_column_wrapper<int32_t>{1, 1, 1, 1, 1, 2, 2, 2, 2};
-  auto const input_column = cudf::test::strings_column_wrapper{
-    {"10", "11", "12", "13", "14", "20", "21", "22", "23"}, {1, 0, 1, 1, 1, 1, 0, 1, 1}};
+  auto const input_column =
+    cudf::test::strings_column_wrapper{{"10", "11", "12", "13", "14", "20", "21", "22", "23"},
+                                       {true, false, true, true, true, true, false, true, true}};
   auto const preceding   = 2;
   auto const following   = 1;
   auto const min_periods = 1;
@@ -1148,8 +1151,9 @@ TEST_F(CollectListTest, GroupedTimeRangeRollingWindowOnStringsWithNullsAndMinPer
       1, 1, 2, 2, 3, 1, 4, 5, 6};
   auto const group_column =
     cudf::test::fixed_width_column_wrapper<int32_t>{1, 1, 1, 1, 1, 2, 2, 2, 2};
-  auto const input_column = cudf::test::strings_column_wrapper{
-    {"10", "11", "12", "13", "14", "20", "21", "22", "23"}, {1, 0, 1, 1, 1, 1, 0, 1, 1}};
+  auto const input_column =
+    cudf::test::strings_column_wrapper{{"10", "11", "12", "13", "14", "20", "21", "22", "23"},
+                                       {true, false, true, true, true, true, false, true, true}};
   auto const preceding   = 2;
   auto const following   = 1;
   auto const min_periods = 4;
@@ -1558,7 +1562,7 @@ TEST_F(CollectSetTest, RollingWindowHonoursMinPeriodsOnStrings)
                         *cudf::make_collect_set_aggregation<cudf::rolling_aggregation>());
   auto expected_result_2 = cudf::test::lists_column_wrapper<cudf::string_view>{
     {{}, {"0", "1", "2"}, {"1", "2", "4"}, {"2", "4"}, {}, {}},
-    cudf::detail::make_counting_transform_iterator(0, [num_elements](auto i) {
+    cudf::detail::make_counting_transform_iterator(0, [](auto i) {
       return i != 0 && i < 4;
     })}.release();
 
@@ -1650,7 +1654,7 @@ TEST_F(CollectSetTest, RollingWindowHonoursMinPeriodsWithDecimal)
       cudf::test::fixed_width_column_wrapper<cudf::size_type>{0, 0, 3, 7, 10, 10, 10}.release();
     auto expected_num_rows = expected_offsets->size() - 1;
     auto null_mask_iter    = cudf::detail::make_counting_transform_iterator(
-      cudf::size_type{0}, [expected_num_rows](auto i) { return i > 0 && i < 4; });
+      cudf::size_type{0}, [](auto i) { return i > 0 && i < 4; });
 
     auto [null_mask, null_count] =
       cudf::test::detail::make_null_mask(null_mask_iter, null_mask_iter + expected_num_rows);
diff --git a/cpp/tests/rolling/grouped_rolling_test.cpp b/cpp/tests/rolling/grouped_rolling_test.cpp
index a4abe5ee608..78d5daf7e83 100644
--- a/cpp/tests/rolling/grouped_rolling_test.cpp
+++ b/cpp/tests/rolling/grouped_rolling_test.cpp
@@ -338,7 +338,7 @@ class GroupedRollingTest : public cudf::test::BaseFixture {
 
     agg_op op;
     for (cudf::size_type i = 0; i < num_rows; i++) {
-      OutputType val = agg_op::template identity<OutputType>();
+      auto val = agg_op::template identity<OutputType>();
 
       // load sizes
       min_periods = std::max(min_periods, 1);  // at least one observation is required
@@ -458,7 +458,7 @@ TEST_F(GroupedRollingErrorTest, NegativeMinPeriods)
 {
   // Construct agg column.
   const std::vector<cudf::size_type> col_data{0, 1, 2, 0, 4};
-  const std::vector<bool> col_valid{1, 1, 1, 0, 1};
+  const std::vector<bool> col_valid{true, true, true, false, true};
   cudf::test::fixed_width_column_wrapper<cudf::size_type> input{
     col_data.begin(), col_data.end(), col_valid.begin()};
 
@@ -674,7 +674,7 @@ using GroupedRollingTestStrings = GroupedRollingTest<cudf::string_view>;
 TEST_F(GroupedRollingTestStrings, StringsUnsupportedOperators)
 {
   cudf::test::strings_column_wrapper input{{"This", "is", "not", "a", "string", "type"},
-                                           {1, 1, 1, 0, 1, 0}};
+                                           {true, true, true, false, true, false}};
 
   const cudf::size_type DATA_SIZE{static_cast<cudf::column_view>(input).size()};
   const std::vector<cudf::size_type> key_col_vec(DATA_SIZE, 0);
@@ -984,7 +984,7 @@ class GroupedTimeRangeRollingTest : public cudf::test::BaseFixture {
 
     agg_op op;
     for (cudf::size_type i = 0; i < num_rows; i++) {
-      OutputType val = agg_op::template identity<OutputType>();
+      auto val = agg_op::template identity<OutputType>();
 
       // load sizes
       min_periods = std::max(min_periods, 1);  // at least one observation is required
@@ -1272,7 +1272,8 @@ TYPED_TEST(TypedNullTimestampTestForRangeQueries, CountSingleGroupTimestampASCNu
                                                                  {1, 1, 1, 1, 1, 0, 1, 1, 1, 1}};
   auto const time_col =
     cudf::test::fixed_width_column_wrapper<cudf::timestamp_D, cudf::timestamp_D::rep>{
-      {0, 1, 2, 3, 4, 5, 6, 7, 8, 9}, {0, 0, 0, 0, 1, 1, 1, 1, 1, 1}};
+      {0, 1, 2, 3, 4, 5, 6, 7, 8, 9},
+      {false, false, false, false, true, true, true, true, true, true}};
 
   auto const grouping_keys = cudf::table_view{std::vector<cudf::column_view>{grp_col}};
   auto const preceding     = 1L;
@@ -1303,7 +1304,8 @@ TYPED_TEST(TypedNullTimestampTestForRangeQueries, CountSingleGroupTimestampASCNu
 
   auto const time_col =
     cudf::test::fixed_width_column_wrapper<cudf::timestamp_D, cudf::timestamp_D::rep>{
-      {0, 1, 2, 3, 4, 5, 6, 7, 8, 9}, {1, 1, 1, 1, 1, 1, 0, 0, 0, 0}};
+      {0, 1, 2, 3, 4, 5, 6, 7, 8, 9},
+      {true, true, true, true, true, true, false, false, false, false}};
 
   auto const grouping_keys = cudf::table_view{std::vector<cudf::column_view>{grp_col}};
   auto const preceding     = 1L;
@@ -1332,7 +1334,8 @@ TYPED_TEST(TypedNullTimestampTestForRangeQueries, CountMultiGroupTimestampASCNul
   auto const agg_col = cudf::test::fixed_width_column_wrapper<T>{0, 1, 2, 3, 4, 5, 6, 7, 8, 9};
   auto const time_col =
     cudf::test::fixed_width_column_wrapper<cudf::timestamp_D, cudf::timestamp_D::rep>{
-      {1, 2, 2, 1, 2, 1, 2, 3, 4, 5}, {0, 0, 0, 1, 1, 0, 0, 1, 1, 1}};
+      {1, 2, 2, 1, 2, 1, 2, 3, 4, 5},
+      {false, false, false, true, true, false, false, true, true, true}};
 
   auto const grouping_keys = cudf::table_view{std::vector<cudf::column_view>{grp_col}};
   auto const preceding     = 1L;
@@ -1361,7 +1364,8 @@ TYPED_TEST(TypedNullTimestampTestForRangeQueries, CountMultiGroupTimestampASCNul
   auto const agg_col = cudf::test::fixed_width_column_wrapper<T>{0, 1, 2, 3, 4, 5, 6, 7, 8, 9};
   auto const time_col =
     cudf::test::fixed_width_column_wrapper<cudf::timestamp_D, cudf::timestamp_D::rep>{
-      {1, 2, 2, 1, 3, 1, 2, 3, 4, 5}, {1, 1, 1, 0, 0, 1, 1, 1, 0, 0}};
+      {1, 2, 2, 1, 3, 1, 2, 3, 4, 5},
+      {true, true, true, false, false, true, true, true, false, false}};
 
   auto const grouping_keys = cudf::table_view{std::vector<cudf::column_view>{grp_col}};
   auto const preceding     = 1L;
@@ -1391,7 +1395,8 @@ TYPED_TEST(TypedNullTimestampTestForRangeQueries, CountSingleGroupTimestampDESCN
                                                                  {1, 1, 1, 1, 1, 0, 1, 1, 1, 1}};
   auto const time_col =
     cudf::test::fixed_width_column_wrapper<cudf::timestamp_D, cudf::timestamp_D::rep>{
-      {9, 8, 7, 6, 5, 4, 3, 2, 1, 0}, {0, 0, 0, 0, 1, 1, 1, 1, 1, 1}};
+      {9, 8, 7, 6, 5, 4, 3, 2, 1, 0},
+      {false, false, false, false, true, true, true, true, true, true}};
 
   auto const grouping_keys = cudf::table_view{std::vector<cudf::column_view>{grp_col}};
   auto const preceding     = 1L;
@@ -1422,7 +1427,8 @@ TYPED_TEST(TypedNullTimestampTestForRangeQueries, CountSingleGroupTimestampDESCN
 
   auto const time_col =
     cudf::test::fixed_width_column_wrapper<cudf::timestamp_D, cudf::timestamp_D::rep>{
-      {9, 8, 7, 6, 5, 4, 3, 2, 1, 0}, {1, 1, 1, 1, 1, 1, 0, 0, 0, 0}};
+      {9, 8, 7, 6, 5, 4, 3, 2, 1, 0},
+      {true, true, true, true, true, true, false, false, false, false}};
 
   auto const grouping_keys = cudf::table_view{std::vector<cudf::column_view>{grp_col}};
   auto const preceding     = 1L;
@@ -1451,7 +1457,8 @@ TYPED_TEST(TypedNullTimestampTestForRangeQueries, CountMultiGroupTimestampDESCNu
   auto const agg_col = cudf::test::fixed_width_column_wrapper<T>{0, 1, 2, 3, 4, 5, 6, 7, 8, 9};
   auto const time_col =
     cudf::test::fixed_width_column_wrapper<cudf::timestamp_D, cudf::timestamp_D::rep>{
-      {4, 3, 2, 1, 0, 9, 8, 7, 6, 5}, {0, 0, 0, 1, 1, 0, 0, 1, 1, 1}};
+      {4, 3, 2, 1, 0, 9, 8, 7, 6, 5},
+      {false, false, false, true, true, false, false, true, true, true}};
 
   auto const grouping_keys = cudf::table_view{std::vector<cudf::column_view>{grp_col}};
   auto const preceding     = 1L;
@@ -1480,7 +1487,8 @@ TYPED_TEST(TypedNullTimestampTestForRangeQueries, CountMultiGroupTimestampDESCNu
   auto const agg_col = cudf::test::fixed_width_column_wrapper<T>{0, 1, 2, 3, 4, 5, 6, 7, 8, 9};
   auto const time_col =
     cudf::test::fixed_width_column_wrapper<cudf::timestamp_D, cudf::timestamp_D::rep>{
-      {4, 3, 2, 1, 0, 9, 8, 7, 6, 5}, {1, 1, 1, 0, 0, 1, 1, 1, 0, 0}};
+      {4, 3, 2, 1, 0, 9, 8, 7, 6, 5},
+      {true, true, true, false, false, true, true, true, false, false}};
 
   auto const grouping_keys = cudf::table_view{std::vector<cudf::column_view>{grp_col}};
   auto const preceding     = 1L;
@@ -1511,7 +1519,8 @@ TYPED_TEST(TypedNullTimestampTestForRangeQueries, CountSingleGroupAllNullTimesta
 
   auto const time_col =
     cudf::test::fixed_width_column_wrapper<cudf::timestamp_D, cudf::timestamp_D::rep>{
-      {0, 1, 2, 3, 4, 5, 6, 7, 8, 9}, {0, 0, 0, 0, 0, 0, 0, 0, 0, 0}};
+      {0, 1, 2, 3, 4, 5, 6, 7, 8, 9},
+      {false, false, false, false, false, false, false, false, false, false}};
 
   auto const grouping_keys = cudf::table_view{std::vector<cudf::column_view>{grp_col}};
   auto const preceding     = 1L;
@@ -1542,7 +1551,8 @@ TYPED_TEST(TypedNullTimestampTestForRangeQueries, CountMultiGroupAllNullTimestam
 
   auto const time_col =
     cudf::test::fixed_width_column_wrapper<cudf::timestamp_D, cudf::timestamp_D::rep>{
-      {0, 1, 2, 3, 4, 5, 6, 7, 8, 9}, {1, 1, 1, 1, 1, 0, 0, 0, 0, 0}};
+      {0, 1, 2, 3, 4, 5, 6, 7, 8, 9},
+      {true, true, true, true, true, false, false, false, false, false}};
 
   auto const grouping_keys = cudf::table_view{std::vector<cudf::column_view>{grp_col}};
   auto const preceding     = 1L;
@@ -1584,7 +1594,8 @@ TYPED_TEST(TypedUnboundedWindowTest, UnboundedPrecedingWindowSingleGroupTimestam
                                                                  {1, 1, 1, 1, 1, 0, 1, 1, 1, 1}};
   auto const time_col =
     cudf::test::fixed_width_column_wrapper<cudf::timestamp_D, cudf::timestamp_D::rep>{
-      {0, 1, 2, 3, 4, 5, 6, 7, 8, 9}, {0, 0, 0, 0, 1, 1, 1, 1, 1, 1}};
+      {0, 1, 2, 3, 4, 5, 6, 7, 8, 9},
+      {false, false, false, false, true, true, true, true, true, true}};
 
   auto const grouping_keys       = cudf::table_view{std::vector<cudf::column_view>{grp_col}};
   auto const unbounded_preceding = cudf::window_bounds::unbounded();
@@ -1614,7 +1625,8 @@ TYPED_TEST(TypedUnboundedWindowTest, UnboundedFollowingWindowSingleGroupTimestam
                                                                  {1, 1, 1, 1, 1, 0, 1, 1, 1, 1}};
   auto const time_col =
     cudf::test::fixed_width_column_wrapper<cudf::timestamp_D, cudf::timestamp_D::rep>{
-      {0, 1, 2, 3, 4, 5, 6, 7, 8, 9}, {0, 0, 0, 0, 1, 1, 1, 1, 1, 1}};
+      {0, 1, 2, 3, 4, 5, 6, 7, 8, 9},
+      {false, false, false, false, true, true, true, true, true, true}};
 
   auto const grouping_keys       = cudf::table_view{std::vector<cudf::column_view>{grp_col}};
   auto const one_day_preceding   = cudf::window_bounds::get(1L);
@@ -1645,7 +1657,8 @@ TYPED_TEST(TypedUnboundedWindowTest,
                                                                  {1, 1, 1, 1, 1, 0, 1, 1, 1, 1}};
   auto const time_col =
     cudf::test::fixed_width_column_wrapper<cudf::timestamp_D, cudf::timestamp_D::rep>{
-      {0, 1, 2, 3, 4, 5, 6, 7, 8, 9}, {0, 0, 0, 0, 1, 1, 1, 1, 1, 1}};
+      {0, 1, 2, 3, 4, 5, 6, 7, 8, 9},
+      {false, false, false, false, true, true, true, true, true, true}};
 
   auto const grouping_keys       = cudf::table_view{std::vector<cudf::column_view>{grp_col}};
   auto const unbounded_preceding = cudf::window_bounds::unbounded();
@@ -1675,7 +1688,8 @@ TYPED_TEST(TypedUnboundedWindowTest, UnboundedPrecedingWindowSingleGroupTimestam
                                                                  {1, 1, 1, 1, 1, 0, 1, 1, 1, 1}};
   auto const time_col =
     cudf::test::fixed_width_column_wrapper<cudf::timestamp_D, cudf::timestamp_D::rep>{
-      {0, 1, 2, 3, 4, 5, 6, 7, 8, 9}, {1, 1, 1, 1, 1, 1, 0, 0, 0, 0}};
+      {0, 1, 2, 3, 4, 5, 6, 7, 8, 9},
+      {true, true, true, true, true, true, false, false, false, false}};
 
   auto const grouping_keys       = cudf::table_view{std::vector<cudf::column_view>{grp_col}};
   auto const unbounded_preceding = cudf::window_bounds::unbounded();
@@ -1705,7 +1719,8 @@ TYPED_TEST(TypedUnboundedWindowTest, UnboundedFollowingWindowSingleGroupTimestam
                                                                  {1, 1, 1, 1, 1, 0, 1, 1, 1, 1}};
   auto const time_col =
     cudf::test::fixed_width_column_wrapper<cudf::timestamp_D, cudf::timestamp_D::rep>{
-      {0, 1, 2, 3, 4, 5, 6, 7, 8, 9}, {1, 1, 1, 1, 1, 1, 0, 0, 0, 0}};
+      {0, 1, 2, 3, 4, 5, 6, 7, 8, 9},
+      {true, true, true, true, true, true, false, false, false, false}};
 
   auto const grouping_keys       = cudf::table_view{std::vector<cudf::column_view>{grp_col}};
   auto const one_day_preceding   = cudf::window_bounds::get(1L);
@@ -1736,7 +1751,8 @@ TYPED_TEST(TypedUnboundedWindowTest,
                                                                  {1, 1, 1, 1, 1, 0, 1, 1, 1, 1}};
   auto const time_col =
     cudf::test::fixed_width_column_wrapper<cudf::timestamp_D, cudf::timestamp_D::rep>{
-      {0, 1, 2, 3, 4, 5, 6, 7, 8, 9}, {1, 1, 1, 1, 1, 1, 0, 0, 0, 0}};
+      {0, 1, 2, 3, 4, 5, 6, 7, 8, 9},
+      {true, true, true, true, true, true, false, false, false, false}};
 
   auto const grouping_keys       = cudf::table_view{std::vector<cudf::column_view>{grp_col}};
   auto const unbounded_preceding = cudf::window_bounds::unbounded();
@@ -1766,7 +1782,8 @@ TYPED_TEST(TypedUnboundedWindowTest, UnboundedPrecedingWindowSingleGroupTimestam
                                                                  {1, 1, 1, 1, 1, 0, 1, 1, 1, 1}};
   auto const time_col =
     cudf::test::fixed_width_column_wrapper<cudf::timestamp_D, cudf::timestamp_D::rep>{
-      {9, 8, 7, 6, 5, 4, 3, 2, 1, 0}, {0, 0, 0, 0, 1, 1, 1, 1, 1, 1}};
+      {9, 8, 7, 6, 5, 4, 3, 2, 1, 0},
+      {false, false, false, false, true, true, true, true, true, true}};
 
   auto const grouping_keys       = cudf::table_view{std::vector<cudf::column_view>{grp_col}};
   auto const unbounded_preceding = cudf::window_bounds::unbounded();
@@ -1796,7 +1813,8 @@ TYPED_TEST(TypedUnboundedWindowTest, UnboundedFollowingWindowSingleGroupTimestam
                                                                  {1, 1, 1, 1, 1, 0, 1, 1, 1, 1}};
   auto const time_col =
     cudf::test::fixed_width_column_wrapper<cudf::timestamp_D, cudf::timestamp_D::rep>{
-      {9, 8, 7, 6, 5, 4, 3, 2, 1, 0}, {0, 0, 0, 0, 1, 1, 1, 1, 1, 1}};
+      {9, 8, 7, 6, 5, 4, 3, 2, 1, 0},
+      {false, false, false, false, true, true, true, true, true, true}};
 
   auto const grouping_keys       = cudf::table_view{std::vector<cudf::column_view>{grp_col}};
   auto const one_day_preceding   = cudf::window_bounds::get(1L);
@@ -1827,7 +1845,8 @@ TYPED_TEST(TypedUnboundedWindowTest,
                                                                  {1, 1, 1, 1, 1, 0, 1, 1, 1, 1}};
   auto const time_col =
     cudf::test::fixed_width_column_wrapper<cudf::timestamp_D, cudf::timestamp_D::rep>{
-      {9, 8, 7, 6, 5, 4, 3, 2, 1, 0}, {0, 0, 0, 0, 1, 1, 1, 1, 1, 1}};
+      {9, 8, 7, 6, 5, 4, 3, 2, 1, 0},
+      {false, false, false, false, true, true, true, true, true, true}};
 
   auto const grouping_keys       = cudf::table_view{std::vector<cudf::column_view>{grp_col}};
   auto const unbounded_preceding = cudf::window_bounds::unbounded();
@@ -1857,7 +1876,8 @@ TYPED_TEST(TypedUnboundedWindowTest, UnboundedPrecedingWindowSingleGroupTimestam
                                                                  {1, 1, 1, 1, 1, 0, 1, 1, 1, 1}};
   auto const time_col =
     cudf::test::fixed_width_column_wrapper<cudf::timestamp_D, cudf::timestamp_D::rep>{
-      {9, 8, 7, 6, 5, 4, 3, 2, 1, 0}, {1, 1, 1, 1, 1, 1, 0, 0, 0, 0}};
+      {9, 8, 7, 6, 5, 4, 3, 2, 1, 0},
+      {true, true, true, true, true, true, false, false, false, false}};
 
   auto const grouping_keys       = cudf::table_view{std::vector<cudf::column_view>{grp_col}};
   auto const unbounded_preceding = cudf::window_bounds::unbounded();
@@ -1887,7 +1907,8 @@ TYPED_TEST(TypedUnboundedWindowTest, UnboundedFollowingWindowSingleGroupTimestam
                                                                  {1, 1, 1, 1, 1, 0, 1, 1, 1, 1}};
   auto const time_col =
     cudf::test::fixed_width_column_wrapper<cudf::timestamp_D, cudf::timestamp_D::rep>{
-      {9, 8, 7, 6, 5, 4, 3, 2, 1, 0}, {1, 1, 1, 1, 1, 1, 0, 0, 0, 0}};
+      {9, 8, 7, 6, 5, 4, 3, 2, 1, 0},
+      {true, true, true, true, true, true, false, false, false, false}};
 
   auto const grouping_keys       = cudf::table_view{std::vector<cudf::column_view>{grp_col}};
   auto const one_day_preceding   = cudf::window_bounds::get(1L);
@@ -1918,7 +1939,8 @@ TYPED_TEST(TypedUnboundedWindowTest,
                                                                  {1, 1, 1, 1, 1, 0, 1, 1, 1, 1}};
   auto const time_col =
     cudf::test::fixed_width_column_wrapper<cudf::timestamp_D, cudf::timestamp_D::rep>{
-      {9, 8, 7, 6, 5, 4, 3, 2, 1, 0}, {1, 1, 1, 1, 1, 1, 0, 0, 0, 0}};
+      {9, 8, 7, 6, 5, 4, 3, 2, 1, 0},
+      {true, true, true, true, true, true, false, false, false, false}};
 
   auto const grouping_keys       = cudf::table_view{std::vector<cudf::column_view>{grp_col}};
   auto const unbounded_preceding = cudf::window_bounds::unbounded();
@@ -1947,7 +1969,8 @@ TYPED_TEST(TypedUnboundedWindowTest, UnboundedPrecedingCountMultiGroupTimestampA
   auto const agg_col = cudf::test::fixed_width_column_wrapper<T>{0, 1, 2, 3, 4, 5, 6, 7, 8, 9};
   auto const time_col =
     cudf::test::fixed_width_column_wrapper<cudf::timestamp_D, cudf::timestamp_D::rep>{
-      {1, 2, 2, 1, 2, 1, 2, 3, 4, 5}, {0, 0, 0, 1, 1, 0, 0, 1, 1, 1}};
+      {1, 2, 2, 1, 2, 1, 2, 3, 4, 5},
+      {false, false, false, true, true, false, false, true, true, true}};
 
   auto const grouping_keys       = cudf::table_view{std::vector<cudf::column_view>{grp_col}};
   auto const unbounded_preceding = cudf::window_bounds::unbounded();
@@ -1976,7 +1999,8 @@ TYPED_TEST(TypedUnboundedWindowTest, UnboundedFollowingCountMultiGroupTimestampA
   auto const agg_col = cudf::test::fixed_width_column_wrapper<T>{0, 1, 2, 3, 4, 5, 6, 7, 8, 9};
   auto const time_col =
     cudf::test::fixed_width_column_wrapper<cudf::timestamp_D, cudf::timestamp_D::rep>{
-      {1, 2, 2, 1, 2, 1, 2, 3, 4, 5}, {0, 0, 0, 1, 1, 0, 0, 1, 1, 1}};
+      {1, 2, 2, 1, 2, 1, 2, 3, 4, 5},
+      {false, false, false, true, true, false, false, true, true, true}};
 
   auto const grouping_keys       = cudf::table_view{std::vector<cudf::column_view>{grp_col}};
   auto const one_day_preceding   = cudf::window_bounds::get(1L);
@@ -2006,7 +2030,8 @@ TYPED_TEST(TypedUnboundedWindowTest,
   auto const agg_col = cudf::test::fixed_width_column_wrapper<T>{0, 1, 2, 3, 4, 5, 6, 7, 8, 9};
   auto const time_col =
     cudf::test::fixed_width_column_wrapper<cudf::timestamp_D, cudf::timestamp_D::rep>{
-      {1, 2, 2, 1, 2, 1, 2, 3, 4, 5}, {0, 0, 0, 1, 1, 0, 0, 1, 1, 1}};
+      {1, 2, 2, 1, 2, 1, 2, 3, 4, 5},
+      {false, false, false, true, true, false, false, true, true, true}};
 
   auto const grouping_keys       = cudf::table_view{std::vector<cudf::column_view>{grp_col}};
   auto const unbounded_preceding = cudf::window_bounds::unbounded();
@@ -2035,7 +2060,8 @@ TYPED_TEST(TypedUnboundedWindowTest, UnboundedPrecedingCountMultiGroupTimestampA
   auto const agg_col = cudf::test::fixed_width_column_wrapper<T>{0, 1, 2, 3, 4, 5, 6, 7, 8, 9};
   auto const time_col =
     cudf::test::fixed_width_column_wrapper<cudf::timestamp_D, cudf::timestamp_D::rep>{
-      {1, 2, 2, 1, 3, 1, 2, 3, 4, 5}, {1, 1, 1, 0, 0, 1, 1, 1, 0, 0}};
+      {1, 2, 2, 1, 3, 1, 2, 3, 4, 5},
+      {true, true, true, false, false, true, true, true, false, false}};
 
   auto const grouping_keys       = cudf::table_view{std::vector<cudf::column_view>{grp_col}};
   auto const unbounded_preceding = cudf::window_bounds::unbounded();
@@ -2064,7 +2090,8 @@ TYPED_TEST(TypedUnboundedWindowTest, UnboundedFollowingCountMultiGroupTimestampA
   auto const agg_col = cudf::test::fixed_width_column_wrapper<T>{0, 1, 2, 3, 4, 5, 6, 7, 8, 9};
   auto const time_col =
     cudf::test::fixed_width_column_wrapper<cudf::timestamp_D, cudf::timestamp_D::rep>{
-      {1, 2, 2, 1, 3, 1, 2, 3, 4, 5}, {1, 1, 1, 0, 0, 1, 1, 1, 0, 0}};
+      {1, 2, 2, 1, 3, 1, 2, 3, 4, 5},
+      {true, true, true, false, false, true, true, true, false, false}};
 
   auto const grouping_keys       = cudf::table_view{std::vector<cudf::column_view>{grp_col}};
   auto const one_day_preceding   = cudf::window_bounds::get(1L);
@@ -2094,7 +2121,8 @@ TYPED_TEST(TypedUnboundedWindowTest,
   auto const agg_col = cudf::test::fixed_width_column_wrapper<T>{0, 1, 2, 3, 4, 5, 6, 7, 8, 9};
   auto const time_col =
     cudf::test::fixed_width_column_wrapper<cudf::timestamp_D, cudf::timestamp_D::rep>{
-      {1, 2, 2, 1, 3, 1, 2, 3, 4, 5}, {1, 1, 1, 0, 0, 1, 1, 1, 0, 0}};
+      {1, 2, 2, 1, 3, 1, 2, 3, 4, 5},
+      {true, true, true, false, false, true, true, true, false, false}};
 
   auto const grouping_keys       = cudf::table_view{std::vector<cudf::column_view>{grp_col}};
   auto const unbounded_preceding = cudf::window_bounds::unbounded();
@@ -2123,7 +2151,8 @@ TYPED_TEST(TypedUnboundedWindowTest, UnboundedPrecedingCountMultiGroupTimestampD
   auto const agg_col = cudf::test::fixed_width_column_wrapper<T>{0, 1, 2, 3, 4, 5, 6, 7, 8, 9};
   auto const time_col =
     cudf::test::fixed_width_column_wrapper<cudf::timestamp_D, cudf::timestamp_D::rep>{
-      {4, 3, 2, 1, 0, 9, 8, 7, 6, 5}, {0, 0, 0, 1, 1, 0, 0, 1, 1, 1}};
+      {4, 3, 2, 1, 0, 9, 8, 7, 6, 5},
+      {false, false, false, true, true, false, false, true, true, true}};
 
   auto const grouping_keys       = cudf::table_view{std::vector<cudf::column_view>{grp_col}};
   auto const unbounded_preceding = cudf::window_bounds::unbounded();
@@ -2152,7 +2181,8 @@ TYPED_TEST(TypedUnboundedWindowTest, UnboundedFollowingCountMultiGroupTimestampD
   auto const agg_col = cudf::test::fixed_width_column_wrapper<T>{0, 1, 2, 3, 4, 5, 6, 7, 8, 9};
   auto const time_col =
     cudf::test::fixed_width_column_wrapper<cudf::timestamp_D, cudf::timestamp_D::rep>{
-      {4, 3, 2, 1, 0, 9, 8, 7, 6, 5}, {0, 0, 0, 1, 1, 0, 0, 1, 1, 1}};
+      {4, 3, 2, 1, 0, 9, 8, 7, 6, 5},
+      {false, false, false, true, true, false, false, true, true, true}};
 
   auto const grouping_keys       = cudf::table_view{std::vector<cudf::column_view>{grp_col}};
   auto const one_day_preceding   = cudf::window_bounds::get(1L);
@@ -2182,7 +2212,8 @@ TYPED_TEST(TypedUnboundedWindowTest,
   auto const agg_col = cudf::test::fixed_width_column_wrapper<T>{0, 1, 2, 3, 4, 5, 6, 7, 8, 9};
   auto const time_col =
     cudf::test::fixed_width_column_wrapper<cudf::timestamp_D, cudf::timestamp_D::rep>{
-      {4, 3, 2, 1, 0, 9, 8, 7, 6, 5}, {0, 0, 0, 1, 1, 0, 0, 1, 1, 1}};
+      {4, 3, 2, 1, 0, 9, 8, 7, 6, 5},
+      {false, false, false, true, true, false, false, true, true, true}};
 
   auto const grouping_keys       = cudf::table_view{std::vector<cudf::column_view>{grp_col}};
   auto const unbounded_preceding = cudf::window_bounds::unbounded();
@@ -2211,7 +2242,8 @@ TYPED_TEST(TypedUnboundedWindowTest, UnboundedPrecedingCountMultiGroupTimestampD
   auto const agg_col = cudf::test::fixed_width_column_wrapper<T>{0, 1, 2, 3, 4, 5, 6, 7, 8, 9};
   auto const time_col =
     cudf::test::fixed_width_column_wrapper<cudf::timestamp_D, cudf::timestamp_D::rep>{
-      {4, 3, 2, 1, 0, 9, 8, 7, 6, 5}, {1, 1, 1, 0, 0, 1, 1, 1, 0, 0}};
+      {4, 3, 2, 1, 0, 9, 8, 7, 6, 5},
+      {true, true, true, false, false, true, true, true, false, false}};
 
   auto const grouping_keys       = cudf::table_view{std::vector<cudf::column_view>{grp_col}};
   auto const unbounded_preceding = cudf::window_bounds::unbounded();
@@ -2240,7 +2272,8 @@ TYPED_TEST(TypedUnboundedWindowTest, UnboundedFollowingCountMultiGroupTimestampD
   auto const agg_col = cudf::test::fixed_width_column_wrapper<T>{0, 1, 2, 3, 4, 5, 6, 7, 8, 9};
   auto const time_col =
     cudf::test::fixed_width_column_wrapper<cudf::timestamp_D, cudf::timestamp_D::rep>{
-      {4, 3, 2, 1, 0, 9, 8, 7, 6, 5}, {1, 1, 1, 0, 0, 1, 1, 1, 0, 0}};
+      {4, 3, 2, 1, 0, 9, 8, 7, 6, 5},
+      {true, true, true, false, false, true, true, true, false, false}};
 
   auto const grouping_keys       = cudf::table_view{std::vector<cudf::column_view>{grp_col}};
   auto const one_day_preceding   = cudf::window_bounds::get(1L);
@@ -2270,7 +2303,8 @@ TYPED_TEST(TypedUnboundedWindowTest,
   auto const agg_col = cudf::test::fixed_width_column_wrapper<T>{0, 1, 2, 3, 4, 5, 6, 7, 8, 9};
   auto const time_col =
     cudf::test::fixed_width_column_wrapper<cudf::timestamp_D, cudf::timestamp_D::rep>{
-      {4, 3, 2, 1, 0, 9, 8, 7, 6, 5}, {1, 1, 1, 0, 0, 1, 1, 1, 0, 0}};
+      {4, 3, 2, 1, 0, 9, 8, 7, 6, 5},
+      {true, true, true, false, false, true, true, true, false, false}};
 
   auto const grouping_keys       = cudf::table_view{std::vector<cudf::column_view>{grp_col}};
   auto const unbounded_preceding = cudf::window_bounds::unbounded();
diff --git a/cpp/tests/rolling/range_rolling_window_test.cpp b/cpp/tests/rolling/range_rolling_window_test.cpp
index fcd0cc18019..461c41025e9 100644
--- a/cpp/tests/rolling/range_rolling_window_test.cpp
+++ b/cpp/tests/rolling/range_rolling_window_test.cpp
@@ -34,6 +34,7 @@
 #include <src/rolling/detail/range_window_bounds.hpp>
 #include <src/rolling/detail/rolling.hpp>
 
+#include <utility>
 #include <vector>
 
 template <typename T, typename R = int32_t>
@@ -57,12 +58,12 @@ struct window_exec {
               ScalarT preceding_scalar,
               ScalarT following_scalar,
               cudf::size_type min_periods = 1)
-    : gby_column(gby),
-      oby_column(oby),
+    : gby_column(std::move(gby)),
+      oby_column(std::move(oby)),
       order(ordering),
-      agg_column(agg),
-      preceding(preceding_scalar),
-      following(following_scalar),
+      agg_column(std::move(agg)),
+      preceding(std::move(preceding_scalar)),
+      following(std::move(following_scalar)),
       min_periods(min_periods)
   {
   }
@@ -170,7 +171,7 @@ TYPED_TEST(TypedTimeRangeRollingTest, TimestampASC)
   // clang-format off
   auto gby_column  = int_col { 0, 0, 0, 0, 0, 1, 1, 1, 1, 1};
   auto agg_column  = int_col {{0, 8, 4, 6, 2, 9, 3, 5, 1, 7},
-                              {1, 1, 1, 1, 1, 1, 1, 1, 1, 0}};
+                              {true, true, true, true, true, true, true, true, true, false}};
   auto time_column = time_col{ 1, 5, 6, 8, 9, 2, 2, 3, 4, 9};
   // clang-format on
 
@@ -252,7 +253,7 @@ TYPED_TEST(TypedTimeRangeRollingTest, TimestampDESC)
   // clang-format off
   auto gby_column  = int_col { 5, 5, 5, 5, 5, 1, 1, 1, 1, 1};
   auto agg_column  = int_col {{7, 1, 5, 3, 9, 2, 6, 4, 8, 0},
-                              {0, 1, 1, 1, 1, 1, 1, 1, 1, 1}};
+                              {false, true, true, true, true, true, true, true, true, true}};
   auto time_column = time_col{ 9, 4, 3, 2, 2, 9, 8, 6, 5, 1};
   // clang-format on
 
@@ -281,7 +282,7 @@ TYPED_TEST(TypedIntegralRangeRollingTest, OrderByASC)
   // clang-format off
   auto gby_column = int_col { 0, 0, 0, 0, 0, 1, 1, 1, 1, 1};
   auto agg_column = int_col {{0, 8, 4, 6, 2, 9, 3, 5, 1, 7},
-                             {1, 1, 1, 1, 1, 1, 1, 1, 1, 0}};
+                             {true, true, true, true, true, true, true, true, true, false}};
   auto oby_column = fwcw<T>{  1, 5, 6, 8, 9, 2, 2, 3, 4, 9};
   // clang-format on
 
@@ -304,7 +305,7 @@ TYPED_TEST(TypedIntegralRangeRollingTest, OrderByDesc)
   // clang-format off
   auto gby_column  = int_col { 5, 5, 5, 5, 5, 1, 1, 1, 1, 1};
   auto agg_column  = int_col {{7, 1, 5, 3, 9, 2, 6, 4, 8, 0},
-                              {0, 1, 1, 1, 1, 1, 1, 1, 1, 1}};
+                              {false, true, true, true, true, true, true, true, true, true}};
   auto oby_column  = fwcw<T>{  9, 4, 3, 2, 2, 9, 8, 6, 5, 1};
   // clang-format on
 
@@ -418,8 +419,9 @@ TYPED_TEST(TypedRangeRollingNullsTest, CountMultiGroupOrderByASCNullsLast)
   // Aggregation column.
   auto const agg_col = cudf::test::fixed_width_column_wrapper<T>{0, 1, 2, 3, 4, 5, 6, 7, 8, 9};
   // OrderBy column.
-  auto const oby_col = cudf::test::fixed_width_column_wrapper<T>{{1, 2, 2, 1, 3, 1, 2, 3, 4, 5},
-                                                                 {1, 1, 1, 0, 0, 1, 1, 1, 0, 0}};
+  auto const oby_col = cudf::test::fixed_width_column_wrapper<T>{
+    {1, 2, 2, 1, 3, 1, 2, 3, 4, 5},
+    {true, true, true, false, false, true, true, true, false, false}};
 
   auto const output = do_count_over_window<T>(grp_col, oby_col, cudf::order::ASCENDING, agg_col);
 
diff --git a/cpp/tests/round/round_tests.cpp b/cpp/tests/round/round_tests.cpp
index 64d08fa7338..a1cdcc5b793 100644
--- a/cpp/tests/round/round_tests.cpp
+++ b/cpp/tests/round/round_tests.cpp
@@ -336,7 +336,8 @@ TYPED_TEST(RoundTestsFixedPointTypes, TestScaleMovementExceedingMaxPrecision)
   auto const result_even = cudf::round(input, -target_scale, cudf::rounding_method::HALF_EVEN);
   CUDF_TEST_EXPECT_COLUMNS_EQUAL(expected_even, result_even->view());
 
-  const std::initializer_list<bool> validity = {1, 0, 1, 1, 1, 0, 0, 1, 1, 1, 1, 0};
+  const std::initializer_list<bool> validity = {
+    true, false, true, true, true, false, false, true, true, true, true, false};
   auto const input_null =
     fp_wrapper{{14, 15, 16, 24, 25, 26, -14, -15, -16, -24, -25, -26}, validity, scale_type{1}};
   auto const expected_null =
@@ -705,7 +706,7 @@ TEST_F(RoundTests, BoolTestHalfUp)
 }
 
 // Use __uint128_t for demonstration.
-constexpr __uint128_t operator""_uint128_t(const char* s)
+constexpr __uint128_t operator""_uint128_t(char const* s)
 {
   __uint128_t ret = 0;
   for (int i = 0; s[i] != '\0'; ++i) {
diff --git a/cpp/tests/scalar/scalar_test.cpp b/cpp/tests/scalar/scalar_test.cpp
index cb689abb8d8..2d37de920d5 100644
--- a/cpp/tests/scalar/scalar_test.cpp
+++ b/cpp/tests/scalar/scalar_test.cpp
@@ -248,7 +248,7 @@ TEST_F(StructScalarTest, BasicNulls)
   src_columns.push_back(std::make_unique<cudf::column>(src_children[0]));
   src_columns.push_back(std::make_unique<cudf::column>(src_children[1]));
   src_columns.push_back(std::make_unique<cudf::column>(src_children[2]));
-  cudf::test::structs_column_wrapper valid_struct_col(std::move(src_columns), {1});
+  cudf::test::structs_column_wrapper valid_struct_col(std::move(src_columns), {true});
   cudf::column_view vcv = static_cast<cudf::column_view>(valid_struct_col);
   std::vector<cudf::column_view> valid_children(vcv.child_begin(), vcv.child_end());
 
@@ -256,7 +256,7 @@ TEST_F(StructScalarTest, BasicNulls)
   src_columns.push_back(std::make_unique<cudf::column>(src_children[0]));
   src_columns.push_back(std::make_unique<cudf::column>(src_children[1]));
   src_columns.push_back(std::make_unique<cudf::column>(src_children[2]));
-  cudf::test::structs_column_wrapper invalid_struct_col(std::move(src_columns), {0});
+  cudf::test::structs_column_wrapper invalid_struct_col(std::move(src_columns), {false});
   cudf::column_view icv = static_cast<cudf::column_view>(invalid_struct_col);
   std::vector<cudf::column_view> invalid_children(icv.child_begin(), icv.child_end());
 
diff --git a/cpp/tests/search/search_dictionary_test.cpp b/cpp/tests/search/search_dictionary_test.cpp
index 79a3d3b3b47..78f79ccc648 100644
--- a/cpp/tests/search/search_dictionary_test.cpp
+++ b/cpp/tests/search/search_dictionary_test.cpp
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2019-2023, NVIDIA CORPORATION.
+ * Copyright (c) 2019-2024, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -31,9 +31,10 @@ using cudf::test::fixed_width_column_wrapper;
 TEST_F(DictionarySearchTest, search_dictionary)
 {
   cudf::test::dictionary_column_wrapper<std::string> input(
-    {"", "", "10", "10", "20", "20", "30", "40"}, {0, 0, 1, 1, 1, 1, 1, 1});
+    {"", "", "10", "10", "20", "20", "30", "40"},
+    {false, false, true, true, true, true, true, true});
   cudf::test::dictionary_column_wrapper<std::string> values(
-    {"", "08", "10", "11", "30", "32", "90"}, {0, 1, 1, 1, 1, 1, 1});
+    {"", "08", "10", "11", "30", "32", "90"}, {false, true, true, true, true, true, true});
 
   auto result = cudf::upper_bound({cudf::table_view{{input}}},
                                   {cudf::table_view{{values}}},
@@ -52,17 +53,20 @@ TEST_F(DictionarySearchTest, search_dictionary)
 
 TEST_F(DictionarySearchTest, search_table_dictionary)
 {
-  fixed_width_column_wrapper<int32_t> column_0{{10, 10, 20, 20, 20, 20, 20, 20, 20, 50, 30},
-                                               {1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0}};
-  fixed_width_column_wrapper<float> column_1{{5.0, 6.0, .5, .5, .5, .5, .7, .7, .7, .7, .5},
-                                             {1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1}};
+  fixed_width_column_wrapper<int32_t> column_0{
+    {10, 10, 20, 20, 20, 20, 20, 20, 20, 50, 30},
+    {true, true, true, true, true, true, true, true, true, true, false}};
+  fixed_width_column_wrapper<float> column_1{
+    {5.0, 6.0, .5, .5, .5, .5, .7, .7, .7, .7, .5},
+    {true, false, true, true, true, true, true, true, true, true, true}};
   cudf::test::dictionary_column_wrapper<int16_t> column_2{
-    {90, 95, 77, 78, 79, 76, 61, 62, 63, 41, 50}, {1, 1, 1, 1, 0, 0, 1, 1, 1, 1, 1}};
+    {90, 95, 77, 78, 79, 76, 61, 62, 63, 41, 50},
+    {true, true, true, true, false, false, true, true, true, true, true}};
   cudf::table_view input({column_0, column_1, column_2});
 
-  fixed_width_column_wrapper<int32_t> values_0{{10, 40, 20}, {1, 0, 1}};
-  fixed_width_column_wrapper<float> values_1{{6., .5, .5}, {0, 1, 1}};
-  cudf::test::dictionary_column_wrapper<int16_t> values_2{{95, 50, 77}, {1, 1, 0}};
+  fixed_width_column_wrapper<int32_t> values_0{{10, 40, 20}, {true, false, true}};
+  fixed_width_column_wrapper<float> values_1{{6., .5, .5}, {false, true, true}};
+  cudf::test::dictionary_column_wrapper<int16_t> values_2{{95, 50, 77}, {true, true, false}};
   cudf::table_view values({values_0, values_1, values_2});
 
   std::vector<cudf::order> order_flags{
@@ -94,8 +98,8 @@ TEST_F(DictionarySearchTest, contains_dictionary)
 
 TEST_F(DictionarySearchTest, contains_nullable_dictionary)
 {
-  cudf::test::dictionary_column_wrapper<int64_t> column({0, 0, 17, 17, 23, 23, 29},
-                                                        {1, 0, 1, 1, 1, 1, 1});
+  cudf::test::dictionary_column_wrapper<int64_t> column(
+    {0, 0, 17, 17, 23, 23, 29}, {true, false, true, true, true, true, true});
   EXPECT_TRUE(cudf::contains(column, numeric_scalar<int64_t>{23}));
   EXPECT_FALSE(cudf::contains(column, numeric_scalar<int64_t>{28}));
 
diff --git a/cpp/tests/sort/is_sorted_tests.cpp b/cpp/tests/sort/is_sorted_tests.cpp
index 271b119ff80..109095192f9 100644
--- a/cpp/tests/sort/is_sorted_tests.cpp
+++ b/cpp/tests/sort/is_sorted_tests.cpp
@@ -148,13 +148,13 @@ auto empty<cudf::string_view>()
 template <>
 auto nulls_after<cudf::string_view>()
 {
-  return cudf::test::strings_column_wrapper({"identical", "identical"}, {1, 0});
+  return cudf::test::strings_column_wrapper({"identical", "identical"}, {true, false});
 }
 
 template <>
 auto nulls_before<cudf::string_view>()
 {
-  return cudf::test::strings_column_wrapper({"identical", "identical"}, {0, 1});
+  return cudf::test::strings_column_wrapper({"identical", "identical"}, {false, true});
 }
 
 // ----- struct_view {"nestedInt" : {"Int" : 0 }, "float" : 1}
@@ -213,7 +213,7 @@ auto nulls_after<cudf::struct_view>()
   auto int_col = cudf::test::fixed_width_column_wrapper<int32_t>({1, 1});
   auto col1    = cudf::test::structs_column_wrapper{{int_col}};
   auto col2    = cudf::test::fixed_width_column_wrapper<float>({1, 1});
-  return cudf::test::structs_column_wrapper{{col1, col2}, {1, 0}};
+  return cudf::test::structs_column_wrapper{{col1, col2}, {true, false}};
 }
 
 template <>
@@ -222,7 +222,7 @@ auto nulls_before<cudf::struct_view>()
   auto int_col = cudf::test::fixed_width_column_wrapper<int32_t>({1, 1});
   auto col1    = cudf::test::structs_column_wrapper{{int_col}};
   auto col2    = cudf::test::fixed_width_column_wrapper<float>({1, 1});
-  return cudf::test::structs_column_wrapper{{col1, col2}, {0, 1}};
+  return cudf::test::structs_column_wrapper{{col1, col2}, {false, true}};
 }
 
 using lcw = cudf::test::lists_column_wrapper<int32_t>;
diff --git a/cpp/tests/sort/rank_test.cpp b/cpp/tests/sort/rank_test.cpp
index 47a1ba3b294..e08a2105aea 100644
--- a/cpp/tests/sort/rank_test.cpp
+++ b/cpp/tests/sort/rank_test.cpp
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2020-2023, NVIDIA CORPORATION.
+ * Copyright (c) 2020-2024, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -74,7 +74,8 @@ template <typename T>
 struct Rank : public cudf::test::BaseFixture {
   cudf::test::fixed_width_column_wrapper<T> col1{{5, 4, 3, 5, 8, 5}};
   cudf::test::fixed_width_column_wrapper<T> col2{{5, 4, 3, 5, 8, 5}, {1, 1, 0, 1, 1, 1}};
-  cudf::test::strings_column_wrapper col3{{"d", "e", "a", "d", "k", "d"}, {1, 1, 1, 1, 1, 1}};
+  cudf::test::strings_column_wrapper col3{{"d", "e", "a", "d", "k", "d"},
+                                          {true, true, true, true, true, true}};
 
   void run_all_tests(cudf::rank_method method,
                      input_arg_t input_arg,
@@ -116,10 +117,10 @@ TYPED_TEST(Rank, first_asc_keep)
 {
   // ASCENDING
   cudf::test::fixed_width_column_wrapper<cudf::size_type> col1_rank{{3, 2, 1, 4, 6, 5}};
-  cudf::test::fixed_width_column_wrapper<cudf::size_type> col2_rank{{2, 1, -1, 3, 5, 4},
-                                                                    {1, 1, 0, 1, 1, 1}};  // KEEP
-  cudf::test::fixed_width_column_wrapper<cudf::size_type> col3_rank{{2, 5, 1, 3, 6, 4},
-                                                                    {1, 1, 1, 1, 1, 1}};
+  cudf::test::fixed_width_column_wrapper<cudf::size_type> col2_rank{
+    {2, 1, -1, 3, 5, 4}, {true, true, false, true, true, true}};  // KEEP
+  cudf::test::fixed_width_column_wrapper<cudf::size_type> col3_rank{
+    {2, 5, 1, 3, 6, 4}, {true, true, true, true, true, true}};
   this->run_all_tests(cudf::rank_method::FIRST, asc_keep, col1_rank, col2_rank, col3_rank);
 }
 
@@ -145,10 +146,10 @@ TYPED_TEST(Rank, first_desc_keep)
 {
   // DESCENDING
   cudf::test::fixed_width_column_wrapper<cudf::size_type> col1_rank{{2, 5, 6, 3, 1, 4}};
-  cudf::test::fixed_width_column_wrapper<cudf::size_type> col2_rank{{2, 5, -1, 3, 1, 4},
-                                                                    {1, 1, 0, 1, 1, 1}};  // KEEP
-  cudf::test::fixed_width_column_wrapper<cudf::size_type> col3_rank{{3, 2, 6, 4, 1, 5},
-                                                                    {1, 1, 1, 1, 1, 1}};
+  cudf::test::fixed_width_column_wrapper<cudf::size_type> col2_rank{
+    {2, 5, -1, 3, 1, 4}, {true, true, false, true, true, true}};  // KEEP
+  cudf::test::fixed_width_column_wrapper<cudf::size_type> col3_rank{
+    {3, 2, 6, 4, 1, 5}, {true, true, true, true, true, true}};
   this->run_all_tests(cudf::rank_method::FIRST, desc_keep, col1_rank, col2_rank, col3_rank);
 }
 
@@ -173,10 +174,10 @@ TYPED_TEST(Rank, first_desc_bottom)
 TYPED_TEST(Rank, dense_asc_keep)
 {
   cudf::test::fixed_width_column_wrapper<cudf::size_type> col1_rank{{3, 2, 1, 3, 4, 3}};
-  cudf::test::fixed_width_column_wrapper<cudf::size_type> col2_rank{{2, 1, -1, 2, 3, 2},
-                                                                    {1, 1, 0, 1, 1, 1}};
-  cudf::test::fixed_width_column_wrapper<cudf::size_type> col3_rank{{2, 3, 1, 2, 4, 2},
-                                                                    {1, 1, 1, 1, 1, 1}};
+  cudf::test::fixed_width_column_wrapper<cudf::size_type> col2_rank{
+    {2, 1, -1, 2, 3, 2}, {true, true, false, true, true, true}};
+  cudf::test::fixed_width_column_wrapper<cudf::size_type> col3_rank{
+    {2, 3, 1, 2, 4, 2}, {true, true, true, true, true, true}};
   this->run_all_tests(cudf::rank_method::DENSE, asc_keep, col1_rank, col2_rank, col3_rank);
 }
 
@@ -199,10 +200,10 @@ TYPED_TEST(Rank, dense_asc_bottom)
 TYPED_TEST(Rank, dense_desc_keep)
 {
   cudf::test::fixed_width_column_wrapper<cudf::size_type> col1_rank{{2, 3, 4, 2, 1, 2}};
-  cudf::test::fixed_width_column_wrapper<cudf::size_type> col2_rank{{2, 3, -1, 2, 1, 2},
-                                                                    {1, 1, 0, 1, 1, 1}};
-  cudf::test::fixed_width_column_wrapper<cudf::size_type> col3_rank{{3, 2, 4, 3, 1, 3},
-                                                                    {1, 1, 1, 1, 1, 1}};
+  cudf::test::fixed_width_column_wrapper<cudf::size_type> col2_rank{
+    {2, 3, -1, 2, 1, 2}, {true, true, false, true, true, true}};
+  cudf::test::fixed_width_column_wrapper<cudf::size_type> col3_rank{
+    {3, 2, 4, 3, 1, 3}, {true, true, true, true, true, true}};
   this->run_all_tests(cudf::rank_method::DENSE, desc_keep, col1_rank, col2_rank, col3_rank);
 }
 
@@ -225,10 +226,10 @@ TYPED_TEST(Rank, dense_desc_bottom)
 TYPED_TEST(Rank, min_asc_keep)
 {
   cudf::test::fixed_width_column_wrapper<cudf::size_type> col1_rank{{3, 2, 1, 3, 6, 3}};
-  cudf::test::fixed_width_column_wrapper<cudf::size_type> col2_rank{{2, 1, -1, 2, 5, 2},
-                                                                    {1, 1, 0, 1, 1, 1}};
-  cudf::test::fixed_width_column_wrapper<cudf::size_type> col3_rank{{2, 5, 1, 2, 6, 2},
-                                                                    {1, 1, 1, 1, 1, 1}};
+  cudf::test::fixed_width_column_wrapper<cudf::size_type> col2_rank{
+    {2, 1, -1, 2, 5, 2}, {true, true, false, true, true, true}};
+  cudf::test::fixed_width_column_wrapper<cudf::size_type> col3_rank{
+    {2, 5, 1, 2, 6, 2}, {true, true, true, true, true, true}};
   this->run_all_tests(cudf::rank_method::MIN, asc_keep, col1_rank, col2_rank, col3_rank);
 }
 
@@ -251,10 +252,10 @@ TYPED_TEST(Rank, min_asc_bottom)
 TYPED_TEST(Rank, min_desc_keep)
 {
   cudf::test::fixed_width_column_wrapper<cudf::size_type> col1_rank{{2, 5, 6, 2, 1, 2}};
-  cudf::test::fixed_width_column_wrapper<cudf::size_type> col2_rank{{2, 5, -1, 2, 1, 2},
-                                                                    {1, 1, 0, 1, 1, 1}};
-  cudf::test::fixed_width_column_wrapper<cudf::size_type> col3_rank{{3, 2, 6, 3, 1, 3},
-                                                                    {1, 1, 1, 1, 1, 1}};
+  cudf::test::fixed_width_column_wrapper<cudf::size_type> col2_rank{
+    {2, 5, -1, 2, 1, 2}, {true, true, false, true, true, true}};
+  cudf::test::fixed_width_column_wrapper<cudf::size_type> col3_rank{
+    {3, 2, 6, 3, 1, 3}, {true, true, true, true, true, true}};
   this->run_all_tests(cudf::rank_method::MIN, desc_keep, col1_rank, col2_rank, col3_rank);
 }
 
@@ -277,10 +278,10 @@ TYPED_TEST(Rank, min_desc_bottom)
 TYPED_TEST(Rank, max_asc_keep)
 {
   cudf::test::fixed_width_column_wrapper<cudf::size_type> col1_rank{{5, 2, 1, 5, 6, 5}};
-  cudf::test::fixed_width_column_wrapper<cudf::size_type> col2_rank{{4, 1, -1, 4, 5, 4},
-                                                                    {1, 1, 0, 1, 1, 1}};
-  cudf::test::fixed_width_column_wrapper<cudf::size_type> col3_rank{{4, 5, 1, 4, 6, 4},
-                                                                    {1, 1, 1, 1, 1, 1}};
+  cudf::test::fixed_width_column_wrapper<cudf::size_type> col2_rank{
+    {4, 1, -1, 4, 5, 4}, {true, true, false, true, true, true}};
+  cudf::test::fixed_width_column_wrapper<cudf::size_type> col3_rank{
+    {4, 5, 1, 4, 6, 4}, {true, true, true, true, true, true}};
   this->run_all_tests(cudf::rank_method::MAX, asc_keep, col1_rank, col2_rank, col3_rank);
 }
 
@@ -303,10 +304,10 @@ TYPED_TEST(Rank, max_asc_bottom)
 TYPED_TEST(Rank, max_desc_keep)
 {
   cudf::test::fixed_width_column_wrapper<cudf::size_type> col1_rank{{4, 5, 6, 4, 1, 4}};
-  cudf::test::fixed_width_column_wrapper<cudf::size_type> col2_rank{{4, 5, -1, 4, 1, 4},
-                                                                    {1, 1, 0, 1, 1, 1}};
-  cudf::test::fixed_width_column_wrapper<cudf::size_type> col3_rank{{5, 2, 6, 5, 1, 5},
-                                                                    {1, 1, 1, 1, 1, 1}};
+  cudf::test::fixed_width_column_wrapper<cudf::size_type> col2_rank{
+    {4, 5, -1, 4, 1, 4}, {true, true, false, true, true, true}};
+  cudf::test::fixed_width_column_wrapper<cudf::size_type> col3_rank{
+    {5, 2, 6, 5, 1, 5}, {true, true, true, true, true, true}};
   this->run_all_tests(cudf::rank_method::MAX, desc_keep, col1_rank, col2_rank, col3_rank);
 }
 
@@ -329,8 +330,10 @@ TYPED_TEST(Rank, max_desc_bottom)
 TYPED_TEST(Rank, average_asc_keep)
 {
   cudf::test::fixed_width_column_wrapper<double> col1_rank{{4, 2, 1, 4, 6, 4}};
-  cudf::test::fixed_width_column_wrapper<double> col2_rank{{3, 1, -1, 3, 5, 3}, {1, 1, 0, 1, 1, 1}};
-  cudf::test::fixed_width_column_wrapper<double> col3_rank{{3, 5, 1, 3, 6, 3}, {1, 1, 1, 1, 1, 1}};
+  cudf::test::fixed_width_column_wrapper<double> col2_rank{{3, 1, -1, 3, 5, 3},
+                                                           {true, true, false, true, true, true}};
+  cudf::test::fixed_width_column_wrapper<double> col3_rank{{3, 5, 1, 3, 6, 3},
+                                                           {true, true, true, true, true, true}};
   this->run_all_tests(cudf::rank_method::AVERAGE, asc_keep, col1_rank, col2_rank, col3_rank);
 }
 
@@ -353,8 +356,10 @@ TYPED_TEST(Rank, average_asc_bottom)
 TYPED_TEST(Rank, average_desc_keep)
 {
   cudf::test::fixed_width_column_wrapper<double> col1_rank{{3, 5, 6, 3, 1, 3}};
-  cudf::test::fixed_width_column_wrapper<double> col2_rank{{3, 5, -1, 3, 1, 3}, {1, 1, 0, 1, 1, 1}};
-  cudf::test::fixed_width_column_wrapper<double> col3_rank{{4, 2, 6, 4, 1, 4}, {1, 1, 1, 1, 1, 1}};
+  cudf::test::fixed_width_column_wrapper<double> col2_rank{{3, 5, -1, 3, 1, 3},
+                                                           {true, true, false, true, true, true}};
+  cudf::test::fixed_width_column_wrapper<double> col3_rank{{4, 2, 6, 4, 1, 4},
+                                                           {true, true, true, true, true, true}};
   this->run_all_tests(cudf::rank_method::AVERAGE, desc_keep, col1_rank, col2_rank, col3_rank);
 }
 
@@ -379,9 +384,9 @@ TYPED_TEST(Rank, dense_asc_keep_pct)
 {
   cudf::test::fixed_width_column_wrapper<double> col1_rank{{0.75, 0.5, 0.25, 0.75, 1., 0.75}};
   cudf::test::fixed_width_column_wrapper<double> col2_rank{
-    {2.0 / 3.0, 1.0 / 3.0, -1., 2.0 / 3.0, 1., 2.0 / 3.0}, {1, 1, 0, 1, 1, 1}};
+    {2.0 / 3.0, 1.0 / 3.0, -1., 2.0 / 3.0, 1., 2.0 / 3.0}, {true, true, false, true, true, true}};
   cudf::test::fixed_width_column_wrapper<double> col3_rank{{0.5, 0.75, 0.25, 0.5, 1., 0.5},
-                                                           {1, 1, 1, 1, 1, 1}};
+                                                           {true, true, true, true, true, true}};
   this->run_all_tests(cudf::rank_method::DENSE, asc_keep, col1_rank, col2_rank, col3_rank, true);
 }
 
@@ -406,9 +411,9 @@ TYPED_TEST(Rank, min_desc_keep_pct)
   cudf::test::fixed_width_column_wrapper<double> col1_rank{
     {1.0 / 3.0, 5.0 / 6.0, 1., 1.0 / 3.0, 1.0 / 6.0, 1.0 / 3.0}};
   cudf::test::fixed_width_column_wrapper<double> col2_rank{{0.4, 1., -1., 0.4, 0.2, 0.4},
-                                                           {1, 1, 0, 1, 1, 1}};
+                                                           {true, true, false, true, true, true}};
   cudf::test::fixed_width_column_wrapper<double> col3_rank{
-    {0.5, 1.0 / 3.0, 1., 0.5, 1.0 / 6.0, 0.5}, {1, 1, 1, 1, 1, 1}};
+    {0.5, 1.0 / 3.0, 1., 0.5, 1.0 / 6.0, 0.5}, {true, true, true, true, true, true}};
   this->run_all_tests(cudf::rank_method::MIN, desc_keep, col1_rank, col2_rank, col3_rank, true);
 }
 
@@ -494,7 +499,7 @@ struct RankListAndStruct : public cudf::test::BaseFixture {
     7 |   {null, 0}|
       +------------+
     */
-    std::vector<bool>                           struct_valids{1, 1, 0, 1, 0, 1, 1, 1};
+    std::vector<bool>                           struct_valids{true, true, false, true, false, true, true, true};
     auto col1       = cudf::test::fixed_width_column_wrapper<T>{{ 0,  1,  9, -1,  9, -1, -1, -1}, {1, 1, 1, 0, 1, 0, 0, 0}};
     auto col2       = cudf::test::fixed_width_column_wrapper<T>{{-1, -1,  9, -1,  9, -1,  1,  0}, {0, 0, 1, 0, 1, 0, 1, 1}};
     auto struct_col = cudf::test::structs_column_wrapper{{col1, col2}, struct_valids}.release();
diff --git a/cpp/tests/sort/stable_sort_tests.cpp b/cpp/tests/sort/stable_sort_tests.cpp
index 341f8317004..655166e0d62 100644
--- a/cpp/tests/sort/stable_sort_tests.cpp
+++ b/cpp/tests/sort/stable_sort_tests.cpp
@@ -60,7 +60,7 @@ TYPED_TEST(StableSort, MixedNullOrder)
   cudf::test::fixed_width_column_wrapper<T> col1({0, 1, 1, 0, 0, 1, 0, 1},
                                                  {0, 1, 1, 1, 1, 1, 1, 1});
   cudf::test::strings_column_wrapper col2({"2", "a", "b", "x", "k", "a", "x", "a"},
-                                          {1, 1, 1, 1, 0, 1, 1, 1});
+                                          {true, true, true, true, false, true, true, true});
 
   cudf::test::fixed_width_column_wrapper<R> expected{{4, 3, 6, 1, 5, 7, 2, 0}};
 
@@ -76,7 +76,8 @@ TYPED_TEST(StableSort, WithNullMax)
   using T = TypeParam;
 
   cudf::test::fixed_width_column_wrapper<T> col1{{5, 4, 3, 5, 8, 5}, {1, 1, 0, 1, 1, 1}};
-  cudf::test::strings_column_wrapper col2({"d", "e", "a", "d", "k", "d"}, {1, 1, 0, 1, 1, 1});
+  cudf::test::strings_column_wrapper col2({"d", "e", "a", "d", "k", "d"},
+                                          {true, true, false, true, true, true});
   cudf::test::fixed_width_column_wrapper<T> col3{{10, 40, 70, 10, 2, 10}, {1, 1, 0, 1, 1, 1}};
   cudf::table_view input{{col1, col2, col3}};
 
@@ -140,7 +141,8 @@ TYPED_TEST(StableSort, WithNullMin)
   using T = TypeParam;
 
   cudf::test::fixed_width_column_wrapper<T> col1{{5, 4, 3, 5, 8}, {1, 1, 0, 1, 1}};
-  cudf::test::strings_column_wrapper col2({"d", "e", "a", "d", "k"}, {1, 1, 0, 1, 1});
+  cudf::test::strings_column_wrapper col2({"d", "e", "a", "d", "k"},
+                                          {true, true, false, true, true});
   cudf::test::fixed_width_column_wrapper<T> col3{{10, 40, 70, 10, 2}, {1, 1, 0, 1, 1}};
   cudf::table_view input{{col1, col2, col3}};
 
diff --git a/cpp/tests/stream_compaction/distinct_count_tests.cpp b/cpp/tests/stream_compaction/distinct_count_tests.cpp
index ee0ca3f86c1..a2dab649961 100644
--- a/cpp/tests/stream_compaction/distinct_count_tests.cpp
+++ b/cpp/tests/stream_compaction/distinct_count_tests.cpp
@@ -254,7 +254,7 @@ TEST_F(DistinctCount, StringColumnWithNull)
 {
   cudf::test::strings_column_wrapper input_col{
     {"", "this", "is", "this", "This", "a", "column", "of", "the", "strings"},
-    {1, 1, 1, 1, 1, 1, 1, 1, 0, 1}};
+    {true, true, true, true, true, true, true, true, false, true}};
 
   cudf::size_type const expected =
     (std::vector<std::string>{"", "this", "is", "This", "a", "column", "of", "strings"}).size();
@@ -264,10 +264,12 @@ TEST_F(DistinctCount, StringColumnWithNull)
 
 TEST_F(DistinctCount, TableWithNull)
 {
-  cudf::test::fixed_width_column_wrapper<int32_t> col1{{5, 4, 3, 5, 8, 1, 4, 5, 0, 9, -1},
-                                                       {1, 1, 1, 1, 1, 1, 1, 1, 0, 1, 0}};
-  cudf::test::fixed_width_column_wrapper<int32_t> col2{{2, 2, 2, -1, 2, 1, 2, 0, 0, 9, -1},
-                                                       {1, 1, 1, 0, 1, 1, 1, 0, 0, 1, 0}};
+  cudf::test::fixed_width_column_wrapper<int32_t> col1{
+    {5, 4, 3, 5, 8, 1, 4, 5, 0, 9, -1},
+    {true, true, true, true, true, true, true, true, false, true, false}};
+  cudf::test::fixed_width_column_wrapper<int32_t> col2{
+    {2, 2, 2, -1, 2, 1, 2, 0, 0, 9, -1},
+    {true, true, true, false, true, true, true, false, false, true, false}};
   cudf::table_view input{{col1, col2}};
 
   EXPECT_EQ(8, cudf::distinct_count(input, null_equality::EQUAL));
@@ -276,7 +278,8 @@ TEST_F(DistinctCount, TableWithNull)
 
 TEST_F(DistinctCount, TableWithSomeNull)
 {
-  cudf::test::fixed_width_column_wrapper<int32_t> col1{{1, 2, 3, 4, 5, 6}, {1, 0, 1, 0, 1, 0}};
+  cudf::test::fixed_width_column_wrapper<int32_t> col1{{1, 2, 3, 4, 5, 6},
+                                                       {true, false, true, false, true, false}};
   cudf::test::fixed_width_column_wrapper<int32_t> col2{{1, 1, 1, 1, 1, 1}};
   cudf::table_view input{{col1, col2}};
 
@@ -296,12 +299,15 @@ TEST_F(DistinctCount, EmptyColumnedTable)
 
 TEST_F(DistinctCount, TableMixedTypes)
 {
-  cudf::test::fixed_width_column_wrapper<int32_t> col1{{5, 4, 3, 5, 8, 1, 4, 5, 0, 9, -1},
-                                                       {1, 1, 1, 1, 1, 1, 1, 1, 0, 1, 0}};
-  cudf::test::fixed_width_column_wrapper<double> col2{{2, 2, 2, -1, 2, 1, 2, 0, 0, 9, -1},
-                                                      {1, 1, 1, 0, 1, 1, 1, 0, 0, 1, 0}};
-  cudf::test::fixed_width_column_wrapper<uint32_t> col3{{2, 2, 2, -1, 2, 1, 2, 0, 0, 9, -1},
-                                                        {1, 1, 1, 0, 1, 1, 1, 1, 0, 1, 0}};
+  cudf::test::fixed_width_column_wrapper<int32_t> col1{
+    {5, 4, 3, 5, 8, 1, 4, 5, 0, 9, -1},
+    {true, true, true, true, true, true, true, true, false, true, false}};
+  cudf::test::fixed_width_column_wrapper<double> col2{
+    {2, 2, 2, -1, 2, 1, 2, 0, 0, 9, -1},
+    {true, true, true, false, true, true, true, false, false, true, false}};
+  cudf::test::fixed_width_column_wrapper<uint32_t> col3{
+    {2, 2, 2, -1, 2, 1, 2, 0, 0, 9, -1},
+    {true, true, true, false, true, true, true, true, false, true, false}};
   cudf::table_view input{{col1, col2, col3}};
 
   EXPECT_EQ(9, cudf::distinct_count(input, null_equality::EQUAL));
@@ -310,11 +316,12 @@ TEST_F(DistinctCount, TableMixedTypes)
 
 TEST_F(DistinctCount, TableWithStringColumnWithNull)
 {
-  cudf::test::fixed_width_column_wrapper<int32_t> col1{{0, 9, 8, 9, 6, 5, 4, 3, 2, 1, 0},
-                                                       {1, 1, 1, 1, 1, 1, 1, 1, 0, 1, 0}};
+  cudf::test::fixed_width_column_wrapper<int32_t> col1{
+    {0, 9, 8, 9, 6, 5, 4, 3, 2, 1, 0},
+    {true, true, true, true, true, true, true, true, false, true, false}};
   cudf::test::strings_column_wrapper col2{
     {"", "this", "is", "this", "this", "a", "column", "of", "the", "strings", ""},
-    {1, 1, 1, 1, 1, 1, 1, 1, 0, 1, 0}};
+    {true, true, true, true, true, true, true, true, false, true, false}};
 
   cudf::table_view input{{col1, col2}};
   EXPECT_EQ(9, cudf::distinct_count(input, null_equality::EQUAL));
diff --git a/cpp/tests/stream_compaction/distinct_tests.cpp b/cpp/tests/stream_compaction/distinct_tests.cpp
index 586792b4b30..14d7d8789ac 100644
--- a/cpp/tests/stream_compaction/distinct_tests.cpp
+++ b/cpp/tests/stream_compaction/distinct_tests.cpp
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2019-2023, NVIDIA CORPORATION.
+ * Copyright (c) 2019-2024, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -143,7 +143,7 @@ TEST_F(DistinctKeepAny, NoColumnInputTable)
 
 TEST_F(DistinctKeepAny, EmptyKeys)
 {
-  int32s_col col{{5, 4, 3, 5, 8, 1}, {1, 0, 1, 1, 1, 1}};
+  int32s_col col{{5, 4, 3, 5, 8, 1}, {true, false, true, true, true, true}};
   int32s_col empty_col{};
   cudf::table_view input{{col}};
   std::vector<cudf::size_type> key_idx{};
diff --git a/cpp/tests/stream_compaction/drop_nans_tests.cpp b/cpp/tests/stream_compaction/drop_nans_tests.cpp
index 425d9a47ecc..bf72da5c840 100644
--- a/cpp/tests/stream_compaction/drop_nans_tests.cpp
+++ b/cpp/tests/stream_compaction/drop_nans_tests.cpp
@@ -35,16 +35,19 @@ TEST_F(DropNANsTest, MixedNANsAndNull)
   using F = float;
   using D = double;
   cudf::test::fixed_width_column_wrapper<float> col1{
-    {F(1.0), F(2.0), F(NAN), F(NAN), F(5.0), F(6.0)}, {1, 1, 0, 1, 1, 0}};
-  cudf::test::fixed_width_column_wrapper<int32_t> col2{{10, 40, 70, 5, 2, 10}, {1, 1, 0, 1, 1, 0}};
+    {F(1.0), F(2.0), F(NAN), F(NAN), F(5.0), F(6.0)}, {true, true, false, true, true, false}};
+  cudf::test::fixed_width_column_wrapper<int32_t> col2{{10, 40, 70, 5, 2, 10},
+                                                       {true, true, false, true, true, false}};
   cudf::test::fixed_width_column_wrapper<double> col3{{D(NAN), 40.0, 70.0, 5.0, 2.0, 10.0},
-                                                      {1, 1, 0, 1, 1, 0}};
+                                                      {true, true, false, true, true, false}};
   cudf::table_view input{{col1, col2, col3}};
   std::vector<cudf::size_type> keys{0, 2};
-  cudf::test::fixed_width_column_wrapper<float> col1_expected{{2.0, 3.0, 5.0, 6.0}, {1, 0, 1, 0}};
-  cudf::test::fixed_width_column_wrapper<int32_t> col2_expected{{40, 70, 2, 10}, {1, 0, 1, 0}};
+  cudf::test::fixed_width_column_wrapper<float> col1_expected{{2.0, 3.0, 5.0, 6.0},
+                                                              {true, false, true, false}};
+  cudf::test::fixed_width_column_wrapper<int32_t> col2_expected{{40, 70, 2, 10},
+                                                                {true, false, true, false}};
   cudf::test::fixed_width_column_wrapper<double> col3_expected{{40.0, 70.0, 2.0, 10.0},
-                                                               {1, 0, 1, 0}};
+                                                               {true, false, true, false}};
   cudf::table_view expected{{col1_expected, col2_expected, col3_expected}};
 
   auto got = cudf::drop_nans(input, keys);
@@ -55,9 +58,11 @@ TEST_F(DropNANsTest, MixedNANsAndNull)
 TEST_F(DropNANsTest, NoNANs)
 {
   cudf::test::fixed_width_column_wrapper<float> col1{{1.0, 2.0, 3.0, 4.0, 5.0, 6.0},
-                                                     {1, 1, 0, 1, 1, 1}};
-  cudf::test::fixed_width_column_wrapper<int32_t> col2{{10, 40, 70, 5, 2, 10}, {1, 1, 1, 1, 0, 1}};
-  cudf::test::fixed_width_column_wrapper<double> col3{{10, 40, 70, 5, 2, 10}, {1, 1, 0, 1, 1, 1}};
+                                                     {true, true, false, true, true, true}};
+  cudf::test::fixed_width_column_wrapper<int32_t> col2{{10, 40, 70, 5, 2, 10},
+                                                       {true, true, true, true, false, true}};
+  cudf::test::fixed_width_column_wrapper<double> col3{{10, 40, 70, 5, 2, 10},
+                                                      {true, true, false, true, true, true}};
   cudf::table_view input{{col1, col2, col3}};
   std::vector<cudf::size_type> keys{0, 2};
 
@@ -71,18 +76,19 @@ TEST_F(DropNANsTest, MixedWithThreshold)
   using F = float;
   using D = double;
   cudf::test::fixed_width_column_wrapper<float> col1{
-    {F(1.0), F(2.0), F(NAN), F(NAN), F(5.0), F(6.0)}, {1, 1, 0, 1, 1, 0}};
-  cudf::test::fixed_width_column_wrapper<int32_t> col2{{10, 40, 70, 5, 2, 10}, {1, 1, 0, 1, 1, 0}};
+    {F(1.0), F(2.0), F(NAN), F(NAN), F(5.0), F(6.0)}, {true, true, false, true, true, false}};
+  cudf::test::fixed_width_column_wrapper<int32_t> col2{{10, 40, 70, 5, 2, 10},
+                                                       {true, true, false, true, true, false}};
   cudf::test::fixed_width_column_wrapper<double> col3{{D(NAN), 40.0, 70.0, D(NAN), 2.0, 10.0},
-                                                      {1, 1, 0, 1, 1, 0}};
+                                                      {true, true, false, true, true, false}};
   cudf::table_view input{{col1, col2, col3}};
   std::vector<cudf::size_type> keys{0, 2};
   cudf::test::fixed_width_column_wrapper<float> col1_expected{{1.0, 2.0, 3.0, 5.0, 6.0},
-                                                              {1, 1, 0, 1, 0}};
+                                                              {true, true, false, true, false}};
   cudf::test::fixed_width_column_wrapper<int32_t> col2_expected{{10, 40, 70, 2, 10},
-                                                                {1, 1, 0, 1, 0}};
+                                                                {true, true, false, true, false}};
   cudf::test::fixed_width_column_wrapper<double> col3_expected{{D(NAN), 40.0, 70.0, 2.0, 10.0},
-                                                               {1, 1, 0, 1, 0}};
+                                                               {true, true, false, true, false}};
   cudf::table_view expected{{col1_expected, col2_expected, col3_expected}};
 
   auto got = cudf::drop_nans(input, keys, 1);
@@ -122,7 +128,7 @@ TEST_F(DropNANsTest, EmptyKeys)
 {
   using F = float;
   cudf::test::fixed_width_column_wrapper<float> col1{
-    {F(1.0), F(2.0), F(NAN), F(NAN), F(5.0), F(6.0)}, {1, 1, 0, 1, 1, 0}};
+    {F(1.0), F(2.0), F(NAN), F(NAN), F(5.0), F(6.0)}, {true, true, false, true, true, false}};
   cudf::table_view input{{col1}};
   std::vector<cudf::size_type> keys{};
 
diff --git a/cpp/tests/stream_compaction/drop_nulls_tests.cpp b/cpp/tests/stream_compaction/drop_nulls_tests.cpp
index 47aa2d8ee3e..dbac1d58195 100644
--- a/cpp/tests/stream_compaction/drop_nulls_tests.cpp
+++ b/cpp/tests/stream_compaction/drop_nulls_tests.cpp
@@ -34,15 +34,19 @@ struct DropNullsTest : public cudf::test::BaseFixture {};
 TEST_F(DropNullsTest, WholeRowIsNull)
 {
   cudf::test::fixed_width_column_wrapper<int16_t> col1{{true, false, true, false, true, false},
-                                                       {1, 1, 0, 1, 1, 0}};
-  cudf::test::fixed_width_column_wrapper<int32_t> col2{{10, 40, 70, 5, 2, 10}, {1, 1, 0, 1, 1, 0}};
-  cudf::test::fixed_width_column_wrapper<double> col3{{10, 40, 70, 5, 2, 10}, {1, 1, 0, 1, 1, 0}};
+                                                       {true, true, false, true, true, false}};
+  cudf::test::fixed_width_column_wrapper<int32_t> col2{{10, 40, 70, 5, 2, 10},
+                                                       {true, true, false, true, true, false}};
+  cudf::test::fixed_width_column_wrapper<double> col3{{10, 40, 70, 5, 2, 10},
+                                                      {true, true, false, true, true, false}};
   cudf::table_view input{{col1, col2, col3}};
   std::vector<cudf::size_type> keys{0, 1, 2};
   cudf::test::fixed_width_column_wrapper<int16_t> col1_expected{{true, false, false, true},
-                                                                {1, 1, 1, 1}};
-  cudf::test::fixed_width_column_wrapper<int32_t> col2_expected{{10, 40, 5, 2}, {1, 1, 1, 1}};
-  cudf::test::fixed_width_column_wrapper<double> col3_expected{{10, 40, 5, 2}, {1, 1, 1, 1}};
+                                                                {true, true, true, true}};
+  cudf::test::fixed_width_column_wrapper<int32_t> col2_expected{{10, 40, 5, 2},
+                                                                {true, true, true, true}};
+  cudf::test::fixed_width_column_wrapper<double> col3_expected{{10, 40, 5, 2},
+                                                               {true, true, true, true}};
   cudf::table_view expected{{col1_expected, col2_expected, col3_expected}};
 
   auto got = cudf::drop_nulls(input, keys);
@@ -53,9 +57,11 @@ TEST_F(DropNullsTest, WholeRowIsNull)
 TEST_F(DropNullsTest, NoNull)
 {
   cudf::test::fixed_width_column_wrapper<int16_t> col1{{true, false, true, false, true, false},
-                                                       {1, 1, 1, 1, 1, 1}};
-  cudf::test::fixed_width_column_wrapper<int32_t> col2{{10, 40, 70, 5, 2, 10}, {1, 1, 1, 1, 1, 1}};
-  cudf::test::fixed_width_column_wrapper<double> col3{{10, 40, 70, 5, 2, 10}, {1, 1, 1, 1, 1, 1}};
+                                                       {true, true, true, true, true, true}};
+  cudf::test::fixed_width_column_wrapper<int32_t> col2{{10, 40, 70, 5, 2, 10},
+                                                       {true, true, true, true, true, true}};
+  cudf::test::fixed_width_column_wrapper<double> col3{{10, 40, 70, 5, 2, 10},
+                                                      {true, true, true, true, true, true}};
   cudf::table_view input{{col1, col2, col3}};
   std::vector<cudf::size_type> keys{0, 1, 2};
 
@@ -67,15 +73,19 @@ TEST_F(DropNullsTest, NoNull)
 TEST_F(DropNullsTest, MixedSetOfRows)
 {
   cudf::test::fixed_width_column_wrapper<int16_t> col1{{true, false, true, false, true, false},
-                                                       {1, 1, 0, 1, 1, 0}};
-  cudf::test::fixed_width_column_wrapper<int32_t> col2{{10, 40, 70, 5, 2, 10}, {1, 1, 0, 1, 1, 0}};
-  cudf::test::fixed_width_column_wrapper<double> col3{{10, 40, 70, 5, 2, 10}, {1, 1, 0, 1, 1, 1}};
+                                                       {true, true, false, true, true, false}};
+  cudf::test::fixed_width_column_wrapper<int32_t> col2{{10, 40, 70, 5, 2, 10},
+                                                       {true, true, false, true, true, false}};
+  cudf::test::fixed_width_column_wrapper<double> col3{{10, 40, 70, 5, 2, 10},
+                                                      {true, true, false, true, true, true}};
   cudf::table_view input{{col1, col2, col3}};
   std::vector<cudf::size_type> keys{0, 1, 2};
   cudf::test::fixed_width_column_wrapper<int16_t> col1_expected{{true, false, false, true},
-                                                                {1, 1, 1, 1}};
-  cudf::test::fixed_width_column_wrapper<int32_t> col2_expected{{10, 40, 5, 2}, {1, 1, 1, 1}};
-  cudf::test::fixed_width_column_wrapper<double> col3_expected{{10, 40, 5, 2}, {1, 1, 1, 1}};
+                                                                {true, true, true, true}};
+  cudf::test::fixed_width_column_wrapper<int32_t> col2_expected{{10, 40, 5, 2},
+                                                                {true, true, true, true}};
+  cudf::test::fixed_width_column_wrapper<double> col3_expected{{10, 40, 5, 2},
+                                                               {true, true, true, true}};
   cudf::table_view expected{{col1_expected, col2_expected, col3_expected}};
 
   auto got = cudf::drop_nulls(input, keys);
@@ -132,16 +142,19 @@ TEST_F(DropNullsTest, LargeColumn)
 TEST_F(DropNullsTest, MixedSetOfRowsWithThreshold)
 {
   cudf::test::fixed_width_column_wrapper<int16_t> col1{{true, false, true, false, true, false},
-                                                       {1, 1, 0, 1, 1, 0}};
-  cudf::test::fixed_width_column_wrapper<int32_t> col2{{10, 40, 70, 5, 2, 10}, {1, 1, 0, 1, 1, 1}};
-  cudf::test::fixed_width_column_wrapper<double> col3{{10, 40, 70, 5, 2, 10}, {1, 1, 1, 1, 1, 1}};
+                                                       {true, true, false, true, true, false}};
+  cudf::test::fixed_width_column_wrapper<int32_t> col2{{10, 40, 70, 5, 2, 10},
+                                                       {true, true, false, true, true, true}};
+  cudf::test::fixed_width_column_wrapper<double> col3{{10, 40, 70, 5, 2, 10},
+                                                      {true, true, true, true, true, true}};
   cudf::table_view input{{col1, col2, col3}};
   std::vector<cudf::size_type> keys{0, 1, 2};
   cudf::test::fixed_width_column_wrapper<int16_t> col1_expected{{true, false, false, true, false},
-                                                                {1, 1, 1, 1, 0}};
+                                                                {true, true, true, true, false}};
   cudf::test::fixed_width_column_wrapper<int32_t> col2_expected{{10, 40, 5, 2, 10},
-                                                                {1, 1, 1, 1, 1}};
-  cudf::test::fixed_width_column_wrapper<double> col3_expected{{10, 40, 5, 2, 10}, {1, 1, 1, 1, 1}};
+                                                                {true, true, true, true, true}};
+  cudf::test::fixed_width_column_wrapper<double> col3_expected{{10, 40, 5, 2, 10},
+                                                               {true, true, true, true, true}};
   cudf::table_view expected{{col1_expected, col2_expected, col3_expected}};
 
   auto got = cudf::drop_nulls(input, keys, keys.size() - 1);
@@ -180,7 +193,7 @@ TEST_F(DropNullsTest, EmptyColumns)
 TEST_F(DropNullsTest, EmptyKeys)
 {
   cudf::test::fixed_width_column_wrapper<int16_t> col1{{true, false, true, false, true, false},
-                                                       {1, 1, 0, 1, 1, 0}};
+                                                       {true, true, false, true, true, false}};
   cudf::table_view input{{col1}};
   std::vector<cudf::size_type> keys{};
 
@@ -191,13 +204,15 @@ TEST_F(DropNullsTest, EmptyKeys)
 TEST_F(DropNullsTest, StringColWithNull)
 {
   cudf::test::fixed_width_column_wrapper<int16_t> col1{{11, 12, 11, 13, 12, 15},
-                                                       {1, 1, 0, 1, 0, 1}};
+                                                       {true, true, false, true, false, true}};
   cudf::test::strings_column_wrapper col2{{"Hi", "Hello", "Hi", "No", "Hello", "Naive"},
-                                          {1, 1, 0, 1, 0, 1}};
+                                          {true, true, false, true, false, true}};
   cudf::table_view input{{col1, col2}};
   std::vector<cudf::size_type> keys{0, 1};
-  cudf::test::fixed_width_column_wrapper<int16_t> col1_expected{{11, 12, 13, 15}, {1, 1, 1, 1}};
-  cudf::test::strings_column_wrapper col2_expected{{"Hi", "Hello", "No", "Naive"}, {1, 1, 1, 1}};
+  cudf::test::fixed_width_column_wrapper<int16_t> col1_expected{{11, 12, 13, 15},
+                                                                {true, true, true, true}};
+  cudf::test::strings_column_wrapper col2_expected{{"Hi", "Hello", "No", "Naive"},
+                                                   {true, true, true, true}};
   cudf::table_view expected{{col1_expected, col2_expected}};
 
   auto got = cudf::drop_nulls(input, keys);
diff --git a/cpp/tests/stream_compaction/stable_distinct_tests.cpp b/cpp/tests/stream_compaction/stable_distinct_tests.cpp
index e28b96fc8be..6c6c53331d4 100644
--- a/cpp/tests/stream_compaction/stable_distinct_tests.cpp
+++ b/cpp/tests/stream_compaction/stable_distinct_tests.cpp
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2023, NVIDIA CORPORATION.
+ * Copyright (c) 2023-2024, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -137,7 +137,7 @@ TEST_F(StableDistinctKeepAny, NoColumnInputTable)
 
 TEST_F(StableDistinctKeepAny, EmptyKeys)
 {
-  int32s_col col{{5, 4, 3, 5, 8, 1}, {1, 0, 1, 1, 1, 1}};
+  int32s_col col{{5, 4, 3, 5, 8, 1}, {true, false, true, true, true, true}};
   int32s_col empty_col{};
   cudf::table_view input{{col}};
   std::vector<cudf::size_type> key_idx{};
diff --git a/cpp/tests/stream_compaction/unique_tests.cpp b/cpp/tests/stream_compaction/unique_tests.cpp
index 01f5f4d39db..4d7d23dc881 100644
--- a/cpp/tests/stream_compaction/unique_tests.cpp
+++ b/cpp/tests/stream_compaction/unique_tests.cpp
@@ -56,15 +56,17 @@ struct Unique : public cudf::test::BaseFixture {};
 
 TEST_F(Unique, StringKeyColumn)
 {
-  cudf::test::fixed_width_column_wrapper<int32_t> col{{5, 4, 4, 5, 5, 8, 1}, {1, 0, 0, 1, 1, 1, 1}};
+  cudf::test::fixed_width_column_wrapper<int32_t> col{{5, 4, 4, 5, 5, 8, 1},
+                                                      {true, false, false, true, true, true, true}};
   cudf::test::strings_column_wrapper key_col{{"all", "new", "new", "all", "new", "the", "strings"},
-                                             {1, 1, 1, 1, 0, 1, 1}};
+                                             {true, true, true, true, false, true, true}};
   cudf::table_view input{{col, key_col}};
   std::vector<cudf::size_type> keys{1};
 
-  cudf::test::fixed_width_column_wrapper<int32_t> exp_col{{5, 4, 5, 5, 8, 1}, {1, 0, 1, 1, 1, 1}};
+  cudf::test::fixed_width_column_wrapper<int32_t> exp_col{{5, 4, 5, 5, 8, 1},
+                                                          {true, false, true, true, true, true}};
   cudf::test::strings_column_wrapper exp_key_col{{"all", "new", "all", "new", "the", "strings"},
-                                                 {1, 1, 1, 0, 1, 1}};
+                                                 {true, true, true, false, true, true}};
   cudf::table_view expected{{exp_col, exp_key_col}};
 
   auto got = unique(input, keys, cudf::duplicate_keep_option::KEEP_LAST);
@@ -92,7 +94,8 @@ TEST_F(Unique, NoColumnInputTable)
 
 TEST_F(Unique, EmptyKeys)
 {
-  cudf::test::fixed_width_column_wrapper<int32_t> col{{5, 4, 3, 5, 8, 1}, {1, 0, 1, 1, 1, 1}};
+  cudf::test::fixed_width_column_wrapper<int32_t> col{{5, 4, 3, 5, 8, 1},
+                                                      {true, false, true, true, true, true}};
   cudf::test::fixed_width_column_wrapper<int32_t> empty_col{};
   cudf::table_view input{{col}};
   std::vector<cudf::size_type> keys{};
@@ -151,17 +154,18 @@ TEST_F(Unique, NonNullTable)
 
 TEST_F(Unique, KeepFirstWithNull)
 {
-  cudf::test::fixed_width_column_wrapper<int32_t> col{{5, 4, 3, 2, 5, 8, 1}, {1, 0, 1, 1, 1, 1, 1}};
+  cudf::test::fixed_width_column_wrapper<int32_t> col{{5, 4, 3, 2, 5, 8, 1},
+                                                      {true, false, true, true, true, true, true}};
   cudf::test::fixed_width_column_wrapper<int32_t> key{{20, 20, 20, 20, 19, 21, 19},
-                                                      {1, 1, 0, 0, 1, 1, 1}};
+                                                      {true, true, false, false, true, true, true}};
   cudf::table_view input{{col, key}};
   std::vector<cudf::size_type> keys{1};
 
   // nulls are equal
-  cudf::test::fixed_width_column_wrapper<int32_t> exp_col_first_equal{{5, 3, 5, 8, 1},
-                                                                      {1, 1, 1, 1, 1}};
-  cudf::test::fixed_width_column_wrapper<int32_t> exp_key_col_first_equal{{20, 20, 19, 21, 19},
-                                                                          {1, 0, 1, 1, 1}};
+  cudf::test::fixed_width_column_wrapper<int32_t> exp_col_first_equal{
+    {5, 3, 5, 8, 1}, {true, true, true, true, true}};
+  cudf::test::fixed_width_column_wrapper<int32_t> exp_key_col_first_equal{
+    {20, 20, 19, 21, 19}, {true, false, true, true, true}};
   cudf::table_view expected_first_equal{{exp_col_first_equal, exp_key_col_first_equal}};
   auto got_first_equal =
     unique(input, keys, cudf::duplicate_keep_option::KEEP_FIRST, null_equality::EQUAL);
@@ -169,10 +173,10 @@ TEST_F(Unique, KeepFirstWithNull)
   CUDF_TEST_EXPECT_TABLES_EQUAL(expected_first_equal, got_first_equal->view());
 
   // nulls are unequal
-  cudf::test::fixed_width_column_wrapper<int32_t> exp_col_first_unequal{{5, 3, 2, 5, 8, 1},
-                                                                        {1, 1, 1, 1, 1, 1}};
+  cudf::test::fixed_width_column_wrapper<int32_t> exp_col_first_unequal{
+    {5, 3, 2, 5, 8, 1}, {true, true, true, true, true, true}};
   cudf::test::fixed_width_column_wrapper<int32_t> exp_key_col_first_unequal{
-    {20, 20, 20, 19, 21, 19}, {1, 0, 0, 1, 1, 1}};
+    {20, 20, 20, 19, 21, 19}, {true, false, false, true, true, true}};
   cudf::table_view expected_first_unequal{{exp_col_first_unequal, exp_key_col_first_unequal}};
   auto got_first_unequal =
     unique(input, keys, cudf::duplicate_keep_option::KEEP_FIRST, null_equality::UNEQUAL);
@@ -182,17 +186,18 @@ TEST_F(Unique, KeepFirstWithNull)
 
 TEST_F(Unique, KeepLastWithNull)
 {
-  cudf::test::fixed_width_column_wrapper<int32_t> col{{5, 4, 3, 2, 5, 8, 1}, {1, 0, 1, 1, 1, 1, 1}};
+  cudf::test::fixed_width_column_wrapper<int32_t> col{{5, 4, 3, 2, 5, 8, 1},
+                                                      {true, false, true, true, true, true, true}};
   cudf::test::fixed_width_column_wrapper<int32_t> key{{20, 20, 20, 20, 19, 21, 19},
-                                                      {1, 1, 0, 0, 1, 1, 1}};
+                                                      {true, true, false, false, true, true, true}};
   cudf::table_view input{{col, key}};
   std::vector<cudf::size_type> keys{1};
 
   // nulls are equal
-  cudf::test::fixed_width_column_wrapper<int32_t> exp_col_last_equal{{4, 2, 5, 8, 1},
-                                                                     {0, 1, 1, 1, 1}};
-  cudf::test::fixed_width_column_wrapper<int32_t> exp_key_col_last_equal{{20, 20, 19, 21, 19},
-                                                                         {1, 0, 1, 1, 1}};
+  cudf::test::fixed_width_column_wrapper<int32_t> exp_col_last_equal{
+    {4, 2, 5, 8, 1}, {false, true, true, true, true}};
+  cudf::test::fixed_width_column_wrapper<int32_t> exp_key_col_last_equal{
+    {20, 20, 19, 21, 19}, {true, false, true, true, true}};
   cudf::table_view expected_last_equal{{exp_col_last_equal, exp_key_col_last_equal}};
   auto got_last_equal =
     unique(input, keys, cudf::duplicate_keep_option::KEEP_LAST, null_equality::EQUAL);
@@ -200,10 +205,10 @@ TEST_F(Unique, KeepLastWithNull)
   CUDF_TEST_EXPECT_TABLES_EQUAL(expected_last_equal, got_last_equal->view());
 
   // nulls are unequal
-  cudf::test::fixed_width_column_wrapper<int32_t> exp_col_last_unequal{{4, 3, 2, 5, 8, 1},
-                                                                       {0, 1, 1, 1, 1, 1}};
-  cudf::test::fixed_width_column_wrapper<int32_t> exp_key_col_last_unequal{{20, 20, 20, 19, 21, 19},
-                                                                           {1, 0, 0, 1, 1, 1}};
+  cudf::test::fixed_width_column_wrapper<int32_t> exp_col_last_unequal{
+    {4, 3, 2, 5, 8, 1}, {false, true, true, true, true, true}};
+  cudf::test::fixed_width_column_wrapper<int32_t> exp_key_col_last_unequal{
+    {20, 20, 20, 19, 21, 19}, {true, false, false, true, true, true}};
   cudf::table_view expected_last_unequal{{exp_col_last_unequal, exp_key_col_last_unequal}};
   auto got_last_unequal =
     unique(input, keys, cudf::duplicate_keep_option::KEEP_LAST, null_equality::UNEQUAL);
@@ -213,15 +218,18 @@ TEST_F(Unique, KeepLastWithNull)
 
 TEST_F(Unique, KeepNoneWithNull)
 {
-  cudf::test::fixed_width_column_wrapper<int32_t> col{{5, 4, 3, 2, 5, 8, 1}, {1, 0, 1, 1, 1, 1, 1}};
+  cudf::test::fixed_width_column_wrapper<int32_t> col{{5, 4, 3, 2, 5, 8, 1},
+                                                      {true, false, true, true, true, true, true}};
   cudf::test::fixed_width_column_wrapper<int32_t> key{{20, 20, 20, 20, 19, 21, 19},
-                                                      {1, 1, 0, 0, 1, 1, 1}};
+                                                      {true, true, false, false, true, true, true}};
   cudf::table_view input{{col, key}};
   std::vector<cudf::size_type> keys{1};
 
   // nulls are equal
-  cudf::test::fixed_width_column_wrapper<int32_t> exp_col_unique_equal{{5, 8, 1}, {1, 1, 1}};
-  cudf::test::fixed_width_column_wrapper<int32_t> exp_key_col_unique_equal{{19, 21, 19}, {1, 1, 1}};
+  cudf::test::fixed_width_column_wrapper<int32_t> exp_col_unique_equal{{5, 8, 1},
+                                                                       {true, true, true}};
+  cudf::test::fixed_width_column_wrapper<int32_t> exp_key_col_unique_equal{{19, 21, 19},
+                                                                           {true, true, true}};
   cudf::table_view expected_unique_equal{{exp_col_unique_equal, exp_key_col_unique_equal}};
   auto got_unique_equal =
     unique(input, keys, cudf::duplicate_keep_option::KEEP_NONE, null_equality::EQUAL);
@@ -229,10 +237,10 @@ TEST_F(Unique, KeepNoneWithNull)
   CUDF_TEST_EXPECT_TABLES_EQUAL(expected_unique_equal, got_unique_equal->view());
 
   // nulls are unequal
-  cudf::test::fixed_width_column_wrapper<int32_t> exp_col_unique_unequal{{3, 2, 5, 8, 1},
-                                                                         {1, 1, 1, 1, 1}};
-  cudf::test::fixed_width_column_wrapper<int32_t> exp_key_col_unique_unequal{{20, 20, 19, 21, 19},
-                                                                             {0, 0, 1, 1, 1}};
+  cudf::test::fixed_width_column_wrapper<int32_t> exp_col_unique_unequal{
+    {3, 2, 5, 8, 1}, {true, true, true, true, true}};
+  cudf::test::fixed_width_column_wrapper<int32_t> exp_key_col_unique_unequal{
+    {20, 20, 19, 21, 19}, {false, false, true, true, true}};
   cudf::table_view expected_unique_unequal{{exp_col_unique_unequal, exp_key_col_unique_unequal}};
   auto got_unique_unequal =
     unique(input, keys, cudf::duplicate_keep_option::KEEP_NONE, null_equality::UNEQUAL);
diff --git a/cpp/tests/streams/interop_test.cpp b/cpp/tests/streams/interop_test.cpp
index cf620749d8f..9e4ee5a4a93 100644
--- a/cpp/tests/streams/interop_test.cpp
+++ b/cpp/tests/streams/interop_test.cpp
@@ -21,6 +21,7 @@
 #include <cudf/interop.hpp>
 #include <cudf/scalar/scalar.hpp>
 #include <cudf/scalar/scalar_factories.hpp>
+#include <cudf/table/table_view.hpp>
 
 struct ArrowTest : public cudf::test::BaseFixture {};
 
diff --git a/cpp/tests/streams/io/orc_test.cpp b/cpp/tests/streams/io/orc_test.cpp
index 57e36d13224..401c7049381 100644
--- a/cpp/tests/streams/io/orc_test.cpp
+++ b/cpp/tests/streams/io/orc_test.cpp
@@ -60,7 +60,7 @@ cudf::table construct_table()
   cudf::test::fixed_width_column_wrapper<float> col4(zeros_iterator, zeros_iterator + num_rows);
   cudf::test::fixed_width_column_wrapper<double> col5(zeros_iterator, zeros_iterator + num_rows);
 
-  cudf::test::fixed_width_column_wrapper<numeric::decimal128> col6 = [&ones_iterator, num_rows] {
+  cudf::test::fixed_width_column_wrapper<numeric::decimal128> col6 = [&ones_iterator] {
     auto col6_data = cudf::detail::make_counting_transform_iterator(0, [&](auto i) {
       return numeric::decimal128{ones_iterator[i], numeric::scale_type{12}};
     });
@@ -68,7 +68,7 @@ cudf::table construct_table()
                                                                        col6_data + num_rows);
   }();
 
-  cudf::test::fixed_width_column_wrapper<numeric::decimal128> col7 = [&ones_iterator, num_rows] {
+  cudf::test::fixed_width_column_wrapper<numeric::decimal128> col7 = [&ones_iterator] {
     auto col7_data = cudf::detail::make_counting_transform_iterator(0, [&](auto i) {
       return numeric::decimal128{ones_iterator[i], numeric::scale_type{-12}};
     });
diff --git a/cpp/tests/streams/io/parquet_test.cpp b/cpp/tests/streams/io/parquet_test.cpp
index f6bb2cf4336..b277d184e3a 100644
--- a/cpp/tests/streams/io/parquet_test.cpp
+++ b/cpp/tests/streams/io/parquet_test.cpp
@@ -55,14 +55,14 @@ cudf::table construct_table()
   cudf::test::fixed_width_column_wrapper<int32_t> col3(zeros.begin(), zeros.end());
   cudf::test::fixed_width_column_wrapper<float> col4(zeros.begin(), zeros.end());
   cudf::test::fixed_width_column_wrapper<double> col5(zeros.begin(), zeros.end());
-  cudf::test::fixed_width_column_wrapper<numeric::decimal128> col6 = [&ones, num_rows] {
+  cudf::test::fixed_width_column_wrapper<numeric::decimal128> col6 = [&ones] {
     auto col6_data = cudf::detail::make_counting_transform_iterator(0, [&](auto i) {
       return numeric::decimal128{ones[i], numeric::scale_type{12}};
     });
     return cudf::test::fixed_width_column_wrapper<numeric::decimal128>(col6_data,
                                                                        col6_data + num_rows);
   }();
-  cudf::test::fixed_width_column_wrapper<numeric::decimal128> col7 = [&ones, num_rows] {
+  cudf::test::fixed_width_column_wrapper<numeric::decimal128> col7 = [&ones] {
     auto col7_data = cudf::detail::make_counting_transform_iterator(0, [&](auto i) {
       return numeric::decimal128{ones[i], numeric::scale_type{-12}};
     });
diff --git a/cpp/tests/streams/lists_test.cpp b/cpp/tests/streams/lists_test.cpp
index 74e0e8837f7..711e20e4b17 100644
--- a/cpp/tests/streams/lists_test.cpp
+++ b/cpp/tests/streams/lists_test.cpp
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2023, NVIDIA CORPORATION.
+ * Copyright (c) 2023-2024, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -154,7 +154,8 @@ TEST_F(ListTest, StableSortLists)
 TEST_F(ListTest, ApplyBooleanMask)
 {
   cudf::test::lists_column_wrapper<int> list_col{{0, 1}, {2, 3, 7, 8}, {4, 5}};
-  cudf::test::lists_column_wrapper<bool> boolean_mask{{0, 1}, {1, 1, 1, 0}, {0, 1}};
+  cudf::test::lists_column_wrapper<bool> boolean_mask{
+    {false, true}, {true, true, true, false}, {false, true}};
   cudf::lists::apply_boolean_mask(list_col, boolean_mask, cudf::test::get_default_stream());
 }
 
diff --git a/cpp/tests/streams/reduction_test.cpp b/cpp/tests/streams/reduction_test.cpp
index 53dd1eed459..e6438ac2834 100644
--- a/cpp/tests/streams/reduction_test.cpp
+++ b/cpp/tests/streams/reduction_test.cpp
@@ -48,8 +48,9 @@ TEST_F(ReductionTest, ReductionSumScalarInit)
 
 TEST_F(ReductionTest, SegmentedReductionSum)
 {
-  auto const input     = cudf::test::fixed_width_column_wrapper<int>{{1, 2, 3, 1, 0, 3, 1, 0, 0, 0},
-                                                                     {1, 1, 1, 1, 0, 1, 1, 0, 0, 0}};
+  auto const input = cudf::test::fixed_width_column_wrapper<int>{
+    {1, 2, 3, 1, 0, 3, 1, 0, 0, 0},
+    {true, true, true, true, false, true, true, false, false, false}};
   auto const offsets   = std::vector<cudf::size_type>{0, 3, 6, 7, 8, 10, 10};
   auto const d_offsets = cudf::detail::make_device_uvector_async(
     offsets, cudf::test::get_default_stream(), rmm::mr::get_current_device_resource());
@@ -65,8 +66,9 @@ TEST_F(ReductionTest, SegmentedReductionSum)
 
 TEST_F(ReductionTest, SegmentedReductionSumScalarInit)
 {
-  auto const input     = cudf::test::fixed_width_column_wrapper<int>{{1, 2, 3, 1, 0, 3, 1, 0, 0, 0},
-                                                                     {1, 1, 1, 1, 0, 1, 1, 0, 0, 0}};
+  auto const input = cudf::test::fixed_width_column_wrapper<int>{
+    {1, 2, 3, 1, 0, 3, 1, 0, 0, 0},
+    {true, true, true, true, false, true, true, false, false, false}};
   auto const offsets   = std::vector<cudf::size_type>{0, 3, 6, 7, 8, 10, 10};
   auto const d_offsets = cudf::detail::make_device_uvector_async(
     offsets, cudf::test::get_default_stream(), rmm::mr::get_current_device_resource());
@@ -84,7 +86,8 @@ TEST_F(ReductionTest, SegmentedReductionSumScalarInit)
 TEST_F(ReductionTest, ScanMin)
 {
   auto const input = cudf::test::fixed_width_column_wrapper<int>{
-    {123, 64, 63, 99, -5, 123, -16, -120, -111}, {1, 0, 1, 1, 1, 1, 0, 0, 1}};
+    {123, 64, 63, 99, -5, 123, -16, -120, -111},
+    {true, false, true, true, true, true, false, false, true}};
 
   cudf::scan(input,
              *cudf::make_min_aggregation<cudf::scan_aggregation>(),
@@ -96,7 +99,8 @@ TEST_F(ReductionTest, ScanMin)
 TEST_F(ReductionTest, MinMax)
 {
   auto const input = cudf::test::fixed_width_column_wrapper<int>{
-    {123, 64, 63, 99, -5, 123, -16, -120, -111}, {1, 0, 1, 1, 1, 1, 0, 0, 1}};
+    {123, 64, 63, 99, -5, 123, -16, -120, -111},
+    {true, false, true, true, true, true, false, false, true}};
 
   cudf::minmax(input, cudf::test::get_default_stream());
 }
diff --git a/cpp/tests/streams/replace_test.cpp b/cpp/tests/streams/replace_test.cpp
index 25293db4347..752ddc87dfc 100644
--- a/cpp/tests/streams/replace_test.cpp
+++ b/cpp/tests/streams/replace_test.cpp
@@ -27,21 +27,24 @@ class ReplaceTest : public cudf::test::BaseFixture {};
 
 TEST_F(ReplaceTest, ReplaceNullsColumn)
 {
-  cudf::test::fixed_width_column_wrapper<int> input({{0, 0, 0, 0, 0}, {0, 0, 1, 1, 1}});
+  cudf::test::fixed_width_column_wrapper<int> input(
+    {{0, 0, 0, 0, 0}, {false, false, true, true, true}});
   cudf::test::fixed_width_column_wrapper<int> replacement({1, 1, 1, 1, 1});
   cudf::replace_nulls(input, replacement, cudf::test::get_default_stream());
 }
 
 TEST_F(ReplaceTest, ReplaceNullsScalar)
 {
-  cudf::test::fixed_width_column_wrapper<int> input({{0, 0, 0, 0, 0}, {0, 0, 1, 1, 1}});
+  cudf::test::fixed_width_column_wrapper<int> input(
+    {{0, 0, 0, 0, 0}, {false, false, true, true, true}});
   auto replacement = cudf::numeric_scalar<int>(1, true, cudf::test::get_default_stream());
   cudf::replace_nulls(input, replacement, cudf::test::get_default_stream());
 }
 
 TEST_F(ReplaceTest, ReplaceNullsPolicy)
 {
-  cudf::test::fixed_width_column_wrapper<int> input({{0, 0, 0, 0, 0}, {0, 0, 1, 1, 1}});
+  cudf::test::fixed_width_column_wrapper<int> input(
+    {{0, 0, 0, 0, 0}, {false, false, true, true, true}});
   cudf::replace_nulls(input, cudf::replace_policy::FOLLOWING, cudf::test::get_default_stream());
 }
 
diff --git a/cpp/tests/streams/strings/filter_test.cpp b/cpp/tests/streams/strings/filter_test.cpp
index 53ebe4e0b0d..b4e361201fd 100644
--- a/cpp/tests/streams/strings/filter_test.cpp
+++ b/cpp/tests/streams/strings/filter_test.cpp
@@ -41,7 +41,7 @@ TEST_F(StringsFilterTest, Translate)
   auto view  = cudf::strings_column_view(input);
 
   std::vector<std::pair<cudf::char_utf8, cudf::char_utf8>> translate_table{
-    make_entry("b", 0), make_entry("a", "A"), make_entry(" ", "_")};
+    make_entry("b", nullptr), make_entry("a", "A"), make_entry(" ", "_")};
   cudf::strings::translate(view, translate_table, cudf::test::get_default_stream());
 }
 
@@ -51,7 +51,7 @@ TEST_F(StringsFilterTest, Filter)
   auto view  = cudf::strings_column_view(input);
 
   std::vector<std::pair<cudf::char_utf8, cudf::char_utf8>> filter_table{
-    make_entry("b", 0), make_entry("a", "A"), make_entry(" ", "_")};
+    make_entry("b", nullptr), make_entry("a", "A"), make_entry(" ", "_")};
 
   auto const repl = cudf::string_scalar("X", true, cudf::test::get_default_stream());
   auto const keep = cudf::strings::filter_type::KEEP;
diff --git a/cpp/tests/strings/case_tests.cpp b/cpp/tests/strings/case_tests.cpp
index bb0e77a29d0..ce61a1bda8c 100644
--- a/cpp/tests/strings/case_tests.cpp
+++ b/cpp/tests/strings/case_tests.cpp
@@ -99,28 +99,28 @@ TEST_F(StringsCaseTest, Capitalize)
 {
   cudf::test::strings_column_wrapper strings(
     {"SȺȺnich xyZ", "Examples aBc", "thesé", "", "ARE\tTHE", "tést\tstrings", ""},
-    {1, 1, 1, 0, 1, 1, 1});
+    {true, true, true, false, true, true, true});
   auto strings_view = cudf::strings_column_view(strings);
 
   {
     auto results = cudf::strings::capitalize(strings_view);
     cudf::test::strings_column_wrapper expected(
       {"Sⱥⱥnich xyz", "Examples abc", "Thesé", "", "Are\tthe", "Tést\tstrings", ""},
-      {1, 1, 1, 0, 1, 1, 1});
+      {true, true, true, false, true, true, true});
     CUDF_TEST_EXPECT_COLUMNS_EQUAL(*results, expected);
   }
   {
     auto results = cudf::strings::capitalize(strings_view, std::string(" "));
     cudf::test::strings_column_wrapper expected(
       {"Sⱥⱥnich Xyz", "Examples Abc", "Thesé", "", "Are\tthe", "Tést\tstrings", ""},
-      {1, 1, 1, 0, 1, 1, 1});
+      {true, true, true, false, true, true, true});
     CUDF_TEST_EXPECT_COLUMNS_EQUAL(*results, expected);
   }
   {
     auto results = cudf::strings::capitalize(strings_view, std::string(" \t"));
     cudf::test::strings_column_wrapper expected(
       {"Sⱥⱥnich Xyz", "Examples Abc", "Thesé", "", "Are\tThe", "Tést\tStrings", ""},
-      {1, 1, 1, 0, 1, 1, 1});
+      {true, true, true, false, true, true, true});
     CUDF_TEST_EXPECT_COLUMNS_EQUAL(*results, expected);
   }
 }
@@ -129,47 +129,49 @@ TEST_F(StringsCaseTest, Title)
 {
   cudf::test::strings_column_wrapper input(
     {"SȺȺnich", "Examples aBc", "thesé", "", "ARE THE", "tést strings", "", "n2viDIA corp"},
-    {1, 1, 1, 0, 1, 1, 1, 1});
+    {true, true, true, false, true, true, true, true});
   auto strings_view = cudf::strings_column_view(input);
 
   auto results = cudf::strings::title(strings_view);
 
   cudf::test::strings_column_wrapper expected(
     {"Sⱥⱥnich", "Examples Abc", "Thesé", "", "Are The", "Tést Strings", "", "N2Vidia Corp"},
-    {1, 1, 1, 0, 1, 1, 1, 1});
+    {true, true, true, false, true, true, true, true});
   CUDF_TEST_EXPECT_COLUMNS_EQUAL(*results, expected);
 
   results = cudf::strings::title(strings_view, cudf::strings::string_character_types::ALPHANUM);
 
   cudf::test::strings_column_wrapper expected2(
     {"Sⱥⱥnich", "Examples Abc", "Thesé", "", "Are The", "Tést Strings", "", "N2vidia Corp"},
-    {1, 1, 1, 0, 1, 1, 1, 1});
+    {true, true, true, false, true, true, true, true});
   CUDF_TEST_EXPECT_COLUMNS_EQUAL(*results, expected2);
 }
 
 TEST_F(StringsCaseTest, IsTitle)
 {
-  cudf::test::strings_column_wrapper input({"Sⱥⱥnich",
-                                            "Examples Abc",
-                                            "Thesé Strings",
-                                            "",
-                                            "Are The",
-                                            "Tést strings",
-                                            "",
-                                            "N2Vidia Corp",
-                                            "SNAKE",
-                                            "!Abc",
-                                            " Eagle",
-                                            "A Test",
-                                            "12345",
-                                            "Alpha Not Upper Or Lower: ƻC",
-                                            "one More"},
-                                           {1, 1, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1});
+  cudf::test::strings_column_wrapper input(
+    {"Sⱥⱥnich",
+     "Examples Abc",
+     "Thesé Strings",
+     "",
+     "Are The",
+     "Tést strings",
+     "",
+     "N2Vidia Corp",
+     "SNAKE",
+     "!Abc",
+     " Eagle",
+     "A Test",
+     "12345",
+     "Alpha Not Upper Or Lower: ƻC",
+     "one More"},
+    {true, true, true, false, true, true, true, true, true, true, true, true, true, true, true});
 
   auto results = cudf::strings::is_title(cudf::strings_column_view(input));
 
   cudf::test::fixed_width_column_wrapper<bool> expected(
-    {1, 1, 1, 0, 1, 0, 0, 1, 0, 1, 1, 1, 0, 1, 0}, {1, 1, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1});
+    {1, 1, 1, 0, 1, 0, 0, 1, 0, 1, 1, 1, 0, 1, 0},
+    {true, true, true, false, true, true, true, true, true, true, true, true, true, true, true});
   CUDF_TEST_EXPECT_COLUMNS_EQUAL(*results, expected);
 }
 
diff --git a/cpp/tests/strings/chars_types_tests.cpp b/cpp/tests/strings/chars_types_tests.cpp
index fbc059186a8..7e530b2a34d 100644
--- a/cpp/tests/strings/chars_types_tests.cpp
+++ b/cpp/tests/strings/chars_types_tests.cpp
@@ -148,7 +148,22 @@ TEST_F(StringsCharsTest, Alphanumeric)
   auto results = cudf::strings::all_characters_of_type(
     strings_view, cudf::strings::string_character_types::ALPHANUM);
 
-  std::vector<bool> h_expected{1, 1, 0, 1, 0, 0, 0, 0, 0, 1, 1, 1, 0, 1, 1, 0};
+  std::vector<bool> h_expected{true,
+                               true,
+                               false,
+                               true,
+                               false,
+                               false,
+                               false,
+                               false,
+                               false,
+                               true,
+                               true,
+                               true,
+                               false,
+                               true,
+                               true,
+                               false};
   cudf::test::fixed_width_column_wrapper<bool> expected(
     h_expected.begin(),
     h_expected.end(),
@@ -186,7 +201,22 @@ TEST_F(StringsCharsTest, AlphaNumericSpace)
   auto results = cudf::strings::all_characters_of_type(
     strings_view, (cudf::strings::string_character_types)types);
 
-  std::vector<bool> h_expected{1, 1, 0, 1, 1, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1};
+  std::vector<bool> h_expected{true,
+                               true,
+                               false,
+                               true,
+                               true,
+                               false,
+                               false,
+                               false,
+                               false,
+                               true,
+                               true,
+                               true,
+                               true,
+                               true,
+                               true,
+                               true};
   cudf::test::fixed_width_column_wrapper<bool> expected(
     h_expected.begin(),
     h_expected.end(),
@@ -225,7 +255,22 @@ TEST_F(StringsCharsTest, Numerics)
   auto results = cudf::strings::all_characters_of_type(
     strings_view, (cudf::strings::string_character_types)types);
 
-  std::vector<bool> h_expected{0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 1, 0, 1, 0, 0};
+  std::vector<bool> h_expected{false,
+                               false,
+                               false,
+                               false,
+                               false,
+                               false,
+                               false,
+                               false,
+                               false,
+                               true,
+                               false,
+                               true,
+                               false,
+                               true,
+                               false,
+                               false};
   cudf::test::fixed_width_column_wrapper<bool> expected(
     h_expected.begin(),
     h_expected.end(),
diff --git a/cpp/tests/strings/combine/concatenate_tests.cpp b/cpp/tests/strings/combine/concatenate_tests.cpp
index 95993e6ecbc..bb57d6f5e8a 100644
--- a/cpp/tests/strings/combine/concatenate_tests.cpp
+++ b/cpp/tests/strings/combine/concatenate_tests.cpp
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2019-2023, NVIDIA CORPORATION.
+ * Copyright (c) 2019-2024, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -98,11 +98,11 @@ TEST_F(StringsCombineTest, Concatenate)
 TEST_F(StringsCombineTest, ConcatenateSkipNulls)
 {
   cudf::test::strings_column_wrapper strings1({"eee", "", "", "", "aa", "bbb", "ééé"},
-                                              {1, 0, 0, 1, 1, 1, 1});
+                                              {true, false, false, true, true, true, true});
   cudf::test::strings_column_wrapper strings2({"xyz", "", "d", "éa", "", "", "f"},
-                                              {1, 0, 1, 1, 1, 0, 1});
+                                              {true, false, true, true, true, false, true});
   cudf::test::strings_column_wrapper strings3({"q", "", "s", "t", "u", "", "w"},
-                                              {1, 1, 1, 1, 1, 0, 1});
+                                              {true, true, true, true, true, false, true});
 
   cudf::table_view table({strings1, strings2, strings3});
 
@@ -126,7 +126,8 @@ TEST_F(StringsCombineTest, ConcatenateSkipNulls)
   }
   {
     cudf::test::strings_column_wrapper expected(
-      {"eee+xyz+q", "", "", "+éa+t", "aa++u", "", "ééé+f+w"}, {1, 0, 0, 1, 1, 0, 1});
+      {"eee+xyz+q", "", "", "+éa+t", "aa++u", "", "ééé+f+w"},
+      {true, false, false, true, true, false, true});
     auto results = cudf::strings::concatenate(table,
                                               cudf::string_scalar("+"),
                                               cudf::string_scalar("", false),
diff --git a/cpp/tests/strings/combine/join_strings_tests.cpp b/cpp/tests/strings/combine/join_strings_tests.cpp
index ecc7432201f..817cbab461b 100644
--- a/cpp/tests/strings/combine/join_strings_tests.cpp
+++ b/cpp/tests/strings/combine/join_strings_tests.cpp
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2019-2023, NVIDIA CORPORATION.
+ * Copyright (c) 2019-2024, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -82,10 +82,10 @@ TEST_F(JoinStringsTest, JoinZeroSizeStringsColumn)
 
 TEST_F(JoinStringsTest, JoinAllNullStringsColumn)
 {
-  cudf::test::strings_column_wrapper strings({"", "", ""}, {0, 0, 0});
+  cudf::test::strings_column_wrapper strings({"", "", ""}, {false, false, false});
 
   auto results = cudf::strings::join_strings(cudf::strings_column_view(strings));
-  cudf::test::strings_column_wrapper expected1({""}, {0});
+  cudf::test::strings_column_wrapper expected1({""}, {false});
   CUDF_TEST_EXPECT_COLUMNS_EQUAL(*results, expected1);
 
   results = cudf::strings::join_strings(
diff --git a/cpp/tests/strings/contains_tests.cpp b/cpp/tests/strings/contains_tests.cpp
index 2d9e2035e5e..59423d5b927 100644
--- a/cpp/tests/strings/contains_tests.cpp
+++ b/cpp/tests/strings/contains_tests.cpp
@@ -86,8 +86,8 @@ TEST_F(StringsContainsTests, ContainsTest)
                                     "\n",
                                     "b.\\s*\n",
                                     ".*c",
-                                    "\\d\\d:\\d\\d:\\d\\d",
-                                    "\\d\\d?:\\d\\d?:\\d\\d?",
+                                    R"(\d\d:\d\d:\d\d)",
+                                    R"(\d\d?:\d\d?:\d\d?)",
                                     "[Hh]ello [Ww]orld",
                                     "\\bworld\\b",
                                     ".*"};
@@ -282,7 +282,7 @@ TEST_F(StringsContainsTests, OctalTest)
   results  = cudf::strings::contains_re(strings_view, *prog);
   CUDF_TEST_EXPECT_COLUMNS_EQUAL(*results, expected);
 
-  pattern  = std::string("[\\7][\\11][\\15]");
+  pattern  = std::string(R"([\7][\11][\15])");
   expected = cudf::test::fixed_width_column_wrapper<bool>({0, 0, 0, 0, 0, 1});
   prog     = cudf::strings::regex_program::create(pattern);
   results  = cudf::strings::contains_re(strings_view, *prog);
@@ -689,11 +689,11 @@ TEST_F(StringsContainsTests, ASCII)
   auto input = cudf::test::strings_column_wrapper({"abc \t\f\r 12", "áé 　❽❽", "aZ ❽4", "XYZ　8"});
   auto view = cudf::strings_column_view(input);
 
-  std::string patterns[] = {"\\w+[\\s]+\\d+",
-                            "[^\\W]+\\s+[^\\D]+",
-                            "[\\w]+[^\\S]+[\\d]+",
-                            "[\\w]+\\s+[\\d]+",
-                            "\\w+\\s+\\d+"};
+  std::string patterns[] = {R"(\w+[\s]+\d+)",
+                            R"([^\W]+\s+[^\D]+)",
+                            R"([\w]+[^\S]+[\d]+)",
+                            R"([\w]+\s+[\d]+)",
+                            R"(\w+\s+\d+)"};
 
   for (auto ptn : patterns) {
     auto expected_contains = cudf::test::fixed_width_column_wrapper<bool>({1, 0, 0, 0});
diff --git a/cpp/tests/strings/datetime_tests.cpp b/cpp/tests/strings/datetime_tests.cpp
index bb5c96a09bf..b3dc3010c67 100644
--- a/cpp/tests/strings/datetime_tests.cpp
+++ b/cpp/tests/strings/datetime_tests.cpp
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2019-2023, NVIDIA CORPORATION.
+ * Copyright (c) 2019-2024, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -59,8 +59,8 @@ TEST_F(StringsDatetimeTest, ToTimestamp)
   CUDF_TEST_EXPECT_COLUMNS_EQUAL(*results, expected);
 
   results = cudf::strings::is_timestamp(strings_view, "%Y-%m-%dT%H:%M:%SZ");
-  cudf::test::fixed_width_column_wrapper<bool> is_expected({1, 1, 0, 0, 1, 1, 1, 1},
-                                                           {1, 1, 0, 1, 1, 1, 1, 1});
+  cudf::test::fixed_width_column_wrapper<bool> is_expected(
+    {1, 1, 0, 0, 1, 1, 1, 1}, {true, true, false, true, true, true, true, true});
   CUDF_TEST_EXPECT_COLUMNS_EQUAL(*results, is_expected);
 }
 
diff --git a/cpp/tests/strings/extract_tests.cpp b/cpp/tests/strings/extract_tests.cpp
index 70112f7ca75..b26cbd5a549 100644
--- a/cpp/tests/strings/extract_tests.cpp
+++ b/cpp/tests/strings/extract_tests.cpp
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2019-2023, NVIDIA CORPORATION.
+ * Copyright (c) 2019-2024, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -98,7 +98,7 @@ TEST_F(StringsExtractTests, ExtractDomainTest)
                                               "a23-44-13-2.deploy.static.akamaitechnologies.com"});
   auto strings_view = cudf::strings_column_view(strings);
 
-  std::string pattern = "([\\w]+[\\.].*[^/]|[\\-\\w]+[\\.].*[^/])";
+  std::string pattern = R"(([\w]+[\.].*[^/]|[\-\w]+[\.].*[^/]))";
 
   cudf::test::strings_column_wrapper expected1({
     "www.google.com",
@@ -126,11 +126,11 @@ TEST_F(StringsExtractTests, ExtractDomainTest)
 TEST_F(StringsExtractTests, ExtractEventTest)
 {
   std::vector<std::string> patterns({"(^[0-9]+\\.?[0-9]*),",
-                                     "search_name=\"([0-9A-Za-z\\s\\-\\(\\)]+)",
-                                     "message.ip=\"([\\w\\.]+)",
-                                     "message.hostname=\"([\\w\\.]+)",
-                                     "message.user_name=\"([\\w\\.\\@]+)",
-                                     "message\\.description=\"([\\w\\.\\s]+)"});
+                                     R"(search_name="([0-9A-Za-z\s\-\(\)]+))",
+                                     R"(message.ip="([\w\.]+))",
+                                     R"(message.hostname="([\w\.]+))",
+                                     R"(message.user_name="([\w\.\@]+))",
+                                     R"(message\.description="([\w\.\s]+))"});
 
   cudf::test::strings_column_wrapper strings(
     {"15162388.26, search_name=\"Test Search Name\", orig_time=\"1516238826\", "
@@ -164,7 +164,7 @@ TEST_F(StringsExtractTests, MultiLine)
 
   auto pattern = std::string("(^[a-c]+$)");
   cudf::test::strings_column_wrapper expected_multiline({"abc", "abc", "abc", "", "abc", "abc"},
-                                                        {1, 1, 1, 0, 1, 1});
+                                                        {true, true, true, false, true, true});
   auto expected = cudf::table_view{{expected_multiline}};
   auto prog = cudf::strings::regex_program::create(pattern, cudf::strings::regex_flags::MULTILINE);
   auto results = cudf::strings::extract(view, *prog);
@@ -172,7 +172,7 @@ TEST_F(StringsExtractTests, MultiLine)
 
   pattern = std::string("^([a-c]+)$");
   cudf::test::strings_column_wrapper expected_default({"", "", "abc", "", "abc", ""},
-                                                      {0, 0, 1, 0, 1, 0});
+                                                      {false, false, true, false, true, false});
   expected = cudf::table_view{{expected_default}};
   prog     = cudf::strings::regex_program::create(pattern);
   results  = cudf::strings::extract(view, *prog);
@@ -186,13 +186,14 @@ TEST_F(StringsExtractTests, DotAll)
 
   auto pattern = std::string("(a.*f)");
   cudf::test::strings_column_wrapper expected_dotall({"abc\nfa\nef", "abbc\nfff", "abcdef", ""},
-                                                     {1, 1, 1, 0});
+                                                     {true, true, true, false});
   auto expected = cudf::table_view{{expected_dotall}};
   auto prog     = cudf::strings::regex_program::create(pattern, cudf::strings::regex_flags::DOTALL);
   auto results  = cudf::strings::extract(view, *prog);
   CUDF_TEST_EXPECT_TABLES_EQUAL(*results, expected);
 
-  cudf::test::strings_column_wrapper expected_default({"", "", "abcdef", ""}, {0, 0, 1, 0});
+  cudf::test::strings_column_wrapper expected_default({"", "", "abcdef", ""},
+                                                      {false, false, true, false});
   expected = cudf::table_view{{expected_default}};
   prog     = cudf::strings::regex_program::create(pattern);
   results  = cudf::strings::extract(view, *prog);
diff --git a/cpp/tests/strings/fill_tests.cpp b/cpp/tests/strings/fill_tests.cpp
index aadd68402c8..ef54b00d08b 100644
--- a/cpp/tests/strings/fill_tests.cpp
+++ b/cpp/tests/strings/fill_tests.cpp
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2019-2023, NVIDIA CORPORATION.
+ * Copyright (c) 2019-2024, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -56,13 +56,13 @@ TEST_F(StringsFillTest, Fill)
   {
     auto results = cudf::fill(input, 0, 7, cudf::string_scalar(""));
     cudf::test::strings_column_wrapper expected({"", "", "", "", "", "", ""},
-                                                {1, 1, 1, 1, 1, 1, 1});
+                                                {true, true, true, true, true, true, true});
     CUDF_TEST_EXPECT_COLUMNS_EQUIVALENT(*results, expected);
   }
   {
     auto results = cudf::fill(input, 0, 7, cudf::string_scalar("", false));
     cudf::test::strings_column_wrapper expected({"", "", "", "", "", "", ""},
-                                                {0, 0, 0, 0, 0, 0, 0});
+                                                {false, false, false, false, false, false, false});
     CUDF_TEST_EXPECT_COLUMNS_EQUIVALENT(*results, expected);
   }
 }
diff --git a/cpp/tests/strings/find_multiple_tests.cpp b/cpp/tests/strings/find_multiple_tests.cpp
index 57cba495ba0..41a5940c880 100644
--- a/cpp/tests/strings/find_multiple_tests.cpp
+++ b/cpp/tests/strings/find_multiple_tests.cpp
@@ -69,7 +69,7 @@ TEST_F(StringsFindMultipleTest, ZeroSizeStringsColumn)
 
 TEST_F(StringsFindMultipleTest, ErrorTest)
 {
-  cudf::test::strings_column_wrapper strings({"this string intentionally left blank"}, {0});
+  cudf::test::strings_column_wrapper strings({"this string intentionally left blank"}, {false});
   auto strings_view = cudf::strings_column_view(strings);
 
   auto const zero_size_strings_column = cudf::make_empty_column(cudf::type_id::STRING)->view();
diff --git a/cpp/tests/strings/find_tests.cpp b/cpp/tests/strings/find_tests.cpp
index 7f89cc9fb53..2da95ba5c27 100644
--- a/cpp/tests/strings/find_tests.cpp
+++ b/cpp/tests/strings/find_tests.cpp
@@ -34,55 +34,55 @@ struct StringsFindTest : public cudf::test::BaseFixture {};
 TEST_F(StringsFindTest, Find)
 {
   cudf::test::strings_column_wrapper strings({"Héllo", "thesé", "", "lest", "tést strings", ""},
-                                             {1, 1, 0, 1, 1, 1});
+                                             {true, true, false, true, true, true});
   auto strings_view = cudf::strings_column_view(strings);
 
   {
     auto const target = cudf::string_scalar("é");
-    cudf::test::fixed_width_column_wrapper<cudf::size_type> expected({1, 4, -1, -1, 1, -1},
-                                                                     {1, 1, 0, 1, 1, 1});
+    cudf::test::fixed_width_column_wrapper<cudf::size_type> expected(
+      {1, 4, -1, -1, 1, -1}, {true, true, false, true, true, true});
     auto results = cudf::strings::find(strings_view, target);
     CUDF_TEST_EXPECT_COLUMNS_EQUAL(*results, expected);
     results = cudf::strings::rfind(strings_view, target);
     CUDF_TEST_EXPECT_COLUMNS_EQUAL(*results, expected);
   }
   {
-    cudf::test::fixed_width_column_wrapper<cudf::size_type> expected({3, -1, -1, 0, -1, -1},
-                                                                     {1, 1, 0, 1, 1, 1});
+    cudf::test::fixed_width_column_wrapper<cudf::size_type> expected(
+      {3, -1, -1, 0, -1, -1}, {true, true, false, true, true, true});
     auto results = cudf::strings::rfind(strings_view, cudf::string_scalar("l"));
     CUDF_TEST_EXPECT_COLUMNS_EQUAL(*results, expected);
   }
   {
     auto const target = cudf::string_scalar("es");
-    cudf::test::fixed_width_column_wrapper<cudf::size_type> expected({-1, 2, -1, 1, -1, -1},
-                                                                     {1, 1, 0, 1, 1, 1});
+    cudf::test::fixed_width_column_wrapper<cudf::size_type> expected(
+      {-1, 2, -1, 1, -1, -1}, {true, true, false, true, true, true});
     auto results = cudf::strings::find(strings_view, target);
     CUDF_TEST_EXPECT_COLUMNS_EQUAL(*results, expected);
     results = cudf::strings::rfind(strings_view, target);
     CUDF_TEST_EXPECT_COLUMNS_EQUAL(*results, expected);
   }
   {
-    cudf::test::fixed_width_column_wrapper<cudf::size_type> expected({0, 0, 0, 0, 0, 0},
-                                                                     {1, 1, 0, 1, 1, 1});
+    cudf::test::fixed_width_column_wrapper<cudf::size_type> expected(
+      {0, 0, 0, 0, 0, 0}, {true, true, false, true, true, true});
     auto results = cudf::strings::find(strings_view, cudf::string_scalar(""));
     CUDF_TEST_EXPECT_COLUMNS_EQUAL(*results, expected);
   }
   {
-    cudf::test::fixed_width_column_wrapper<cudf::size_type> expected({5, 5, 0, 4, 12, 0},
-                                                                     {1, 1, 0, 1, 1, 1});
+    cudf::test::fixed_width_column_wrapper<cudf::size_type> expected(
+      {5, 5, 0, 4, 12, 0}, {true, true, false, true, true, true});
     auto results = cudf::strings::rfind(strings_view, cudf::string_scalar(""));
     CUDF_TEST_EXPECT_COLUMNS_EQUAL(*results, expected);
   }
   {
     auto const targets = cudf::test::strings_column_wrapper({"l", "t", "", "x", "é", "o"});
-    cudf::test::fixed_width_column_wrapper<cudf::size_type> expected({2, 0, 0, -1, 1, -1},
-                                                                     {1, 1, 0, 1, 1, 1});
+    cudf::test::fixed_width_column_wrapper<cudf::size_type> expected(
+      {2, 0, 0, -1, 1, -1}, {true, true, false, true, true, true});
     auto results = cudf::strings::find(strings_view, cudf::strings_column_view(targets));
     CUDF_TEST_EXPECT_COLUMNS_EQUAL(*results, expected);
   }
   {
-    cudf::test::fixed_width_column_wrapper<cudf::size_type> expected({0, 0, 0, 0, 0, 0},
-                                                                     {1, 1, 0, 1, 1, 1});
+    cudf::test::fixed_width_column_wrapper<cudf::size_type> expected(
+      {0, 0, 0, 0, 0, 0}, {true, true, false, true, true, true});
     auto results = cudf::strings::find(strings_view, strings_view);
     CUDF_TEST_EXPECT_COLUMNS_EQUAL(*results, expected);
   }
@@ -91,13 +91,13 @@ TEST_F(StringsFindTest, Find)
 TEST_F(StringsFindTest, FindWithNullTargets)
 {
   cudf::test::strings_column_wrapper input({"hello hello", "thesé help", "", "helicopter", "", "x"},
-                                           {1, 1, 0, 1, 1, 1});
+                                           {true, true, false, true, true, true});
   auto strings_view = cudf::strings_column_view(input);
 
   auto const targets = cudf::test::strings_column_wrapper(
-    {"lo he", "", "hhh", "cop", "help", "xyz"}, {1, 0, 1, 1, 1, 1});
-  cudf::test::fixed_width_column_wrapper<cudf::size_type> expected({3, -1, -1, 4, -1, -1},
-                                                                   {1, 0, 0, 1, 1, 1});
+    {"lo he", "", "hhh", "cop", "help", "xyz"}, {true, false, true, true, true, true});
+  cudf::test::fixed_width_column_wrapper<cudf::size_type> expected(
+    {3, -1, -1, 4, -1, -1}, {true, false, false, true, true, true});
   auto results = cudf::strings::find(strings_view, cudf::strings_column_view(targets));
   CUDF_TEST_EXPECT_COLUMNS_EQUAL(*results, expected);
 }
@@ -144,25 +144,26 @@ TEST_F(StringsFindTest, FindLongStrings)
 TEST_F(StringsFindTest, Contains)
 {
   cudf::test::strings_column_wrapper strings(
-    {"Héllo", "thesé", "", "lease", "tést strings", "", "eé", "éte"}, {1, 1, 0, 1, 1, 1, 1, 1});
+    {"Héllo", "thesé", "", "lease", "tést strings", "", "eé", "éte"},
+    {true, true, false, true, true, true, true, true});
   auto strings_view = cudf::strings_column_view(strings);
   {
-    cudf::test::fixed_width_column_wrapper<bool> expected({0, 1, 0, 1, 0, 0, 1, 1},
-                                                          {1, 1, 0, 1, 1, 1, 1, 1});
+    cudf::test::fixed_width_column_wrapper<bool> expected(
+      {0, 1, 0, 1, 0, 0, 1, 1}, {true, true, false, true, true, true, true, true});
     auto results = cudf::strings::contains(strings_view, cudf::string_scalar("e"));
     CUDF_TEST_EXPECT_COLUMNS_EQUAL(*results, expected);
   }
   {
-    cudf::test::fixed_width_column_wrapper<bool> expected({1, 1, 0, 0, 1, 0, 1, 1},
-                                                          {1, 1, 0, 1, 1, 1, 1, 1});
+    cudf::test::fixed_width_column_wrapper<bool> expected(
+      {1, 1, 0, 0, 1, 0, 1, 1}, {true, true, false, true, true, true, true, true});
     auto results = cudf::strings::contains(strings_view, cudf::string_scalar("é"));
     CUDF_TEST_EXPECT_COLUMNS_EQUAL(*results, expected);
   }
   {
     cudf::test::strings_column_wrapper targets({"Hello", "é", "e", "x", "", "", "n", "t"},
-                                               {1, 1, 1, 1, 1, 0, 1, 1});
-    cudf::test::fixed_width_column_wrapper<bool> expected({0, 1, 0, 0, 1, 0, 0, 1},
-                                                          {1, 1, 0, 1, 1, 1, 1, 1});
+                                               {true, true, true, true, true, false, true, true});
+    cudf::test::fixed_width_column_wrapper<bool> expected(
+      {0, 1, 0, 0, 1, 0, 0, 1}, {true, true, false, true, true, true, true, true});
     auto results = cudf::strings::contains(strings_view, cudf::strings_column_view(targets));
     CUDF_TEST_EXPECT_COLUMNS_EQUAL(*results, expected);
   }
@@ -200,10 +201,11 @@ TEST_F(StringsFindTest, ContainsLongStrings)
 TEST_F(StringsFindTest, StartsWith)
 {
   cudf::test::strings_column_wrapper strings({"Héllo", "thesé", "", "lease", "tést strings", ""},
-                                             {1, 1, 0, 1, 1, 1});
+                                             {true, true, false, true, true, true});
   auto strings_view = cudf::strings_column_view(strings);
   {
-    cudf::test::fixed_width_column_wrapper<bool> expected({0, 1, 0, 0, 1, 0}, {1, 1, 0, 1, 1, 1});
+    cudf::test::fixed_width_column_wrapper<bool> expected({0, 1, 0, 0, 1, 0},
+                                                          {true, true, false, true, true, true});
     auto results = cudf::strings::starts_with(strings_view, cudf::string_scalar("t"));
     CUDF_TEST_EXPECT_COLUMNS_EQUAL(*results, expected);
   }
@@ -212,12 +214,14 @@ TEST_F(StringsFindTest, StartsWith)
     cudf::test::strings_column_wrapper targets(h_targets.begin(), h_targets.end());
 
     auto targets_view = cudf::strings_column_view(targets);
-    cudf::test::fixed_width_column_wrapper<bool> expected({0, 1, 0, 0, 1, 1}, {1, 1, 0, 1, 1, 1});
+    cudf::test::fixed_width_column_wrapper<bool> expected({0, 1, 0, 0, 1, 1},
+                                                          {true, true, false, true, true, true});
     auto results = cudf::strings::starts_with(strings_view, targets_view);
     CUDF_TEST_EXPECT_COLUMNS_EQUAL(*results, expected);
   }
   {
-    cudf::test::fixed_width_column_wrapper<bool> expected({0, 1, 0, 0, 0, 0}, {1, 1, 0, 1, 1, 1});
+    cudf::test::fixed_width_column_wrapper<bool> expected({0, 1, 0, 0, 0, 0},
+                                                          {true, true, false, true, true, true});
     auto results = cudf::strings::starts_with(strings_view, cudf::string_scalar("thesé"));
     CUDF_TEST_EXPECT_COLUMNS_EQUAL(*results, expected);
   }
@@ -229,7 +233,8 @@ TEST_F(StringsFindTest, StartsWith)
       thrust::make_transform_iterator(h_targets.begin(), [](auto str) { return str != nullptr; }));
 
     auto targets_view = cudf::strings_column_view(targets);
-    cudf::test::fixed_width_column_wrapper<bool> expected({0, 1, 0, 0, 0, 1}, {1, 1, 0, 1, 1, 1});
+    cudf::test::fixed_width_column_wrapper<bool> expected({0, 1, 0, 0, 0, 1},
+                                                          {true, true, false, true, true, true});
     auto results = cudf::strings::starts_with(strings_view, targets_view);
     CUDF_TEST_EXPECT_COLUMNS_EQUAL(*results, expected);
   }
@@ -238,10 +243,11 @@ TEST_F(StringsFindTest, StartsWith)
 TEST_F(StringsFindTest, EndsWith)
 {
   cudf::test::strings_column_wrapper strings({"Héllo", "thesé", "", "lease", "tést strings", ""},
-                                             {1, 1, 0, 1, 1, 1});
+                                             {true, true, false, true, true, true});
   auto strings_view = cudf::strings_column_view(strings);
   {
-    cudf::test::fixed_width_column_wrapper<bool> expected({0, 0, 0, 1, 0, 0}, {1, 1, 0, 1, 1, 1});
+    cudf::test::fixed_width_column_wrapper<bool> expected({0, 0, 0, 1, 0, 0},
+                                                          {true, true, false, true, true, true});
     auto results = cudf::strings::ends_with(strings_view, cudf::string_scalar("se"));
     CUDF_TEST_EXPECT_COLUMNS_EQUAL(*results, expected);
   }
@@ -250,12 +256,14 @@ TEST_F(StringsFindTest, EndsWith)
     cudf::test::strings_column_wrapper targets(h_targets.begin(), h_targets.end());
 
     auto targets_view = cudf::strings_column_view(targets);
-    cudf::test::fixed_width_column_wrapper<bool> expected({0, 1, 0, 0, 1, 1}, {1, 1, 0, 1, 1, 1});
+    cudf::test::fixed_width_column_wrapper<bool> expected({0, 1, 0, 0, 1, 1},
+                                                          {true, true, false, true, true, true});
     auto results = cudf::strings::ends_with(strings_view, targets_view);
     CUDF_TEST_EXPECT_COLUMNS_EQUAL(*results, expected);
   }
   {
-    cudf::test::fixed_width_column_wrapper<bool> expected({0, 1, 0, 0, 0, 0}, {1, 1, 0, 1, 1, 1});
+    cudf::test::fixed_width_column_wrapper<bool> expected({0, 1, 0, 0, 0, 0},
+                                                          {true, true, false, true, true, true});
     auto results = cudf::strings::ends_with(strings_view, cudf::string_scalar("thesé"));
     CUDF_TEST_EXPECT_COLUMNS_EQUAL(*results, expected);
   }
@@ -267,7 +275,8 @@ TEST_F(StringsFindTest, EndsWith)
       thrust::make_transform_iterator(h_targets.begin(), [](auto str) { return str != nullptr; }));
 
     auto targets_view = cudf::strings_column_view(targets);
-    cudf::test::fixed_width_column_wrapper<bool> expected({0, 1, 0, 0, 1, 1}, {1, 1, 0, 1, 1, 1});
+    cudf::test::fixed_width_column_wrapper<bool> expected({0, 1, 0, 0, 1, 1},
+                                                          {true, true, false, true, true, true});
     auto results = cudf::strings::ends_with(strings_view, targets_view);
     CUDF_TEST_EXPECT_COLUMNS_EQUAL(*results, expected);
   }
@@ -296,10 +305,11 @@ TEST_F(StringsFindTest, ZeroSizeStringsColumn)
 TEST_F(StringsFindTest, EmptyTarget)
 {
   cudf::test::strings_column_wrapper strings({"Héllo", "thesé", "", "lease", "tést strings", ""},
-                                             {1, 1, 0, 1, 1, 1});
+                                             {true, true, false, true, true, true});
   auto strings_view = cudf::strings_column_view(strings);
 
-  cudf::test::fixed_width_column_wrapper<bool> expected({1, 1, 1, 1, 1, 1}, {1, 1, 0, 1, 1, 1});
+  cudf::test::fixed_width_column_wrapper<bool> expected({1, 1, 1, 1, 1, 1},
+                                                        {true, true, false, true, true, true});
   auto results = cudf::strings::contains(strings_view, cudf::string_scalar(""));
   CUDF_TEST_EXPECT_COLUMNS_EQUAL(*results, expected);
   results = cudf::strings::starts_with(strings_view, cudf::string_scalar(""));
@@ -307,8 +317,8 @@ TEST_F(StringsFindTest, EmptyTarget)
   results = cudf::strings::ends_with(strings_view, cudf::string_scalar(""));
   CUDF_TEST_EXPECT_COLUMNS_EQUAL(*results, expected);
 
-  cudf::test::fixed_width_column_wrapper<cudf::size_type> expected_find({0, 0, 0, 0, 0, 0},
-                                                                        {1, 1, 0, 1, 1, 1});
+  cudf::test::fixed_width_column_wrapper<cudf::size_type> expected_find(
+    {0, 0, 0, 0, 0, 0}, {true, true, false, true, true, true});
   results = cudf::strings::find(strings_view, cudf::string_scalar(""));
   CUDF_TEST_EXPECT_COLUMNS_EQUAL(*results, expected_find);
   auto expected_rfind = cudf::strings::count_characters(strings_view);
@@ -325,7 +335,7 @@ TEST_F(StringsFindTest, AllEmpty)
   cudf::test::fixed_width_column_wrapper<cudf::size_type> expected32(h_expected32.begin(),
                                                                      h_expected32.end());
 
-  std::vector<bool> h_expected8(h_strings.size(), 0);
+  std::vector<bool> h_expected8(h_strings.size(), false);
   cudf::test::fixed_width_column_wrapper<bool> expected8(h_expected8.begin(), h_expected8.end());
 
   auto strings_view = cudf::strings_column_view(strings);
@@ -419,8 +429,8 @@ TEST_P(FindParmsTest, Find)
   {
     auto results = cudf::strings::find(strings_view, cudf::string_scalar("e"), position);
     std::vector<cudf::size_type> h_expected;
-    for (auto itr = h_strings.begin(); itr != h_strings.end(); ++itr)
-      h_expected.push_back(static_cast<cudf::size_type>((*itr).find("e", position)));
+    for (auto& h_string : h_strings)
+      h_expected.push_back(static_cast<cudf::size_type>(h_string.find("e", position)));
     cudf::test::fixed_width_column_wrapper<cudf::size_type> expected(h_expected.begin(),
                                                                      h_expected.end());
     CUDF_TEST_EXPECT_COLUMNS_EQUAL(*results, expected);
@@ -428,8 +438,8 @@ TEST_P(FindParmsTest, Find)
   {
     auto results = cudf::strings::rfind(strings_view, cudf::string_scalar("e"), 0, position + 1);
     std::vector<cudf::size_type> h_expected;
-    for (auto itr = h_strings.begin(); itr != h_strings.end(); ++itr)
-      h_expected.push_back(static_cast<cudf::size_type>((*itr).rfind("e", position)));
+    for (auto& h_string : h_strings)
+      h_expected.push_back(static_cast<cudf::size_type>(h_string.rfind("e", position)));
     cudf::test::fixed_width_column_wrapper<cudf::size_type> expected(h_expected.begin(),
                                                                      h_expected.end());
     CUDF_TEST_EXPECT_COLUMNS_EQUAL(*results, expected);
diff --git a/cpp/tests/strings/findall_tests.cpp b/cpp/tests/strings/findall_tests.cpp
index fe27beed197..4582dcb1e38 100644
--- a/cpp/tests/strings/findall_tests.cpp
+++ b/cpp/tests/strings/findall_tests.cpp
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2019-2023, NVIDIA CORPORATION.
+ * Copyright (c) 2019-2024, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -31,7 +31,7 @@ struct StringsFindallTests : public cudf::test::BaseFixture {};
 
 TEST_F(StringsFindallTests, FindallTest)
 {
-  bool valids[] = {1, 1, 1, 1, 1, 0, 1, 1};
+  bool valids[] = {true, true, true, true, true, false, true, true};
   cudf::test::strings_column_wrapper input(
     {"3-A", "4-May 5-Day 6-Hay", "12-Dec-2021-Jan", "Feb-March", "4 ABC", "", "", "25-9000-Hal"},
     valids);
@@ -83,7 +83,7 @@ TEST_F(StringsFindallTests, DotAll)
 TEST_F(StringsFindallTests, MediumRegex)
 {
   // This results in 15 regex instructions and falls in the 'medium' range.
-  std::string medium_regex = "(\\w+) (\\w+) (\\d+)";
+  std::string medium_regex = R"((\w+) (\w+) (\d+))";
   auto prog                = cudf::strings::regex_program::create(medium_regex);
 
   cudf::test::strings_column_wrapper input({"first words 1234 and just numbers 9876", "neither"});
diff --git a/cpp/tests/strings/fixed_point_tests.cpp b/cpp/tests/strings/fixed_point_tests.cpp
index 9205207cc53..79054551498 100644
--- a/cpp/tests/strings/fixed_point_tests.cpp
+++ b/cpp/tests/strings/fixed_point_tests.cpp
@@ -54,7 +54,7 @@ TYPED_TEST(StringsFixedPointConvertTest, ToFixedPoint)
   CUDF_TEST_EXPECT_COLUMNS_EQUIVALENT(*results, expected_scaled);
 
   cudf::test::strings_column_wrapper strings_nulls(
-    {"1234", "-876", "543", "900000", "25E5", "", ""}, {1, 1, 1, 1, 1, 1, 0});
+    {"1234", "-876", "543", "900000", "25E5", "", ""}, {true, true, true, true, true, true, false});
   results = cudf::strings::to_fixed_point(cudf::strings_column_view(strings_nulls),
                                           cudf::data_type{cudf::type_to_id<DecimalType>()});
   auto const expected_nulls = fp_wrapper{
@@ -205,14 +205,14 @@ TYPED_TEST(StringsFixedPointConvertTest, FromFixedPoint)
     fp_wrapper({110, -222, 3330, 4, -550, 0}, {1, 1, 1, 1, 1, 0}, numeric::scale_type{2});
   results = cudf::strings::from_fixed_point(positive_scale);
   cudf::test::strings_column_wrapper positive_expected(
-    {"11000", "-22200", "333000", "400", "-55000", ""}, {1, 1, 1, 1, 1, 0});
+    {"11000", "-22200", "333000", "400", "-55000", ""}, {true, true, true, true, true, false});
   CUDF_TEST_EXPECT_COLUMNS_EQUIVALENT(*results, positive_expected);
 
   auto const zero_scale =
     fp_wrapper({0, -222, 3330, 4, -550, 0}, {0, 1, 1, 1, 1, 1}, numeric::scale_type{0});
   results = cudf::strings::from_fixed_point(zero_scale);
   cudf::test::strings_column_wrapper zero_expected({"", "-222", "3330", "4", "-550", "0"},
-                                                   {0, 1, 1, 1, 1, 1});
+                                                   {false, true, true, true, true, true});
   CUDF_TEST_EXPECT_COLUMNS_EQUIVALENT(*results, zero_expected);
 }
 
diff --git a/cpp/tests/strings/integers_tests.cpp b/cpp/tests/strings/integers_tests.cpp
index c8f292f55b2..51e9b3bd0a0 100644
--- a/cpp/tests/strings/integers_tests.cpp
+++ b/cpp/tests/strings/integers_tests.cpp
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2019-2023, NVIDIA CORPORATION.
+ * Copyright (c) 2019-2024, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -352,11 +352,11 @@ TEST_F(StringsConvertTest, HexToInteger)
 
   {
     std::vector<int32_t> h_expected;
-    for (auto itr = h_strings.begin(); itr != h_strings.end(); ++itr) {
-      if (*itr == nullptr)
+    for (auto& h_string : h_strings) {
+      if (h_string == nullptr)
         h_expected.push_back(0);
       else
-        h_expected.push_back(static_cast<int>(std::stol(std::string(*itr), 0, 16)));
+        h_expected.push_back(static_cast<int>(std::stol(std::string(h_string), nullptr, 16)));
     }
 
     auto results = cudf::strings::hex_to_integers(cudf::strings_column_view(strings),
@@ -369,11 +369,11 @@ TEST_F(StringsConvertTest, HexToInteger)
   }
   {
     std::vector<int64_t> h_expected;
-    for (auto itr = h_strings.begin(); itr != h_strings.end(); ++itr) {
-      if (*itr == nullptr)
+    for (auto& h_string : h_strings) {
+      if (h_string == nullptr)
         h_expected.push_back(0);
       else
-        h_expected.push_back(std::stol(std::string(*itr), 0, 16));
+        h_expected.push_back(std::stol(std::string(h_string), nullptr, 16));
     }
 
     auto results = cudf::strings::hex_to_integers(cudf::strings_column_view(strings),
@@ -404,8 +404,9 @@ TEST_F(StringsConvertTest, IsHex)
     h_strings.begin(),
     h_strings.end(),
     thrust::make_transform_iterator(h_strings.begin(), [](auto str) { return str != nullptr; }));
-  cudf::test::fixed_width_column_wrapper<bool> expected({0, 1, 0, 1, 1, 1, 1, 1, 0, 1, 0, 0},
-                                                        {1, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1});
+  cudf::test::fixed_width_column_wrapper<bool> expected(
+    {0, 1, 0, 1, 1, 1, 1, 1, 0, 1, 0, 0},
+    {true, true, false, true, true, true, true, true, true, true, true, true});
   auto results = cudf::strings::is_hex(cudf::strings_column_view(strings));
   CUDF_TEST_EXPECT_COLUMNS_EQUAL(*results, expected);
 }
@@ -447,11 +448,12 @@ TYPED_TEST(StringsIntegerConvertTest, IntegerToHex)
 TEST_F(StringsConvertTest, IntegerToHexWithNull)
 {
   cudf::test::fixed_width_column_wrapper<int32_t> integers(
-    {123456, -1, 0, 0, 12, 12345, 123456789, -123456789}, {1, 1, 1, 0, 1, 1, 1, 1});
+    {123456, -1, 0, 0, 12, 12345, 123456789, -123456789},
+    {true, true, true, false, true, true, true, true});
 
   cudf::test::strings_column_wrapper expected(
     {"01E240", "FFFFFFFF", "00", "", "0C", "3039", "075BCD15", "F8A432EB"},
-    {1, 1, 1, 0, 1, 1, 1, 1});
+    {true, true, true, false, true, true, true, true});
 
   auto results = cudf::strings::integers_to_hex(integers);
   CUDF_TEST_EXPECT_COLUMNS_EQUAL(*results, expected);
diff --git a/cpp/tests/strings/ipv4_tests.cpp b/cpp/tests/strings/ipv4_tests.cpp
index 2b2d5730ca7..3bfe0f9727e 100644
--- a/cpp/tests/strings/ipv4_tests.cpp
+++ b/cpp/tests/strings/ipv4_tests.cpp
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2019-2023, NVIDIA CORPORATION.
+ * Copyright (c) 2019-2024, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -104,8 +104,9 @@ TEST_F(StringsConvertTest, IsIPv4)
     h_strings.begin(),
     h_strings.end(),
     thrust::make_transform_iterator(h_strings.begin(), [](auto str) { return str != nullptr; }));
-  cudf::test::fixed_width_column_wrapper<bool> expected({0, 0, 0, 1, 0, 0, 1, 0, 0, 0, 0, 0},
-                                                        {1, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1});
+  cudf::test::fixed_width_column_wrapper<bool> expected(
+    {0, 0, 0, 1, 0, 0, 1, 0, 0, 0, 0, 0},
+    {true, true, false, true, true, true, true, true, true, true, true, true});
   auto results = cudf::strings::is_ipv4(cudf::strings_column_view(strings));
   CUDF_TEST_EXPECT_COLUMNS_EQUAL(*results, expected);
 }
diff --git a/cpp/tests/strings/like_tests.cpp b/cpp/tests/strings/like_tests.cpp
index 4352a1ed584..6aedbdeb537 100644
--- a/cpp/tests/strings/like_tests.cpp
+++ b/cpp/tests/strings/like_tests.cpp
@@ -26,12 +26,13 @@ struct StringsLikeTests : public cudf::test::BaseFixture {};
 TEST_F(StringsLikeTests, Basic)
 {
   cudf::test::strings_column_wrapper input({"abc", "a bc", "ABC", "abcd", " abc", "", "", "áéêú"},
-                                           {1, 1, 1, 1, 1, 1, 0, 1});
+                                           {true, true, true, true, true, true, false, true});
   auto const sv      = cudf::strings_column_view(input);
   auto const pattern = std::string("abc");
   auto const results = cudf::strings::like(sv, pattern);
   cudf::test::fixed_width_column_wrapper<bool> expected(
-    {true, false, false, false, false, false, false, false}, {1, 1, 1, 1, 1, 1, 0, 1});
+    {true, false, false, false, false, false, false, false},
+    {true, true, true, true, true, true, false, true});
   CUDF_TEST_EXPECT_COLUMNS_EQUIVALENT(results->view(), expected);
 }
 
@@ -201,7 +202,7 @@ TEST_F(StringsLikeTests, Errors)
   EXPECT_THROW(cudf::strings::like(sv, invalid_str), cudf::logic_error);
   EXPECT_THROW(cudf::strings::like(sv, std::string("3"), invalid_str), cudf::logic_error);
 
-  auto patterns          = cudf::test::strings_column_wrapper({"3", ""}, {1, 0});
+  auto patterns          = cudf::test::strings_column_wrapper({"3", ""}, {true, false});
   auto const sv_patterns = cudf::strings_column_view(patterns);
   EXPECT_THROW(cudf::strings::like(sv, sv_patterns), cudf::logic_error);
   EXPECT_THROW(cudf::strings::like(sv, sv, invalid_str), cudf::logic_error);
diff --git a/cpp/tests/strings/pad_tests.cpp b/cpp/tests/strings/pad_tests.cpp
index 81ec87a12a8..693c043ac3f 100644
--- a/cpp/tests/strings/pad_tests.cpp
+++ b/cpp/tests/strings/pad_tests.cpp
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2019-2023, NVIDIA CORPORATION.
+ * Copyright (c) 2019-2024, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -115,8 +115,7 @@ TEST_P(PadParameters, Padding)
   auto results          = cudf::strings::pad(strings_view, width, cudf::strings::side_type::RIGHT);
 
   std::vector<std::string> h_expected;
-  for (auto itr = h_strings.begin(); itr != h_strings.end(); ++itr) {
-    std::string str      = *itr;
+  for (auto str : h_strings) {
     cudf::size_type size = str.size();
     if (size < width) str.insert(size, width - size, ' ');
     h_expected.push_back(str);
diff --git a/cpp/tests/strings/replace_regex_tests.cpp b/cpp/tests/strings/replace_regex_tests.cpp
index d1c545b0e2f..8c0482653fb 100644
--- a/cpp/tests/strings/replace_regex_tests.cpp
+++ b/cpp/tests/strings/replace_regex_tests.cpp
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2019-2023, NVIDIA CORPORATION.
+ * Copyright (c) 2019-2024, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -165,7 +165,7 @@ TEST_F(StringsReplaceRegexTest, Alternation)
     {"16  6  brr  232323  1  hello  90", "123 ABC 00 2022", "abé123  4567  89xyz"});
   auto sv = cudf::strings_column_view(input);
 
-  auto pattern = std::string("(^|\\s)\\d+(\\s|$)");
+  auto pattern = std::string(R"((^|\s)\d+(\s|$))");
   auto repl    = cudf::string_scalar("_");
   auto expected =
     cudf::test::strings_column_wrapper({"__ brr __ hello _", "_ABC_2022", "abé123 _ 89xyz"});
@@ -173,7 +173,7 @@ TEST_F(StringsReplaceRegexTest, Alternation)
   auto results = cudf::strings::replace_re(sv, *prog, repl);
   CUDF_TEST_EXPECT_COLUMNS_EQUIVALENT(*results, expected);
 
-  pattern = std::string("(\\s|^)\\d+($|\\s)");
+  pattern = std::string(R"((\s|^)\d+($|\s))");
   prog    = cudf::strings::regex_program::create(pattern);
   results = cudf::strings::replace_re(sv, *prog, repl);
   CUDF_TEST_EXPECT_COLUMNS_EQUIVALENT(*results, expected);
diff --git a/cpp/tests/strings/replace_tests.cpp b/cpp/tests/strings/replace_tests.cpp
index ef4f3bc2b2a..3aa7467d156 100644
--- a/cpp/tests/strings/replace_tests.cpp
+++ b/cpp/tests/strings/replace_tests.cpp
@@ -37,10 +37,10 @@ struct StringsReplaceTest : public cudf::test::BaseFixture {
                                        "",
                                        nullptr};
 
-    return cudf::test::strings_column_wrapper(
+    return {
       h_strings.begin(),
       h_strings.end(),
-      thrust::make_transform_iterator(h_strings.begin(), [](auto str) { return str != nullptr; }));
+      thrust::make_transform_iterator(h_strings.begin(), [](auto str) { return str != nullptr; })};
   }
 
   std::unique_ptr<cudf::column> build_large(cudf::column_view const& first,
@@ -429,7 +429,7 @@ TEST_F(StringsReplaceTest, ReplaceMultiLong)
      "Test string for overlap check: bananaápple bananá ápplebananá banápple ápple bananá",
      "",
      ""},
-    {1, 1, 1, 1, 0, 1});
+    {true, true, true, true, false, true});
   auto strings_view = cudf::strings_column_view(input);
 
   auto targets      = cudf::test::strings_column_wrapper({"78901", "bananá", "ápple", "78"});
@@ -463,7 +463,7 @@ TEST_F(StringsReplaceTest, ReplaceMultiLong)
        "Test string for overlap check: bananaavocado PEAR avocadoPEAR banavocado avocado PEAR",
        "",
        ""},
-      {1, 1, 1, 1, 0, 1});
+      {true, true, true, true, false, true});
     CUDF_TEST_EXPECT_COLUMNS_EQUAL(*results, expected);
   }
 
@@ -491,7 +491,7 @@ TEST_F(StringsReplaceTest, ReplaceMultiLong)
        "*",
        "",
        ""},
-      {1, 1, 1, 1, 0, 1});
+      {true, true, true, true, false, true});
     CUDF_TEST_EXPECT_COLUMNS_EQUAL(*results, expected);
   }
 
@@ -527,7 +527,7 @@ TEST_F(StringsReplaceTest, ReplaceMultiLong)
        "Test string for overlap check: bananaápple bananá ápplebananá banápple ápple bananá",
        "",
        ""},
-      {1, 1, 1, 1, 0, 1});
+      {true, true, true, true, false, true});
     CUDF_TEST_EXPECT_COLUMNS_EQUAL(*results, expected);
   }
 }
diff --git a/cpp/tests/strings/reverse_tests.cpp b/cpp/tests/strings/reverse_tests.cpp
index 3df42b61ebf..40858f1ad23 100644
--- a/cpp/tests/strings/reverse_tests.cpp
+++ b/cpp/tests/strings/reverse_tests.cpp
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2022-2023, NVIDIA CORPORATION.
+ * Copyright (c) 2022-2024, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -29,17 +29,19 @@ struct StringsReverseTest : public cudf::test::BaseFixture {};
 
 TEST_F(StringsReverseTest, Reverse)
 {
-  auto input = cudf::test::strings_column_wrapper(
-    {"abcdef", "12345", "", "", "aébé", "A é Z", "X", "é"}, {1, 1, 1, 0, 1, 1, 1, 1});
-  auto results  = cudf::strings::reverse(cudf::strings_column_view(input));
-  auto expected = cudf::test::strings_column_wrapper(
-    {"fedcba", "54321", "", "", "ébéa", "Z é A", "X", "é"}, {1, 1, 1, 0, 1, 1, 1, 1});
+  auto input =
+    cudf::test::strings_column_wrapper({"abcdef", "12345", "", "", "aébé", "A é Z", "X", "é"},
+                                       {true, true, true, false, true, true, true, true});
+  auto results = cudf::strings::reverse(cudf::strings_column_view(input));
+  auto expected =
+    cudf::test::strings_column_wrapper({"fedcba", "54321", "", "", "ébéa", "Z é A", "X", "é"},
+                                       {true, true, true, false, true, true, true, true});
   CUDF_TEST_EXPECT_COLUMNS_EQUIVALENT(*results, expected);
 
   auto sliced = cudf::slice(input, {1, 7}).front();
   results     = cudf::strings::reverse(cudf::strings_column_view(sliced));
-  expected =
-    cudf::test::strings_column_wrapper({"54321", "", "", "ébéa", "Z é A", "X"}, {1, 1, 0, 1, 1, 1});
+  expected    = cudf::test::strings_column_wrapper({"54321", "", "", "ébéa", "Z é A", "X"},
+                                                   {true, true, false, true, true, true});
   CUDF_TEST_EXPECT_COLUMNS_EQUIVALENT(*results, expected);
 }
 
diff --git a/cpp/tests/strings/slice_tests.cpp b/cpp/tests/strings/slice_tests.cpp
index 92230d06672..52e439bd93f 100644
--- a/cpp/tests/strings/slice_tests.cpp
+++ b/cpp/tests/strings/slice_tests.cpp
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2019-2023, NVIDIA CORPORATION.
+ * Copyright (c) 2019-2024, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -62,8 +62,8 @@ TEST_P(Parameters, Substring)
   auto results        = cudf::strings::slice_strings(strings_column, start);
 
   std::vector<std::string> h_expected;
-  for (auto itr = h_strings.begin(); itr != h_strings.end(); ++itr)
-    h_expected.push_back((*itr).substr(start));
+  for (auto& h_string : h_strings)
+    h_expected.push_back(h_string.substr(start));
 
   cudf::test::strings_column_wrapper expected(h_expected.begin(), h_expected.end());
   CUDF_TEST_EXPECT_COLUMNS_EQUAL(*results, expected);
@@ -277,7 +277,7 @@ TEST_F(StringsSliceTest, Error)
   auto indexes = cudf::test::fixed_width_column_wrapper<int32_t>({1, 2});
   EXPECT_THROW(cudf::strings::slice_strings(strings_view, indexes, indexes), cudf::logic_error);
 
-  auto indexes_null = cudf::test::fixed_width_column_wrapper<int32_t>({1}, {0});
+  auto indexes_null = cudf::test::fixed_width_column_wrapper<int32_t>({1}, {false});
   EXPECT_THROW(cudf::strings::slice_strings(strings_view, indexes_null, indexes_null),
                cudf::logic_error);
 
diff --git a/cpp/tests/strings/split_tests.cpp b/cpp/tests/strings/split_tests.cpp
index 445e283ef45..d53c64ed539 100644
--- a/cpp/tests/strings/split_tests.cpp
+++ b/cpp/tests/strings/split_tests.cpp
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2019-2023, NVIDIA CORPORATION.
+ * Copyright (c) 2019-2024, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -337,7 +337,8 @@ TEST_F(StringsSplitTest, MultiByteDelimiters)
 
     auto c0 = cudf::test::strings_column_wrapper({"u", "w", "y", "", "", ""});
     auto c1 = cudf::test::strings_column_wrapper({"", ":x", "", "a", ":b", ":c"});
-    auto c2 = cudf::test::strings_column_wrapper({"", "", "z", "", "", ":"}, {0, 0, 1, 0, 0, 1});
+    auto c2 = cudf::test::strings_column_wrapper({"", "", "z", "", "", ":"},
+                                                 {false, false, true, false, false, true});
     std::vector<std::unique_ptr<cudf::column>> expected_columns;
     expected_columns.push_back(c0.release());
     expected_columns.push_back(c1.release());
@@ -349,7 +350,8 @@ TEST_F(StringsSplitTest, MultiByteDelimiters)
 
     c0 = cudf::test::strings_column_wrapper({"u", "w:", "y", "", ":", ":"});
     c1 = cudf::test::strings_column_wrapper({"", "x", "", "a", "b", "c:"});
-    c2 = cudf::test::strings_column_wrapper({"", "", "z", "", "", ""}, {0, 0, 1, 0, 0, 1});
+    c2 = cudf::test::strings_column_wrapper({"", "", "z", "", "", ""},
+                                            {false, false, true, false, false, true});
     expected_columns.push_back(c0.release());
     expected_columns.push_back(c1.release());
     expected_columns.push_back(c2.release());
@@ -371,7 +373,7 @@ TEST_F(StringsSplitTest, MultiByteDelimiters)
     auto result = cudf::strings::split(view, cudf::string_scalar("}:{"));
 
     auto c0 = cudf::test::strings_column_wrapper({"{a=1", "{c=3}", ":{"});
-    auto c1 = cudf::test::strings_column_wrapper({"b=2}:", "", "}"}, {1, 0, 1});
+    auto c1 = cudf::test::strings_column_wrapper({"b=2}:", "", "}"}, {true, false, true});
     std::vector<std::unique_ptr<cudf::column>> expected_columns;
     expected_columns.push_back(c0.release());
     expected_columns.push_back(c1.release());
@@ -395,8 +397,10 @@ TEST_F(StringsSplitTest, SplitRegex)
     auto pattern = std::string("\\s+");
 
     cudf::test::strings_column_wrapper col0({"", "", "are", "tést", ""}, validity);
-    cudf::test::strings_column_wrapper col1({"Héllo", "", "some", "String", ""}, {1, 0, 1, 1, 0});
-    cudf::test::strings_column_wrapper col2({"thesé", "", "", "", ""}, {1, 0, 1, 0, 0});
+    cudf::test::strings_column_wrapper col1({"Héllo", "", "some", "String", ""},
+                                            {true, false, true, true, false});
+    cudf::test::strings_column_wrapper col2({"thesé", "", "", "", ""},
+                                            {true, false, true, false, false});
     auto expected = cudf::table_view({col0, col1, col2});
     auto prog     = cudf::strings::regex_program::create(pattern);
     auto result   = cudf::strings::split_re(sv, *prog);
@@ -412,9 +416,11 @@ TEST_F(StringsSplitTest, SplitRegex)
 
     cudf::test::strings_column_wrapper col0({" H", "", "ar", "t", ""}, validity);
     cudf::test::strings_column_wrapper col1({"llo th", "", " som", "st String", ""},
-                                            {1, 0, 1, 1, 0});
-    cudf::test::strings_column_wrapper col2({"s", "", "  ", "", ""}, {1, 0, 1, 0, 0});
-    cudf::test::strings_column_wrapper col3({"", "", "", "", ""}, {1, 0, 0, 0, 0});
+                                            {true, false, true, true, false});
+    cudf::test::strings_column_wrapper col2({"s", "", "  ", "", ""},
+                                            {true, false, true, false, false});
+    cudf::test::strings_column_wrapper col3({"", "", "", "", ""},
+                                            {true, false, false, false, false});
     auto expected = cudf::table_view({col0, col1, col2, col3});
     auto prog     = cudf::strings::regex_program::create(pattern);
     auto result   = cudf::strings::split_re(sv, *prog);
@@ -479,9 +485,10 @@ TEST_F(StringsSplitTest, SplitRegexWithMaxSplit)
   {
     auto pattern = std::string("\\s+");
 
-    cudf::test::strings_column_wrapper col0({"", "", "are", "tést", ""}, {1, 0, 1, 1, 1});
+    cudf::test::strings_column_wrapper col0({"", "", "are", "tést", ""},
+                                            {true, false, true, true, true});
     cudf::test::strings_column_wrapper col1({"Héllo\tthesé", "", "some  ", "String", ""},
-                                            {1, 0, 1, 1, 0});
+                                            {true, false, true, true, false});
     auto expected = cudf::table_view({col0, col1});
     auto prog     = cudf::strings::regex_program::create(pattern);
     auto result   = cudf::strings::split_re(sv, *prog, 1);
@@ -528,10 +535,10 @@ TEST_F(StringsSplitTest, SplitRegexWordBoundary)
     auto pattern = std::string("\\b");
 
     cudf::test::strings_column_wrapper col0({"", "", "-+", ""});
-    cudf::test::strings_column_wrapper col1({"a", "ab", "", "e"}, {1, 1, 0, 1});
-    cudf::test::strings_column_wrapper col2({"", "", "", "\n"}, {1, 1, 0, 1});
-    cudf::test::strings_column_wrapper col3({"", "", "", "é"}, {0, 0, 0, 1});
-    cudf::test::strings_column_wrapper col4({"", "", "", ""}, {0, 0, 0, 1});
+    cudf::test::strings_column_wrapper col1({"a", "ab", "", "e"}, {true, true, false, true});
+    cudf::test::strings_column_wrapper col2({"", "", "", "\n"}, {true, true, false, true});
+    cudf::test::strings_column_wrapper col3({"", "", "", "é"}, {false, false, false, true});
+    cudf::test::strings_column_wrapper col4({"", "", "", ""}, {false, false, false, true});
     auto expected = cudf::table_view({col0, col1, col2, col3, col4});
     auto prog     = cudf::strings::regex_program::create(pattern);
     auto result   = cudf::strings::split_re(sv, *prog);
@@ -652,7 +659,8 @@ TEST_F(StringsSplitTest, RSplitRegexWithMaxSplit)
 
   {
     cudf::test::strings_column_wrapper col0({" Héllo", "", "are some", "tést", ""}, validity);
-    cudf::test::strings_column_wrapper col1({"thesé", "", "", "String", ""}, {1, 0, 1, 1, 0});
+    cudf::test::strings_column_wrapper col1({"thesé", "", "", "String", ""},
+                                            {true, false, true, true, false});
     auto expected = cudf::table_view({col0, col1});
     auto result   = cudf::strings::rsplit_re(sv, *prog, 1);
     CUDF_TEST_EXPECT_TABLES_EQUIVALENT(result->view(), expected);
@@ -710,7 +718,7 @@ TEST_F(StringsSplitTest, SplitZeroSizeStringsColumns)
 // This test specifically for https://github.com/rapidsai/custrings/issues/119
 TEST_F(StringsSplitTest, AllNullsCase)
 {
-  cudf::test::strings_column_wrapper input({"", "", ""}, {0, 0, 0});
+  cudf::test::strings_column_wrapper input({"", "", ""}, {false, false, false});
   auto sv   = cudf::strings_column_view(input);
   auto prog = cudf::strings::regex_program::create("-");
 
diff --git a/cpp/tests/strings/strip_tests.cpp b/cpp/tests/strings/strip_tests.cpp
index 63179474944..b72186f5141 100644
--- a/cpp/tests/strings/strip_tests.cpp
+++ b/cpp/tests/strings/strip_tests.cpp
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2019-2023, NVIDIA CORPORATION.
+ * Copyright (c) 2019-2024, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -102,7 +102,8 @@ TEST_F(StringsStripTest, EmptyStringsColumn)
 
 TEST_F(StringsStripTest, AllEmptyStrings)
 {
-  auto input = cudf::test::strings_column_wrapper({"", "", "", "", "", ""}, {1, 1, 0, 1, 1});
+  auto input =
+    cudf::test::strings_column_wrapper({"", "", "", "", "", ""}, {true, true, false, true, true});
   auto results =
     cudf::strings::strip(cudf::strings_column_view(input), cudf::strings::side_type::BOTH);
   CUDF_TEST_EXPECT_COLUMNS_EQUAL(*results, input);
diff --git a/cpp/tests/strings/translate_tests.cpp b/cpp/tests/strings/translate_tests.cpp
index ab3973242c6..3672d65406d 100644
--- a/cpp/tests/strings/translate_tests.cpp
+++ b/cpp/tests/strings/translate_tests.cpp
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2019-2023, NVIDIA CORPORATION.
+ * Copyright (c) 2019-2024, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -49,7 +49,7 @@ TEST_F(StringsTranslateTest, Translate)
   auto strings_view = cudf::strings_column_view(strings);
 
   std::vector<std::pair<cudf::char_utf8, cudf::char_utf8>> translate_table{
-    make_entry("b", 0), make_entry("a", "A"), make_entry("é", "E"), make_entry("e", "_")};
+    make_entry("b", nullptr), make_entry("a", "A"), make_entry("é", "E"), make_entry("e", "_")};
   auto results = cudf::strings::translate(strings_view, translate_table);
 
   std::vector<char const*> h_expected{"___ ddd", " cc", nullptr, "", "AA", "dEd"};
diff --git a/cpp/tests/structs/structs_column_tests.cpp b/cpp/tests/structs/structs_column_tests.cpp
index 8f492a930a8..df005dfa1dc 100644
--- a/cpp/tests/structs/structs_column_tests.cpp
+++ b/cpp/tests/structs/structs_column_tests.cpp
@@ -144,7 +144,7 @@ TYPED_TEST(TypedStructColumnWrapperTest, TestColumnWrapperConstruction)
   // Check child columns for exactly correct values.
   vector_of_columns expected_children;
   expected_children.emplace_back(
-    cudf::test::strings_column_wrapper{names, {1, 1, 1, 0, 1, 1}}.release());
+    cudf::test::strings_column_wrapper{names, {true, true, true, false, true, true}}.release());
   expected_children.emplace_back(cudf::test::fixed_width_column_wrapper<TypeParam, int32_t>{
     {48, 27, 25, 31, 351, 351},
     {1, 1, 1, 0, 1, 0}}.release());
diff --git a/cpp/tests/structs/utilities_tests.cpp b/cpp/tests/structs/utilities_tests.cpp
index 00f7d636530..e5ff700a242 100644
--- a/cpp/tests/structs/utilities_tests.cpp
+++ b/cpp/tests/structs/utilities_tests.cpp
@@ -325,8 +325,8 @@ TYPED_TEST(TypedStructUtilitiesTest, StructOfStructWithNullsAtAllLevels)
   auto expected_nums_col_2 =
     cudf::column(static_cast<cudf::structs_column_view>(struct_of_structs_col)
                    .get_sliced_child(0, cudf::get_default_stream()));
-  auto expected_structs_col_2 =
-    cudf::test::fixed_width_column_wrapper<bool>{{1, 1, 0, 1, 0, 1, 1}, {1, 1, 0, 1, 0, 1, 1}};
+  auto expected_structs_col_2 = cudf::test::fixed_width_column_wrapper<bool>{
+    {1, 1, 0, 1, 0, 1, 1}, {true, true, false, true, false, true, true}};
   auto expected_nums_col_3 =
     cudf::column(static_cast<cudf::structs_column_view>(struct_of_structs_col)
                    .get_sliced_child(1, cudf::get_default_stream())
diff --git a/cpp/tests/table/row_operators_tests.cpp b/cpp/tests/table/row_operators_tests.cpp
index 974e7d67658..5fa63c47cf0 100644
--- a/cpp/tests/table/row_operators_tests.cpp
+++ b/cpp/tests/table/row_operators_tests.cpp
@@ -30,8 +30,10 @@ struct RowOperatorTestForNAN : public cudf::test::BaseFixture {};
 
 TEST_F(RowOperatorTestForNAN, NANEquality)
 {
-  cudf::test::fixed_width_column_wrapper<double> col1{{1., double(NAN), 3., 4.}, {1, 1, 0, 1}};
-  cudf::test::fixed_width_column_wrapper<double> col2{{1., double(NAN), 3., 4.}, {1, 1, 0, 1}};
+  cudf::test::fixed_width_column_wrapper<double> col1{{1., double(NAN), 3., 4.},
+                                                      {true, true, false, true}};
+  cudf::test::fixed_width_column_wrapper<double> col2{{1., double(NAN), 3., 4.},
+                                                      {true, true, false, true}};
 
   CUDF_TEST_EXPECT_COLUMNS_EQUAL(col1, col2);
 }
@@ -47,7 +49,7 @@ TEST_F(RowOperatorTestForNAN, NANSorting)
      std::numeric_limits<double>::infinity(),
      1.,
      -1 * std::numeric_limits<double>::infinity()},
-    {1, 1, 1, 0, 1, 1, 1, 1}};
+    {true, true, true, false, true, true, true, true}};
   cudf::test::fixed_width_column_wrapper<int32_t> expected1{{3, 6, 2, 0, 5, 4, 1}};
   std::vector<cudf::order> column_order{cudf::order::ASCENDING};
   std::vector<cudf::null_order> null_precedence_1{cudf::null_order::BEFORE};
diff --git a/cpp/tests/text/bpe_tests.cpp b/cpp/tests/text/bpe_tests.cpp
index b03df12c5ed..3b08439612b 100644
--- a/cpp/tests/text/bpe_tests.cpp
+++ b/cpp/tests/text/bpe_tests.cpp
@@ -129,6 +129,6 @@ TEST_F(TextBytePairEncoding, BPE_Error)
 {
   auto empty = cudf::make_empty_column(cudf::type_id::STRING);
   EXPECT_THROW(nvtext::load_merge_pairs(cudf::strings_column_view(*empty)), cudf::logic_error);
-  auto null_pairs = cudf::test::strings_column_wrapper({"", ""}, {1, 0});
+  auto null_pairs = cudf::test::strings_column_wrapper({"", ""}, {true, false});
   EXPECT_THROW(nvtext::load_merge_pairs(cudf::strings_column_view(null_pairs)), cudf::logic_error);
 }
diff --git a/cpp/tests/text/jaccard_tests.cpp b/cpp/tests/text/jaccard_tests.cpp
index a0aee594609..91ebb644f83 100644
--- a/cpp/tests/text/jaccard_tests.cpp
+++ b/cpp/tests/text/jaccard_tests.cpp
@@ -48,21 +48,22 @@ TEST_F(JaccardTest, Basic)
 
 TEST_F(JaccardTest, WithNulls)
 {
-  auto input1 =
-    cudf::test::strings_column_wrapper({"brown fox", "jumps over dog", "", ""}, {1, 1, 0, 1});
-  auto input2 =
-    cudf::test::strings_column_wrapper({"brown cat", "jumps on fox", "", ""}, {1, 1, 1, 0});
+  auto input1 = cudf::test::strings_column_wrapper({"brown fox", "jumps over dog", "", ""},
+                                                   {true, true, false, true});
+  auto input2 = cudf::test::strings_column_wrapper({"brown cat", "jumps on fox", "", ""},
+                                                   {true, true, true, false});
 
   auto view1 = cudf::strings_column_view(input1);
   auto view2 = cudf::strings_column_view(input2);
 
   auto results = nvtext::jaccard_index(view1, view2, 5);
 
-  auto expected =
-    cudf::test::fixed_width_column_wrapper<float>({0.25f, 0.200000003f, 0.f, 0.f}, {1, 1, 0, 0});
+  auto expected = cudf::test::fixed_width_column_wrapper<float>({0.25f, 0.200000003f, 0.f, 0.f},
+                                                                {true, true, false, false});
   CUDF_TEST_EXPECT_COLUMNS_EQUIVALENT(*results, expected);
 
-  expected = cudf::test::fixed_width_column_wrapper<float>({1.0f, 1.0f, 0.f, 0.f}, {1, 1, 0, 1});
+  expected = cudf::test::fixed_width_column_wrapper<float>({1.0f, 1.0f, 0.f, 0.f},
+                                                           {true, true, false, true});
   results  = nvtext::jaccard_index(view1, view1, 7);
   CUDF_TEST_EXPECT_COLUMNS_EQUIVALENT(*results, expected);
 }
diff --git a/cpp/tests/text/normalize_tests.cpp b/cpp/tests/text/normalize_tests.cpp
index bf619bf49bc..b0d41004e7e 100644
--- a/cpp/tests/text/normalize_tests.cpp
+++ b/cpp/tests/text/normalize_tests.cpp
@@ -79,7 +79,7 @@ TEST_F(TextNormalizeTest, NormalizeEmptyTest)
 
 TEST_F(TextNormalizeTest, AllNullStrings)
 {
-  cudf::test::strings_column_wrapper strings({"", "", ""}, {0, 0, 0});
+  cudf::test::strings_column_wrapper strings({"", "", ""}, {false, false, false});
   cudf::strings_column_view strings_view(strings);
   auto results = nvtext::normalize_spaces(strings_view);
   CUDF_TEST_EXPECT_COLUMNS_EQUAL(*results, strings);
@@ -89,10 +89,10 @@ TEST_F(TextNormalizeTest, AllNullStrings)
 
 TEST_F(TextNormalizeTest, SomeNullStrings)
 {
-  cudf::test::strings_column_wrapper strings({"", ".", "a"}, {0, 1, 1});
+  cudf::test::strings_column_wrapper strings({"", ".", "a"}, {false, true, true});
   cudf::strings_column_view strings_view(strings);
   auto results = nvtext::normalize_characters(strings_view, false);
-  cudf::test::strings_column_wrapper expected({"", " . ", "a"}, {0, 1, 1});
+  cudf::test::strings_column_wrapper expected({"", " . ", "a"}, {false, true, true});
   CUDF_TEST_EXPECT_COLUMNS_EQUAL(*results, expected);
 }
 
diff --git a/cpp/tests/text/replace_tests.cpp b/cpp/tests/text/replace_tests.cpp
index faced4a14d3..fadeb690df7 100644
--- a/cpp/tests/text/replace_tests.cpp
+++ b/cpp/tests/text/replace_tests.cpp
@@ -116,7 +116,7 @@ TEST_F(TextReplaceTest, ReplaceTokensErrorTest)
   cudf::strings_column_view strings_view(strings->view());
   cudf::test::strings_column_wrapper notnulls({"", "", ""});
   cudf::strings_column_view notnulls_view(notnulls);
-  cudf::test::strings_column_wrapper nulls({"", ""}, {0, 0});
+  cudf::test::strings_column_wrapper nulls({"", ""}, {false, false});
   cudf::strings_column_view nulls_view(nulls);
 
   EXPECT_THROW(nvtext::replace_tokens(strings_view, nulls_view, notnulls_view), cudf::logic_error);
diff --git a/cpp/tests/text/stemmer_tests.cpp b/cpp/tests/text/stemmer_tests.cpp
index bbc145e0fe7..a343913411c 100644
--- a/cpp/tests/text/stemmer_tests.cpp
+++ b/cpp/tests/text/stemmer_tests.cpp
@@ -168,7 +168,7 @@ TEST_F(TextStemmerTest, EmptyTest)
 TEST_F(TextStemmerTest, ErrorTest)
 {
   auto empty = cudf::make_empty_column(cudf::data_type{cudf::type_id::STRING});
-  cudf::test::fixed_width_column_wrapper<int32_t> indices({0}, {0});
+  cudf::test::fixed_width_column_wrapper<int32_t> indices({0}, {false});
   EXPECT_THROW(nvtext::is_letter(
                  cudf::strings_column_view(empty->view()), nvtext::letter_type::VOWEL, indices),
                cudf::logic_error);
diff --git a/cpp/tests/text/subword_tests.cpp b/cpp/tests/text/subword_tests.cpp
index 5a347e5fe68..a615780c02a 100644
--- a/cpp/tests/text/subword_tests.cpp
+++ b/cpp/tests/text/subword_tests.cpp
@@ -253,7 +253,7 @@ TEST(TextSubwordTest, EmptyStrings)
 
 TEST(TextSubwordTest, AllNullStrings)
 {
-  cudf::test::strings_column_wrapper strings({"", "", ""}, {0, 0, 0});
+  cudf::test::strings_column_wrapper strings({"", "", ""}, {false, false, false});
   std::string hash_file = temp_env->get_temp_filepath("hashed_vocab.txt");
   create_hashed_vocab(hash_file);
   auto vocab  = nvtext::load_vocabulary_file(hash_file);
diff --git a/cpp/tests/text/tokenize_tests.cpp b/cpp/tests/text/tokenize_tests.cpp
index a59a54169d7..f9ca343eaac 100644
--- a/cpp/tests/text/tokenize_tests.cpp
+++ b/cpp/tests/text/tokenize_tests.cpp
@@ -102,7 +102,7 @@ TEST_F(TextTokenizeTest, TokenizeErrorTest)
     EXPECT_THROW(nvtext::count_tokens(strings_view, delimiters_view), cudf::logic_error);
   }
   {
-    cudf::test::strings_column_wrapper delimiters({"", ""}, {0, 0});  // null delimiters
+    cudf::test::strings_column_wrapper delimiters({"", ""}, {false, false});  // null delimiters
     cudf::strings_column_view delimiters_view(delimiters);
     EXPECT_THROW(nvtext::tokenize(strings_view, delimiters_view), cudf::logic_error);
     EXPECT_THROW(nvtext::count_tokens(strings_view, delimiters_view), cudf::logic_error);
@@ -127,7 +127,7 @@ TEST_F(TextTokenizeTest, TokenizeEmptyTest)
   auto view  = cudf::strings_column_view(input->view());
   cudf::test::strings_column_wrapper all_empty_wrapper({"", "", ""});
   auto all_empty = cudf::strings_column_view(all_empty_wrapper);
-  cudf::test::strings_column_wrapper all_null_wrapper({"", "", ""}, {0, 0, 0});
+  cudf::test::strings_column_wrapper all_null_wrapper({"", "", ""}, {false, false, false});
   auto all_null = cudf::strings_column_view(all_null_wrapper);
   cudf::test::fixed_width_column_wrapper<cudf::size_type> expected({0, 0, 0});
 
@@ -278,7 +278,7 @@ TEST_F(TextTokenizeTest, TokenizeErrors)
   cudf::strings_column_view view(empty);
   EXPECT_THROW(nvtext::load_vocabulary(view), cudf::logic_error);
 
-  cudf::test::strings_column_wrapper vocab_nulls({""}, {0});
+  cudf::test::strings_column_wrapper vocab_nulls({""}, {false});
   cudf::strings_column_view nulls(vocab_nulls);
   EXPECT_THROW(nvtext::load_vocabulary(nulls), cudf::logic_error);
 
diff --git a/cpp/tests/transform/nans_to_null_test.cpp b/cpp/tests/transform/nans_to_null_test.cpp
index 5dcfe18b7a0..ba16c100e7a 100644
--- a/cpp/tests/transform/nans_to_null_test.cpp
+++ b/cpp/tests/transform/nans_to_null_test.cpp
@@ -70,7 +70,7 @@ TYPED_TEST(NaNsToNullTest, WithMask)
   using T = TypeParam;
 
   std::vector<T> input   = {1, NAN, 3, NAN, 5, NAN};
-  std::vector<bool> mask = {1, 1, 1, 1, 0, 0};
+  std::vector<bool> mask = {true, true, true, true, false, false};
   auto input_column =
     cudf::test::fixed_width_column_wrapper<T>(input.begin(), input.end(), mask.begin());
   auto expected_column = this->create_expected(input, mask);
@@ -92,7 +92,7 @@ TYPED_TEST(NaNsToNullTest, NoNANWithMask)
   using T = TypeParam;
 
   std::vector<T> input   = {1, 2, 3, 4, 5, 6};
-  std::vector<bool> mask = {1, 1, 1, 1, 0, 0};
+  std::vector<bool> mask = {true, true, true, true, false, false};
   auto input_column =
     cudf::test::fixed_width_column_wrapper<T>(input.begin(), input.end(), mask.begin());
   auto expected_column = this->create_expected(input, mask);
diff --git a/cpp/tests/transform/one_hot_encode_tests.cpp b/cpp/tests/transform/one_hot_encode_tests.cpp
index 8384cb3480b..ae2c3bc0c0c 100644
--- a/cpp/tests/transform/one_hot_encode_tests.cpp
+++ b/cpp/tests/transform/one_hot_encode_tests.cpp
@@ -57,8 +57,9 @@ TYPED_TEST(OneHotEncodingTestTyped, Basic)
 
 TYPED_TEST(OneHotEncodingTestTyped, Nulls)
 {
-  auto input    = cudf::test::fixed_width_column_wrapper<int32_t>{{8, 8, 8, 9, 9}, {1, 1, 0, 1, 1}};
-  auto category = cudf::test::fixed_width_column_wrapper<int32_t>({8, 9, -1}, {1, 1, 0});
+  auto input    = cudf::test::fixed_width_column_wrapper<int32_t>{{8, 8, 8, 9, 9},
+                                                                  {true, true, false, true, true}};
+  auto category = cudf::test::fixed_width_column_wrapper<int32_t>({8, 9, -1}, {true, true, false});
 
   auto col0 = cudf::test::fixed_width_column_wrapper<bool>{1, 1, 0, 0, 0};
   auto col1 = cudf::test::fixed_width_column_wrapper<bool>{0, 0, 0, 1, 1};
@@ -164,8 +165,8 @@ TEST_F(OneHotEncodingTest, Strings)
 {
   auto input = cudf::test::strings_column_wrapper{
     {"hello", "rapidsai", "cudf", "hello", "cuspatial", "hello", "world", "!"},
-    {1, 1, 1, 1, 0, 1, 1, 0}};
-  auto category = cudf::test::strings_column_wrapper{{"hello", "world", ""}, {1, 1, 0}};
+    {true, true, true, true, false, true, true, false}};
+  auto category = cudf::test::strings_column_wrapper{{"hello", "world", ""}, {true, true, false}};
 
   auto col0 = cudf::test::fixed_width_column_wrapper<bool>{1, 0, 0, 1, 0, 1, 0, 0};
   auto col1 = cudf::test::fixed_width_column_wrapper<bool>{0, 0, 0, 0, 0, 0, 1, 0};
diff --git a/cpp/tests/unary/cast_tests.cpp b/cpp/tests/unary/cast_tests.cpp
index ebeafc82039..45b89b76070 100644
--- a/cpp/tests/unary/cast_tests.cpp
+++ b/cpp/tests/unary/cast_tests.cpp
@@ -1036,8 +1036,9 @@ TYPED_TEST(FixedPointTests, Decimal32ToDecimalXXWithLargerScaleAndNullMask)
   using fp_wrapperFrom = cudf::test::fixed_point_column_wrapper<RepTypeFrom>;
   using fp_wrapperTo   = cudf::test::fixed_point_column_wrapper<RepTypeTo>;
 
-  auto const vec      = std::vector{1729, 17290, 172900, 1729000};
-  auto const input    = fp_wrapperFrom{vec.cbegin(), vec.cend(), {1, 1, 1, 0}, scale_type{-3}};
+  auto const vec = std::vector{1729, 17290, 172900, 1729000};
+  auto const input =
+    fp_wrapperFrom{vec.cbegin(), vec.cend(), {true, true, true, false}, scale_type{-3}};
   auto const expected = fp_wrapperTo{{1, 17, 172, 1729000}, {1, 1, 1, 0}, scale_type{0}};
   auto const result   = cudf::cast(input, make_fixed_point_data_type<decimalXX>(0));
 
@@ -1053,8 +1054,9 @@ TYPED_TEST(FixedPointTests, Decimal64ToDecimalXXWithLargerScaleAndNullMask)
   using fp_wrapperFrom = cudf::test::fixed_point_column_wrapper<RepTypeFrom>;
   using fp_wrapperTo   = cudf::test::fixed_point_column_wrapper<RepTypeTo>;
 
-  auto const vec      = std::vector{1729, 17290, 172900, 1729000};
-  auto const input    = fp_wrapperFrom{vec.cbegin(), vec.cend(), {1, 1, 1, 0}, scale_type{-3}};
+  auto const vec = std::vector{1729, 17290, 172900, 1729000};
+  auto const input =
+    fp_wrapperFrom{vec.cbegin(), vec.cend(), {true, true, true, false}, scale_type{-3}};
   auto const expected = fp_wrapperTo{{1, 17, 172, 1729000}, {1, 1, 1, 0}, scale_type{0}};
   auto const result   = cudf::cast(input, make_fixed_point_data_type<decimalXX>(0));
 
@@ -1070,8 +1072,9 @@ TYPED_TEST(FixedPointTests, Decimal128ToDecimalXXWithLargerScaleAndNullMask)
   using fp_wrapperFrom = cudf::test::fixed_point_column_wrapper<RepTypeFrom>;
   using fp_wrapperTo   = cudf::test::fixed_point_column_wrapper<RepTypeTo>;
 
-  auto const vec      = std::vector{1729, 17290, 172900, 1729000};
-  auto const input    = fp_wrapperFrom{vec.cbegin(), vec.cend(), {1, 1, 1, 0}, scale_type{-3}};
+  auto const vec = std::vector{1729, 17290, 172900, 1729000};
+  auto const input =
+    fp_wrapperFrom{vec.cbegin(), vec.cend(), {true, true, true, false}, scale_type{-3}};
   auto const expected = fp_wrapperTo{{1, 17, 172, 1729000}, {1, 1, 1, 0}, scale_type{0}};
   auto const result   = cudf::cast(input, make_fixed_point_data_type<decimalXX>(0));
 
diff --git a/cpp/tests/unary/math_ops_test.cpp b/cpp/tests/unary/math_ops_test.cpp
index acbf0732522..5bfbf70d5f9 100644
--- a/cpp/tests/unary/math_ops_test.cpp
+++ b/cpp/tests/unary/math_ops_test.cpp
@@ -69,7 +69,8 @@ TYPED_TEST(UnaryLogicalOpsTest, SimpleLogicalNot)
 TYPED_TEST(UnaryLogicalOpsTest, SimpleLogicalNotWithNullMask)
 {
   cudf::test::fixed_width_column_wrapper<TypeParam> input{{true, true, true, true}, {1, 0, 1, 1}};
-  cudf::test::fixed_width_column_wrapper<bool> expected{{false, true, false, false}, {1, 0, 1, 1}};
+  cudf::test::fixed_width_column_wrapper<bool> expected{{false, true, false, false},
+                                                        {true, false, true, true}};
   auto output = cudf::unary_operation(input, cudf::unary_operator::NOT);
   CUDF_TEST_EXPECT_COLUMNS_EQUAL(expected, output->view());
   auto encoded = cudf::dictionary::encode(input);
diff --git a/cpp/tests/utilities/column_utilities.cu b/cpp/tests/utilities/column_utilities.cu
index 7cc2777972e..fb9bdeb0b22 100644
--- a/cpp/tests/utilities/column_utilities.cu
+++ b/cpp/tests/utilities/column_utilities.cu
@@ -777,7 +777,7 @@ struct column_comparator {
 
 void check_non_empty_nulls(column_view const& lhs, column_view const& rhs)
 {
-  auto check_column_nulls = [](column_view const& col, const char* col_name) {
+  auto check_column_nulls = [](column_view const& col, char const* col_name) {
     if (cudf::detail::has_nonempty_nulls(col, cudf::get_default_stream())) {
       throw std::invalid_argument(col_name + std::string(" column has non-empty nulls"));
     }
diff --git a/cpp/tests/utilities/identify_stream_usage.cpp b/cpp/tests/utilities/identify_stream_usage.cpp
index 5628f7966c3..5100c066883 100644
--- a/cpp/tests/utilities/identify_stream_usage.cpp
+++ b/cpp/tests/utilities/identify_stream_usage.cpp
@@ -92,7 +92,7 @@ class test_cuda_stream_pool : public cuda_stream_pool {
     return std::vector<rmm::cuda_stream_view>(count, cudf::test::get_default_stream());
   }
 
-  std::size_t get_stream_pool_size() const override { return 1UL; }
+  [[nodiscard]] std::size_t get_stream_pool_size() const override { return 1UL; }
 };
 
 cuda_stream_pool* create_global_cuda_stream_pool() { return new test_cuda_stream_pool(); }
diff --git a/cpp/tests/utilities_tests/logger_tests.cpp b/cpp/tests/utilities_tests/logger_tests.cpp
index 9d44e9d8247..d052e20eedb 100644
--- a/cpp/tests/utilities_tests/logger_tests.cpp
+++ b/cpp/tests/utilities_tests/logger_tests.cpp
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2023, NVIDIA CORPORATION.
+ * Copyright (c) 2023-2024, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -34,7 +34,7 @@ class LoggerTest : public cudf::test::BaseFixture {
     cudf::logger().set_formatter(
       std::unique_ptr<spdlog::formatter>(new spdlog::pattern_formatter("%v")));
   }
-  ~LoggerTest()
+  ~LoggerTest() override
   {
     cudf::logger().set_level(prev_level);
     cudf::logger().sinks() = prev_sinks;
diff --git a/cpp/tests/utilities_tests/type_list_tests.cpp b/cpp/tests/utilities_tests/type_list_tests.cpp
index d0b10b774eb..849457056e4 100644
--- a/cpp/tests/utilities_tests/type_list_tests.cpp
+++ b/cpp/tests/utilities_tests/type_list_tests.cpp
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2019-2021, NVIDIA CORPORATION.
+ * Copyright (c) 2019-2024, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -61,7 +61,7 @@ std::string type_name()
 {
   int status;
   char* realname;
-  realname = abi::__cxa_demangle(typeid(T).name(), 0, 0, &status);
+  realname = abi::__cxa_demangle(typeid(T).name(), nullptr, nullptr, &status);
   std::string name{realname};
   free(realname);
   return name;
@@ -69,10 +69,10 @@ std::string type_name()
 
 TEST(TypeList, GetSize)
 {
-  static_assert(GetSize<Types<>> == 0, "");
-  static_assert(GetSize<Types<int>> == 1, "");
-  static_assert(GetSize<Types<int, int>> == 2, "");
-  static_assert(GetSize<Types<int, void>> == 2, "");
+  static_assert(GetSize<Types<>> == 0);
+  static_assert(GetSize<Types<int>> == 1);
+  static_assert(GetSize<Types<int, int>> == 2);
+  static_assert(GetSize<Types<int, void>> == 2);
 }
 
 TEST(TypeList, GetType)
@@ -149,39 +149,39 @@ TEST(TypeList, CrossProduct)
 
 TEST(TypeList, AllSame)
 {
-  static_assert(AllSame::Call<Types<int, int>>::value, "");
-  static_assert(AllSame::Call<Types<int, int>>::value, "");
-  static_assert(!AllSame::Call<Types<bool, int>>::value, "");
+  static_assert(AllSame::Call<Types<int, int>>::value);
+  static_assert(AllSame::Call<Types<int, int>>::value);
+  static_assert(!AllSame::Call<Types<bool, int>>::value);
 
-  static_assert(AllSame::Call<int, int>::value, "");
-  static_assert(!AllSame::Call<int, bool>::value, "");
+  static_assert(AllSame::Call<int, int>::value);
+  static_assert(!AllSame::Call<int, bool>::value);
 
-  static_assert(AllSame::Call<int, int, int>::value, "");
-  static_assert(!AllSame::Call<int, float, int>::value, "");
-  static_assert(!AllSame::Call<int, int, float>::value, "");
+  static_assert(AllSame::Call<int, int, int>::value);
+  static_assert(!AllSame::Call<int, float, int>::value);
+  static_assert(!AllSame::Call<int, int, float>::value);
 }
 
 TEST(TypeList, Exists)
 {
-  static_assert(Exists<int, Types<int, char, float>>, "");
-  static_assert(!Exists<int, Types<double, char, float>>, "");
-  static_assert(!Exists<int, Types<>>, "");
-  static_assert(Exists<int, Types<double, char, float, int>>, "");
-  static_assert(!Exists<int, Types<double>>, "");
-  static_assert(Exists<int, Types<int>>, "");
+  static_assert(Exists<int, Types<int, char, float>>);
+  static_assert(!Exists<int, Types<double, char, float>>);
+  static_assert(!Exists<int, Types<>>);
+  static_assert(Exists<int, Types<double, char, float, int>>);
+  static_assert(!Exists<int, Types<double>>);
+  static_assert(Exists<int, Types<int>>);
 }
 
 TEST(TypeList, ContainedIn)
 {
-  static_assert(ContainedIn<Types<Types<int, char>>>::Call<Types<int, char>>::value, "");
-  static_assert(!ContainedIn<Types<Types<int, char>>>::Call<Types<int, float>>::value, "");
-  static_assert(!ContainedIn<Types<>>::Call<Types<int, float>>::value, "");
+  static_assert(ContainedIn<Types<Types<int, char>>>::Call<Types<int, char>>::value);
+  static_assert(!ContainedIn<Types<Types<int, char>>>::Call<Types<int, float>>::value);
+  static_assert(!ContainedIn<Types<>>::Call<Types<int, float>>::value);
   static_assert(
-    ContainedIn<Types<Types<int, float>, Types<char, char>>>::Call<Types<int, float>>::value, "");
+    ContainedIn<Types<Types<int, float>, Types<char, char>>>::Call<Types<int, float>>::value);
   static_assert(
-    !ContainedIn<Types<Types<int, float>, Types<char, char>>>::Call<Types<int, double>>::value, "");
-  static_assert(ContainedIn<Types<Types<int, float>, Types<>>>::Call<Types<>>::value, "");
-  static_assert(!ContainedIn<Types<Types<int, float>, Types<int>>>::Call<Types<>>::value, "");
+    !ContainedIn<Types<Types<int, float>, Types<char, char>>>::Call<Types<int, double>>::value);
+  static_assert(ContainedIn<Types<Types<int, float>, Types<>>>::Call<Types<>>::value);
+  static_assert(!ContainedIn<Types<Types<int, float>, Types<int>>>::Call<Types<>>::value);
 }
 
 TEST(TypeList, RemoveIf)
diff --git a/java/src/main/native/include/jni_utils.hpp b/java/src/main/native/include/jni_utils.hpp
index 96ad1f23b8c..ea04c1cda83 100644
--- a/java/src/main/native/include/jni_utils.hpp
+++ b/java/src/main/native/include/jni_utils.hpp
@@ -53,7 +53,7 @@ class jni_exception : public std::runtime_error {
 /**
  * @brief throw a java exception and a C++ one for flow control.
  */
-inline void throw_java_exception(JNIEnv* const env, const char* class_name, const char* message)
+inline void throw_java_exception(JNIEnv* const env, char const* class_name, char const* message)
 {
   jclass ex_class = env->FindClass(class_name);
   if (ex_class != NULL) { env->ThrowNew(ex_class, message); }
@@ -258,7 +258,7 @@ class native_jArray {
     check_java_exception(env);
   }
 
-  native_jArray(JNIEnv* const env, const std::vector<N_TYPE>& arr)
+  native_jArray(JNIEnv* const env, std::vector<N_TYPE> const& arr)
     : env(env), orig(access.newArray(env, arr.size())), len(arr.size()), data_ptr(NULL)
   {
     check_java_exception(env);
@@ -485,7 +485,7 @@ class unique_jpointerArray {
   {
   }
 
-  unique_jpointerArray(JNIEnv* const env, jlongArray orig, const D& del)
+  unique_jpointerArray(JNIEnv* const env, jlongArray orig, D const& del)
     : wrapped(new native_jpointerArray<T>(env, orig)), del(del)
   {
   }
@@ -494,7 +494,7 @@ class unique_jpointerArray {
   {
   }
 
-  unique_jpointerArray(JNIEnv* const env, int len, const D& del)
+  unique_jpointerArray(JNIEnv* const env, int len, D const& del)
     : wrapped(new native_jpointerArray<T>(env, len)), del(del)
   {
   }
@@ -504,7 +504,7 @@ class unique_jpointerArray {
   {
   }
 
-  unique_jpointerArray(JNIEnv* const env, T* arr, int len, const D& del)
+  unique_jpointerArray(JNIEnv* const env, T* arr, int len, D const& del)
     : wrapped(new native_jpointerArray<T>(env, arr, len)), del(del)
   {
   }
@@ -561,7 +561,7 @@ class native_jstring {
  private:
   JNIEnv* env;
   jstring orig;
-  mutable const char* cstr;
+  mutable char const* cstr;
   mutable size_t cstr_length;
 
   void init_cstr() const
@@ -600,7 +600,7 @@ class native_jstring {
 
   bool is_null() const noexcept { return orig == NULL; }
 
-  const char* get() const
+  char const* get() const
   {
     init_cstr();
     return cstr;
@@ -665,7 +665,7 @@ class native_jobjectArray {
     return ret;
   }
 
-  void set(int index, const T& val)
+  void set(int index, T const& val)
   {
     if (orig == NULL) { throw_java_exception(env, NPE_CLASS, "jobjectArray pointer is NULL"); }
     env->SetObjectArrayElement(orig, index, val);
@@ -685,7 +685,7 @@ class native_jstringArray {
   native_jobjectArray<jstring> arr;
   mutable std::vector<native_jstring> cache;
   mutable std::vector<std::string> cpp_cache;
-  mutable std::vector<const char*> c_cache;
+  mutable std::vector<char const*> c_cache;
 
   void init_cache() const
   {
@@ -753,7 +753,7 @@ class native_jstringArray {
     return cache[index];
   }
 
-  const char** const as_c_array() const
+  char const** const as_c_array() const
   {
     init_c_cache();
     return c_cache.data();
@@ -771,13 +771,13 @@ class native_jstringArray {
     update_caches(index, val);
   }
 
-  void set(int index, const native_jstring& val)
+  void set(int index, native_jstring const& val)
   {
     arr.set(index, val.get_jstring());
     update_caches(index, val.get_jstring());
   }
 
-  void set(int index, const char* val)
+  void set(int index, char const* val)
   {
     jstring str = env->NewStringUTF(val);
     check_java_exception(env);
@@ -791,7 +791,7 @@ class native_jstringArray {
  */
 inline jthrowable cuda_exception(JNIEnv* const env, cudaError_t status, jthrowable cause = NULL)
 {
-  const char* ex_class_name;
+  char const* ex_class_name;
 
   // Calls cudaGetLastError twice. It is nearly certain that a fatal error occurred if the second
   // call doesn't return with cudaSuccess.
diff --git a/java/src/main/native/src/ColumnVectorJni.cpp b/java/src/main/native/src/ColumnVectorJni.cpp
index 30a04e37d2c..cdc5aa41abe 100644
--- a/java/src/main/native/src/ColumnVectorJni.cpp
+++ b/java/src/main/native/src/ColumnVectorJni.cpp
@@ -109,10 +109,10 @@ JNIEXPORT jlong JNICALL Java_ai_rapids_cudf_ColumnVector_fromArrow(JNIEnv* env,
       offsets_length  = env->GetDirectBufferCapacity(j_offsets_obj);
     }
     auto data_buffer =
-      arrow::Buffer::Wrap(static_cast<const char*>(data_address), static_cast<int>(data_length));
-    auto null_buffer    = arrow::Buffer::Wrap(static_cast<const char*>(validity_address),
+      arrow::Buffer::Wrap(static_cast<char const*>(data_address), static_cast<int>(data_length));
+    auto null_buffer    = arrow::Buffer::Wrap(static_cast<char const*>(validity_address),
                                            static_cast<int>(validity_length));
-    auto offsets_buffer = arrow::Buffer::Wrap(static_cast<const char*>(offsets_address),
+    auto offsets_buffer = arrow::Buffer::Wrap(static_cast<char const*>(offsets_address),
                                               static_cast<int>(offsets_length));
 
     std::shared_ptr<arrow::Array> arrow_array;
@@ -171,8 +171,8 @@ Java_ai_rapids_cudf_ColumnVector_stringConcatenation(JNIEnv* env,
   JNI_NULL_CHECK(env, narep, "narep string scalar object is null", 0);
   try {
     cudf::jni::auto_set_device(env);
-    const auto& separator_scalar = *reinterpret_cast<cudf::string_scalar*>(separator);
-    const auto& narep_scalar     = *reinterpret_cast<cudf::string_scalar*>(narep);
+    auto const& separator_scalar = *reinterpret_cast<cudf::string_scalar*>(separator);
+    auto const& narep_scalar     = *reinterpret_cast<cudf::string_scalar*>(narep);
     auto null_policy             = separate_nulls ? cudf::strings::separator_on_nulls::YES
                                                   : cudf::strings::separator_on_nulls::NO;
 
@@ -199,8 +199,8 @@ Java_ai_rapids_cudf_ColumnVector_stringConcatenationSepCol(JNIEnv* env,
   JNI_NULL_CHECK(env, col_narep, "column narep string scalar object is null", 0);
   try {
     cudf::jni::auto_set_device(env);
-    const auto& separator_narep_scalar = *reinterpret_cast<cudf::string_scalar*>(separator_narep);
-    const auto& col_narep_scalar       = *reinterpret_cast<cudf::string_scalar*>(col_narep);
+    auto const& separator_narep_scalar = *reinterpret_cast<cudf::string_scalar*>(separator_narep);
+    auto const& col_narep_scalar       = *reinterpret_cast<cudf::string_scalar*>(col_narep);
     auto null_policy                   = separate_nulls ? cudf::strings::separator_on_nulls::YES
                                                         : cudf::strings::separator_on_nulls::NO;
 
diff --git a/java/src/main/native/src/ColumnViewJni.cpp b/java/src/main/native/src/ColumnViewJni.cpp
index 8487fb6dc91..4551325ebb1 100644
--- a/java/src/main/native/src/ColumnViewJni.cpp
+++ b/java/src/main/native/src/ColumnViewJni.cpp
@@ -1026,7 +1026,7 @@ JNIEXPORT jlong JNICALL Java_ai_rapids_cudf_ColumnView_isNullNative(JNIEnv* env,
   JNI_NULL_CHECK(env, handle, "input column is null", 0);
   try {
     cudf::jni::auto_set_device(env);
-    const cudf::column_view* input = reinterpret_cast<cudf::column_view*>(handle);
+    cudf::column_view const* input = reinterpret_cast<cudf::column_view*>(handle);
     return release_as_jlong(cudf::is_null(*input));
   }
   CATCH_STD(env, 0);
@@ -1039,7 +1039,7 @@ JNIEXPORT jlong JNICALL Java_ai_rapids_cudf_ColumnView_isNotNullNative(JNIEnv* e
   JNI_NULL_CHECK(env, handle, "input column is null", 0);
   try {
     cudf::jni::auto_set_device(env);
-    const cudf::column_view* input = reinterpret_cast<cudf::column_view*>(handle);
+    cudf::column_view const* input = reinterpret_cast<cudf::column_view*>(handle);
     return release_as_jlong(cudf::is_valid(*input));
   }
   CATCH_STD(env, 0);
@@ -1052,7 +1052,7 @@ JNIEXPORT jlong JNICALL Java_ai_rapids_cudf_ColumnView_isNanNative(JNIEnv* env,
   JNI_NULL_CHECK(env, handle, "input column is null", 0);
   try {
     cudf::jni::auto_set_device(env);
-    const cudf::column_view* input = reinterpret_cast<cudf::column_view*>(handle);
+    cudf::column_view const* input = reinterpret_cast<cudf::column_view*>(handle);
     return release_as_jlong(cudf::is_nan(*input));
   }
   CATCH_STD(env, 0);
@@ -1065,7 +1065,7 @@ JNIEXPORT jlong JNICALL Java_ai_rapids_cudf_ColumnView_isNotNanNative(JNIEnv* en
   JNI_NULL_CHECK(env, handle, "input column is null", 0);
   try {
     cudf::jni::auto_set_device(env);
-    const cudf::column_view* input = reinterpret_cast<cudf::column_view*>(handle);
+    cudf::column_view const* input = reinterpret_cast<cudf::column_view*>(handle);
     return release_as_jlong(cudf::is_not_nan(*input));
   }
   CATCH_STD(env, 0);
@@ -1104,7 +1104,7 @@ JNIEXPORT jlong JNICALL Java_ai_rapids_cudf_ColumnView_year(JNIEnv* env, jclass,
   JNI_NULL_CHECK(env, input_ptr, "input is null", 0);
   try {
     cudf::jni::auto_set_device(env);
-    const cudf::column_view* input = reinterpret_cast<cudf::column_view*>(input_ptr);
+    cudf::column_view const* input = reinterpret_cast<cudf::column_view*>(input_ptr);
     return release_as_jlong(cudf::datetime::extract_year(*input));
   }
   CATCH_STD(env, 0);
@@ -1115,7 +1115,7 @@ JNIEXPORT jlong JNICALL Java_ai_rapids_cudf_ColumnView_month(JNIEnv* env, jclass
   JNI_NULL_CHECK(env, input_ptr, "input is null", 0);
   try {
     cudf::jni::auto_set_device(env);
-    const cudf::column_view* input = reinterpret_cast<cudf::column_view*>(input_ptr);
+    cudf::column_view const* input = reinterpret_cast<cudf::column_view*>(input_ptr);
     return release_as_jlong(cudf::datetime::extract_month(*input));
   }
   CATCH_STD(env, 0);
@@ -1126,7 +1126,7 @@ JNIEXPORT jlong JNICALL Java_ai_rapids_cudf_ColumnView_day(JNIEnv* env, jclass,
   JNI_NULL_CHECK(env, input_ptr, "input is null", 0);
   try {
     cudf::jni::auto_set_device(env);
-    const cudf::column_view* input = reinterpret_cast<cudf::column_view*>(input_ptr);
+    cudf::column_view const* input = reinterpret_cast<cudf::column_view*>(input_ptr);
     return release_as_jlong(cudf::datetime::extract_day(*input));
   }
   CATCH_STD(env, 0);
@@ -1137,7 +1137,7 @@ JNIEXPORT jlong JNICALL Java_ai_rapids_cudf_ColumnView_hour(JNIEnv* env, jclass,
   JNI_NULL_CHECK(env, input_ptr, "input is null", 0);
   try {
     cudf::jni::auto_set_device(env);
-    const cudf::column_view* input = reinterpret_cast<cudf::column_view*>(input_ptr);
+    cudf::column_view const* input = reinterpret_cast<cudf::column_view*>(input_ptr);
     return release_as_jlong(cudf::datetime::extract_hour(*input));
   }
   CATCH_STD(env, 0);
@@ -1148,7 +1148,7 @@ JNIEXPORT jlong JNICALL Java_ai_rapids_cudf_ColumnView_minute(JNIEnv* env, jclas
   JNI_NULL_CHECK(env, input_ptr, "input is null", 0);
   try {
     cudf::jni::auto_set_device(env);
-    const cudf::column_view* input = reinterpret_cast<cudf::column_view*>(input_ptr);
+    cudf::column_view const* input = reinterpret_cast<cudf::column_view*>(input_ptr);
     return release_as_jlong(cudf::datetime::extract_minute(*input));
   }
   CATCH_STD(env, 0);
@@ -1159,7 +1159,7 @@ JNIEXPORT jlong JNICALL Java_ai_rapids_cudf_ColumnView_second(JNIEnv* env, jclas
   JNI_NULL_CHECK(env, input_ptr, "input is null", 0);
   try {
     cudf::jni::auto_set_device(env);
-    const cudf::column_view* input = reinterpret_cast<cudf::column_view*>(input_ptr);
+    cudf::column_view const* input = reinterpret_cast<cudf::column_view*>(input_ptr);
     return release_as_jlong(cudf::datetime::extract_second(*input));
   }
   CATCH_STD(env, 0);
@@ -1170,7 +1170,7 @@ JNIEXPORT jlong JNICALL Java_ai_rapids_cudf_ColumnView_weekDay(JNIEnv* env, jcla
   JNI_NULL_CHECK(env, input_ptr, "input is null", 0);
   try {
     cudf::jni::auto_set_device(env);
-    const cudf::column_view* input = reinterpret_cast<cudf::column_view*>(input_ptr);
+    cudf::column_view const* input = reinterpret_cast<cudf::column_view*>(input_ptr);
     return release_as_jlong(cudf::datetime::extract_weekday(*input));
   }
   CATCH_STD(env, 0);
@@ -1183,7 +1183,7 @@ JNIEXPORT jlong JNICALL Java_ai_rapids_cudf_ColumnView_lastDayOfMonth(JNIEnv* en
   JNI_NULL_CHECK(env, input_ptr, "input is null", 0);
   try {
     cudf::jni::auto_set_device(env);
-    const cudf::column_view* input = reinterpret_cast<cudf::column_view*>(input_ptr);
+    cudf::column_view const* input = reinterpret_cast<cudf::column_view*>(input_ptr);
     return release_as_jlong(cudf::datetime::last_day_of_month(*input));
   }
   CATCH_STD(env, 0);
@@ -1196,7 +1196,7 @@ JNIEXPORT jlong JNICALL Java_ai_rapids_cudf_ColumnView_dayOfYear(JNIEnv* env,
   JNI_NULL_CHECK(env, input_ptr, "input is null", 0);
   try {
     cudf::jni::auto_set_device(env);
-    const cudf::column_view* input = reinterpret_cast<cudf::column_view*>(input_ptr);
+    cudf::column_view const* input = reinterpret_cast<cudf::column_view*>(input_ptr);
     return release_as_jlong(cudf::datetime::day_of_year(*input));
   }
   CATCH_STD(env, 0);
@@ -1209,7 +1209,7 @@ JNIEXPORT jlong JNICALL Java_ai_rapids_cudf_ColumnView_quarterOfYear(JNIEnv* env
   JNI_NULL_CHECK(env, input_ptr, "input is null", 0);
   try {
     cudf::jni::auto_set_device(env);
-    const cudf::column_view* input = reinterpret_cast<cudf::column_view*>(input_ptr);
+    cudf::column_view const* input = reinterpret_cast<cudf::column_view*>(input_ptr);
     return release_as_jlong(cudf::datetime::extract_quarter(*input));
   }
   CATCH_STD(env, 0);
@@ -1224,8 +1224,8 @@ JNIEXPORT jlong JNICALL Java_ai_rapids_cudf_ColumnView_addCalendricalMonths(JNIE
   JNI_NULL_CHECK(env, months_ptr, "months is null", 0);
   try {
     cudf::jni::auto_set_device(env);
-    const cudf::column_view* ts     = reinterpret_cast<cudf::column_view*>(ts_ptr);
-    const cudf::column_view* months = reinterpret_cast<cudf::column_view*>(months_ptr);
+    cudf::column_view const* ts     = reinterpret_cast<cudf::column_view*>(ts_ptr);
+    cudf::column_view const* months = reinterpret_cast<cudf::column_view*>(months_ptr);
     return release_as_jlong(cudf::datetime::add_calendrical_months(*ts, *months));
   }
   CATCH_STD(env, 0);
@@ -1238,7 +1238,7 @@ JNIEXPORT jlong JNICALL Java_ai_rapids_cudf_ColumnView_isLeapYear(JNIEnv* env,
   JNI_NULL_CHECK(env, input_ptr, "input is null", 0);
   try {
     cudf::jni::auto_set_device(env);
-    const cudf::column_view* input = reinterpret_cast<cudf::column_view*>(input_ptr);
+    cudf::column_view const* input = reinterpret_cast<cudf::column_view*>(input_ptr);
     return release_as_jlong(cudf::datetime::is_leap_year(*input));
   }
   CATCH_STD(env, 0);
@@ -2702,8 +2702,8 @@ JNIEXPORT jlong JNICALL Java_ai_rapids_cudf_ColumnView_stringConcatenationListEl
   JNI_NULL_CHECK(env, col_narep, "column narep string scalar object is null", 0);
   try {
     cudf::jni::auto_set_device(env);
-    const auto& separator_narep_scalar = *reinterpret_cast<cudf::string_scalar*>(separator_narep);
-    const auto& col_narep_scalar       = *reinterpret_cast<cudf::string_scalar*>(col_narep);
+    auto const& separator_narep_scalar = *reinterpret_cast<cudf::string_scalar*>(separator_narep);
+    auto const& col_narep_scalar       = *reinterpret_cast<cudf::string_scalar*>(col_narep);
     auto null_policy                   = separate_nulls ? cudf::strings::separator_on_nulls::YES
                                                         : cudf::strings::separator_on_nulls::NO;
     auto empty_list_output             = empty_string_output_if_empty_list
@@ -2738,8 +2738,8 @@ JNIEXPORT jlong JNICALL Java_ai_rapids_cudf_ColumnView_stringConcatenationListEl
   JNI_NULL_CHECK(env, narep, "separator narep string scalar object is null", 0);
   try {
     cudf::jni::auto_set_device(env);
-    const auto& separator_scalar = *reinterpret_cast<cudf::string_scalar*>(separator);
-    const auto& narep_scalar     = *reinterpret_cast<cudf::string_scalar*>(narep);
+    auto const& separator_scalar = *reinterpret_cast<cudf::string_scalar*>(separator);
+    auto const& narep_scalar     = *reinterpret_cast<cudf::string_scalar*>(narep);
     auto null_policy             = separate_nulls ? cudf::strings::separator_on_nulls::YES
                                                   : cudf::strings::separator_on_nulls::NO;
     auto empty_list_output       = empty_string_output_if_empty_list
@@ -2837,7 +2837,7 @@ JNIEXPORT jlong JNICALL Java_ai_rapids_cudf_ColumnView_toHex(JNIEnv* env, jclass
   JNI_NULL_CHECK(env, input_ptr, "input is null", 0);
   try {
     cudf::jni::auto_set_device(env);
-    const cudf::column_view* input = reinterpret_cast<cudf::column_view*>(input_ptr);
+    cudf::column_view const* input = reinterpret_cast<cudf::column_view*>(input_ptr);
     return release_as_jlong(cudf::strings::integers_to_hex(*input));
   }
   CATCH_STD(env, 0);
diff --git a/java/src/main/native/src/RmmJni.cpp b/java/src/main/native/src/RmmJni.cpp
index 8bd0f7793b4..5842a980fc4 100644
--- a/java/src/main/native/src/RmmJni.cpp
+++ b/java/src/main/native/src/RmmJni.cpp
@@ -450,7 +450,7 @@ class pinned_fallback_host_memory_resource {
   {
     try {
       return _pool->allocate(bytes, alignment);
-    } catch (const std::exception& unused) {
+    } catch (std::exception const& unused) {
       // try to allocate using the underlying pinned resource
       return prior_cudf_pinned_mr().allocate(bytes, alignment);
     }
@@ -558,13 +558,13 @@ class pinned_fallback_host_memory_resource {
   /**
    * @briefreturn{true if the specified resource is the same type as this resource.}
    */
-  bool operator==(const pinned_fallback_host_memory_resource&) const { return true; }
+  bool operator==(pinned_fallback_host_memory_resource const&) const { return true; }
 
   /**
    * @briefreturn{true if the specified resource is not the same type as this resource, otherwise
    * false.}
    */
-  bool operator!=(const pinned_fallback_host_memory_resource&) const { return false; }
+  bool operator!=(pinned_fallback_host_memory_resource const&) const { return false; }
 
   /**
    * @brief Enables the `cuda::mr::device_accessible` property
@@ -1067,7 +1067,7 @@ JNIEXPORT jlong JNICALL Java_ai_rapids_cudf_Rmm_allocFromPinnedPool(JNIEnv* env,
     auto pool = reinterpret_cast<rmm_pinned_pool_t*>(pool_ptr);
     void* ret = pool->allocate(size);
     return reinterpret_cast<jlong>(ret);
-  } catch (const std::exception& unused) {
+  } catch (std::exception const& unused) {
     return -1;
   }
 }
diff --git a/java/src/main/native/src/ScalarJni.cpp b/java/src/main/native/src/ScalarJni.cpp
index 6a1ad1a9f32..55037910abe 100644
--- a/java/src/main/native/src/ScalarJni.cpp
+++ b/java/src/main/native/src/ScalarJni.cpp
@@ -180,8 +180,8 @@ Java_ai_rapids_cudf_Scalar_getChildrenFromStructScalar(JNIEnv* env, jclass, jlon
   JNI_NULL_CHECK(env, scalar_handle, "scalar handle is null", 0);
   try {
     cudf::jni::auto_set_device(env);
-    const auto s                  = reinterpret_cast<cudf::struct_scalar*>(scalar_handle);
-    const cudf::table_view& table = s->view();
+    auto const s                  = reinterpret_cast<cudf::struct_scalar*>(scalar_handle);
+    cudf::table_view const& table = s->view();
     cudf::jni::native_jpointerArray<cudf::column_view> column_handles(env, table.num_columns());
     for (int i = 0; i < table.num_columns(); i++) {
       column_handles[i] = new cudf::column_view(table.column(i));
diff --git a/java/src/main/native/src/TableJni.cpp b/java/src/main/native/src/TableJni.cpp
index e411b1d5362..c58cd732b39 100644
--- a/java/src/main/native/src/TableJni.cpp
+++ b/java/src/main/native/src/TableJni.cpp
@@ -102,14 +102,14 @@ typedef jni_table_writer_handle<cudf::io::orc_chunked_writer> native_orc_writer_
 
 class native_arrow_ipc_writer_handle final {
  public:
-  explicit native_arrow_ipc_writer_handle(const std::vector<std::string>& col_names,
-                                          const std::string& file_name)
+  explicit native_arrow_ipc_writer_handle(std::vector<std::string> const& col_names,
+                                          std::string const& file_name)
     : initialized(false), column_names(col_names), file_name(file_name)
   {
   }
 
-  explicit native_arrow_ipc_writer_handle(const std::vector<std::string>& col_names,
-                                          const std::shared_ptr<arrow::io::OutputStream>& sink)
+  explicit native_arrow_ipc_writer_handle(std::vector<std::string> const& col_names,
+                                          std::shared_ptr<arrow::io::OutputStream> const& sink)
     : initialized(false), column_names(col_names), file_name(""), sink(sink)
   {
   }
@@ -178,7 +178,7 @@ class native_arrow_ipc_writer_handle final {
     initialized = false;
   }
 
-  std::vector<cudf::column_metadata> get_column_metadata(const cudf::table_view& tview)
+  std::vector<cudf::column_metadata> get_column_metadata(cudf::table_view const& tview)
   {
     if (!column_names.empty() && columns_meta.empty()) {
       // Rebuild the structure of column meta according to table schema.
@@ -200,9 +200,9 @@ class native_arrow_ipc_writer_handle final {
   }
 
  private:
-  cudf::column_metadata build_one_column_meta(const cudf::column_view& cview,
+  cudf::column_metadata build_one_column_meta(cudf::column_view const& cview,
                                               size_t& idx,
-                                              const bool consume_name = true)
+                                              bool const consume_name = true)
   {
     auto col_meta = cudf::column_metadata{};
     if (consume_name) { col_meta.name = get_column_name(idx++); }
@@ -266,16 +266,16 @@ class jni_arrow_output_stream final : public arrow::io::OutputStream {
     host_memory_allocator = nullptr;
   }
 
-  arrow::Status Write(const std::shared_ptr<arrow::Buffer>& data) override
+  arrow::Status Write(std::shared_ptr<arrow::Buffer> const& data) override
   {
     return Write(data->data(), data->size());
   }
 
-  arrow::Status Write(const void* data, int64_t nbytes) override
+  arrow::Status Write(void const* data, int64_t nbytes) override
   {
     JNIEnv* env           = cudf::jni::get_jni_env(jvm);
     int64_t left_to_copy  = nbytes;
-    const char* copy_from = static_cast<const char*>(data);
+    char const* copy_from = static_cast<char const*>(data);
     while (left_to_copy > 0) {
       long buffer_amount_available = current_buffer_len - current_buffer_written;
       if (buffer_amount_available <= 0) {
@@ -440,7 +440,7 @@ class jni_arrow_input_stream final : public arrow::io::InputStream {
 
 class native_arrow_ipc_reader_handle final {
  public:
-  explicit native_arrow_ipc_reader_handle(const std::string& file_name)
+  explicit native_arrow_ipc_reader_handle(std::string const& file_name)
   {
     auto tmp_source = arrow::io::ReadableFile::Open(file_name);
     if (!tmp_source.ok()) { throw std::runtime_error(tmp_source.status().message()); }
@@ -2056,7 +2056,7 @@ JNIEXPORT jlongArray JNICALL Java_ai_rapids_cudf_Table_readAvro(JNIEnv* env,
                                                                 jlong buffer,
                                                                 jlong buffer_length)
 {
-  const bool read_buffer = (buffer != 0);
+  bool const read_buffer = (buffer != 0);
   if (!read_buffer) {
     JNI_NULL_CHECK(env, inputfilepath, "input file or buffer must be supplied", NULL);
   } else if (inputfilepath != NULL) {
@@ -2421,7 +2421,7 @@ Java_ai_rapids_cudf_Table_writeORCBufferBegin(JNIEnv* env,
                    meta_keys.end(),
                    meta_values.begin(),
                    std::inserter(kv_metadata, kv_metadata.end()),
-                   [](const std::string& k, const std::string& v) { return std::make_pair(k, v); });
+                   [](std::string const& k, std::string const& v) { return std::make_pair(k, v); });
 
     std::unique_ptr<cudf::jni::jni_writer_data_sink> data_sink(
       new cudf::jni::jni_writer_data_sink(env, consumer, host_memory_allocator));
@@ -2495,7 +2495,7 @@ JNIEXPORT long JNICALL Java_ai_rapids_cudf_Table_writeORCFileBegin(JNIEnv* env,
                    meta_keys.end(),
                    meta_values.begin(),
                    std::inserter(kv_metadata, kv_metadata.end()),
-                   [](const std::string& k, const std::string& v) { return std::make_pair(k, v); });
+                   [](std::string const& k, std::string const& v) { return std::make_pair(k, v); });
 
     sink_info sink{output_path.get()};
     auto stats                      = std::make_shared<cudf::io::writer_compression_statistics>();
diff --git a/java/src/main/native/src/jni_writer_data_sink.hpp b/java/src/main/native/src/jni_writer_data_sink.hpp
index 52756266beb..c918e87ba89 100644
--- a/java/src/main/native/src/jni_writer_data_sink.hpp
+++ b/java/src/main/native/src/jni_writer_data_sink.hpp
@@ -61,7 +61,7 @@ class jni_writer_data_sink final : public cudf::io::data_sink {
   {
     JNIEnv* env           = cudf::jni::get_jni_env(jvm);
     long left_to_copy     = static_cast<long>(size);
-    const char* copy_from = static_cast<const char*>(data);
+    char const* copy_from = static_cast<char const*>(data);
     while (left_to_copy > 0) {
       long buffer_amount_available = current_buffer_len - current_buffer_written;
       if (buffer_amount_available <= 0) {
@@ -87,7 +87,7 @@ class jni_writer_data_sink final : public cudf::io::data_sink {
   {
     JNIEnv* env           = cudf::jni::get_jni_env(jvm);
     long left_to_copy     = static_cast<long>(size);
-    const char* copy_from = static_cast<const char*>(gpu_data);
+    char const* copy_from = static_cast<char const*>(gpu_data);
     while (left_to_copy > 0) {
       long buffer_amount_available = current_buffer_len - current_buffer_written;
       if (buffer_amount_available <= 0) {

From 9fae8ab6133614dd155c8ca445d59eb1ce36b4bd Mon Sep 17 00:00:00 2001
From: Lawrence Mitchell <lmitchell@nvidia.com>
Date: Wed, 12 Jun 2024 14:16:31 +0100
Subject: [PATCH 6/9] Add test coverage for slicing with "out of bounds"
 negative indices (#15990)

Polars wraps negative starts and then clamps both the resulting start
and length to [0, num_rows), so we should do that.

Add tests of this behaviour as well.

Authors:
  - Lawrence Mitchell (https://github.com/wence-)

Approvers:
  - Bradley Dice (https://github.com/bdice)

URL: https://github.com/rapidsai/cudf/pull/15990
---
 .../cudf_polars/containers/dataframe.py           | 13 ++++++++-----
 python/cudf_polars/cudf_polars/testing/asserts.py | 14 ++++++++++++--
 python/cudf_polars/cudf_polars/typing/__init__.py | 15 ++++++++++++++-
 python/cudf_polars/tests/test_slice.py            | 13 +++++++------
 4 files changed, 41 insertions(+), 14 deletions(-)

diff --git a/python/cudf_polars/cudf_polars/containers/dataframe.py b/python/cudf_polars/cudf_polars/containers/dataframe.py
index 7039fcaf077..d1f7a9ed2cf 100644
--- a/python/cudf_polars/cudf_polars/containers/dataframe.py
+++ b/python/cudf_polars/cudf_polars/containers/dataframe.py
@@ -96,7 +96,7 @@ def from_table(cls, table: plc.Table, names: Sequence[str]) -> Self:
 
         Returns
         -------
-        New dataframe sharing  data with the input table.
+        New dataframe sharing data with the input table.
 
         Raises
         ------
@@ -205,15 +205,18 @@ def slice(self, zlice: tuple[int, int] | None) -> Self:
 
         Returns
         -------
-        New dataframe (if zlice is not None) other self (if it is)
+        New dataframe (if zlice is not None) otherwise self (if it is)
         """
         if zlice is None:
             return self
         start, length = zlice
         if start < 0:
             start += self.num_rows
-        # Polars slice takes an arbitrary positive integer and slice
-        # to the end of the frame if it is larger.
-        end = min(start + length, self.num_rows)
+        # Polars implementation wraps negative start by num_rows, then
+        # adds length to start to get the end, then clamps both to
+        # [0, num_rows)
+        end = start + length
+        start = max(min(start, self.num_rows), 0)
+        end = max(min(end, self.num_rows), 0)
         (table,) = plc.copying.slice(self.table, [start, end])
         return type(self).from_table(table, self.column_names).sorted_like(self)
diff --git a/python/cudf_polars/cudf_polars/testing/asserts.py b/python/cudf_polars/cudf_polars/testing/asserts.py
index 2f19b41cc3a..3edaa427432 100644
--- a/python/cudf_polars/cudf_polars/testing/asserts.py
+++ b/python/cudf_polars/cudf_polars/testing/asserts.py
@@ -13,14 +13,19 @@
 from cudf_polars.callback import execute_with_cudf
 
 if TYPE_CHECKING:
+    from collections.abc import Mapping
+
     import polars as pl
 
+    from cudf_polars.typing import OptimizationArgs
+
 __all__: list[str] = ["assert_gpu_result_equal"]
 
 
 def assert_gpu_result_equal(
     lazydf: pl.LazyFrame,
     *,
+    collect_kwargs: Mapping[OptimizationArgs, bool] | None = None,
     check_row_order: bool = True,
     check_column_order: bool = True,
     check_dtypes: bool = True,
@@ -36,6 +41,9 @@ def assert_gpu_result_equal(
     ----------
     lazydf
         frame to collect.
+    collect_kwargs
+        Keyword arguments to pass to collect. Useful for controlling
+        optimization settings.
     check_row_order
         Expect rows to be in same order
     check_column_order
@@ -59,9 +67,11 @@ def assert_gpu_result_equal(
     NotImplementedError
         If GPU collection failed in some way.
     """
-    expect = lazydf.collect()
+    collect_kwargs = {} if collect_kwargs is None else collect_kwargs
+    expect = lazydf.collect(**collect_kwargs)
     got = lazydf.collect(
-        post_opt_callback=partial(execute_with_cudf, raise_on_fail=True)
+        **collect_kwargs,
+        post_opt_callback=partial(execute_with_cudf, raise_on_fail=True),
     )
     assert_frame_equal(
         expect,
diff --git a/python/cudf_polars/cudf_polars/typing/__init__.py b/python/cudf_polars/cudf_polars/typing/__init__.py
index 287c977f4eb..6d597a91724 100644
--- a/python/cudf_polars/cudf_polars/typing/__init__.py
+++ b/python/cudf_polars/cudf_polars/typing/__init__.py
@@ -6,7 +6,7 @@
 from __future__ import annotations
 
 from collections.abc import Mapping
-from typing import TYPE_CHECKING, Protocol, TypeAlias
+from typing import TYPE_CHECKING, Literal, Protocol, TypeAlias
 
 from polars.polars import _expr_nodes as pl_expr, _ir_nodes as pl_ir
 
@@ -89,3 +89,16 @@ def set_udf(
     ) -> None:
         """Set the callback replacing the current node in the plan."""
         ...
+
+
+OptimizationArgs: TypeAlias = Literal[
+    "type_coercion",
+    "predicate_pushdown",
+    "projection_pushdown",
+    "simplify_expression",
+    "slice_pushdown",
+    "comm_subplan_elim",
+    "comm_subexpr_elim",
+    "cluster_with_columns",
+    "no_optimization",
+]
diff --git a/python/cudf_polars/tests/test_slice.py b/python/cudf_polars/tests/test_slice.py
index d27e91302ba..8ea5c623ae7 100644
--- a/python/cudf_polars/tests/test_slice.py
+++ b/python/cudf_polars/tests/test_slice.py
@@ -11,13 +11,14 @@
 
 @pytest.mark.parametrize(
     "offset",
-    [0, 1, 2],
+    [0, 1, 2, -10, -20, -1, -2, 20],
 )
 @pytest.mark.parametrize(
-    "len",
-    [0, 2, 12],
+    "length",
+    [0, 2, 12, 11],
 )
-def test_slice(offset, len):
+@pytest.mark.parametrize("slice_pushdown", [False, True])
+def test_slice(offset, length, slice_pushdown):
     ldf = pl.DataFrame(
         {
             "a": [1, 2, 3, 4, 5, 6, 7],
@@ -29,6 +30,6 @@ def test_slice(offset, len):
         ldf.group_by(pl.col("a"))
         .agg(pl.col("b").sum())
         .sort(by=pl.col("a"))
-        .slice(offset, len)
+        .slice(offset, length)
     )
-    assert_gpu_result_equal(query)
+    assert_gpu_result_equal(query, collect_kwargs={"slice_pushdown": slice_pushdown})

From e57f0fe4edafb689ff468ae6336d47b3aea4772d Mon Sep 17 00:00:00 2001
From: GALI PREM SAGAR <sagarprem75@gmail.com>
Date: Wed, 12 Jun 2024 09:19:48 -0500
Subject: [PATCH 7/9] Enable round-tripping of large strings in `cudf` (#15944)

Fixes: #15922

This PR adds support for round-tripping `LargeStringArray` in `cudf` using 64 bit offsets.

Authors:
  - GALI PREM SAGAR (https://github.com/galipremsagar)

Approvers:
  - Lawrence Mitchell (https://github.com/wence-)
  - David Wendt (https://github.com/davidwendt)
  - Bradley Dice (https://github.com/bdice)

URL: https://github.com/rapidsai/cudf/pull/15944
---
 cpp/src/interop/from_arrow.cu          | 42 ++++++++++++++++++++------
 cpp/src/interop/to_arrow.cu            | 18 ++++++++---
 cpp/tests/interop/from_arrow_test.cpp  | 42 ++++++++++++++++++++++++--
 python/cudf/cudf/core/column/column.py |  6 ----
 python/cudf/cudf/tests/test_series.py  | 11 ++++---
 5 files changed, 91 insertions(+), 28 deletions(-)

diff --git a/cpp/src/interop/from_arrow.cu b/cpp/src/interop/from_arrow.cu
index f100ca0cc2b..579820cbae3 100644
--- a/cpp/src/interop/from_arrow.cu
+++ b/cpp/src/interop/from_arrow.cu
@@ -78,6 +78,7 @@ data_type arrow_to_cudf_type(arrow::DataType const& arrow_type)
       }
     }
     case arrow::Type::STRING: return data_type(type_id::STRING);
+    case arrow::Type::LARGE_STRING: return data_type(type_id::STRING);
     case arrow::Type::DICTIONARY: return data_type(type_id::DICTIONARY32);
     case arrow::Type::LIST: return data_type(type_id::LIST);
     case arrow::Type::DECIMAL: {
@@ -276,21 +277,42 @@ std::unique_ptr<column> dispatch_to_cudf_column::operator()<cudf::string_view>(
   rmm::device_async_resource_ref mr)
 {
   if (array.length() == 0) { return make_empty_column(type_id::STRING); }
-  auto str_array    = static_cast<arrow::StringArray const*>(&array);
-  auto offset_array = std::make_unique<arrow::Int32Array>(
-    str_array->value_offsets()->size() / sizeof(int32_t), str_array->value_offsets(), nullptr);
-  auto char_array = std::make_unique<arrow::Int8Array>(
-    str_array->value_data()->size(), str_array->value_data(), nullptr);
 
-  auto offsets_column = dispatch_to_cudf_column{}.operator()<int32_t>(
-    *offset_array, data_type(type_id::INT32), true, stream, mr);
-  auto chars_column = dispatch_to_cudf_column{}.operator()<int8_t>(
-    *char_array, data_type(type_id::INT8), true, stream, mr);
+  std::unique_ptr<column> offsets_column;
+  std::unique_ptr<arrow::Array> char_array;
+
+  if (array.type_id() == arrow::Type::LARGE_STRING) {
+    auto str_array    = static_cast<arrow::LargeStringArray const*>(&array);
+    auto offset_array = std::make_unique<arrow::Int64Array>(
+      str_array->value_offsets()->size() / sizeof(int64_t), str_array->value_offsets(), nullptr);
+    offsets_column = dispatch_to_cudf_column{}.operator()<int64_t>(
+      *offset_array, data_type(type_id::INT64), true, stream, mr);
+    char_array = std::make_unique<arrow::Int8Array>(
+      str_array->value_data()->size(), str_array->value_data(), nullptr);
+  } else if (array.type_id() == arrow::Type::STRING) {
+    auto str_array    = static_cast<arrow::StringArray const*>(&array);
+    auto offset_array = std::make_unique<arrow::Int32Array>(
+      str_array->value_offsets()->size() / sizeof(int32_t), str_array->value_offsets(), nullptr);
+    offsets_column = dispatch_to_cudf_column{}.operator()<int32_t>(
+      *offset_array, data_type(type_id::INT32), true, stream, mr);
+    char_array = std::make_unique<arrow::Int8Array>(
+      str_array->value_data()->size(), str_array->value_data(), nullptr);
+  } else {
+    throw std::runtime_error("Unsupported array type");
+  }
+
+  rmm::device_buffer chars(char_array->length(), stream, mr);
+  auto data_buffer = char_array->data()->buffers[1];
+  CUDF_CUDA_TRY(cudaMemcpyAsync(chars.data(),
+                                reinterpret_cast<uint8_t const*>(data_buffer->address()),
+                                chars.size(),
+                                cudaMemcpyDefault,
+                                stream.value()));
 
   auto const num_rows = offsets_column->size() - 1;
   auto out_col        = make_strings_column(num_rows,
                                      std::move(offsets_column),
-                                     std::move(chars_column->release().data.release()[0]),
+                                     std::move(chars),
                                      array.null_count(),
                                      std::move(*get_mask_buffer(array, stream, mr)));
 
diff --git a/cpp/src/interop/to_arrow.cu b/cpp/src/interop/to_arrow.cu
index e871e656c48..47aee982c32 100644
--- a/cpp/src/interop/to_arrow.cu
+++ b/cpp/src/interop/to_arrow.cu
@@ -306,11 +306,19 @@ std::shared_ptr<arrow::Array> dispatch_to_arrow::operator()<cudf::string_view>(
                               static_cast<std::size_t>(sview.chars_size(stream))},
     ar_mr,
     stream);
-  return std::make_shared<arrow::StringArray>(static_cast<int64_t>(input_view.size()),
-                                              offset_buffer,
-                                              data_buffer,
-                                              fetch_mask_buffer(input_view, ar_mr, stream),
-                                              static_cast<int64_t>(input_view.null_count()));
+  if (sview.offsets().type().id() == cudf::type_id::INT64) {
+    return std::make_shared<arrow::LargeStringArray>(static_cast<int64_t>(input_view.size()),
+                                                     offset_buffer,
+                                                     data_buffer,
+                                                     fetch_mask_buffer(input_view, ar_mr, stream),
+                                                     static_cast<int64_t>(input_view.null_count()));
+  } else {
+    return std::make_shared<arrow::StringArray>(static_cast<int64_t>(input_view.size()),
+                                                offset_buffer,
+                                                data_buffer,
+                                                fetch_mask_buffer(input_view, ar_mr, stream),
+                                                static_cast<int64_t>(input_view.null_count()));
+  }
 }
 
 template <>
diff --git a/cpp/tests/interop/from_arrow_test.cpp b/cpp/tests/interop/from_arrow_test.cpp
index aec2bab7196..af20a5c772f 100644
--- a/cpp/tests/interop/from_arrow_test.cpp
+++ b/cpp/tests/interop/from_arrow_test.cpp
@@ -50,13 +50,36 @@ std::unique_ptr<cudf::table> get_cudf_table()
                                                               {true, false, true, true, true});
   columns.emplace_back(std::move(cudf::dictionary::encode(col4)));
   columns.emplace_back(cudf::test::fixed_width_column_wrapper<bool>(
-                         {true, false, true, false, true}, {true, false, true, true, false})
+                         {true, false, true, false, true}, {true, false, true, true, false}).release());
+  columns.emplace_back(cudf::test::strings_column_wrapper(
+                         {
+                           "",
+                           "abc",
+                           "def",
+                           "1",
+                           "2",
+                         },
+                         {0, 1, 1, 1, 1})
                          .release());
   // columns.emplace_back(cudf::test::lists_column_wrapper<int>({{1, 2}, {3, 4}, {}, {6}, {7, 8,
   // 9}}).release());
   return std::make_unique<cudf::table>(std::move(columns));
 }
 
+std::shared_ptr<arrow::LargeStringArray> get_arrow_large_string_array(
+  std::vector<std::string> const& data, std::vector<uint8_t> const& mask = {})
+{
+  std::shared_ptr<arrow::LargeStringArray> large_string_array;
+  arrow::LargeStringBuilder large_string_builder;
+
+  CUDF_EXPECTS(large_string_builder.AppendValues(data, mask.data()).ok(),
+               "Failed to append values to string builder");
+  CUDF_EXPECTS(large_string_builder.Finish(&large_string_array).ok(),
+               "Failed to create arrow string array");
+
+  return large_string_array;
+}
+
 struct FromArrowTest : public cudf::test::BaseFixture {};
 
 template <typename T>
@@ -294,6 +317,15 @@ TEST_F(FromArrowTest, ChunkedArray)
       "ccc",
     },
     {0, 1});
+  auto large_string_array_1 = get_arrow_large_string_array(
+    {
+      "",
+      "abc",
+      "def",
+      "1",
+      "2",
+    },
+    {0, 1, 1, 1, 1});
   auto dict_array1 = get_arrow_dict_array({1, 2, 5, 7}, {0, 1, 2}, {1, 0, 1});
   auto dict_array2 = get_arrow_dict_array({1, 2, 5, 7}, {1, 3});
 
@@ -307,13 +339,16 @@ TEST_F(FromArrowTest, ChunkedArray)
   auto boolean_array =
     get_arrow_array<bool>({true, false, true, false, true}, {true, false, true, true, false});
   auto boolean_chunked_array = std::make_shared<arrow::ChunkedArray>(boolean_array);
+  auto large_string_chunked_array = std::make_shared<arrow::ChunkedArray>(
+    std::vector<std::shared_ptr<arrow::Array>>{large_string_array_1});
 
   std::vector<std::shared_ptr<arrow::Field>> schema_vector(
     {arrow::field("a", int32_chunked_array->type()),
      arrow::field("b", int64array->type()),
      arrow::field("c", string_array_1->type()),
      arrow::field("d", dict_chunked_array->type()),
-     arrow::field("e", boolean_chunked_array->type())});
+     arrow::field("e", boolean_chunked_array->type()),
+     arrow::field("f", large_string_array_1->type())});
   auto schema = std::make_shared<arrow::Schema>(schema_vector);
 
   auto arrow_table = arrow::Table::Make(schema,
@@ -321,7 +356,8 @@ TEST_F(FromArrowTest, ChunkedArray)
                                          int64_chunked_array,
                                          string_chunked_array,
                                          dict_chunked_array,
-                                         boolean_chunked_array});
+                                         boolean_chunked_array,
+                                         large_string_chunked_array});
 
   auto expected_cudf_table = get_cudf_table();
 
diff --git a/python/cudf/cudf/core/column/column.py b/python/cudf/cudf/core/column/column.py
index 7abdbc85720..001e8996c19 100644
--- a/python/cudf/cudf/core/column/column.py
+++ b/python/cudf/cudf/core/column/column.py
@@ -334,12 +334,6 @@ def from_arrow(cls, array: pa.Array) -> ColumnBase:
             )
         elif isinstance(array.type, ArrowIntervalType):
             return cudf.core.column.IntervalColumn.from_arrow(array)
-        elif pa.types.is_large_string(array.type):
-            # Pandas-2.2+: Pandas defaults to `large_string` type
-            # instead of `string` without data-introspection.
-            # Temporary workaround until cudf has native
-            # support for `LARGE_STRING` i.e., 64 bit offsets
-            array = array.cast(pa.string())
 
         data = pa.table([array], [None])
 
diff --git a/python/cudf/cudf/tests/test_series.py b/python/cudf/cudf/tests/test_series.py
index f47c42d9a1d..30189e1ac8a 100644
--- a/python/cudf/cudf/tests/test_series.py
+++ b/python/cudf/cudf/tests/test_series.py
@@ -2737,13 +2737,16 @@ def test_series_dtype_astypes(data):
     assert_eq(result, expected)
 
 
-def test_series_from_large_string():
-    pa_large_string_array = pa.array(["a", "b", "c"]).cast(pa.large_string())
-    got = cudf.Series(pa_large_string_array)
-    expected = pd.Series(pa_large_string_array)
+@pytest.mark.parametrize("pa_type", [pa.string, pa.large_string])
+def test_series_from_large_string(pa_type):
+    pa_string_array = pa.array(["a", "b", "c"]).cast(pa_type())
+    got = cudf.Series(pa_string_array)
+    expected = pd.Series(pa_string_array)
 
     assert_eq(expected, got)
 
+    assert pa_string_array.equals(got.to_arrow())
+
 
 @pytest.mark.parametrize(
     "scalar",

From c0c2ad355c720d4d168b48aea3d5564efcd890a7 Mon Sep 17 00:00:00 2001
From: James Lamb <jlamb@nvidia.com>
Date: Wed, 12 Jun 2024 09:54:34 -0500
Subject: [PATCH 8/9] resolve dependency-file-generator warning, remove
 unnecessary rapids-build-backend configuration (#15980)

Contributes to https://github.com/rapidsai/build-planning/issues/31
Contributes to https://github.com/rapidsai/dependency-file-generator/issues/89

#15245 was one of the first `rapids-build-backend` PRs merged across RAPIDS. Since it was merged, we've made some small adjustments to the approach for `rapids-build-backend`. This catches `cudf` up with those changes:

* consolidates version-handling in `ci/build_cpp.sh`
* removes `commit-file` configuration in `pyproject.toml`
  - *as of https://github.com/rapidsai/rapids-build-backend/pull/30, this is no longer necessary if the project's top-level directory is `{project_name}.replace("-", "_")*
  - *and anyway, it was changed from `commit-file` to `commit-files` in that PR, so `commit-file` was being silently ignored here*
* uses `--file-key` instead of `--file_key` in `rapids-dependency-file-generator` calls

Authors:
  - James Lamb (https://github.com/jameslamb)

Approvers:
  - Kyle Edwards (https://github.com/KyleFromNVIDIA)
  - Bradley Dice (https://github.com/bdice)

URL: https://github.com/rapidsai/cudf/pull/15980
---
 ci/build_cpp.sh                   | 4 +---
 ci/build_docs.sh                  | 2 +-
 ci/check_style.sh                 | 2 +-
 ci/configure_cpp_static.sh        | 2 +-
 ci/test_cpp_common.sh             | 2 +-
 ci/test_java.sh                   | 2 +-
 ci/test_notebooks.sh              | 2 +-
 ci/test_python_common.sh          | 2 +-
 python/cudf/pyproject.toml        | 1 -
 python/cudf_kafka/pyproject.toml  | 1 -
 python/cudf_polars/pyproject.toml | 1 -
 python/custreamz/pyproject.toml   | 1 -
 python/dask_cudf/pyproject.toml   | 1 -
 13 files changed, 8 insertions(+), 15 deletions(-)

diff --git a/ci/build_cpp.sh b/ci/build_cpp.sh
index 740a6409ccd..e5fcef17a83 100755
--- a/ci/build_cpp.sh
+++ b/ci/build_cpp.sh
@@ -13,12 +13,10 @@ export CMAKE_GENERATOR=Ninja
 
 rapids-print-env
 
-version=$(rapids-generate-version)
-
 rapids-logger "Begin cpp build"
 
 # With boa installed conda build forward to boa
-RAPIDS_PACKAGE_VERSION=${version} rapids-conda-retry mambabuild \
+RAPIDS_PACKAGE_VERSION=$(rapids-generate-version) rapids-conda-retry mambabuild \
     conda/recipes/libcudf
 
 rapids-upload-conda-to-s3 cpp
diff --git a/ci/build_docs.sh b/ci/build_docs.sh
index 67a5415f353..14dc7a59048 100755
--- a/ci/build_docs.sh
+++ b/ci/build_docs.sh
@@ -14,7 +14,7 @@ ENV_YAML_DIR="$(mktemp -d)"
 
 rapids-dependency-file-generator \
   --output conda \
-  --file_key docs \
+  --file-key docs \
   --matrix "cuda=${RAPIDS_CUDA_VERSION%.*};arch=$(arch);py=${RAPIDS_PY_VERSION}" | tee "${ENV_YAML_DIR}/env.yaml"
 
 rapids-mamba-retry env create --yes -f "${ENV_YAML_DIR}/env.yaml" -n docs
diff --git a/ci/check_style.sh b/ci/check_style.sh
index 029cd305f1d..634d8b0d702 100755
--- a/ci/check_style.sh
+++ b/ci/check_style.sh
@@ -10,7 +10,7 @@ ENV_YAML_DIR="$(mktemp -d)"
 
 rapids-dependency-file-generator \
   --output conda \
-  --file_key checks \
+  --file-key checks \
   --matrix "cuda=${RAPIDS_CUDA_VERSION%.*};arch=$(arch);py=${RAPIDS_PY_VERSION}" | tee "${ENV_YAML_DIR}/env.yaml"
 
 rapids-mamba-retry env create --yes -f "${ENV_YAML_DIR}/env.yaml" -n checks
diff --git a/ci/configure_cpp_static.sh b/ci/configure_cpp_static.sh
index 11d5585d98f..51e41b065fb 100755
--- a/ci/configure_cpp_static.sh
+++ b/ci/configure_cpp_static.sh
@@ -12,7 +12,7 @@ REQUIREMENTS_FILE="${ENV_YAML_DIR}/requirements.txt"
 
 rapids-dependency-file-generator \
   --output requirements \
-  --file_key test_static_build \
+  --file-key test_static_build \
   --matrix "cuda=${RAPIDS_CUDA_VERSION%.*};arch=$(arch)" | tee "${REQUIREMENTS_FILE}"
 
 python -m pip install -r "${REQUIREMENTS_FILE}"
diff --git a/ci/test_cpp_common.sh b/ci/test_cpp_common.sh
index da847137a2b..f5a8de543f6 100755
--- a/ci/test_cpp_common.sh
+++ b/ci/test_cpp_common.sh
@@ -11,7 +11,7 @@ ENV_YAML_DIR="$(mktemp -d)"
 
 rapids-dependency-file-generator \
   --output conda \
-  --file_key test_cpp \
+  --file-key test_cpp \
   --matrix "cuda=${RAPIDS_CUDA_VERSION%.*};arch=$(arch)" | tee "${ENV_YAML_DIR}/env.yaml"
 
 rapids-mamba-retry env create --yes -f "${ENV_YAML_DIR}/env.yaml" -n test
diff --git a/ci/test_java.sh b/ci/test_java.sh
index c93079742f0..9713eb192d2 100755
--- a/ci/test_java.sh
+++ b/ci/test_java.sh
@@ -11,7 +11,7 @@ ENV_YAML_DIR="$(mktemp -d)"
 
 rapids-dependency-file-generator \
   --output conda \
-  --file_key test_java \
+  --file-key test_java \
   --matrix "cuda=${RAPIDS_CUDA_VERSION%.*};arch=$(arch)" | tee "${ENV_YAML_DIR}/env.yaml"
 
 rapids-mamba-retry env create --yes -f "${ENV_YAML_DIR}/env.yaml" -n test
diff --git a/ci/test_notebooks.sh b/ci/test_notebooks.sh
index 8be2d374bed..da9478ce25d 100755
--- a/ci/test_notebooks.sh
+++ b/ci/test_notebooks.sh
@@ -11,7 +11,7 @@ ENV_YAML_DIR="$(mktemp -d)"
 
 rapids-dependency-file-generator \
   --output conda \
-  --file_key test_notebooks \
+  --file-key test_notebooks \
   --matrix "cuda=${RAPIDS_CUDA_VERSION%.*};arch=$(arch);py=${RAPIDS_PY_VERSION}" | tee "${ENV_YAML_DIR}/env.yaml"
 
 rapids-mamba-retry env create --yes -f "${ENV_YAML_DIR}/env.yaml" -n test
diff --git a/ci/test_python_common.sh b/ci/test_python_common.sh
index 7559d970f6d..e8849588aa5 100755
--- a/ci/test_python_common.sh
+++ b/ci/test_python_common.sh
@@ -13,7 +13,7 @@ ENV_YAML_DIR="$(mktemp -d)"
 
 rapids-dependency-file-generator \
   --output conda \
-  --file_key test_python \
+  --file-key test_python \
   --matrix "cuda=${RAPIDS_CUDA_VERSION%.*};arch=$(arch);py=${RAPIDS_PY_VERSION}" | tee "${ENV_YAML_DIR}/env.yaml"
 
 rapids-mamba-retry env create --yes -f "${ENV_YAML_DIR}/env.yaml" -n test
diff --git a/python/cudf/pyproject.toml b/python/cudf/pyproject.toml
index 9ad02fed044..20b731624df 100644
--- a/python/cudf/pyproject.toml
+++ b/python/cudf/pyproject.toml
@@ -119,7 +119,6 @@ skip = [
 
 [tool.rapids-build-backend]
 build-backend = "scikit_build_core.build"
-commit-file = "cudf/GIT_COMMIT"
 dependencies-file = "../../dependencies.yaml"
 requires = [
     "cmake>=3.26.4",
diff --git a/python/cudf_kafka/pyproject.toml b/python/cudf_kafka/pyproject.toml
index 1bc04742a73..11e18cd4f32 100644
--- a/python/cudf_kafka/pyproject.toml
+++ b/python/cudf_kafka/pyproject.toml
@@ -99,7 +99,6 @@ regex = "(?P<value>.*)"
 
 [tool.rapids-build-backend]
 build-backend = "scikit_build_core.build"
-commit-file = "cudf_kafka/GIT_COMMIT"
 dependencies-file = "../../dependencies.yaml"
 requires = [
     "cmake>=3.26.4",
diff --git a/python/cudf_polars/pyproject.toml b/python/cudf_polars/pyproject.toml
index 11178a3be74..face04b9bd8 100644
--- a/python/cudf_polars/pyproject.toml
+++ b/python/cudf_polars/pyproject.toml
@@ -174,7 +174,6 @@ docstring-code-format = true
 
 [tool.rapids-build-backend]
 build-backend = "setuptools.build_meta"
-commit-file = "cudf_polars/GIT_COMMIT"
 dependencies-file = "../../dependencies.yaml"
 # Pure python
 disable-cuda = true
diff --git a/python/custreamz/pyproject.toml b/python/custreamz/pyproject.toml
index e004a8f5219..7b99e041b54 100644
--- a/python/custreamz/pyproject.toml
+++ b/python/custreamz/pyproject.toml
@@ -48,7 +48,6 @@ Homepage = "https://github.com/rapidsai/cudf"
 
 [tool.rapids-build-backend]
 build-backend = "setuptools.build_meta"
-commit-file = "custreamz/COMMIT_FILE"
 dependencies-file = "../../dependencies.yaml"
 
 [tool.setuptools]
diff --git a/python/dask_cudf/pyproject.toml b/python/dask_cudf/pyproject.toml
index 6b5d5ccc412..9b2e3a5a7b1 100644
--- a/python/dask_cudf/pyproject.toml
+++ b/python/dask_cudf/pyproject.toml
@@ -57,7 +57,6 @@ Homepage = "https://github.com/rapidsai/cudf"
 
 [tool.rapids-build-backend]
 build-backend = "setuptools.build_meta"
-commit-file = "dask_cudf/GIT_COMMIT"
 dependencies-file = "../../dependencies.yaml"
 
 [tool.setuptools]

From 0891c5dec7fd8ce0f2e0233fe1c637e49a53f86e Mon Sep 17 00:00:00 2001
From: Lawrence Mitchell <lmitchell@nvidia.com>
Date: Wed, 12 Jun 2024 17:50:52 +0100
Subject: [PATCH 9/9] Add tests covering magic methods of Expr objects (#15996)

repr is not stable for now because the pylibcudf datatype repr is not stable (it includes the address).

Authors:
  - Lawrence Mitchell (https://github.com/wence-)

Approvers:
  - Bradley Dice (https://github.com/bdice)

URL: https://github.com/rapidsai/cudf/pull/15996
---
 python/cudf_polars/cudf_polars/dsl/expr.py | 12 ++--
 python/cudf_polars/tests/dsl/__init__.py   |  6 ++
 python/cudf_polars/tests/dsl/test_expr.py  | 76 ++++++++++++++++++++++
 3 files changed, 89 insertions(+), 5 deletions(-)
 create mode 100644 python/cudf_polars/tests/dsl/__init__.py
 create mode 100644 python/cudf_polars/tests/dsl/test_expr.py

diff --git a/python/cudf_polars/cudf_polars/dsl/expr.py b/python/cudf_polars/cudf_polars/dsl/expr.py
index a81cdcbf0c3..13e496136b5 100644
--- a/python/cudf_polars/cudf_polars/dsl/expr.py
+++ b/python/cudf_polars/cudf_polars/dsl/expr.py
@@ -134,14 +134,14 @@ def is_equal(self, other: Any) -> bool:
         True if the two expressions are equal, false otherwise.
         """
         if type(self) is not type(other):
-            return False
+            return False  # pragma: no cover; __eq__ trips first
         return self._ctor_arguments(self.children) == other._ctor_arguments(
             other.children
         )
 
     def __eq__(self, other: Any) -> bool:
         """Equality of expressions."""
-        if type(self) != type(other) or hash(self) != hash(other):
+        if type(self) is not type(other) or hash(self) != hash(other):
             return False
         else:
             return self.is_equal(other)
@@ -196,7 +196,9 @@ def do_evaluate(
             are returned during translation to the IR, but for now we
             are not perfect.
         """
-        raise NotImplementedError(f"Evaluation of {type(self).__name__}")
+        raise NotImplementedError(
+            f"Evaluation of expression {type(self).__name__}"
+        )  # pragma: no cover; translation of unimplemented nodes trips first
 
     def evaluate(
         self,
@@ -266,7 +268,7 @@ def collect_agg(self, *, depth: int) -> AggInfo:
         """
         raise NotImplementedError(
             f"Collecting aggregation info for {type(self).__name__}"
-        )
+        )  # pragma: no cover; check_agg trips first
 
 
 class NamedExpr:
@@ -287,7 +289,7 @@ def __hash__(self) -> int:
 
     def __repr__(self) -> str:
         """Repr of the expression."""
-        return f"NamedExpr({self.name}, {self.value}"
+        return f"NamedExpr({self.name}, {self.value})"
 
     def __eq__(self, other: Any) -> bool:
         """Equality of two expressions."""
diff --git a/python/cudf_polars/tests/dsl/__init__.py b/python/cudf_polars/tests/dsl/__init__.py
new file mode 100644
index 00000000000..4611d642f14
--- /dev/null
+++ b/python/cudf_polars/tests/dsl/__init__.py
@@ -0,0 +1,6 @@
+# SPDX-FileCopyrightText: Copyright (c) 2024 NVIDIA CORPORATION & AFFILIATES.
+# SPDX-License-Identifier: Apache-2.0
+
+from __future__ import annotations
+
+__all__: list[str] = []
diff --git a/python/cudf_polars/tests/dsl/test_expr.py b/python/cudf_polars/tests/dsl/test_expr.py
new file mode 100644
index 00000000000..ddc3ca66d86
--- /dev/null
+++ b/python/cudf_polars/tests/dsl/test_expr.py
@@ -0,0 +1,76 @@
+# SPDX-FileCopyrightText: Copyright (c) 2024 NVIDIA CORPORATION & AFFILIATES.
+# SPDX-License-Identifier: Apache-2.0
+
+from __future__ import annotations
+
+import pytest
+
+import cudf._lib.pylibcudf as plc
+
+from cudf_polars.dsl import expr
+
+
+def test_expression_equality_not_expression():
+    col = expr.Col(plc.DataType(plc.TypeId.INT8), "a")
+    assert not (col == "a")  # noqa: SIM201
+    assert col != "a"
+
+
+@pytest.mark.parametrize("dtype", [plc.TypeId.INT8, plc.TypeId.INT16])
+def test_column_ne_dtypes_differ(dtype):
+    a = expr.Col(plc.DataType(dtype), "a")
+    b = expr.Col(plc.DataType(plc.TypeId.FLOAT32), "a")
+    assert a != b
+
+
+@pytest.mark.parametrize("dtype", [plc.TypeId.INT8, plc.TypeId.INT16])
+def test_column_ne_names_differ(dtype):
+    a = expr.Col(plc.DataType(dtype), "a")
+    b = expr.Col(plc.DataType(dtype), "b")
+    assert a != b
+
+
+@pytest.mark.parametrize("dtype", [plc.TypeId.INT8, plc.TypeId.INT16])
+def test_column_eq_names_eq(dtype):
+    a = expr.Col(plc.DataType(dtype), "a")
+    b = expr.Col(plc.DataType(dtype), "a")
+    assert a == b
+
+
+def test_expr_hashable():
+    a = expr.Col(plc.DataType(plc.TypeId.INT8), "a")
+    b = expr.Col(plc.DataType(plc.TypeId.INT8), "b")
+    c = expr.Col(plc.DataType(plc.TypeId.FLOAT32), "c")
+
+    collection = {a, b, c}
+    assert len(collection) == 3
+    assert a in collection
+    assert b in collection
+    assert c in collection
+
+
+def test_namedexpr_hashable():
+    b = expr.NamedExpr("b", expr.Col(plc.DataType(plc.TypeId.INT8), "a"))
+    c = expr.NamedExpr("c", expr.Col(plc.DataType(plc.TypeId.INT8), "a"))
+
+    collection = {b, c}
+
+    assert len(collection) == 2
+
+    assert b in collection
+    assert c in collection
+
+
+def test_namedexpr_ne_values():
+    b1 = expr.NamedExpr("b1", expr.Col(plc.DataType(plc.TypeId.INT8), "a"))
+    b2 = expr.NamedExpr("b2", expr.Col(plc.DataType(plc.TypeId.INT16), "a"))
+
+    assert b1 != b2
+
+
+@pytest.mark.xfail(reason="pylibcudf datatype repr not stable")
+def test_namedexpr_repr_stable():
+    b1 = expr.NamedExpr("b1", expr.Col(plc.DataType(plc.TypeId.INT8), "a"))
+    b2 = expr.NamedExpr("b1", expr.Col(plc.DataType(plc.TypeId.INT8), "a"))
+
+    assert repr(b1) == repr(b2)