rapidsai · calebwin · Dec 6, 2021 · Dec 6, 2021 · Dec 6, 2021 · Dec 6, 2021
@@ -405,6 +405,8 @@ class parquet_writer_options {
   size_t _row_group_size_bytes = default_row_group_size_bytes;
   // Maximum number of rows in row group (unless smaller than a single page)
   size_type _row_group_size_rows = default_row_group_size_rows;
+  // Number of rows in each row group
+  std::vector<size_type> _row_group_sizes;
 
   /**
    * @brief Constructor from sink and table.
@@ -489,6 +491,11 @@ class parquet_writer_options {
    */
   auto get_row_group_size_rows() const { return _row_group_size_rows; }
 
+  /**
+   * @brief Returns size of each row group.
+   */
+  auto get_row_group_sizes() const { return _row_group_sizes; }
+
   /**
    * @brief Sets metadata.
    *
@@ -549,6 +556,11 @@ class parquet_writer_options {
       "The maximum row group size cannot be smaller than the page size, which is 5000 rows.");
     _row_group_size_rows = size_rows;
   }
+
+  /**
+   * @brief Sets the size of each row group.
+   */
+  void set_row_group_sizes(std::vector<size_type> sizes_rows) { _row_group_sizes = sizes_rows; }
 };
 
 class parquet_writer_options_builder {
@@ -645,6 +657,18 @@ class parquet_writer_options_builder {
     return *this;
   }
 
+  /**
+   * @brief Sets the number of rows in each output row group.
+   *
+   * @param val number of rows in each row group
+   * @return this for chaining.
+   */
+  parquet_writer_options_builder& row_group_sizes(std::vector<size_type> val)
+  {
+    options.set_row_group_sizes(val);
+    return *this;
+  }
+
   /**
    * @brief Sets whether int96 timestamps are written or not in parquet_writer_options.
    *
@@ -727,6 +751,8 @@ class chunked_parquet_writer_options {
   size_t _row_group_size_bytes = default_row_group_size_bytes;
   // Maximum number of rows in row group (unless smaller than a single page)
   size_type _row_group_size_rows = default_row_group_size_rows;
+  // Number of rows in each row group
+  std::vector<size_type> _row_group_sizes;
 
   /**
    * @brief Constructor from sink.
@@ -780,6 +806,11 @@ class chunked_parquet_writer_options {
    */
   auto get_row_group_size_rows() const { return _row_group_size_rows; }
 
+  /**
+   * @brief Returns size of each row group.
+   */
+  auto get_row_group_sizes() const { return _row_group_sizes; }
+
   /**
    * @brief Sets metadata.
    *
@@ -831,6 +862,11 @@ class chunked_parquet_writer_options {
     _row_group_size_rows = size_rows;
   }
 
+  /**
+   * @brief Sets the size of each row group.
+   */
+  void set_row_group_sizes(std::vector<size_type> sizes_rows) { _row_group_sizes = sizes_rows; }
+
   /**
    * @brief creates builder to build chunked_parquet_writer_options.
    *
@@ -934,6 +970,18 @@ class chunked_parquet_writer_options_builder {
     return *this;
   }
 
+  /**
+   * @brief Sets the number of rows in each output row group.
+   *
+   * @param val number of rows in each row group
+   * @return this for chaining.
+   */
+  chunked_parquet_writer_options_builder& row_group_sizes(std::vector<size_type> val)
+  {
+    options.set_row_group_sizes(val);
+    return *this;
+  }
+
   /**
    * @brief move chunked_parquet_writer_options member once it's built.
    */

@@ -95,16 +95,18 @@ struct map_find_fn {
 template <int block_size>
 __global__ void __launch_bounds__(block_size, 1)
   populate_chunk_hash_maps_kernel(cudf::detail::device_2dspan<EncColumnChunk> chunks,
+                                  cudf::detail::device_2dspan<PageFragment> fragments,
                                   size_type num_rows)
 {
   auto col_idx = blockIdx.y;
   auto block_x = blockIdx.x;
   auto t       = threadIdx.x;
 
-  auto start_row =
-    block_x *
-    max_page_fragment_size;  // This is fragment size. all chunks are multiple of these many rows.
-  size_type end_row = min(start_row + max_page_fragment_size, num_rows);
+  auto start_row = 0;
+  for (auto i = 0; i < block_x; i++) {
+    start_row += fragments[0][i].num_rows;
+  }
-  auto start_row = 0;
-  for (auto i = 0; i < block_x; i++) {
-    start_row += fragments[0][i].num_rows;
-  }
+  auto row_counter = thrust::transform_iterator(fragments[0], [] __device__(auto const& page){ return page.num_rows; });
+  auto start_row = std::accumulate(row_counter[0], row_counter[block_x], 0);
 size_type start_row = frag.start_row; 
-  auto start_row = 0;
-  for (auto i = 0; i < block_x; i++) {
-    start_row += fragments[0][i].num_rows;
-  }
+  auto row_counter = thrust::transform_iterator(fragments[0], [] __device__(auto const& page){ return page.num_rows; });
+  auto start_row = std::accumulate(row_counter[0], row_counter[block_x], 0);
 size_type start_row = frag.start_row; 
+  size_type end_row = min(start_row + fragments[0][block_x].num_rows, num_rows);
 
   __shared__ EncColumnChunk* s_chunk;
   __shared__ parquet_column_device_view s_col;
@@ -245,14 +247,18 @@ __global__ void __launch_bounds__(block_size, 1)
 template <int block_size>
 __global__ void __launch_bounds__(block_size, 1)
   get_dictionary_indices_kernel(cudf::detail::device_2dspan<EncColumnChunk> chunks,
+                                cudf::detail::device_2dspan<PageFragment> fragments,
                                 size_type num_rows)
 {
   auto col_idx = blockIdx.y;
   auto block_x = blockIdx.x;
   auto t       = threadIdx.x;
 
-  size_type start_row = block_x * max_page_fragment_size;
-  size_type end_row   = min(start_row + max_page_fragment_size, num_rows);
+  auto start_row = 0;
+  for (auto i = 0; i < block_x; i++) {
+    start_row += fragments[0][i].num_rows;
+  }
+  size_type end_row = min(start_row + fragments[0][block_x].num_rows, num_rows);
 
   __shared__ EncColumnChunk s_chunk;
   __shared__ parquet_column_device_view s_col;
@@ -335,16 +341,16 @@ void initialize_chunk_hash_maps(device_span<EncColumnChunk> chunks, rmm::cuda_st
 }
 
 void populate_chunk_hash_maps(cudf::detail::device_2dspan<EncColumnChunk> chunks,
+                              cudf::detail::device_2dspan<PageFragment> fragments,
                               size_type num_rows,
                               rmm::cuda_stream_view stream)
 {
   constexpr int block_size = 256;
-  auto const grid_x        = cudf::detail::grid_1d(num_rows, max_page_fragment_size);
   auto const num_columns   = chunks.size().second;
-  dim3 const dim_grid(grid_x.num_blocks, num_columns);
+  dim3 const dim_grid(fragments.size().second, num_columns);
 
   populate_chunk_hash_maps_kernel<block_size>
-    <<<dim_grid, block_size, 0, stream.value()>>>(chunks, num_rows);
+    <<<dim_grid, block_size, 0, stream.value()>>>(chunks, fragments, num_rows);
 }
 
 void collect_map_entries(device_span<EncColumnChunk> chunks, rmm::cuda_stream_view stream)
@@ -354,16 +360,16 @@ void collect_map_entries(device_span<EncColumnChunk> chunks, rmm::cuda_stream_vi
 }
 
 void get_dictionary_indices(cudf::detail::device_2dspan<EncColumnChunk> chunks,
+                            cudf::detail::device_2dspan<PageFragment> fragments,
                             size_type num_rows,
                             rmm::cuda_stream_view stream)
 {
   constexpr int block_size = 256;
-  auto const grid_x        = cudf::detail::grid_1d(num_rows, max_page_fragment_size);
   auto const num_columns   = chunks.size().second;
-  dim3 const dim_grid(grid_x.num_blocks, num_columns);
+  dim3 const dim_grid(fragments.size().second, num_columns);
 
   get_dictionary_indices_kernel<block_size>
-    <<<dim_grid, block_size, 0, stream.value()>>>(chunks, num_rows);
+    <<<dim_grid, block_size, 0, stream.value()>>>(chunks, fragments, num_rows);
 }
 }  // namespace gpu
 }  // namespace parquet

@@ -112,7 +112,7 @@ template <int block_size>
 __global__ void __launch_bounds__(block_size)
   gpuInitPageFragments(device_2dspan<PageFragment> frag,
                        device_span<parquet_column_device_view const> col_desc,
-                       uint32_t fragment_size,
+                       int32_t fragment_size,
                        uint32_t max_num_rows)
 {
   __shared__ __align__(16) frag_init_state_s state_g;
@@ -130,7 +130,11 @@ __global__ void __launch_bounds__(block_size)
   if (!t) {
     // frag.num_rows = fragment_size except for the last page fragment which can be smaller.
     // num_rows is fixed but fragment size could be larger if the data is strings or nested.
-    s->frag.num_rows           = min(fragment_size, max_num_rows - min(start_row, max_num_rows));
+    if (fragment_size != -1) {
+      s->frag.num_rows = min(fragment_size, max_num_rows - min(start_row, max_num_rows));
+    } else {
+      s->frag.num_rows = frag[blockIdx.x][blockIdx.y].num_rows;
+    }
-    if (fragment_size != -1) {
-      s->frag.num_rows = min(fragment_size, max_num_rows - min(start_row, max_num_rows));
-    } else {
-      s->frag.num_rows = frag[blockIdx.x][blockIdx.y].num_rows;
-    }
+    s->frag.num_rows = fragment_size != -1 ? min(fragment_size, max_num_rows - min(start_row, max_num_rows)) : frag[blockIdx.x][blockIdx.y].num_rows;
-    if (fragment_size != -1) {
-      s->frag.num_rows = min(fragment_size, max_num_rows - min(start_row, max_num_rows));
-    } else {
-      s->frag.num_rows = frag[blockIdx.x][blockIdx.y].num_rows;
-    }
+    s->frag.num_rows = fragment_size != -1 ? min(fragment_size, max_num_rows - min(start_row, max_num_rows)) : frag[blockIdx.x][blockIdx.y].num_rows;
     s->frag.num_dict_vals      = 0;
     s->frag.fragment_data_size = 0;
     s->frag.dict_data_size     = 0;
@@ -1938,13 +1942,13 @@ dremel_data get_dremel_data(column_view h_col,
  *
  * @param[in,out] frag Fragment array [column_id][fragment_id]
  * @param[in] col_desc Column description array [column_id]
- * @param[in] num_fragments Number of fragments per column
+ * @param[in] num_fragments Number of fragments per column, -1 if fragment sizes already specified
  * @param[in] num_columns Number of columns
  * @param[in] stream CUDA stream to use, default 0
  */
 void InitPageFragments(device_2dspan<PageFragment> frag,
                        device_span<parquet_column_device_view const> col_desc,
-                       uint32_t fragment_size,
+                       int32_t fragment_size,
                        uint32_t num_rows,
                        rmm::cuda_stream_view stream)
 {

@@ -463,13 +463,13 @@ dremel_data get_dremel_data(column_view h_col,
  * @param[in] col_desc Column description array [column_id]
  * @param[in] num_fragments Number of fragments per column
  * @param[in] num_columns Number of columns
- * @param[in] fragment_size Number of rows per fragment
+ * @param[in] fragment_size Number of rows per fragment, -1 if fragment sizes already specified
  * @param[in] num_rows Number of rows per column
  * @param[in] stream CUDA stream to use
  */
 void InitPageFragments(cudf::detail::device_2dspan<PageFragment> frag,
                        device_span<parquet_column_device_view const> col_desc,
-                       uint32_t fragment_size,
+                       int32_t fragment_size,
                        uint32_t num_rows,
                        rmm::cuda_stream_view stream);
 
@@ -502,6 +502,7 @@ void initialize_chunk_hash_maps(device_span<EncColumnChunk> chunks, rmm::cuda_st
  * @param stream CUDA stream to use
  */
 void populate_chunk_hash_maps(cudf::detail::device_2dspan<EncColumnChunk> chunks,
+                              cudf::detail::device_2dspan<PageFragment> fragments,
                               size_type num_rows,
                               rmm::cuda_stream_view stream);
 
@@ -527,6 +528,7 @@ void collect_map_entries(device_span<EncColumnChunk> chunks, rmm::cuda_stream_vi
  * @param stream CUDA stream to use
  */
 void get_dictionary_indices(cudf::detail::device_2dspan<EncColumnChunk> chunks,
+                            cudf::detail::device_2dspan<PageFragment> fragments,
                             size_type num_rows,
                             rmm::cuda_stream_view stream);