apache · smiklos · Jul 17, 2023 · Jul 18, 2023 · Jul 18, 2023 · Jul 18, 2023
diff --git a/datafusion/core/src/physical_plan/unnest.rs b/datafusion/core/src/physical_plan/unnest.rs
@@ -18,8 +18,8 @@
 //! Defines the unnest column plan for unnesting values in a column that contains a list
 //! type, conceptually is like joining each row with all the values in the list column.
 use arrow::array::{
-    new_null_array, Array, ArrayAccessor, ArrayRef, ArrowPrimitiveType,
-    FixedSizeListArray, Int32Array, LargeListArray, ListArray, PrimitiveArray,
+    Array, ArrayAccessor, ArrayRef, ArrowPrimitiveType, FixedSizeListArray, Int32Array,
+    LargeListArray, ListArray, PrimitiveArray,
 };
 use arrow::compute::kernels;
 use arrow::datatypes::{
@@ -236,21 +236,21 @@ fn build_batch(
     match list_array.data_type() {
         DataType::List(_) => {
             let list_array = list_array.as_any().downcast_ref::<ListArray>().unwrap();
-            unnest_batch(batch, schema, column, &list_array)
+            unnest_batch(batch, schema, column, &list_array, list_array.values())
         }
         DataType::LargeList(_) => {
             let list_array = list_array
                 .as_any()
                 .downcast_ref::<LargeListArray>()
                 .unwrap();
-            unnest_batch(batch, schema, column, &list_array)
+            unnest_batch(batch, schema, column, &list_array, list_array.values())
         }
         DataType::FixedSizeList(_, _) => {
             let list_array = list_array
                 .as_any()
                 .downcast_ref::<FixedSizeListArray>()
                 .unwrap();
-            unnest_batch(batch, schema, column, list_array)
+            unnest_batch(batch, schema, column, list_array, list_array.values())
         }
         _ => Err(DataFusionError::Execution(format!(
             "Invalid unnest column {column}"
@@ -263,43 +263,27 @@ fn unnest_batch<T>(
     schema: &SchemaRef,
     column: &Column,
     list_array: &T,
+    list_array_values: &Arc<dyn Array>,
 ) -> Result<RecordBatch>
 where
     T: ArrayAccessor<Item = ArrayRef>,
 {
-    // Create an array with the unnested values of the list array, given the list
-    // array:
-    //
-    //   [1], null, [2, 3, 4], null, [5, 6]
-    //
-    // the result array is:
-    //
-    //   1, null, 2, 3, 4, null, 5, 6
-    //
-    let unnested_array = unnest_array(list_array)?;
-
-    // Create an array with the lengths of each list value in the nested array.
-    // Given the nested array:
-    //
-    //   [1], null, [2, 3, 4], null, [5, 6]
-    //
-    // the result array is:
-    //
-    //   1, null, 3, null, 2
-    //
-    // Depending on the list type the result may be Int32Array or Int64Array.
     let list_lengths = list_lengths(list_array)?;
 
     // Create the indices for the take kernel and then use those indices to create
     // the unnested record batch.
     match list_lengths.data_type() {
         DataType::Int32 => {
             let list_lengths = as_primitive_array::<Int32Type>(&list_lengths)?;
+            let unnested_array =
+                unnest_array(list_array, list_array_values, list_lengths)?;
             let indices = create_take_indices(list_lengths, unnested_array.len());
             batch_from_indices(batch, schema, column.index(), &unnested_array, &indices)
         }
         DataType::Int64 => {
             let list_lengths = as_primitive_array::<Int64Type>(&list_lengths)?;
+            let unnested_array =
+                unnest_array(list_array, list_array_values, list_lengths)?;
             let indices = create_take_indices(list_lengths, unnested_array.len());
             batch_from_indices(batch, schema, column.index(), &unnested_array, &indices)
         }
@@ -357,14 +341,67 @@ where
     builder.finish()
 }
 
+fn create_fixed_size_unnest_take_indices<T>(
+    list_lengths: &PrimitiveArray<T>,
+    value_length: usize,
+) -> PrimitiveArray<T>
+where
+    T: ArrowPrimitiveType,
+{
+    let capacity =
+        value_length * list_lengths.len() - list_lengths.null_count() * value_length;
+    let mut builder = PrimitiveArray::<T>::builder(capacity);
+
+    for row in 0..list_lengths.len() {
+        if list_lengths.is_null(row) {
+            builder.append_null();
+        } else {
+            let fixed_length_offset = row * value_length;
+            // Both `repeat` and `index` are positive intergers.
+            (fixed_length_offset..fixed_length_offset + value_length).for_each(|r| {
+                let index = T::Native::from_usize(r).unwrap();
+                builder.append_value(index);
+            });
+        };
+    }
+
+    builder.finish()
+}
+
+fn create_unnest_take_indices<T>(
+    list_lengths: &PrimitiveArray<T>,
+    capacity: usize,
+) -> PrimitiveArray<T>
+where
+    T: ArrowPrimitiveType,
+{
+    let mut builder = PrimitiveArray::<T>::builder(capacity);
+    let mut value_offset = 0;
+    for row in 0..list_lengths.len() {
+        if list_lengths.is_null(row) {
+            builder.append_null();
+        } else {
+            // Both `repeat` and `index` are positive intergers.
+            let repeat = list_lengths.value(row).to_usize().unwrap();
+            (0..repeat).for_each(|r| {
+                let index = T::Native::from_usize(r + value_offset).unwrap();
+                builder.append_value(index);
+            });
+            value_offset += repeat;
+        };
+    }
+
+    builder.finish()
+}
+
 /// Create the final batch given the unnested column array and a `indices` array
 /// that is used by the take kernel to copy values.
 ///
 /// For example if we have the following `RecordBatch`:
 ///
 /// ```ignore
 /// c1: [1], null, [2, 3, 4], null, [5, 6]
-/// c2: 'a', 'b',  'c', null, 'd'
+/// c2: 'a', 'b', 'c', null, 'd'
 /// ```
 ///
 /// then the `unnested_array` contains the unnest column that will replace `c1` in
@@ -425,43 +462,61 @@ where
 /// ```ignore
 /// 1, null, 2, 3, 4, null, 5, 6
 /// ```
-fn unnest_array<T>(list_array: &T) -> Result<Arc<dyn Array + 'static>>
+///
+/// For [`DataType::FixedSizeList`] the values array will look like:   
+///
+/// ```ignore
+/// 1, 2, 3, null, null, null, 4, 5, 6
+/// ```
+///
+/// While the other cases will omit nulls from the values array:
+///
+/// ```ignore
+/// 1, 2, 3, 4, 5, 6
+/// ```
+/// Therefor we calculate take indices based on the underlying datatype.
+///  
+fn unnest_array<T, P>(
+    list_array: &T,
+    list_array_values: &Arc<dyn Array>,
+    list_lengths: &PrimitiveArray<P>,
+) -> Result<Arc<dyn Array + 'static>>
 where
     T: ArrayAccessor<Item = ArrayRef>,
+    P: ArrowPrimitiveType,
 {
-    let elem_type = match list_array.data_type() {
-        DataType::List(f) | DataType::FixedSizeList(f, _) | DataType::LargeList(f) => {
-            f.data_type()
-        }
-        dt => {
-            return Err(DataFusionError::Execution(format!(
-                "Cannot unnest array of type {dt}"
-            )))
-        }
-    };
-
-    let null_row = new_null_array(elem_type, 1);
-
-    // Create a vec of ArrayRef from the list elements.
-    let arrays = (0..list_array.len())
-        .map(|row| {
-            if list_array.is_null(row) {
-                null_row.clone()
-            } else {
-                list_array.value(row)
+    if list_array.null_count() == 0 {
+        Ok(list_array_values.clone())
+    } else {
+        // For `FixedSizeList` the values array contains fixed length arrays, even if there are null values.
+        // Therefor we need to calculate take indices accordingly.
+        match list_array.data_type() {
+            DataType::FixedSizeList(_, value_length) => {
+                let take_indices = create_fixed_size_unnest_take_indices(
+                    list_lengths,
+                    *value_length as usize,
+                );
+                Ok(kernels::take::take(list_array_values, &take_indices, None)?)
             }
-        })
-        .collect::<Vec<_>>();
-
-    // Create Vec<&dyn Array> from Vec<Arc<dyn Array>> for `concat`. Calling
-    // `as_ref()` in the `map` above causes the borrow checker to complain.
-    let arrays = arrays.iter().map(|a| a.as_ref()).collect::<Vec<_>>();
-
-    Ok(kernels::concat::concat(&arrays)?)
+            _ => {
+                let capacity = list_array_values.len() + list_array.null_count();
+                let take_indices = create_unnest_take_indices(list_lengths, capacity);
+                Ok(kernels::take::take(list_array_values, &take_indices, None)?)
+            }
+        }
+    }
 }
 
-/// Returns an array with the lengths of each list in `list_array`. Returns null
-/// for a null value.
+// Create an array with the lengths of each list value in the nested array.
+// Given the nested array:
+//
+//   [1], null, [2, 3, 4], null, [5, 6]
+//
+// the result array is:
+//
+//   1, null, 3, null, 2
+//
+// Depending on the list type the result may be Int32Array or Int64Array.
 fn list_lengths<T>(list_array: &T) -> Result<Arc<dyn Array + 'static>>
 where
     T: ArrayAccessor<Item = ArrayRef>,
@@ -489,3 +544,37 @@ where
         ))),
     }
 }
+
+#[cfg(test)]
+mod tests {
+
+    use super::*;
+
+    #[test]
+    fn calculate_unnest_take_indices() {
+        let test_groups = PrimitiveArray::<Int32Type>::from(vec![
+            Some(3),
+            None,
+            Some(1),
+            None,
+            Some(2),
+            None,
+        ]);
+
+        let res = create_unnest_take_indices(&test_groups, 9);
+
+        let expected = PrimitiveArray::<Int32Type>::from(vec![
+            Some(0),
+            Some(1),
+            Some(2),
+            None,
+            Some(3),
+            None,
+            Some(4),
+            Some(5),
+            None,
+        ]);
+
+        assert_eq!(expected, res)
+    }
+}
diff --git a/datafusion/core/tests/dataframe/mod.rs b/datafusion/core/tests/dataframe/mod.rs
@@ -1114,6 +1114,72 @@ async fn unnest_fixed_list() -> Result<()> {
     Ok(())
 }
 
+#[tokio::test]
+async fn unnest_fixed_list_nonull() -> Result<()> {
+    let mut shape_id_builder = UInt32Builder::new();
+    let mut tags_builder = FixedSizeListBuilder::new(StringBuilder::new(), 2);
+
+    for idx in 0..6 {
+        // Append shape id.
+        shape_id_builder.append_value(idx as u32 + 1);
+
+        tags_builder
+            .values()
+            .append_value(format!("tag{}1", idx + 1));
+        tags_builder
+            .values()
+            .append_value(format!("tag{}2", idx + 1));
+        tags_builder.append(true);
+    }
+
+    let batch = RecordBatch::try_from_iter(vec![
+        ("shape_id", Arc::new(shape_id_builder.finish()) as ArrayRef),
+        ("tags", Arc::new(tags_builder.finish()) as ArrayRef),
+    ])?;
+
+    let ctx = SessionContext::new();
+    ctx.register_batch("shapes", batch)?;
+    let df = ctx.table("shapes").await?;
+
+    let results = df.clone().collect().await?;
+    let expected = vec![
+        "+----------+----------------+",
+        "| shape_id | tags           |",
+        "+----------+----------------+",
+        "| 1        | [tag11, tag12] |",
+        "| 2        | [tag21, tag22] |",
+        "| 3        | [tag31, tag32] |",
+        "| 4        | [tag41, tag42] |",
+        "| 5        | [tag51, tag52] |",
+        "| 6        | [tag61, tag62] |",
+        "+----------+----------------+",
+    ];
+    assert_batches_sorted_eq!(expected, &results);
+
+    let results = df.unnest_column("tags")?.collect().await?;
+    let expected = vec![
+        "+----------+-------+",
+        "| shape_id | tags  |",
+        "+----------+-------+",
+        "| 1        | tag11 |",
+        "| 1        | tag12 |",
+        "| 2        | tag21 |",
+        "| 2        | tag22 |",
+        "| 3        | tag31 |",
+        "| 3        | tag32 |",
+        "| 4        | tag41 |",
+        "| 4        | tag42 |",
+        "| 5        | tag51 |",
+        "| 5        | tag52 |",
+        "| 6        | tag61 |",
+        "| 6        | tag62 |",
+        "+----------+-------+",
+    ];
+    assert_batches_sorted_eq!(expected, &results);
+
+    Ok(())
+}
+
 #[tokio::test]
 async fn unnest_aggregate_columns() -> Result<()> {
     const NUM_ROWS: usize = 5;