move cmp around

apache · Jun 23, 2024 · de104e1 · de104e1
1 parent 5d835e9
commit de104e1
Show file tree

Hide file tree

Showing 3 changed files with 75 additions and 74 deletions.
diff --git a/arrow-array/src/array/byte_view_array.rs b/arrow-array/src/array/byte_view_array.rs
@@ -344,77 +344,6 @@ impl<T: ByteViewType + ?Sized> GenericByteViewArray<T> {
         builder.finish()
     }
 
-    /// Comparing two [`GenericByteViewArray`] at index `left_idx` and `right_idx`
-    pub fn compare(
-        left: &GenericByteViewArray<T>,
-        left_idx: usize,
-        right: &GenericByteViewArray<T>,
-        right_idx: usize,
-    ) -> std::cmp::Ordering {
-        assert!(left_idx < left.len());
-        assert!(right_idx < right.len());
-        unsafe { Self::compare_unchecked(left, left_idx, right, right_idx) }
-    }
-
-    /// Comparing two [`GenericByteViewArray`] at index `left_idx` and `right_idx`
-    ///
-    /// Comparing two ByteView types are non-trivial.
-    /// It takes a bit of patience to understand why we don't just compare two &[u8] directly.
-    ///
-    /// ByteView types give us the following two advantages, and we need to be careful not to lose them:
-    /// (1) For string/byte smaller than 12 bytes, the entire data is inlined in the view.
-    ///     Meaning that reading one array element requires only one memory access
-    ///     (two memory access required for StringArray, one for offset buffer, the other for value buffer).
-    ///
-    /// (2) For string/byte larger than 12 bytes, we can still be faster than (for certain operations) StringArray/ByteArray,
-    ///     thanks to the inlined 4 bytes.
-    ///     Consider equality check:
-    ///     If the first four bytes of the two strings are different, we can return false immediately (with just one memory access).
-    ///
-    /// If we directly compare two &[u8], we materialize the entire string (i.e., make multiple memory accesses), which might be unnecessary.
-    /// - Most of the time (eq, ord), we only need to look at the first 4 bytes to know the answer,
-    ///   e.g., if the inlined 4 bytes are different, we can directly return unequal without looking at the full string.
-    ///
-    /// # Order check flow
-    /// (1) if both string are smaller than 12 bytes, we can directly compare the data inlined to the view.
-    /// (2) if any of the string is larger than 12 bytes, we need to compare the full string.
-    ///     (2.1) if the inlined 4 bytes are different, we can return the result immediately.
-    ///     (2.2) o.w., we need to compare the full string.
-    ///
-    /// # Safety
-    /// The left/right_idx must within range of each array
-    pub unsafe fn compare_unchecked(
-        left: &GenericByteViewArray<T>,
-        left_idx: usize,
-        right: &GenericByteViewArray<T>,
-        right_idx: usize,
-    ) -> std::cmp::Ordering {
-        let l_view = left.views().get_unchecked(left_idx);
-        let l_len = *l_view as u32;
-
-        let r_view = right.views().get_unchecked(right_idx);
-        let r_len = *r_view as u32;
-
-        if l_len <= 12 && r_len <= 12 {
-            let l_data = unsafe { GenericByteViewArray::<T>::inline_value(l_view, l_len as usize) };
-            let r_data = unsafe { GenericByteViewArray::<T>::inline_value(r_view, r_len as usize) };
-            return l_data.cmp(r_data);
-        }
-
-        // one of the string is larger than 12 bytes,
-        // we then try to compare the inlined data first
-        let l_inlined_data = unsafe { GenericByteViewArray::<T>::inline_value(l_view, 4) };
-        let r_inlined_data = unsafe { GenericByteViewArray::<T>::inline_value(r_view, 4) };
-        if r_inlined_data != l_inlined_data {
-            return l_inlined_data.cmp(r_inlined_data);
-        }
-
-        // unfortunately, we need to compare the full data
-        let l_full_data: &[u8] = unsafe { left.value_unchecked(left_idx).as_ref() };
-        let r_full_data: &[u8] = unsafe { right.value_unchecked(right_idx).as_ref() };
-
-        l_full_data.cmp(r_full_data)
-    }
 }
 
 impl<T: ByteViewType + ?Sized> Debug for GenericByteViewArray<T> {

diff --git a/arrow-ord/src/cmp.rs b/arrow-ord/src/cmp.rs
@@ -559,13 +559,13 @@ impl<'a, T: ByteViewType> ArrayOrd for &'a GenericByteViewArray<T> {
             return false;
         }
 
-        unsafe { GenericByteViewArray::compare_unchecked(l.0, l.1, r.0, r.1).is_eq() }
+        unsafe { compare_byte_view_unchecked(l.0, l.1, r.0, r.1).is_eq() }
     }
 
     fn is_lt(l: Self::Item, r: Self::Item) -> bool {
         // # Safety
         // The index is within bounds as it is checked in value()
-        unsafe { GenericByteViewArray::<T>::compare_unchecked(l.0, l.1, r.0, r.1).is_lt() }
+        unsafe { compare_byte_view_unchecked(l.0, l.1, r.0, r.1).is_lt() }
     }
 
     fn len(&self) -> usize {
@@ -597,6 +597,78 @@ impl<'a> ArrayOrd for &'a FixedSizeBinaryArray {
     }
 }
 
+/// Comparing two [`GenericByteViewArray`] at index `left_idx` and `right_idx`
+pub fn compare_byte_view<T: ByteViewType>(
+    left: &GenericByteViewArray<T>,
+    left_idx: usize,
+    right: &GenericByteViewArray<T>,
+    right_idx: usize,
+) -> std::cmp::Ordering {
+    assert!(left_idx < left.len());
+    assert!(right_idx < right.len());
+    unsafe { compare_byte_view_unchecked(left, left_idx, right, right_idx) }
+}
+
+/// Comparing two [`GenericByteViewArray`] at index `left_idx` and `right_idx`
+///
+/// Comparing two ByteView types are non-trivial.
+/// It takes a bit of patience to understand why we don't just compare two &[u8] directly.
+///
+/// ByteView types give us the following two advantages, and we need to be careful not to lose them:
+/// (1) For string/byte smaller than 12 bytes, the entire data is inlined in the view.
+///     Meaning that reading one array element requires only one memory access
+///     (two memory access required for StringArray, one for offset buffer, the other for value buffer).
+///
+/// (2) For string/byte larger than 12 bytes, we can still be faster than (for certain operations) StringArray/ByteArray,
+///     thanks to the inlined 4 bytes.
+///     Consider equality check:
+///     If the first four bytes of the two strings are different, we can return false immediately (with just one memory access).
+///
+/// If we directly compare two &[u8], we materialize the entire string (i.e., make multiple memory accesses), which might be unnecessary.
+/// - Most of the time (eq, ord), we only need to look at the first 4 bytes to know the answer,
+///   e.g., if the inlined 4 bytes are different, we can directly return unequal without looking at the full string.
+///
+/// # Order check flow
+/// (1) if both string are smaller than 12 bytes, we can directly compare the data inlined to the view.
+/// (2) if any of the string is larger than 12 bytes, we need to compare the full string.
+///     (2.1) if the inlined 4 bytes are different, we can return the result immediately.
+///     (2.2) o.w., we need to compare the full string.
+///
+/// # Safety
+/// The left/right_idx must within range of each array
+pub unsafe fn compare_byte_view_unchecked<T: ByteViewType>(
+    left: &GenericByteViewArray<T>,
+    left_idx: usize,
+    right: &GenericByteViewArray<T>,
+    right_idx: usize,
+) -> std::cmp::Ordering {
+    let l_view = left.views().get_unchecked(left_idx);
+    let l_len = *l_view as u32;
+
+    let r_view = right.views().get_unchecked(right_idx);
+    let r_len = *r_view as u32;
+
+    if l_len <= 12 && r_len <= 12 {
+        let l_data = unsafe { GenericByteViewArray::<T>::inline_value(l_view, l_len as usize) };
+        let r_data = unsafe { GenericByteViewArray::<T>::inline_value(r_view, r_len as usize) };
+        return l_data.cmp(r_data);
+    }
+
+    // one of the string is larger than 12 bytes,
+    // we then try to compare the inlined data first
+    let l_inlined_data = unsafe { GenericByteViewArray::<T>::inline_value(l_view, 4) };
+    let r_inlined_data = unsafe { GenericByteViewArray::<T>::inline_value(r_view, 4) };
+    if r_inlined_data != l_inlined_data {
+        return l_inlined_data.cmp(r_inlined_data);
+    }
+
+    // unfortunately, we need to compare the full data
+    let l_full_data: &[u8] = unsafe { left.value_unchecked(left_idx).as_ref() };
+    let r_full_data: &[u8] = unsafe { right.value_unchecked(right_idx).as_ref() };
+
+    l_full_data.cmp(r_full_data)
+}
+
 #[cfg(test)]
 mod tests {
     use std::sync::Arc;

diff --git a/arrow-ord/src/ord.rs b/arrow-ord/src/ord.rs
@@ -146,7 +146,7 @@ fn compare_byte_view<T: ByteViewType>(
     let l = left.clone();
     let r = right.clone();
     compare(left, right, opts, move |i, j| {
-        GenericByteViewArray::compare(&l, i, &r, j)
+        crate::cmp::compare_byte_view(&l, i, &r, j)
     })
 }