rapidsai · rapids-bot · Mar 4, 2021 · Feb 23, 2021 · Feb 23, 2021 · Feb 24, 2021
@@ -0,0 +1,21 @@
+# Copyright (c) 2021, NVIDIA CORPORATION.
+
+from cudf._lib.cpp.column.column cimport column
+from cudf._lib.cpp.column.column_view cimport column_view
+from cudf._lib.cpp.types cimport data_type
+
+from libcpp.memory cimport unique_ptr
+
+cdef extern from "cudf/strings/convert/convert_fixed_point.hpp" namespace \
+        "cudf::strings" nogil:
+    cdef unique_ptr[column] to_fixed_point(
+        column_view input_col,
+        data_type output_type) except +
+
+    cdef unique_ptr[column] from_fixed_point(
+        column_view input_col) except +
+
+    cdef unique_ptr[column] is_fixed_point(
+        column_view source_strings,
+        data_type output_type
+    ) except +
diff --git a/python/cudf/cudf/_lib/string_casting.pyx b/python/cudf/cudf/_lib/string_casting.pyx
@@ -1,4 +1,4 @@
-# Copyright (c) 2020, NVIDIA CORPORATION.
+# Copyright (c) 2020-2021, NVIDIA CORPORATION.
 
 import numpy as np
 
@@ -7,6 +7,7 @@ from cudf._lib.scalar import as_device_scalar
 from cudf._lib.scalar cimport DeviceScalar
 from cudf._lib.types import np_to_cudf_types
 from cudf._lib.types cimport underlying_type_t_type_id
+from cudf._lib.cpp.types cimport DECIMAL64
 
 from cudf.core.column.column import as_column
 
@@ -45,6 +46,11 @@ from cudf._lib.cpp.strings.convert.convert_durations cimport (
     to_durations as cpp_to_durations,
     from_durations as cpp_from_durations
 )
+from cudf._lib.cpp.strings.convert.convert_fixed_point cimport (
+    to_fixed_point as cpp_to_fixed_point,
+    from_fixed_point as cpp_from_fixed_point,
+    is_fixed_point as cpp_is_fixed_point
+)
 from cudf._lib.cpp.types cimport (
     type_id,
     data_type,
@@ -771,3 +777,48 @@ def is_hex(Column source_strings):
         ))
 
     return Column.from_unique_ptr(move(c_result))
+
+
+def from_decimal(Column input_col):
+    cdef column_view input_column_view = input_col.view()
+    cdef unique_ptr[column] c_result
+    with nogil:
+        c_result = move(
+            cpp_from_fixed_point(
+                input_column_view))
+
+    return Column.from_unique_ptr(move(c_result))
+
+
+def to_decimal(Column input_col, object out_type):
+    cdef column_view input_column_view = input_col.view()
+    cdef unique_ptr[column] c_result
+    cdef int scale = out_type.scale
+    cdef data_type c_out_type = data_type(DECIMAL64, -scale)
+    with nogil:
+        c_result = move(
+            cpp_to_fixed_point(
+                input_column_view,
+                c_out_type))
+
+    result = Column.from_unique_ptr(move(c_result))
+    result.dtype.precision = out_type.precision
+    return result
+
+
+def is_fixed_point(Column input_col, object out_type):
+    """
+    Returns a Column of boolean values with True for `input_col`
+    that have fixed-point characters.
+    """
+    cdef unique_ptr[column] c_result
+    cdef column_view source_view = input_col.view()
+    cdef int scale = out_type.scale
+    cdef data_type c_out_type = data_type(DECIMAL64, -scale)
+    with nogil:
+        c_result = move(cpp_is_fixed_point(
+            source_view,
+            c_out_type
+        ))
+
+    return Column.from_unique_ptr(move(c_result))
@@ -1015,6 +1015,8 @@ def astype(self, dtype: Dtype, **kwargs) -> ColumnBase:
                     "Casting interval columns not currently supported"
                 )
             return self
+        elif is_decimal_dtype(dtype):
+            return self.as_decimal_column(dtype, **kwargs)
         elif np.issubdtype(dtype, np.datetime64):
             return self.as_datetime_column(dtype, **kwargs)
         elif np.issubdtype(dtype, np.timedelta64):
@@ -1085,6 +1087,11 @@ def as_string_column(
     ) -> "cudf.core.column.StringColumn":
         raise NotImplementedError
 
+    def as_decimal_column(
+        self, dtype: Dtype, **kwargs
+    ) -> "cudf.core.column.DecimalColumn":
+        raise NotImplementedError
+
     def apply_boolean_mask(self, mask) -> ColumnBase:
         mask = as_column(mask, dtype="bool")
         result = (

@@ -1,14 +1,20 @@
 # Copyright (c) 2021, NVIDIA CORPORATION.
 
+import cudf
 import cupy as cp
 import numpy as np
 import pyarrow as pa
 
+from typing import cast
+
 from cudf import _lib as libcudf
 from cudf.core.buffer import Buffer
 from cudf.core.column import ColumnBase
 from cudf.core.dtypes import Decimal64Dtype
 from cudf.utils.utils import pa_mask_buffer_to_mask
+from cudf._lib import string_casting as str_cast
+from cudf._typing import Dtype
+from cudf.core.column import as_column
 
 
 class DecimalColumn(ColumnBase):
@@ -59,6 +65,16 @@ def binary_operator(self, op, other, reflect=False):
         result.dtype.precision = _binop_precision(self.dtype, other.dtype, op)
         return result
 
+    def as_string_column(
+        self, dtype: Dtype, format=None
+    ) -> "cudf.core.column.StringColumn":
+        if len(self) > 0:
+            return str_cast.from_decimal(self)
+        else:
+            return cast(
+                "cudf.core.column.StringColumn", as_column([], dtype="object")
+            )
+
 
 def _binop_precision(l_dtype, r_dtype, op):
     """

@@ -4887,6 +4887,11 @@ def as_timedelta_column(
         format = "%D days %H:%M:%S"
         return self._as_datetime_or_timedelta_column(out_dtype, format)
 
+    def as_decimal_column(
+        self, dtype: Dtype, **kwargs
+    ) -> "cudf.core.column.DecimalColumn":
+        return str_cast.to_decimal(self, dtype)
+
     def as_string_column(self, dtype: Dtype, format=None) -> StringColumn:
         return self
 

@@ -1,6 +1,7 @@
-# Copyright (c) 2018-2020, NVIDIA CORPORATION.
+# Copyright (c) 2018-2021, NVIDIA CORPORATION.
 import re
 from contextlib import ExitStack as does_not_raise
+from decimal import Decimal
 from sys import getsizeof
 
 import cupy
@@ -206,6 +207,43 @@ def test_string_astype(dtype):
     assert_eq(expect, got)
 
 
+def test_string_decimal():
+    gs = Series(["1.11", "2.22", "3.33"])
+    fp = gs.astype(cudf.Decimal64Dtype(scale=2, precision=3))
+    got = fp.astype("str")
+    assert_eq(gs, got)
+    gs = Series(["111", "222", "33"])
+    fp = gs.astype(cudf.Decimal64Dtype(scale=0, precision=3))
+    got = fp.astype("str")
+    assert_eq(gs, got)
+    gs = Series(["111000", "22000", "3000"])
+    fp = gs.astype(cudf.Decimal64Dtype(scale=-3, precision=3))
+    got = fp.astype("str")
+    assert_eq(gs, got)
+    #
+    fp = cudf.Series(
+        [Decimal("1.23"), Decimal("2.34"), Decimal("3.45")],
+        dtype=cudf.Decimal64Dtype(precision=3, scale=2),
+    )
+    gs = fp.astype("str")
+    got = gs.astype(cudf.Decimal64Dtype(scale=2, precision=3))
+    assert_eq(fp, got)
+    fp = cudf.Series(
+        [Decimal("123"), Decimal("234"), Decimal("345")],
+        dtype=cudf.Decimal64Dtype(precision=3, scale=0),
+    )
+    gs = fp.astype("str")
+    got = gs.astype(cudf.Decimal64Dtype(scale=0, precision=3))
+    assert_eq(fp, got)
+    fp = cudf.Series(
+        [Decimal("12300"), Decimal("-400"), Decimal("5000.0")],
+        dtype=cudf.Decimal64Dtype(precision=5, scale=-2),
+    )
+    gs = fp.astype("str")
+    got = gs.astype(cudf.Decimal64Dtype(scale=-2, precision=5))
+    assert_eq(fp, got)
+
+
 @pytest.mark.parametrize(
     "dtype", NUMERIC_TYPES + DATETIME_TYPES + ["bool", "object", "str"]
 )