pandas-dev · Dr-Irv · Jul 25, 2023 · Jul 21, 2023 · Jul 21, 2023 · Jul 21, 2023
diff --git a/pandas-stubs/_typing.pyi b/pandas-stubs/_typing.pyi
@@ -86,7 +86,11 @@ BooleanDtypeArg: TypeAlias = (
     | pd.BooleanDtype
     | Literal["boolean"]
     # Numpy bool type
+    # https://numpy.org/doc/stable/reference/arrays.scalars.html#numpy.bool_
     | type[np.bool_]
+    | Literal["?", "bool8", "bool_"]
+    # PyArrow boolean type and its string alias
+    | Literal["bool[pyarrow]", "boolean[pyarrow]"]
 )
 IntDtypeArg: TypeAlias = (
     # Builtin integer type and its string alias
@@ -98,22 +102,48 @@ IntDtypeArg: TypeAlias = (
     | pd.Int32Dtype
     | pd.Int64Dtype
     | Literal["Int8", "Int16", "Int32", "Int64"]
+    # Pandas nullable unsigned integer types and their string aliases
+    | pd.UInt8Dtype
+    | pd.UInt16Dtype
+    | pd.UInt32Dtype
+    | pd.UInt64Dtype
+    | Literal["UInt8", "UInt16", "UInt32", "UInt64"]
     # Numpy signed integer types and their string aliases
+    # https://numpy.org/doc/stable/reference/arrays.scalars.html#numpy.byte
     | type[np.byte]
-    | type[np.int8]
+    | Literal["b", "int8", "byte"]
+    # https://numpy.org/doc/stable/reference/arrays.scalars.html#numpy.short
     | type[np.int16]
-    | type[np.int32]
-    | type[np.int64]
-    | type[np.intp]
-    | Literal["byte", "int8", "int16", "int32", "int64", "intp"]
+    | Literal["h", "int16", "short"]
+    # https://numpy.org/doc/stable/reference/arrays.scalars.html#numpy.intc
+    | type[np.intc]
+    | Literal["i", "int32", "intc"]
+    # https://numpy.org/doc/stable/reference/arrays.scalars.html#numpy.int_
+    | type[np.int_]
+    | Literal["l", "int64", "int_", "intp", "long"]
+    # https://numpy.org/doc/stable/reference/arrays.scalars.html#numpy.longlong
+    | type[np.longlong]
+    | Literal["q", "longlong"]  # NOTE: int128 not assigned
     # Numpy unsigned integer types and their string aliases
+    # https://numpy.org/doc/stable/reference/arrays.scalars.html#numpy.ubyte
     | type[np.ubyte]
-    | type[np.uint8]
-    | type[np.uint16]
-    | type[np.uint32]
-    | type[np.uint64]
-    | type[np.uintp]
-    | Literal["ubyte", "uint8", "uint16", "uint32", "uint64", "uintp"]
+    | Literal["B", "uint8", "ubyte"]
+    # https://numpy.org/doc/stable/reference/arrays.scalars.html#numpy.ushort
+    | type[np.ushort]
+    | Literal["H", "uint16", "ushort"]
+    # https://numpy.org/doc/stable/reference/arrays.scalars.html#numpy.uintc
+    | type[np.uintc]
+    | Literal["I", "uint32", "uintc"]
+    # https://numpy.org/doc/stable/reference/arrays.scalars.html#numpy.uint
+    | type[np.uint]
+    | Literal["L", "uint64", "uint", "uintp"]
+    # https://numpy.org/doc/stable/reference/arrays.scalars.html#numpy.ulonglong
+    | type[np.ulonglong]
+    | Literal["Q", "ulonglong"]  # NOTE: uint128 not assigned
+    # PyArrow integer types and their string aliases
+    | Literal["int8[pyarrow]", "int16[pyarrow]", "int32[pyarrow]", "int64[pyarrow]"]
+    # PyArrow unsigned integer types and their string aliases
+    | Literal["uint8[pyarrow]", "uint16[pyarrow]", "uint32[pyarrow]", "uint64[pyarrow]"]
 )
 StrDtypeArg: TypeAlias = (
     # Builtin str type and its string alias
@@ -122,6 +152,8 @@ StrDtypeArg: TypeAlias = (
     # Pandas nullable string type and its string alias
     | pd.StringDtype
     | Literal["string"]
+    # PyArrow string type and its string alias
+    | Literal["string[pyarrow]"]
 )
 BytesDtypeArg: TypeAlias = type[bytes]
 FloatDtypeArg: TypeAlias = (
@@ -133,19 +165,43 @@ FloatDtypeArg: TypeAlias = (
     | pd.Float64Dtype
     | Literal["Float32", "Float64"]
     # Numpy float types and their string aliases
-    | type[np.float16]
-    | type[np.float32]
-    | type[np.float64]
-    | Literal["float16", "float32", "float64"]
+    # NOTE: Alias np.float16 only on Linux x86_64, use np.half instead
+    # https://numpy.org/doc/stable/reference/arrays.scalars.html#numpy.half
+    | type[np.half]
+    | Literal["e", "float16", "half"]
+    # https://numpy.org/doc/stable/reference/arrays.scalars.html#numpy.single
+    | type[np.single]
+    | Literal["f", "float32", "single"]
+    # https://numpy.org/doc/stable/reference/arrays.scalars.html#numpy.double
+    | type[np.double]
+    | Literal["d", "float64", "double", "float_"]
+    # https://numpy.org/doc/stable/reference/arrays.scalars.html#numpy.longdouble
+    | type[np.longdouble]
+    | Literal["g", "float128", "longdouble", "longfloat"]
+    # PyArrow floating point types and their string aliases
+    | Literal[
+        "float[pyarrow]",
+        "double[pyarrow]",
+        "float16[pyarrow]",
+        "float32[pyarrow]",
+        "float64[pyarrow]",
+    ]
 )
 ComplexDtypeArg: TypeAlias = (
     # Builtin complex type and its string alias
     type[complex]  # noqa: Y030
     | Literal["complex"]
     # Numpy complex types and their aliases
-    | type[np.complex64]
-    | type[np.complex128]
-    | Literal["complex64", "complex128"]
+    # https://numpy.org/doc/stable/reference/arrays.scalars.html#numpy.csingle
+    | type[np.csingle]
+    | Literal["F", "complex64", "singlecomplex"]
+    # https://numpy.org/doc/stable/reference/arrays.scalars.html#numpy.cdouble
+    | type[np.cdouble]
+    | Literal["D", "complex128", "cdouble", "cfloat", "complex_"]
+    #  https://numpy.org/doc/stable/reference/arrays.scalars.html#numpy.clongdouble
+    # NOTE: Alias np.complex256 only on Linux x86_64, use np.clongdouble instead
+    | type[np.clongdouble]
+    | Literal["G", "complex256", "clongdouble", "clongfloat", "longcomplex"]
 )
 # Refer to https://numpy.org/doc/stable/reference/arrays.datetime.html#datetime-units
 TimedeltaDtypeArg: TypeAlias = Literal[
@@ -163,6 +219,11 @@ TimedeltaDtypeArg: TypeAlias = Literal[
     "timedelta64[ps]",
     "timedelta64[fs]",
     "timedelta64[as]",
+    # PyArrow duration type and its string alias
+    "duration[s][pyarrow]",
+    "duration[ms][pyarrow]",
+    "duration[us][pyarrow]",
+    "duration[ns][pyarrow]",
 ]
 TimestampDtypeArg: TypeAlias = Literal[
     "datetime64[Y]",
@@ -179,9 +240,19 @@ TimestampDtypeArg: TypeAlias = Literal[
     "datetime64[ps]",
     "datetime64[fs]",
     "datetime64[as]",
+    # PyArrow timestamp type and its string alias
+    "date32[pyarrow]",
+    "date64[pyarrow]",
+    "timestamp[s][pyarrow]",
+    "timestamp[ms][pyarrow]",
+    "timestamp[us][pyarrow]",
+    "timestamp[ns][pyarrow]",
 ]
 CategoryDtypeArg: TypeAlias = CategoricalDtype | Literal["category"]
 
+# DtypeArg specifies all allowable dtypes in a functions its dtype argument
+DtypeObj: TypeAlias = np.dtype[np.generic] | ExtensionDtype
+
 AstypeArg: TypeAlias = (
     BooleanDtypeArg
     | IntDtypeArg
@@ -192,11 +263,10 @@ AstypeArg: TypeAlias = (
     | TimedeltaDtypeArg
     | TimestampDtypeArg
     | CategoryDtypeArg
-    | ExtensionDtype
+    | DtypeObj
     | type[object]
+    | str
 )
-# DtypeArg specifies all allowable dtypes in a functions its dtype argument
-DtypeObj: TypeAlias = np.dtype[np.generic] | ExtensionDtype
 
 # filenames and file-like-objects
 AnyStr_cov = TypeVar("AnyStr_cov", str, bytes, covariant=True)

diff --git a/pandas-stubs/core/series.pyi b/pandas-stubs/core/series.pyi
@@ -329,7 +329,7 @@ class Series(IndexOpsMixin, NDFrame, Generic[S1]):
         is_copy: _bool | None = ...,
         **kwargs,
     ) -> Series[S1]: ...
-    def __getattr__(self, name: str) -> S1: ...
+    def __getattr__(self, name: _str) -> S1: ...
     @overload
     def __getitem__(
         self,
@@ -1208,7 +1208,7 @@ class Series(IndexOpsMixin, NDFrame, Generic[S1]):
     @overload
     def astype(
         self,
-        dtype: type[object] | ExtensionDtype,
+        dtype: type[object] | ExtensionDtype | DtypeObj | _str,
         copy: _bool = ...,
         errors: IgnoreRaise = ...,
     ) -> Series: ...

diff --git a/tests/test_series.py b/tests/test_series.py
@@ -1697,8 +1697,12 @@ def test_updated_astype() -> None:
     s = pd.Series([3, 4, 5])
     s1 = pd.Series(True)
 
-    # Boolean types
+    # dynamically typed
+    string: str = "int"  # not Literal!
+    check(assert_type(s.astype(string), "pd.Series[Any]"), pd.Series, np.integer)
+    check(assert_type(s.astype(s.dtype), "pd.Series[Any]"), pd.Series, np.integer)
 
+    # Boolean types
     # Builtin bool types
     check(assert_type(s.astype(bool), "pd.Series[bool]"), pd.Series, np.bool_)
     check(assert_type(s.astype("bool"), "pd.Series[bool]"), pd.Series, np.bool_)
@@ -1791,6 +1795,20 @@ def test_updated_astype() -> None:
     check(assert_type(s.astype("float16"), "pd.Series[float]"), pd.Series, np.float16)
     check(assert_type(s.astype("float32"), "pd.Series[float]"), pd.Series, np.float32)
     check(assert_type(s.astype("float64"), "pd.Series[float]"), pd.Series, np.float64)
+    check(assert_type(s.astype("float64"), "pd.Series[float]"), pd.Series, np.float64)
+    check(assert_type(s.astype("float64"), "pd.Series[float]"), pd.Series, np.float64)
+
+    # pyarrow
+    check(
+        assert_type(s.astype("int64[pyarrow]"), "pd.Series[int]"),
+        pd.Series,
+        int,
+    )
+    check(
+        assert_type(s.astype("float[pyarrow]"), "pd.Series[float]"),
+        pd.Series,
+        float,
+    )
 
     # Complex types
 
@@ -1889,6 +1907,26 @@ def test_updated_astype() -> None:
         pd.Series,
         Timedelta,
     )
+    check(
+        assert_type(s.astype("duration[s][pyarrow]"), TimedeltaSeries),
+        pd.Series,
+        datetime.timedelta,
+    )
+    check(
+        assert_type(s.astype("duration[ms][pyarrow]"), TimedeltaSeries),
+        pd.Series,
+        datetime.timedelta,
+    )
+    check(
+        assert_type(s.astype("duration[us][pyarrow]"), TimedeltaSeries),
+        pd.Series,
+        datetime.timedelta,
+    )
+    check(
+        assert_type(s.astype("duration[ns][pyarrow]"), TimedeltaSeries),
+        pd.Series,
+        datetime.timedelta,
+    )
 
     check(
         assert_type(s.astype("datetime64[Y]"), TimestampSeries),
@@ -1960,6 +1998,26 @@ def test_updated_astype() -> None:
         pd.Series,
         Timestamp,
     )
+    check(
+        assert_type(s.astype("timestamp[s][pyarrow]"), TimestampSeries),
+        pd.Series,
+        datetime.datetime,
+    )
+    check(
+        assert_type(s.astype("timestamp[ms][pyarrow]"), TimestampSeries),
+        pd.Series,
+        datetime.datetime,
+    )
+    check(
+        assert_type(s.astype("timestamp[us][pyarrow]"), TimestampSeries),
+        pd.Series,
+        datetime.datetime,
+    )
+    check(
+        assert_type(s.astype("timestamp[ns][pyarrow]"), TimestampSeries),
+        pd.Series,
+        datetime.datetime,
+    )
 
     orseries = pd.Series([Decimal(x) for x in [1, 2, 3]])
     newtype = DecimalDtype()