From 3252988f70df71c33bf6c6aa64deb40a970c7c4f Mon Sep 17 00:00:00 2001 From: Dongdong Tian Date: Fri, 11 Oct 2024 13:59:22 +0800 Subject: [PATCH] Fix the conversion error for pandas.Series with missing values in pandas<=2.1 (#3505) Co-authored-by: Wei Ji <23487320+weiji14@users.noreply.github.com> --- pygmt/clib/conversion.py | 22 ++++++++++++++++++++-- 1 file changed, 20 insertions(+), 2 deletions(-) diff --git a/pygmt/clib/conversion.py b/pygmt/clib/conversion.py index 0739d767567..ee80ec1a187 100644 --- a/pygmt/clib/conversion.py +++ b/pygmt/clib/conversion.py @@ -7,6 +7,8 @@ from collections.abc import Sequence import numpy as np +import pandas as pd +from packaging.version import Version from pygmt.exceptions import GMTInvalidInput @@ -178,6 +180,10 @@ def vectors_to_arrays(vectors): >>> [i.ndim for i in data] # Check that they are 1-D arrays [1, 1, 1] + >>> series = pd.Series(data=[0, 4, pd.NA, 8, 6], dtype=pd.Int32Dtype()) + >>> vectors_to_arrays([series]) + [array([ 0., 4., nan, 8., 6.])] + >>> import datetime >>> import pytest >>> pa = pytest.importorskip("pyarrow") @@ -205,8 +211,20 @@ def vectors_to_arrays(vectors): } arrays = [] for vector in vectors: - vec_dtype = str(getattr(vector, "dtype", "")) - arrays.append(np.ascontiguousarray(vector, dtype=dtypes.get(vec_dtype))) + if ( + hasattr(vector, "isna") + and vector.isna().any() + and Version(pd.__version__) < Version("2.2") + ): + # Workaround for dealing with pd.NA with pandas < 2.2. + # Bug report at: https://github.com/GenericMappingTools/pygmt/issues/2844 + # Following SPEC0, pandas 2.1 will be dropped in 2025 Q3, so it's likely + # we can remove the workaround in PyGMT v0.17.0. + array = np.ascontiguousarray(vector.astype(float)) + else: + vec_dtype = str(getattr(vector, "dtype", "")) + array = np.ascontiguousarray(vector, dtype=dtypes.get(vec_dtype)) + arrays.append(array) return arrays