modin-project · dchigarev · Oct 20, 2020 · Oct 19, 2020 · Oct 19, 2020 · Oct 19, 2020
@@ -1559,6 +1559,20 @@ def describe(self, **kwargs):
             .astype(self.dtypes)
             .describe(**kwargs)
         )
+        new_index = empty_df.index
+
+        # Note: `describe` convert timestamp type to object type
+        # which results in the loss of two values in index: `first` and `last`
+        # for empty DataFrame.
+        datetime_is_numeric = kwargs.get("datetime_is_numeric") or False
+        if not any(map(is_numeric_dtype, empty_df.dtypes)) and not datetime_is_numeric:
+            for col_name in empty_df.dtypes.index:
+                # if previosly type of `col_name` was datetime or timedelta
+                if is_datetime_or_timedelta_dtype(self.dtypes[col_name]):
+                    new_index = pandas.Index(
+                        empty_df.index.to_list() + ["first"] + ["last"]
+                    )
+                    break
 
         def describe_builder(df, internal_indices=[]):
             return df.iloc[:, internal_indices].describe(**kwargs)
@@ -1568,7 +1582,7 @@ def describe_builder(df, internal_indices=[]):
                 0,
                 describe_builder,
                 empty_df.columns,
-                new_index=empty_df.index,
+                new_index=new_index,
                 new_columns=empty_df.columns,
             )
         )

@@ -140,6 +140,26 @@ def test_describe(data, percentiles):
     )
 
 
+@pytest.mark.parametrize("has_numeric_column", [False, True])
+@pytest.mark.parametrize("datetime_is_numeric", [True, False, None])
+def test_2195(datetime_is_numeric, has_numeric_column):
+    data = {
+        "categorical": pd.Categorical(["d"] * 10 ** 2),
+        "date": [np.datetime64("2000-01-01")] * 10 ** 2,
+    }
+
+    if has_numeric_column:
+        data.update({"numeric": [5] * 10 ** 2})
+
+    modin_df, pandas_df = pd.DataFrame(data), pandas.DataFrame(data)
+
+    eval_general(
+        modin_df,
+        pandas_df,
+        lambda df: df.describe(datetime_is_numeric=datetime_is_numeric),
+    )
+
+
 @pytest.mark.parametrize(
     "exclude,include",
     [