Skip to content

Commit

Permalink
BUG: Fix Series constructor for Categorical with index
Browse files Browse the repository at this point in the history
Fixes Series constructor so that ValueError is raised when a Categorical and index of different length are given.
  • Loading branch information
cbertinato committed Feb 16, 2018
1 parent 11de131 commit 28b70b8
Show file tree
Hide file tree
Showing 3 changed files with 34 additions and 0 deletions.
1 change: 1 addition & 0 deletions doc/source/whatsnew/v0.23.0.txt
Original file line number Diff line number Diff line change
Expand Up @@ -690,6 +690,7 @@ Categorical
- Bug in :meth:`Index.astype` with a categorical dtype where the resultant index is not converted to a :class:`CategoricalIndex` for all types of index (:issue:`18630`)
- Bug in :meth:`Series.astype` and ``Categorical.astype()`` where an existing categorical data does not get updated (:issue:`10696`, :issue:`18593`)
- Bug in :class:`Index` constructor with ``dtype=CategoricalDtype(...)`` where ``categories`` and ``ordered`` are not maintained (issue:`19032`)
- Bug in :class:`Series` constructor with ``Categorical`` where an error is not raised when an index of different length is given (:issue:`19342`)

Datetimelike
^^^^^^^^^^^^
Expand Down
5 changes: 5 additions & 0 deletions pandas/core/series.py
Original file line number Diff line number Diff line change
Expand Up @@ -210,6 +210,11 @@ def __init__(self, data=None, index=None, dtype=None, name=None,
raise ValueError("cannot specify a dtype with a "
"Categorical unless "
"dtype='category'")
if index is not None and len(index) != len(data):
raise ValueError('Length of passed values is {val}, '
'index implies {ind}'
.format(val=len(data), ind=len(index)))

elif (isinstance(data, types.GeneratorType) or
(compat.PY3 and isinstance(data, map))):
data = list(data)
Expand Down
28 changes: 28 additions & 0 deletions pandas/tests/series/test_constructors.py
Original file line number Diff line number Diff line change
Expand Up @@ -5,6 +5,7 @@

from datetime import datetime, timedelta
from collections import OrderedDict
import types

from numpy import nan
import numpy as np
Expand All @@ -22,6 +23,7 @@
from pandas._libs import lib
from pandas._libs.tslib import iNaT

from pandas import compat
from pandas.compat import lrange, range, zip, long
from pandas.util.testing import assert_series_equal
import pandas.util.testing as tm
Expand Down Expand Up @@ -393,6 +395,32 @@ def test_constructor_default_index(self):
s = Series([0, 1, 2])
tm.assert_index_equal(s.index, pd.Index(np.arange(3)))

@pytest.mark.parametrize('input', [[1, 2, 3],
(1, 2, 3),
list(range(3)),
pd.Categorical(['a', 'b', 'a']),
(i for i in range(3)),
map(lambda x: x, range(3))])
def test_constructor_index_mismatch(self, input):
# GH 19342
# test that construction of a Series with an index of different length
# raises an error
idx = np.arange(4)
if compat.PY2:
typs = types.GeneratorType
else:
typs = (map, types.GeneratorType)

if isinstance(input, typs):
input_len = len(list(input))
else:
input_len = len(input)

msg = ('Length of passed values is {val}, index implies {ind}'
.format(val=input_len, ind=len(idx)))
with pytest.raises(ValueError, message=msg):
Series(input, index=idx)

def test_constructor_corner(self):
df = tm.makeTimeDataFrame()
objs = [df, df]
Expand Down

0 comments on commit 28b70b8

Please sign in to comment.