79 lines
2.9 KiB
Python
79 lines
2.9 KiB
Python
import numpy as np
|
|
import pytest
|
|
|
|
from pandas import (
|
|
Categorical,
|
|
CategoricalIndex,
|
|
Index,
|
|
Interval,
|
|
)
|
|
import pandas._testing as tm
|
|
|
|
|
|
class TestReindex:
|
|
def test_reindex_list_non_unique(self):
|
|
# GH#11586
|
|
msg = "cannot reindex on an axis with duplicate labels"
|
|
ci = CategoricalIndex(["a", "b", "c", "a"])
|
|
with pytest.raises(ValueError, match=msg):
|
|
ci.reindex(["a", "c"])
|
|
|
|
def test_reindex_categorical_non_unique(self):
|
|
msg = "cannot reindex on an axis with duplicate labels"
|
|
ci = CategoricalIndex(["a", "b", "c", "a"])
|
|
with pytest.raises(ValueError, match=msg):
|
|
ci.reindex(Categorical(["a", "c"]))
|
|
|
|
def test_reindex_list_non_unique_unused_category(self):
|
|
msg = "cannot reindex on an axis with duplicate labels"
|
|
ci = CategoricalIndex(["a", "b", "c", "a"], categories=["a", "b", "c", "d"])
|
|
with pytest.raises(ValueError, match=msg):
|
|
ci.reindex(["a", "c"])
|
|
|
|
def test_reindex_categorical_non_unique_unused_category(self):
|
|
msg = "cannot reindex on an axis with duplicate labels"
|
|
ci = CategoricalIndex(["a", "b", "c", "a"], categories=["a", "b", "c", "d"])
|
|
with pytest.raises(ValueError, match=msg):
|
|
ci.reindex(Categorical(["a", "c"]))
|
|
|
|
def test_reindex_duplicate_target(self):
|
|
# See GH25459
|
|
cat = CategoricalIndex(["a", "b", "c"], categories=["a", "b", "c", "d"])
|
|
res, indexer = cat.reindex(["a", "c", "c"])
|
|
exp = Index(["a", "c", "c"], dtype="object")
|
|
tm.assert_index_equal(res, exp, exact=True)
|
|
tm.assert_numpy_array_equal(indexer, np.array([0, 2, 2], dtype=np.intp))
|
|
|
|
res, indexer = cat.reindex(
|
|
CategoricalIndex(["a", "c", "c"], categories=["a", "b", "c", "d"])
|
|
)
|
|
exp = CategoricalIndex(["a", "c", "c"], categories=["a", "b", "c", "d"])
|
|
tm.assert_index_equal(res, exp, exact=True)
|
|
tm.assert_numpy_array_equal(indexer, np.array([0, 2, 2], dtype=np.intp))
|
|
|
|
def test_reindex_empty_index(self):
|
|
# See GH16770
|
|
c = CategoricalIndex([])
|
|
res, indexer = c.reindex(["a", "b"])
|
|
tm.assert_index_equal(res, Index(["a", "b"]), exact=True)
|
|
tm.assert_numpy_array_equal(indexer, np.array([-1, -1], dtype=np.intp))
|
|
|
|
def test_reindex_categorical_added_category(self):
|
|
# GH 42424
|
|
ci = CategoricalIndex(
|
|
[Interval(0, 1, closed="right"), Interval(1, 2, closed="right")],
|
|
ordered=True,
|
|
)
|
|
ci_add = CategoricalIndex(
|
|
[
|
|
Interval(0, 1, closed="right"),
|
|
Interval(1, 2, closed="right"),
|
|
Interval(2, 3, closed="right"),
|
|
Interval(3, 4, closed="right"),
|
|
],
|
|
ordered=True,
|
|
)
|
|
result, _ = ci.reindex(ci_add)
|
|
expected = ci_add
|
|
tm.assert_index_equal(expected, result)
|