projektAI/venv/Lib/site-packages/pandas/tests/arrays/categorical/test_replace.py

import numpy as np
import pytest

import pandas as pd
from pandas import Categorical
import pandas._testing as tm


@pytest.mark.parametrize(
    "to_replace,value,expected,flip_categories",
    [
        # one-to-one
        (1, 2, [2, 2, 3], False),
        (1, 4, [4, 2, 3], False),
        (4, 1, [1, 2, 3], False),
        (5, 6, [1, 2, 3], False),
        # many-to-one
        ([1], 2, [2, 2, 3], False),
        ([1, 2], 3, [3, 3, 3], False),
        ([1, 2], 4, [4, 4, 3], False),
        ((1, 2, 4), 5, [5, 5, 3], False),
        ((5, 6), 2, [1, 2, 3], False),
        # many-to-many, handled outside of Categorical and results in separate dtype
        #  except for cases with only 1 unique entry in `value`
        ([1], [2], [2, 2, 3], True),
        ([1, 4], [5, 2], [5, 2, 3], True),
        # check_categorical sorts categories, which crashes on mixed dtypes
        (3, "4", [1, 2, "4"], False),
        ([1, 2, "3"], "5", ["5", "5", 3], True),
    ],
)
def test_replace(to_replace, value, expected, flip_categories):
    # GH 31720
    stays_categorical = not isinstance(value, list) or len(pd.unique(value)) == 1

    s = pd.Series([1, 2, 3], dtype="category")
    result = s.replace(to_replace, value)
    expected = pd.Series(expected, dtype="category")
    s.replace(to_replace, value, inplace=True)

    if flip_categories:
        expected = expected.cat.set_categories(expected.cat.categories[::-1])

    if not stays_categorical:
        # the replace call loses categorical dtype
        expected = pd.Series(np.asarray(expected))

    tm.assert_series_equal(expected, result, check_category_order=False)
    tm.assert_series_equal(expected, s, check_category_order=False)


@pytest.mark.parametrize(
    "to_replace, value, result, expected_error_msg",
    [
        ("b", "c", ["a", "c"], "Categorical.categories are different"),
        ("c", "d", ["a", "b"], None),
        # https://github.com/pandas-dev/pandas/issues/33288
        ("a", "a", ["a", "b"], None),
        ("b", None, ["a", None], "Categorical.categories length are different"),
    ],
)
def test_replace2(to_replace, value, result, expected_error_msg):
    # TODO: better name
    # GH#26988
    cat = Categorical(["a", "b"])
    expected = Categorical(result)
    result = cat.replace(to_replace, value)
    tm.assert_categorical_equal(result, expected)
    if to_replace == "b":  # the "c" test is supposed to be unchanged
        with pytest.raises(AssertionError, match=expected_error_msg):
            # ensure non-inplace call does not affect original
            tm.assert_categorical_equal(cat, expected)
    cat.replace(to_replace, value, inplace=True)
    tm.assert_categorical_equal(cat, expected)
Działa 2021-06-06 22:13:05 +02:00			`import numpy as np`
			`import pytest`

			`import pandas as pd`
			`from pandas import Categorical`
			`import pandas._testing as tm`


			`@pytest.mark.parametrize(`
			`"to_replace,value,expected,flip_categories",`
			`[`
			`# one-to-one`
			`(1, 2, [2, 2, 3], False),`
			`(1, 4, [4, 2, 3], False),`
			`(4, 1, [1, 2, 3], False),`
			`(5, 6, [1, 2, 3], False),`
			`# many-to-one`
			`([1], 2, [2, 2, 3], False),`
			`([1, 2], 3, [3, 3, 3], False),`
			`([1, 2], 4, [4, 4, 3], False),`
			`((1, 2, 4), 5, [5, 5, 3], False),`
			`((5, 6), 2, [1, 2, 3], False),`
			`# many-to-many, handled outside of Categorical and results in separate dtype`
			# except for cases with only 1 unique entry in `value`
			`([1], [2], [2, 2, 3], True),`
			`([1, 4], [5, 2], [5, 2, 3], True),`
			`# check_categorical sorts categories, which crashes on mixed dtypes`
			`(3, "4", [1, 2, "4"], False),`
			`([1, 2, "3"], "5", ["5", "5", 3], True),`
			`],`
			`)`
			`def test_replace(to_replace, value, expected, flip_categories):`
			`# GH 31720`
			`stays_categorical = not isinstance(value, list) or len(pd.unique(value)) == 1`

			`s = pd.Series([1, 2, 3], dtype="category")`
			`result = s.replace(to_replace, value)`
			`expected = pd.Series(expected, dtype="category")`
			`s.replace(to_replace, value, inplace=True)`

			`if flip_categories:`
			`expected = expected.cat.set_categories(expected.cat.categories[::-1])`

			`if not stays_categorical:`
			`# the replace call loses categorical dtype`
			`expected = pd.Series(np.asarray(expected))`

			`tm.assert_series_equal(expected, result, check_category_order=False)`
			`tm.assert_series_equal(expected, s, check_category_order=False)`


			`@pytest.mark.parametrize(`
			`"to_replace, value, result, expected_error_msg",`
			`[`
			`("b", "c", ["a", "c"], "Categorical.categories are different"),`
			`("c", "d", ["a", "b"], None),`
			`# https://github.com/pandas-dev/pandas/issues/33288`
			`("a", "a", ["a", "b"], None),`
			`("b", None, ["a", None], "Categorical.categories length are different"),`
			`],`
			`)`
			`def test_replace2(to_replace, value, result, expected_error_msg):`
			`# TODO: better name`
			`# GH#26988`
			`cat = Categorical(["a", "b"])`
			`expected = Categorical(result)`
			`result = cat.replace(to_replace, value)`
			`tm.assert_categorical_equal(result, expected)`
			`if to_replace == "b": # the "c" test is supposed to be unchanged`
			`with pytest.raises(AssertionError, match=expected_error_msg):`
			`# ensure non-inplace call does not affect original`
			`tm.assert_categorical_equal(cat, expected)`
			`cat.replace(to_replace, value, inplace=True)`
			`tm.assert_categorical_equal(cat, expected)`