projektAI/venv/Lib/site-packages/pandas/tests/indexing/interval/test_interval.py

import numpy as np
import pytest

import pandas as pd
from pandas import DataFrame, IntervalIndex, Series
import pandas._testing as tm


class TestIntervalIndex:
    def setup_method(self, method):
        self.s = Series(np.arange(5), IntervalIndex.from_breaks(np.arange(6)))

    def test_getitem_with_scalar(self):

        s = self.s

        expected = s.iloc[:3]
        tm.assert_series_equal(expected, s[:3])
        tm.assert_series_equal(expected, s[:2.5])
        tm.assert_series_equal(expected, s[0.1:2.5])

        expected = s.iloc[1:4]
        tm.assert_series_equal(expected, s[[1.5, 2.5, 3.5]])
        tm.assert_series_equal(expected, s[[2, 3, 4]])
        tm.assert_series_equal(expected, s[[1.5, 3, 4]])

        expected = s.iloc[2:5]
        tm.assert_series_equal(expected, s[s >= 2])

    @pytest.mark.parametrize("direction", ["increasing", "decreasing"])
    def test_nonoverlapping_monotonic(self, direction, closed):
        tpls = [(0, 1), (2, 3), (4, 5)]
        if direction == "decreasing":
            tpls = tpls[::-1]

        idx = IntervalIndex.from_tuples(tpls, closed=closed)
        s = Series(list("abc"), idx)

        for key, expected in zip(idx.left, s):
            if idx.closed_left:
                assert s[key] == expected
                assert s.loc[key] == expected
            else:
                with pytest.raises(KeyError, match=str(key)):
                    s[key]
                with pytest.raises(KeyError, match=str(key)):
                    s.loc[key]

        for key, expected in zip(idx.right, s):
            if idx.closed_right:
                assert s[key] == expected
                assert s.loc[key] == expected
            else:
                with pytest.raises(KeyError, match=str(key)):
                    s[key]
                with pytest.raises(KeyError, match=str(key)):
                    s.loc[key]

        for key, expected in zip(idx.mid, s):
            assert s[key] == expected
            assert s.loc[key] == expected

    def test_non_matching(self):
        s = self.s

        # this is a departure from our current
        # indexing scheme, but simpler
        with pytest.raises(KeyError, match=r"^\[-1\]$"):
            s.loc[[-1, 3, 4, 5]]

        with pytest.raises(KeyError, match=r"^\[-1\]$"):
            s.loc[[-1, 3]]

    @pytest.mark.arm_slow
    def test_large_series(self):
        s = Series(
            np.arange(1000000), index=IntervalIndex.from_breaks(np.arange(1000001))
        )

        result1 = s.loc[:80000]
        result2 = s.loc[0:80000]
        result3 = s.loc[0:80000:1]
        tm.assert_series_equal(result1, result2)
        tm.assert_series_equal(result1, result3)

    def test_loc_getitem_frame(self):
        # CategoricalIndex with IntervalIndex categories
        df = DataFrame({"A": range(10)})
        s = pd.cut(df.A, 5)
        df["B"] = s
        df = df.set_index("B")

        result = df.loc[4]
        expected = df.iloc[4:6]
        tm.assert_frame_equal(result, expected)

        with pytest.raises(KeyError, match="10"):
            df.loc[10]

        # single list-like
        result = df.loc[[4]]
        expected = df.iloc[4:6]
        tm.assert_frame_equal(result, expected)

        # non-unique
        result = df.loc[[4, 5]]
        expected = df.take([4, 5, 4, 5])
        tm.assert_frame_equal(result, expected)

        with pytest.raises(KeyError, match=r"^\[10\]$"):
            df.loc[[10]]

        # partial missing
        with pytest.raises(KeyError, match=r"^\[10\]$"):
            df.loc[[10, 4]]


class TestIntervalIndexInsideMultiIndex:
    def test_mi_intervalindex_slicing_with_scalar(self):
        # GH#27456
        idx = pd.MultiIndex.from_arrays(
            [
                pd.Index(["FC", "FC", "FC", "FC", "OWNER", "OWNER", "OWNER", "OWNER"]),
                pd.Index(
                    ["RID1", "RID1", "RID2", "RID2", "RID1", "RID1", "RID2", "RID2"]
                ),
                pd.IntervalIndex.from_arrays(
                    [0, 1, 10, 11, 0, 1, 10, 11], [1, 2, 11, 12, 1, 2, 11, 12]
                ),
            ]
        )

        idx.names = ["Item", "RID", "MP"]
        df = DataFrame({"value": [1, 2, 3, 4, 5, 6, 7, 8]})
        df.index = idx
        query_df = DataFrame(
            {
                "Item": ["FC", "OWNER", "FC", "OWNER", "OWNER"],
                "RID": ["RID1", "RID1", "RID1", "RID2", "RID2"],
                "MP": [0.2, 1.5, 1.6, 11.1, 10.9],
            }
        )

        query_df = query_df.sort_index()

        idx = pd.MultiIndex.from_arrays([query_df.Item, query_df.RID, query_df.MP])
        query_df.index = idx
        result = df.value.loc[query_df.index]
        expected = Series([1, 6, 2, 8, 7], index=idx, name="value")
        tm.assert_series_equal(result, expected)
Działa 2021-06-06 22:13:05 +02:00			`import numpy as np`
			`import pytest`

			`import pandas as pd`
			`from pandas import DataFrame, IntervalIndex, Series`
			`import pandas._testing as tm`


			`class TestIntervalIndex:`
			`def setup_method(self, method):`
			`self.s = Series(np.arange(5), IntervalIndex.from_breaks(np.arange(6)))`

			`def test_getitem_with_scalar(self):`

			`s = self.s`

			`expected = s.iloc[:3]`
			`tm.assert_series_equal(expected, s[:3])`
			`tm.assert_series_equal(expected, s[:2.5])`
			`tm.assert_series_equal(expected, s[0.1:2.5])`

			`expected = s.iloc[1:4]`
			`tm.assert_series_equal(expected, s[[1.5, 2.5, 3.5]])`
			`tm.assert_series_equal(expected, s[[2, 3, 4]])`
			`tm.assert_series_equal(expected, s[[1.5, 3, 4]])`

			`expected = s.iloc[2:5]`
			`tm.assert_series_equal(expected, s[s >= 2])`

			`@pytest.mark.parametrize("direction", ["increasing", "decreasing"])`
			`def test_nonoverlapping_monotonic(self, direction, closed):`
			`tpls = [(0, 1), (2, 3), (4, 5)]`
			`if direction == "decreasing":`
			`tpls = tpls[::-1]`

			`idx = IntervalIndex.from_tuples(tpls, closed=closed)`
			`s = Series(list("abc"), idx)`

			`for key, expected in zip(idx.left, s):`
			`if idx.closed_left:`
			`assert s[key] == expected`
			`assert s.loc[key] == expected`
			`else:`
			`with pytest.raises(KeyError, match=str(key)):`
			`s[key]`
			`with pytest.raises(KeyError, match=str(key)):`
			`s.loc[key]`

			`for key, expected in zip(idx.right, s):`
			`if idx.closed_right:`
			`assert s[key] == expected`
			`assert s.loc[key] == expected`
			`else:`
			`with pytest.raises(KeyError, match=str(key)):`
			`s[key]`
			`with pytest.raises(KeyError, match=str(key)):`
			`s.loc[key]`

			`for key, expected in zip(idx.mid, s):`
			`assert s[key] == expected`
			`assert s.loc[key] == expected`

			`def test_non_matching(self):`
			`s = self.s`

			`# this is a departure from our current`
			`# indexing scheme, but simpler`
			`with pytest.raises(KeyError, match=r"^\[-1\]$"):`
			`s.loc[[-1, 3, 4, 5]]`

			`with pytest.raises(KeyError, match=r"^\[-1\]$"):`
			`s.loc[[-1, 3]]`

			`@pytest.mark.arm_slow`
			`def test_large_series(self):`
			`s = Series(`
			`np.arange(1000000), index=IntervalIndex.from_breaks(np.arange(1000001))`
			`)`

			`result1 = s.loc[:80000]`
			`result2 = s.loc[0:80000]`
			`result3 = s.loc[0:80000:1]`
			`tm.assert_series_equal(result1, result2)`
			`tm.assert_series_equal(result1, result3)`

			`def test_loc_getitem_frame(self):`
			`# CategoricalIndex with IntervalIndex categories`
			`df = DataFrame({"A": range(10)})`
			`s = pd.cut(df.A, 5)`
			`df["B"] = s`
			`df = df.set_index("B")`

			`result = df.loc[4]`
			`expected = df.iloc[4:6]`
			`tm.assert_frame_equal(result, expected)`

			`with pytest.raises(KeyError, match="10"):`
			`df.loc[10]`

			`# single list-like`
			`result = df.loc[[4]]`
			`expected = df.iloc[4:6]`
			`tm.assert_frame_equal(result, expected)`

			`# non-unique`
			`result = df.loc[[4, 5]]`
			`expected = df.take([4, 5, 4, 5])`
			`tm.assert_frame_equal(result, expected)`

			`with pytest.raises(KeyError, match=r"^\[10\]$"):`
			`df.loc[[10]]`

			`# partial missing`
			`with pytest.raises(KeyError, match=r"^\[10\]$"):`
			`df.loc[[10, 4]]`


			`class TestIntervalIndexInsideMultiIndex:`
			`def test_mi_intervalindex_slicing_with_scalar(self):`
			`# GH#27456`
			`idx = pd.MultiIndex.from_arrays(`
			`[`
			`pd.Index(["FC", "FC", "FC", "FC", "OWNER", "OWNER", "OWNER", "OWNER"]),`
			`pd.Index(`
			`["RID1", "RID1", "RID2", "RID2", "RID1", "RID1", "RID2", "RID2"]`
			`),`
			`pd.IntervalIndex.from_arrays(`
			`[0, 1, 10, 11, 0, 1, 10, 11], [1, 2, 11, 12, 1, 2, 11, 12]`
			`),`
			`]`
			`)`

			`idx.names = ["Item", "RID", "MP"]`
			`df = DataFrame({"value": [1, 2, 3, 4, 5, 6, 7, 8]})`
			`df.index = idx`
			`query_df = DataFrame(`
			`{`
			`"Item": ["FC", "OWNER", "FC", "OWNER", "OWNER"],`
			`"RID": ["RID1", "RID1", "RID1", "RID2", "RID2"],`
			`"MP": [0.2, 1.5, 1.6, 11.1, 10.9],`
			`}`
			`)`

			`query_df = query_df.sort_index()`

			`idx = pd.MultiIndex.from_arrays([query_df.Item, query_df.RID, query_df.MP])`
			`query_df.index = idx`
			`result = df.value.loc[query_df.index]`
			`expected = Series([1, 6, 2, 8, 7], index=idx, name="value")`
			`tm.assert_series_equal(result, expected)`