99 lines
2.7 KiB
Python
99 lines
2.7 KiB
Python
import pytest
|
|
|
|
from pandas import DataFrame
|
|
import pandas._testing as tm
|
|
from pandas.core.reshape.merge import (
|
|
MergeError,
|
|
merge,
|
|
)
|
|
|
|
|
|
@pytest.mark.parametrize(
|
|
("input_col", "output_cols"), [("b", ["a", "b"]), ("a", ["a_x", "a_y"])]
|
|
)
|
|
def test_merge_cross(input_col, output_cols):
|
|
# GH#5401
|
|
left = DataFrame({"a": [1, 3]})
|
|
right = DataFrame({input_col: [3, 4]})
|
|
left_copy = left.copy()
|
|
right_copy = right.copy()
|
|
result = merge(left, right, how="cross")
|
|
expected = DataFrame({output_cols[0]: [1, 1, 3, 3], output_cols[1]: [3, 4, 3, 4]})
|
|
tm.assert_frame_equal(result, expected)
|
|
tm.assert_frame_equal(left, left_copy)
|
|
tm.assert_frame_equal(right, right_copy)
|
|
|
|
|
|
@pytest.mark.parametrize(
|
|
"kwargs",
|
|
[
|
|
{"left_index": True},
|
|
{"right_index": True},
|
|
{"on": "a"},
|
|
{"left_on": "a"},
|
|
{"right_on": "b"},
|
|
],
|
|
)
|
|
def test_merge_cross_error_reporting(kwargs):
|
|
# GH#5401
|
|
left = DataFrame({"a": [1, 3]})
|
|
right = DataFrame({"b": [3, 4]})
|
|
msg = (
|
|
"Can not pass on, right_on, left_on or set right_index=True or "
|
|
"left_index=True"
|
|
)
|
|
with pytest.raises(MergeError, match=msg):
|
|
merge(left, right, how="cross", **kwargs)
|
|
|
|
|
|
def test_merge_cross_mixed_dtypes():
|
|
# GH#5401
|
|
left = DataFrame(["a", "b", "c"], columns=["A"])
|
|
right = DataFrame(range(2), columns=["B"])
|
|
result = merge(left, right, how="cross")
|
|
expected = DataFrame({"A": ["a", "a", "b", "b", "c", "c"], "B": [0, 1, 0, 1, 0, 1]})
|
|
tm.assert_frame_equal(result, expected)
|
|
|
|
|
|
def test_merge_cross_more_than_one_column():
|
|
# GH#5401
|
|
left = DataFrame({"A": list("ab"), "B": [2, 1]})
|
|
right = DataFrame({"C": range(2), "D": range(4, 6)})
|
|
result = merge(left, right, how="cross")
|
|
expected = DataFrame(
|
|
{
|
|
"A": ["a", "a", "b", "b"],
|
|
"B": [2, 2, 1, 1],
|
|
"C": [0, 1, 0, 1],
|
|
"D": [4, 5, 4, 5],
|
|
}
|
|
)
|
|
tm.assert_frame_equal(result, expected)
|
|
|
|
|
|
def test_merge_cross_null_values(nulls_fixture):
|
|
# GH#5401
|
|
left = DataFrame({"a": [1, nulls_fixture]})
|
|
right = DataFrame({"b": ["a", "b"], "c": [1.0, 2.0]})
|
|
result = merge(left, right, how="cross")
|
|
expected = DataFrame(
|
|
{
|
|
"a": [1, 1, nulls_fixture, nulls_fixture],
|
|
"b": ["a", "b", "a", "b"],
|
|
"c": [1.0, 2.0, 1.0, 2.0],
|
|
}
|
|
)
|
|
tm.assert_frame_equal(result, expected)
|
|
|
|
|
|
def test_join_cross_error_reporting():
|
|
# GH#5401
|
|
left = DataFrame({"a": [1, 3]})
|
|
right = DataFrame({"a": [3, 4]})
|
|
msg = (
|
|
"Can not pass on, right_on, left_on or set right_index=True or "
|
|
"left_index=True"
|
|
)
|
|
with pytest.raises(MergeError, match=msg):
|
|
left.join(right, how="cross", on="a")
|