Skip to content

Commit ba05a8d

Browse files
add tests for str and pyarrow strings
1 parent 822b3f4 commit ba05a8d

File tree

1 file changed

+30
-0
lines changed

1 file changed

+30
-0
lines changed

pandas/tests/strings/test_get_dummies.py

Lines changed: 30 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -40,6 +40,7 @@ def test_get_dummies_index():
4040
tm.assert_index_equal(result, expected)
4141

4242

43+
# GH#47872
4344
@pytest.mark.parametrize(
4445
"dtype",
4546
[
@@ -67,6 +68,7 @@ def test_get_dummies_with_dtype(any_string_dtype, dtype):
6768
tm.assert_frame_equal(result, expected)
6869

6970

71+
# GH#47872
7072
@td.skip_if_no("pyarrow")
7173
@pytest.mark.parametrize(
7274
"dtype",
@@ -91,3 +93,31 @@ def test_get_dummies_with_pyarrow_dtype(any_string_dtype, dtype):
9193
dtype=dtype,
9294
)
9395
tm.assert_frame_equal(result, expected)
96+
97+
98+
# GH#47872
99+
def test_get_dummies_with_str_dtype(any_string_dtype):
100+
s = Series(["a|b", "a|c", np.nan], dtype=any_string_dtype)
101+
result = s.str.get_dummies("|", dtype=str)
102+
expected = DataFrame(
103+
[["T", "T", "F"], ["T", "F", "T"], ["F", "F", "F"]],
104+
columns=list("abc"),
105+
dtype=str,
106+
)
107+
tm.assert_frame_equal(result, expected)
108+
109+
110+
# GH#47872
111+
def test_get_dummies_with_pa_str_dtype(any_string_dtype):
112+
s = Series(["a|b", "a|c", np.nan], dtype=any_string_dtype)
113+
result = s.str.get_dummies("|", dtype="str[pyarrow]")
114+
expected = DataFrame(
115+
[
116+
["true", "true", "false"],
117+
["true", "false", "true"],
118+
["false", "false", "false"],
119+
],
120+
columns=list("abc"),
121+
dtype="str[pyarrow]",
122+
)
123+
tm.assert_frame_equal(result, expected)

0 commit comments

Comments
 (0)