Skip to content

Commit ef747da

Browse files
TST/CLN: move some tests (#41474)
1 parent e0ca3de commit ef747da

File tree

3 files changed

+62
-53
lines changed

3 files changed

+62
-53
lines changed

pandas/tests/strings/test_case_justify.py

+9
Original file line numberDiff line numberDiff line change
@@ -81,6 +81,15 @@ def test_swapcase_mixed_object():
8181
tm.assert_series_equal(result, expected)
8282

8383

84+
def test_casefold():
85+
# GH25405
86+
expected = Series(["ss", np.nan, "case", "ssd"])
87+
s = Series(["ß", np.nan, "case", "ßd"])
88+
result = s.str.casefold()
89+
90+
tm.assert_series_equal(result, expected)
91+
92+
8493
def test_casemethods(any_string_dtype):
8594
values = ["aaa", "bbb", "CCC", "Dddd", "eEEE"]
8695
s = Series(values, dtype=any_string_dtype)
+53
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,53 @@
1+
import numpy as np
2+
3+
from pandas import (
4+
DataFrame,
5+
Index,
6+
MultiIndex,
7+
Series,
8+
_testing as tm,
9+
)
10+
11+
12+
def test_get_dummies(any_string_dtype):
13+
s = Series(["a|b", "a|c", np.nan], dtype=any_string_dtype)
14+
result = s.str.get_dummies("|")
15+
expected = DataFrame([[1, 1, 0], [1, 0, 1], [0, 0, 0]], columns=list("abc"))
16+
tm.assert_frame_equal(result, expected)
17+
18+
s = Series(["a;b", "a", 7], dtype=any_string_dtype)
19+
result = s.str.get_dummies(";")
20+
expected = DataFrame([[0, 1, 1], [0, 1, 0], [1, 0, 0]], columns=list("7ab"))
21+
tm.assert_frame_equal(result, expected)
22+
23+
24+
def test_get_dummies_index():
25+
# GH9980, GH8028
26+
idx = Index(["a|b", "a|c", "b|c"])
27+
result = idx.str.get_dummies("|")
28+
29+
expected = MultiIndex.from_tuples(
30+
[(1, 1, 0), (1, 0, 1), (0, 1, 1)], names=("a", "b", "c")
31+
)
32+
tm.assert_index_equal(result, expected)
33+
34+
35+
def test_get_dummies_with_name_dummy(any_string_dtype):
36+
# GH 12180
37+
# Dummies named 'name' should work as expected
38+
s = Series(["a", "b,name", "b"], dtype=any_string_dtype)
39+
result = s.str.get_dummies(",")
40+
expected = DataFrame([[1, 0, 0], [0, 1, 1], [0, 1, 0]], columns=["a", "b", "name"])
41+
tm.assert_frame_equal(result, expected)
42+
43+
44+
def test_get_dummies_with_name_dummy_index():
45+
# GH 12180
46+
# Dummies named 'name' should work as expected
47+
idx = Index(["a|b", "name|c", "b|name"])
48+
result = idx.str.get_dummies("|")
49+
50+
expected = MultiIndex.from_tuples(
51+
[(1, 1, 0, 0), (0, 0, 1, 1), (0, 1, 0, 1)], names=("a", "b", "c", "name")
52+
)
53+
tm.assert_index_equal(result, expected)

pandas/tests/strings/test_strings.py

-53
Original file line numberDiff line numberDiff line change
@@ -303,50 +303,6 @@ def test_isnumeric(any_string_dtype):
303303
tm.assert_series_equal(s.str.isdecimal(), Series(decimal_e, dtype=dtype))
304304

305305

306-
def test_get_dummies(any_string_dtype):
307-
s = Series(["a|b", "a|c", np.nan], dtype=any_string_dtype)
308-
result = s.str.get_dummies("|")
309-
expected = DataFrame([[1, 1, 0], [1, 0, 1], [0, 0, 0]], columns=list("abc"))
310-
tm.assert_frame_equal(result, expected)
311-
312-
s = Series(["a;b", "a", 7], dtype=any_string_dtype)
313-
result = s.str.get_dummies(";")
314-
expected = DataFrame([[0, 1, 1], [0, 1, 0], [1, 0, 0]], columns=list("7ab"))
315-
tm.assert_frame_equal(result, expected)
316-
317-
318-
def test_get_dummies_index():
319-
# GH9980, GH8028
320-
idx = Index(["a|b", "a|c", "b|c"])
321-
result = idx.str.get_dummies("|")
322-
323-
expected = MultiIndex.from_tuples(
324-
[(1, 1, 0), (1, 0, 1), (0, 1, 1)], names=("a", "b", "c")
325-
)
326-
tm.assert_index_equal(result, expected)
327-
328-
329-
def test_get_dummies_with_name_dummy(any_string_dtype):
330-
# GH 12180
331-
# Dummies named 'name' should work as expected
332-
s = Series(["a", "b,name", "b"], dtype=any_string_dtype)
333-
result = s.str.get_dummies(",")
334-
expected = DataFrame([[1, 0, 0], [0, 1, 1], [0, 1, 0]], columns=["a", "b", "name"])
335-
tm.assert_frame_equal(result, expected)
336-
337-
338-
def test_get_dummies_with_name_dummy_index():
339-
# GH 12180
340-
# Dummies named 'name' should work as expected
341-
idx = Index(["a|b", "name|c", "b|name"])
342-
result = idx.str.get_dummies("|")
343-
344-
expected = MultiIndex.from_tuples(
345-
[(1, 1, 0, 0), (0, 0, 1, 1), (0, 1, 0, 1)], names=("a", "b", "c", "name")
346-
)
347-
tm.assert_index_equal(result, expected)
348-
349-
350306
def test_join():
351307
values = Series(["a_b_c", "c_d_e", np.nan, "f_g_h"])
352308
result = values.str.split("_").str.join("_")
@@ -782,15 +738,6 @@ def test_method_on_bytes():
782738
lhs.str.cat(rhs)
783739

784740

785-
def test_casefold():
786-
# GH25405
787-
expected = Series(["ss", np.nan, "case", "ssd"])
788-
s = Series(["ß", np.nan, "case", "ßd"])
789-
result = s.str.casefold()
790-
791-
tm.assert_series_equal(result, expected)
792-
793-
794741
def test_str_accessor_in_apply_func():
795742
# https://github.com/pandas-dev/pandas/issues/38979
796743
df = DataFrame(zip("abc", "def"))

0 commit comments

Comments
 (0)