@@ -302,24 +302,22 @@ def test_dataframe_dummies_with_categorical(self, df, sparse, dtype):
302
302
expected .sort_index (axis = 1 )
303
303
assert_frame_equal (result , expected )
304
304
305
- def test_dataframe_dummies_unicode (self ):
306
- df = pd .DataFrame (({u'ä' : ['a' ]}))
307
- result = get_dummies (df )
308
- expected = pd .DataFrame ({u'ä_a' : [1 ]}, dtype = np .uint8 )
309
- assert_frame_equal (result , expected )
310
-
311
- df = pd .DataFrame ({'x' : [u'ä' ]})
312
- result = pd .get_dummies (df )
313
- expected = pd .DataFrame ({u'x_ä' : [1 ]}, dtype = np .uint8 )
314
- assert_frame_equal (result , expected )
315
-
316
- df = pd .DataFrame ({'x' : ['a' ]})
317
- result = pd .get_dummies (df , prefix = u'ä' )
318
- expected = pd .DataFrame ({u'ä_a' : [1 ]}, dtype = np .uint8 )
319
- assert_frame_equal (result , expected )
320
-
321
- result = pd .get_dummies (df , prefix_sep = u'ä' )
322
- expected = pd .DataFrame ({u'xäa' : [1 ]}, dtype = np .uint8 )
305
+ @pytest .mark .parametrize ('get_dummies_kwargs,expected' , [
306
+ ({'data' : pd .DataFrame (({u'ä' : ['a' ]}))},
307
+ pd .DataFrame ({u'ä_a' : [1 ]}, dtype = np .uint8 )),
308
+
309
+ ({'data' : pd .DataFrame ({'x' : [u'ä' ]})},
310
+ pd .DataFrame ({u'x_ä' : [1 ]}, dtype = np .uint8 )),
311
+
312
+ ({'data' : pd .DataFrame ({'x' : [u'a' ]}), 'prefix' :u'ä' },
313
+ pd .DataFrame ({u'ä_a' : [1 ]}, dtype = np .uint8 )),
314
+
315
+ ({'data' : pd .DataFrame ({'x' : [u'a' ]}), 'prefix_sep' :u'ä' },
316
+ pd .DataFrame ({u'xäa' : [1 ]}, dtype = np .uint8 ))])
317
+ def test_dataframe_dummies_unicode (self , get_dummies_kwargs , expected ):
318
+ # GH22084 pd.get_dummies incorrectly encodes unicode characters
319
+ # in dataframe column names
320
+ result = get_dummies (** get_dummies_kwargs )
323
321
assert_frame_equal (result , expected )
324
322
325
323
def test_basic_drop_first (self , sparse ):
0 commit comments