@@ -302,24 +302,22 @@ def test_dataframe_dummies_with_categorical(self, df, sparse, dtype):
302302 expected .sort_index (axis = 1 )
303303 assert_frame_equal (result , expected )
304304
305- def test_dataframe_dummies_unicode (self ):
306- df = pd .DataFrame (({u'ä' : ['a' ]}))
307- result = get_dummies (df )
308- expected = pd .DataFrame ({u'ä_a' : [1 ]}, dtype = np .uint8 )
309- assert_frame_equal (result , expected )
310-
311- df = pd .DataFrame ({'x' : [u'ä' ]})
312- result = pd .get_dummies (df )
313- expected = pd .DataFrame ({u'x_ä' : [1 ]}, dtype = np .uint8 )
314- assert_frame_equal (result , expected )
315-
316- df = pd .DataFrame ({'x' : ['a' ]})
317- result = pd .get_dummies (df , prefix = u'ä' )
318- expected = pd .DataFrame ({u'ä_a' : [1 ]}, dtype = np .uint8 )
319- assert_frame_equal (result , expected )
320-
321- result = pd .get_dummies (df , prefix_sep = u'ä' )
322- expected = pd .DataFrame ({u'xäa' : [1 ]}, dtype = np .uint8 )
305+ @pytest .mark .parametrize ('get_dummies_kwargs,expected' , [
306+ ({'data' : pd .DataFrame (({u'ä' : ['a' ]}))},
307+ pd .DataFrame ({u'ä_a' : [1 ]}, dtype = np .uint8 )),
308+
309+ ({'data' : pd .DataFrame ({'x' : [u'ä' ]})},
310+ pd .DataFrame ({u'x_ä' : [1 ]}, dtype = np .uint8 )),
311+
312+ ({'data' : pd .DataFrame ({'x' : [u'a' ]}), 'prefix' :u'ä' },
313+ pd .DataFrame ({u'ä_a' : [1 ]}, dtype = np .uint8 )),
314+
315+ ({'data' : pd .DataFrame ({'x' : [u'a' ]}), 'prefix_sep' :u'ä' },
316+ pd .DataFrame ({u'xäa' : [1 ]}, dtype = np .uint8 ))])
317+ def test_dataframe_dummies_unicode (self , get_dummies_kwargs , expected ):
318+ # GH22084 pd.get_dummies incorrectly encodes unicode characters
319+ # in dataframe column names
320+ result = get_dummies (** get_dummies_kwargs )
323321 assert_frame_equal (result , expected )
324322
325323 def test_basic_drop_first (self , sparse ):
0 commit comments