Skip to content

Commit 68d6b4c

Browse files
committed
Add test for non-ascii variable names extraction.
1 parent 3208a79 commit 68d6b4c

File tree

1 file changed

+10
-0
lines changed

1 file changed

+10
-0
lines changed

tests/test_dataframe_mapper.py

Lines changed: 10 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -1,3 +1,5 @@
1+
# -*- coding: utf8 -*-
2+
13
import pytest
24
from pkg_resources import parse_version
35

@@ -128,6 +130,14 @@ def test_transformed_names_binarizer(complex_dataframe):
128130
assert mapper.transformed_names_ == ['target_a', 'target_b', 'target_c']
129131

130132

133+
def test_transformed_names_binarizer_unicode():
134+
df = pd.DataFrame({'target': [u'ñ', u'á', u'é']})
135+
mapper = DataFrameMapper([('target', LabelBinarizer())])
136+
mapper.fit_transform(df)
137+
expected_names = {u'target_ñ', u'target_á', u'target_é'}
138+
assert set(mapper.transformed_names_) == expected_names
139+
140+
131141
def test_transformed_names_transformers_list(complex_dataframe):
132142
"""
133143
When using a list of transformers, use them in inverse order to get the

0 commit comments

Comments
 (0)