@@ -22,7 +22,7 @@ types that are in `Char`, `AbstractString`, and `Number`.
22
22
23
23
# Returns (in a dict)
24
24
25
- - `new_cat_given_col_val `: A dictionary that for each column, maps `missing` into some value according to `label_for_missing`
25
+ - `label_for_missing_given_feature `: A dictionary that for each column, maps `missing` into some value according to `label_for_missing`
26
26
- `encoded_features`: The subset of the categorical features of X that were encoded
27
27
"""
28
28
function missingness_encoder_fit (
@@ -74,26 +74,26 @@ function missingness_encoder_fit(
74
74
end
75
75
76
76
# Nonmissing levels remain as is
77
- new_cat_given_col_val = Dict {Missing, col_type} ()
77
+ label_for_missing_given_feature = Dict {Missing, col_type} ()
78
78
79
79
# Missing levels are mapped
80
80
if elgrandtype in keys (label_for_missing)
81
- new_cat_given_col_val [missing ] = label_for_missing[elgrandtype]
81
+ label_for_missing_given_feature [missing ] = label_for_missing[elgrandtype]
82
82
elseif elgrandtype == Number
83
- new_cat_given_col_val [missing ] = minimum (feat_levels) - 1
83
+ label_for_missing_given_feature [missing ] = minimum (feat_levels) - 1
84
84
else
85
85
throw (ArgumentError (UNSPECIFIED_COL_TYPE_ME (col_type, label_for_missing)))
86
86
end
87
87
88
- return new_cat_given_col_val :: Dict{Missing, col_type}
88
+ return label_for_missing_given_feature :: Dict{Missing, col_type}
89
89
end
90
90
91
91
# 2. Pass it to generic_fit
92
- new_cat_given_col_val , encoded_features = generic_fit (
92
+ label_for_missing_given_feature , encoded_features = generic_fit (
93
93
X, features; ignore = ignore, ordered_factor = ordered_factor, feature_mapper = feature_mapper,
94
94
)
95
95
cache = Dict (
96
- :new_cat_given_col_val => new_cat_given_col_val ,
96
+ :label_for_missing_given_feature => label_for_missing_given_feature ,
97
97
:encoded_features => encoded_features,
98
98
)
99
99
return cache
@@ -115,7 +115,7 @@ Apply a fitted missingness encoder to a table given the output of `missingness_e
115
115
- `X_tr`: The table with selected features after the selected features are transformed by missingness encoder
116
116
"""
117
117
function missingness_encoder_transform (X, cache:: Dict )
118
- new_cat_given_col_val = cache[:new_cat_given_col_val ]
119
- return generic_transform (X, new_cat_given_col_val ; ignore_unknown = true )
118
+ label_for_missing_given_feature = cache[:label_for_missing_given_feature ]
119
+ return generic_transform (X, label_for_missing_given_feature ; ignore_unknown = true )
120
120
end
121
121
0 commit comments