137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222 | def build_tabular_adversarial_metadata(
*,
feature_names: list[str],
x_train,
continuous_columns: list[str] | tuple[str, ...] = (),
integer_columns: list[str] | tuple[str, ...] = (),
categorical_columns: list[str] | tuple[str, ...] = (),
perturbable_continuous_columns: list[str] | tuple[str, ...] = (),
perturbable_integer_columns: list[str] | tuple[str, ...] = (),
perturbable_categorical_columns: list[str] | tuple[str, ...] = (),
integer_step_by_column: dict[str, float] | None = None,
) -> dict[str, Any]:
"""Build tabular adversarial metadata from dataset-level perturbability lists."""
# Datasets should only decide which raw columns are perturbable. This helper
# maps that decision to the transformed feature vector consumed by the model.
_validate_perturbable_columns(
continuous_columns=continuous_columns,
integer_columns=integer_columns,
categorical_columns=categorical_columns,
perturbable_continuous_columns=perturbable_continuous_columns,
perturbable_integer_columns=perturbable_integer_columns,
perturbable_categorical_columns=perturbable_categorical_columns,
)
perturbable_continuous = set(perturbable_continuous_columns)
perturbable_integer = set(perturbable_integer_columns)
perturbable_categorical = set(perturbable_categorical_columns)
# Continuous/integer transformed features usually keep their raw column name
# after an optional transformer prefix, for example "integer__age".
continuous_features = [
idx
for idx, name in enumerate(feature_names)
if _raw_feature_name(name) in perturbable_continuous
]
integer_features = [
idx
for idx, name in enumerate(feature_names)
if _raw_feature_name(name) in perturbable_integer
]
# One raw categorical column becomes several one-hot features, for example
# "categorical__sex_Female" and "categorical__sex_Male".
categorical_features = [
idx
for idx, name in enumerate(feature_names)
if _categorical_column_name(name, categorical_columns) in perturbable_categorical
]
continuous_feature_set = set(continuous_features)
integer_feature_set = set(integer_features)
categorical_feature_set = set(categorical_features)
perturbable_feature_set = continuous_feature_set | integer_feature_set | categorical_feature_set
non_perturbable_features = [
idx
for idx in range(len(feature_names))
if idx not in perturbable_feature_set
]
categorical_groups = _categorical_groups(feature_names, perturbable_categorical)
integer_step_norm = _integer_step_norm(feature_names, integer_features, integer_step_by_column or {})
# The attack consumes only TabularAdversarialMetadata. The extra lists are
# returned so dataset wrappers and logs can expose the same mask clearly.
tabular_metadata = TabularAdversarialMetadata(
feature_names=feature_names,
feature_types=[
CONTINUOUS if idx in continuous_feature_set
else INTEGER if idx in integer_feature_set
else CATEGORICAL if idx in categorical_feature_set
else NON_PERTURBABLE
for idx in range(len(feature_names))
],
feature_min_norm=[float(value) for value in x_train.min(axis=0)],
feature_max_norm=[float(value) for value in x_train.max(axis=0)],
integer_step_norm=integer_step_norm,
categorical_groups=categorical_groups,
).to_dict()
return {
"continuous_features": continuous_features,
"integer_features": integer_features,
"categorical_features": categorical_features,
"non_perturbable_features": non_perturbable_features,
"categorical_groups": categorical_groups,
"integer_step_norm": integer_step_norm,
"tabular_metadata": tabular_metadata,
}
|