# Fit numeric pipeline if self.numeric_features: self.num_imputer_.fit(X[self.numeric_features]) if self.scale: self.scaler_.fit(X[self.numeric_features])
# Imputers and scalers self.num_imputer_ = SimpleImputer(strategy='median') self.cat_imputer_ = SimpleImputer(strategy='most_frequent') self.scaler_ = StandardScaler() if self.scale else None FE Transformer Script
# Process categorical features if self.encode and self.categorical_features: cat_imputed = self.cat_imputer_.transform(X[self.categorical_features]) cat_encoded = self.encoder_.transform(cat_imputed) cat_cols = self.encoder_.get_feature_names_out(self.categorical_features) cat_df = pd.DataFrame(cat_encoded, columns=cat_cols, index=X.index) X_transformed = pd.concat([X_transformed, cat_df], axis=1) # Fit numeric pipeline if self
return self
# Process numeric features if self.numeric_features: num_data = self.num_imputer_.transform(X[self.numeric_features]) if self.scale: num_data = self.scaler_.transform(num_data) num_df = pd.DataFrame(num_data, columns=self.numeric_features, index=X.index) X_transformed = pd.concat([X_transformed, num_df], axis=1) index=X.index) X_transformed = pd.concat([X_transformed
# Fit encoder for categoricals if self.encode and self.categorical_features: self.encoder_ = OneHotEncoder(handle_unknown='ignore', sparse_output=False) self.encoder_.fit(X[self.categorical_features])