@@ -581,15 +581,15 @@ def fit(self, X, y):
581581 if self .categorical_features is not None : #if categorical features are specified, use those
582582 pipeline_steps .append (("impute_categorical" , tpot2 .builtin_modules .ColumnSimpleImputer (self .categorical_features , strategy = 'most_frequent' )))
583583 pipeline_steps .append (("impute_numeric" , tpot2 .builtin_modules .ColumnSimpleImputer ("numeric" , strategy = 'mean' )))
584- pipeline_steps .append (("ColumnOneHotEncoder" , tpot2 .builtin_modules .ColumnOneHotEncoder (self .categorical_features , strategy = 'most_frequent' )))
584+ pipeline_steps .append (("ColumnOneHotEncoder" , tpot2 .builtin_modules .ColumnOneHotEncoder (self .categorical_features , min_frequency = 0.0001 )))
585585
586586 else :
587587 if isinstance (X , pd .DataFrame ):
588588 categorical_columns = X .select_dtypes (include = ['object' ]).columns
589589 if len (categorical_columns ) > 0 :
590590 pipeline_steps .append (("impute_categorical" , tpot2 .builtin_modules .ColumnSimpleImputer ("categorical" , strategy = 'most_frequent' )))
591591 pipeline_steps .append (("impute_numeric" , tpot2 .builtin_modules .ColumnSimpleImputer ("numeric" , strategy = 'mean' )))
592- pipeline_steps .append (("ColumnOneHotEncoder" , tpot2 .builtin_modules .ColumnOneHotEncoder ("categorical" , strategy = 'most_frequent' )))
592+ pipeline_steps .append (("ColumnOneHotEncoder" , tpot2 .builtin_modules .ColumnOneHotEncoder ("categorical" , min_frequency = 0.0001 )))
593593 else :
594594 pipeline_steps .append (("impute_numeric" , tpot2 .builtin_modules .ColumnSimpleImputer ("all" , strategy = 'mean' )))
595595 else :
0 commit comments