EpistasisLab · jhmenke · Jan 14, 2020 · Jan 20, 2020 · Jan 20, 2020 · Jan 20, 2020
diff --git a/tpot/base.py b/tpot/base.py
@@ -491,8 +491,7 @@ def _setup_toolbox(self):
             self._toolbox.register('expr_mut', self._gen_grow_safe, min_=self._min, max_=self._max)
         self._toolbox.register('mutate', self._random_mutation_operator)
 
-
-    def _fit_init(self):
+    def _fit_init(self, multi_output_target: bool = False):
         # initialization for fit function
         if not self.warm_start or not hasattr(self, '_pareto_front'):
             self._pop = []
@@ -501,6 +500,35 @@ def _fit_init(self):
             self._last_optimized_pareto_front_n_gens = 0
             self._setup_config(self.config_dict)
 
+            if multi_output_target:
+                single_output_classifiers = [
+                    'sklearn.naive_bayes.MultinomialNB',
+                    'sklearn.svm.LinearSVC',
+                    'xgboost.XGBClassifier'
+                ]
+                single_output_regressors = [
+                    'sklearn.ensemble.AdaBoostRegressor',
+                    'sklearn.linear_model.LassoLarsCV',
+                    'sklearn.linear_model.ElasticNetCV',
+                    'sklearn.svm.LinearSVR',
+                    'xgboost.XGBRegressor',
+                    'sklearn.linear_model.SGDRegressor'
+                ]
+                for model in list(self._config_dict.keys()):
+                    if model in single_output_classifiers:
+                        if 'sklearn.multioutput.MultiOutputClassifier' not in self._config_dict.keys():
+                            self._config_dict['sklearn.multioutput.MultiOutputClassifier'] = {"estimator": {}}
+                        self._config_dict['sklearn.multioutput.MultiOutputClassifier']['estimator'][model] = self._config_dict[model]
+                        self._config_dict.pop(model, None)
+                    elif model in single_output_regressors:
+                        if 'sklearn.multioutput.MultiOutputRegressor' not in self._config_dict.keys():
+                            self._config_dict['sklearn.multioutput.MultiOutputRegressor'] = {"estimator": {}}
+                        if model == 'sklearn.linear_model.ElasticNetCV':
+                            self._config_dict['sklearn.linear_model.MultiTaskElasticNetCV'] = self._config_dict[model]
+                        else:
+                            self._config_dict['sklearn.multioutput.MultiOutputRegressor']['estimator'][model] = self._config_dict[model]
+                        self._config_dict.pop(model, None)
+
             self._setup_template(self.template)
 
             self.operators = []
@@ -622,7 +650,7 @@ def fit(self, features, target, sample_weight=None, groups=None):
             Returns a copy of the fitted TPOT object
 
         """
-        self._fit_init()
+        self._fit_init(multi_output_target=len(target.shape) > 1 and target.shape[1] > 1)
         features, target = self._check_dataset(features, target, sample_weight)
 
 
@@ -792,10 +820,11 @@ def _update_top_pipeline(self):
             if not self._optimized_pipeline:
                 raise RuntimeError('There was an error in the TPOT optimization '
                                    'process. This could be because the data was '
-                                   'not formatted properly, or because data for '
+                                   'not formatted properly, because data for '
                                    'a regression problem was provided to the '
-                                   'TPOTClassifier object. Please make sure you '
-                                   'passed the data to TPOT correctly.')
+                                   'TPOTClassifier object, or an error in a '
+                                   'custom scoring function. Please make sure '
+                                   'you passed the data to TPOT correctly.')
             else:
                 pareto_front_wvalues = [pipeline_scores.wvalues[1] for pipeline_scores in self._pareto_front.keys]
                 if not self._last_optimized_pareto_front:
@@ -1157,7 +1186,7 @@ def _check_dataset(self, features, target, sample_weight=None):
 
         try:
             if target is not None:
-                X, y = check_X_y(features, target, accept_sparse=True, dtype=None)
+                X, y = check_X_y(features, target, accept_sparse=True, dtype=None, multi_output=len(target.shape) > 1 and target.shape[1] > 1)
                 if self._imputed:
                     return X, y
                 else:

diff --git a/tpot/operator_utils.py b/tpot/operator_utils.py
@@ -212,7 +212,7 @@ def op_type(cls):
                 for dkey, dval in prange.items():
                     dep_import_str, dep_op_str, dep_op_obj = source_decode(dkey, verbose=verbose)
                     if dep_import_str in import_hash:
-                        import_hash[import_str].append(dep_op_str)
+                        import_hash[dep_import_str].append(dep_op_str)
                     else:
                         import_hash[dep_import_str] = [dep_op_str]
                     dep_op_list[pname] = dep_op_str