Ejemplo n.º 1
0
    def test_get_available_components(self):
        # Target type
        for target_type, num_values in [('classification', 15),
                                        ('regression', 14)]:
            data_properties = {'target_type': target_type}

            available_components = fp.FeaturePreprocessorChoice(data_properties)\
                .get_available_components(data_properties)

            self.assertEqual(len(available_components), num_values)

        # Multiclass
        data_properties = {'target_type': 'classification',
                           'multiclass': True}
        available_components = fp.FeaturePreprocessorChoice(data_properties) \
            .get_available_components(data_properties)

        self.assertEqual(len(available_components), 15)

        # Multilabel
        data_properties = {'target_type': 'classification',
                           'multilabel': True}
        available_components = fp.FeaturePreprocessorChoice(data_properties) \
            .get_available_components(data_properties)

        self.assertEqual(len(available_components), 12)
Ejemplo n.º 2
0
    def _get_pipeline(self, init_params=None):
        steps = []

        default_dataset_properties = {'target_type': 'regression'}

        # Add the always active preprocessing components
        if init_params is not None and 'one_hot_encoding' in init_params:
            ohe_init_params = init_params['one_hot_encoding']
            if 'categorical_features' in ohe_init_params:
                categorical_features = ohe_init_params['categorical_features']
        else:
            categorical_features = None

        steps.extend(
            [["categorical_encoding", OHEChoice(default_dataset_properties)],
             ["imputation", Imputation()],
             ["variance_threshold", VarianceThreshold()],
             ["rescaling", rescaling_components.RescalingChoice(
                 default_dataset_properties)]])

        # Add the preprocessing component
        steps.append(['preprocessor',
                      feature_preprocessing_components.FeaturePreprocessorChoice(
                          default_dataset_properties)])

        # Add the classification component
        steps.append(['regressor',
                      regression_components.RegressorChoice(
                          default_dataset_properties)])
        return steps
Ejemplo n.º 3
0
    def _get_pipeline(self):
        steps = []

        default_dataset_properties = {'target_type': 'classification'}

        # Add the always active preprocessing components

        steps.extend([["one_hot_encoding", OneHotEncoder()],
                      ["imputation", Imputation()],
                      [
                          "rescaling",
                          rescaling_components.RescalingChoice(
                              default_dataset_properties)
                      ], ["balancing", Balancing()]])

        # Add the preprocessing component
        steps.append([
            'preprocessor',
            feature_preprocessing_components.FeaturePreprocessorChoice(
                default_dataset_properties)
        ])

        # Add the classification component
        steps.append([
            'classifier',
            classification_components.ClassifierChoice(
                default_dataset_properties)
        ])
        return steps
Ejemplo n.º 4
0
    def _get_pipeline_steps(self, dataset_properties):
        steps = []

        default_dataset_properties = {'target_type': 'classification'}
        if dataset_properties is not None and isinstance(
                dataset_properties, dict):
            default_dataset_properties.update(dataset_properties)

        steps.extend(
            [[
                "data_preprocessing",
                DataPreprocessor(dataset_properties=default_dataset_properties)
            ], ["balancing", Balancing()],
             [
                 "feature_preprocessor",
                 feature_preprocessing_components.FeaturePreprocessorChoice(
                     default_dataset_properties)
             ],
             [
                 'classifier',
                 classification_components.ClassifierChoice(
                     default_dataset_properties)
             ]])

        return steps
Ejemplo n.º 5
0
    def _get_pipeline_steps(self, dataset_properties, init_params=None):
        steps = []

        default_dataset_properties = {'target_type': 'regression'}
        if dataset_properties is not None and isinstance(
                dataset_properties, dict):
            default_dataset_properties.update(dataset_properties)

        steps.extend(
            [[
                'data_preprocessing',
                DataPreprocessor(dataset_properties=default_dataset_properties)
            ],
             [
                 'feature_preprocessor',
                 feature_preprocessing_components.FeaturePreprocessorChoice(
                     default_dataset_properties)
             ],
             [
                 'regressor',
                 regression_components.RegressorChoice(
                     default_dataset_properties)
             ]])

        return steps
Ejemplo n.º 6
0
    def _get_pipeline_steps(self):
        steps = []
        print(" going execute pipeline autosklearn")
        default_dataset_properties = {'target_type': 'classification'}

        steps.extend([
            ["feature_preprocessor",
             feature_preprocessing_components.FeaturePreprocessorChoice(
                 default_dataset_properties)],
            ["data_preprocessing",
                DataPreprocessor(dataset_properties=default_dataset_properties)],
            ["balancing",
                Balancing()],
            ['classifier',
                classification_components.ClassifierChoice(
                    default_dataset_properties)]
        ])

        return steps