Python convert_configurations_to_array Examples, solnml.components.utils.mfse_utils.config_space_utils.convert_configurations_to_array Python Examples

Example #1

0

Show file

File: acq_optimizer.py Project: williamy1996/AutoExpression

    def maximize(self, batch_size=1):
        """
        Maximizes the given acquisition function.

        Parameters
        ----------
        batch_size: number of maximizer returned.

        Returns
        -------
        np.ndarray(N,D)
            Point with highest acquisition value.
        """

        incs_configs = list(
            get_one_exchange_neighbourhood(self.objective_func.eta['config'],
                                           seed=self.rng.randint(int(1e6))))

        configs_list = list(incs_configs)
        rand_incs = convert_configurations_to_array(configs_list)

        # Sample random points uniformly over the whole space
        rand_configs = sample_configurations(
            self.config_space, self.n_samples - rand_incs.shape[0])
        rand = convert_configurations_to_array(rand_configs)

        configs_list.extend(rand_configs)

        X = np.concatenate((rand_incs, rand), axis=0)
        y = self.objective_func(X).flatten()
        candidate_idxs = list(np.argsort(-y)[:batch_size])
        # print(candidate_idxs)
        # print(type(candidate_idxs))
        # print(configs_list[:5])
        return [configs_list[idx] for idx in candidate_idxs]

Example #2

0

Show file

    def maximize(self, batch_size=1):
        """
        Maximizes the given acquisition function.

        Parameters
        ----------
        batch_size: number of maximizer returned.

        Returns
        -------
        np.ndarray(N,D)
            Point with highest acquisition value.
        """
        eta = 0.3
        incs_num = int(eta * self.n_samples)
        incs_configs = list(
            get_one_exchange_neighbourhood(self.objective_func.eta['config'],
                                           seed=self.rng.randint(int(1e6))))
        # TODO: need to implement
        # extra_num = incs_num - len(incs_configs)
        # if extra_num > 0:
        #     incs_configs.extend(get_random_neighborhood(self.objective_func.eta['config'], extra_num, MAXINT))

        configs_list = list(incs_configs)
        rand_incs = convert_configurations_to_array(configs_list)

        # Sample random points uniformly over the whole space
        # rand_configs = self.config_space.sample_configuration(self.n_samples - rand_incs.shape[0])
        rand_configs = sample_configurations(
            self.config_space, self.n_samples - rand_incs.shape[0])
        rand = convert_configurations_to_array(rand_configs)

        configs_list.extend(rand_configs)

        # TODO: Put a Gaussian on the incumbent and sample from that (support categorical feature)
        # loc = self.objective_func.model.get_incumbent()[0],
        # scale = np.ones([self.lower.shape[0]]) * 0.1
        # rand_incs = np.array([np.clip(np.random.normal(loc, scale), self.lower, self.upper)[0]
        #                       for _ in range(int(self.n_samples * 0.3))])
        #

        X = np.concatenate((rand_incs, rand), axis=0)
        y = self.objective_func(X)
        if batch_size == 1:
            return [configs_list[np.argmax(y)]]

        tmp = configs_list[np.argsort(y)[-batch_size:]]
        return tmp

Example #3

0

Show file

File: mfse_optimizer.py Project: yunx-z/soln-ml

    def fetch_candidate_configurations(self, num_config):
        if len(self.target_y[self.iterate_r[-1]]) == 0:
            return sample_configurations(self.config_space, num_config)
        config_cnt = 0
        config_candidates = list()
        total_sample_cnt = 0
        print(num_config)
        while config_cnt < num_config and total_sample_cnt < 3 * num_config:
            incumbent = dict()
            max_r = self.iterate_r[-1]
            best_index = np.argmin(self.target_y[max_r])
            incumbent['config'] = self.target_x[max_r][best_index]
            approximate_obj = self.weighted_surrogate.predict(
                convert_configurations_to_array([incumbent['config']]))[0]
            incumbent['obj'] = approximate_obj
            self.weighted_acquisition_func.update(
                model=self.weighted_surrogate, eta=incumbent)
            _config = self.weighted_acq_optimizer.maximize(batch_size=1)[0]

            if _config not in config_candidates:
                config_candidates.append(_config)
                config_cnt += 1
            total_sample_cnt += 1
        if config_cnt < num_config:
            config_candidates = expand_configurations(config_candidates,
                                                      self.config_space,
                                                      num_config)

        return config_candidates

Example #4

0

Show file

File: mfsebase.py Project: williamy1996/AutoExpression

    def fetch_candidate_configurations(self, num_config):
        if len(self.target_y[self.iterate_r[-1]]) == 0:
            return sample_configurations(self.config_space, num_config)

        incumbent = dict()
        max_r = self.iterate_r[-1]
        # LOWER, THE BETTER.
        best_index = np.argmin(self.target_y[max_r])
        incumbent['config'] = self.target_x[max_r][best_index]
        approximate_obj = self.weighted_surrogate.predict(
            convert_configurations_to_array([incumbent['config']]))[0]
        incumbent['obj'] = approximate_obj
        self.weighted_acquisition_func.update(model=self.weighted_surrogate,
                                              eta=incumbent)

        config_candidates = self.weighted_acq_optimizer.maximize(
            batch_size=num_config)
        p_threshold = 0.3
        n_acq = self.eta * self.eta

        if num_config <= n_acq:
            return config_candidates

        candidates = config_candidates[:n_acq]
        idx_acq = n_acq
        for _id in range(num_config - n_acq):
            if rd.random() < p_threshold:
                config = sample_configurations(self.config_space, 1)[0]
            else:
                config = config_candidates[idx_acq]
                idx_acq += 1
            candidates.append(config)
        return candidates

Example #5

0

Show file

File: mfse_optimizer.py Project: yunx-z/soln-ml

    def _iterate(self, s, skip_last=0):
        if self.weight_update_id > self.s_max:
            self.update_weight()
        self.weight_update_id += 1

        # Set initial number of configurations
        n = int(ceil(self.B / self.R / (s + 1) * self.eta**s))
        # initial number of iterations per config
        r = int(self.R * self.eta**(-s))

        # Choose a batch of configurations in different mechanisms.
        start_time = time.time()
        T = self.fetch_candidate_configurations(n)
        time_elapsed = time.time() - start_time
        self.logger.info("Choosing next configurations took %.2f sec." %
                         time_elapsed)

        for i in range((s + 1) - int(skip_last)):  # changed from s + 1

            # Run each of the n configs for <iterations>
            # and keep best (n_configs / eta) configurations

            n_configs = n * self.eta**(-i)
            n_resource = r * self.eta**i

            self.logger.info("MFSE: %d configurations x size %f each" %
                             (int(n_configs), float(n_resource / self.R)))

            val_losses = self.executor.parallel_execute(
                T, subsample_ratio=float(n_resource / self.R))

            self.target_x[int(n_resource)].extend(T)
            self.target_y[int(n_resource)].extend(val_losses)

            if int(n_resource) == self.R:
                self.incumbent_configs.extend(T)
                self.incumbent_perfs.extend(val_losses)

            # Select a number of best configurations for the next loop.
            # Filter out early stops, if any.
            indices = np.argsort(val_losses)
            if len(T) >= self.eta:
                T = [T[i] for i in indices]
                reduced_num = int(n_configs / self.eta)
                T = T[0:reduced_num]
            else:
                T = [T[indices[0]]]
        for item in self.iterate_r[self.iterate_r.index(r):]:
            # NORMALIZE Objective value: MinMax linear normalization
            normalized_y = minmax_normalization(self.target_y[item])
            self.weighted_surrogate.train(convert_configurations_to_array(
                self.target_x[item]),
                                          np.array(normalized_y,
                                                   dtype=np.float64),
                                          r=item)

Example #6

0

Show file

File: mfse_optimizer.py Project: yunx-z/soln-ml

    def update_weight(self):
        max_r = self.iterate_r[-1]
        incumbent_configs = self.target_x[max_r]
        test_x = convert_configurations_to_array(incumbent_configs)
        test_y = np.array(self.target_y[max_r], dtype=np.float64)

        r_list = self.weighted_surrogate.surrogate_r
        K = len(r_list)
        p = 3

        if len(test_y) >= 3:
            # Get previous weights
            preserving_order_p = list()
            preserving_order_nums = list()
            for i, r in enumerate(r_list):
                fold_num = 5
                if i != K - 1:
                    mean, var = self.weighted_surrogate.surrogate_container[
                        r].predict(test_x)
                    tmp_y = np.reshape(mean, -1)
                    preorder_num, pair_num = self.calculate_preserving_order_num(
                        tmp_y, test_y)
                    preserving_order_p.append(preorder_num / pair_num)
                    preserving_order_nums.append(preorder_num)
                else:
                    if len(test_y) < 2 * fold_num:
                        preserving_order_p.append(0)
                    else:
                        # 5-fold cross validation.
                        kfold = KFold(n_splits=fold_num)
                        cv_pred = np.array([0] * len(test_y))
                        for train_idx, valid_idx in kfold.split(test_x):
                            train_configs, train_y = test_x[train_idx], test_y[
                                train_idx]
                            valid_configs, valid_y = test_x[valid_idx], test_y[
                                valid_idx]
                            types, bounds = get_types(self.config_space)
                            _surrogate = RandomForestWithInstances(
                                types=types, bounds=bounds)
                            _surrogate.train(train_configs, train_y)
                            pred, _ = _surrogate.predict(valid_configs)
                            cv_pred[valid_idx] = pred.reshape(-1)
                        preorder_num, pair_num = self.calculate_preserving_order_num(
                            cv_pred, test_y)
                        preserving_order_p.append(preorder_num / pair_num)
                        preserving_order_nums.append(preorder_num)
            trans_order_weight = np.array(preserving_order_p)
            power_sum = np.sum(np.power(trans_order_weight, p))
            new_weights = np.power(trans_order_weight, p) / power_sum
        else:
            old_weights = list()
            for i, r in enumerate(r_list):
                _weight = self.weighted_surrogate.surrogate_weight[r]
                old_weights.append(_weight)
            new_weights = old_weights.copy()

        self.logger.info(' %d-th Updating weights: %s' %
                         (self.weight_changed_cnt, str(new_weights)))

        # Assign the weight to each basic surrogate.
        for i, r in enumerate(r_list):
            self.weighted_surrogate.surrogate_weight[r] = new_weights[i]
        self.weight_changed_cnt += 1
        # Save the weight data.
        self.hist_weights.append(new_weights)

Example #7

0

Show file

File: mfsebase.py Project: williamy1996/AutoExpression

    def update_weight(self):
        max_r = self.iterate_r[-1]
        incumbent_configs = self.target_x[max_r]
        test_x = convert_configurations_to_array(incumbent_configs)
        test_y = np.array(self.target_y[max_r], dtype=np.float64)

        r_list = self.weighted_surrogate.surrogate_r
        K = len(r_list)
        if len(test_y) >= 3:
            # # p-norm
            # # Get previous weights
            # preserving_order_p = list()
            # preserving_order_nums = list()
            # for i, r in enumerate(r_list):
            #     fold_num = 5
            #     if i != K - 1:
            #         mean, var = self.weighted_surrogate.surrogate_container[r].predict(test_x)
            #         tmp_y = np.reshape(mean, -1)
            #         preorder_num, pair_num = self.calculate_preserving_order_num(tmp_y, test_y)
            #         preserving_order_p.append(preorder_num / pair_num)
            #         preserving_order_nums.append(preorder_num)
            #     else:
            #         if len(test_y) < 2 * fold_num:
            #             preserving_order_p.append(0)
            #         else:
            #             # 5-fold cross validation.
            #             kfold = KFold(n_splits=fold_num)
            #             cv_pred = np.array([0] * len(test_y))
            #             for train_idx, valid_idx in kfold.split(test_x):
            #                 train_configs, train_y = test_x[train_idx], test_y[train_idx]
            #                 valid_configs, valid_y = test_x[valid_idx], test_y[valid_idx]
            #                 types, bounds = get_types(self.config_space)
            #                 _surrogate = RandomForestWithInstances(types=types, bounds=bounds)
            #                 _surrogate.train(train_configs, train_y)
            #                 pred, _ = _surrogate.predict(valid_configs)
            #                 cv_pred[valid_idx] = pred.reshape(-1)
            #             preorder_num, pair_num = self.calculate_preserving_order_num(cv_pred, test_y)
            #             preserving_order_p.append(preorder_num / pair_num)
            #             preserving_order_nums.append(preorder_num)
            # p = 3
            # trans_order_weight = np.array(preserving_order_p)
            # power_sum = np.sum(np.power(trans_order_weight, p))
            # new_weights = np.power(trans_order_weight, p) / power_sum

            # sample
            n_sampling = 100
            argmin_cnt = [0] * K
            predictive_mu, predictive_std = list(), list()
            n_fold = 5
            n_instance = len(test_y)
            ranking_loss_hist = list()
            for i, r in enumerate(r_list):
                if i != K - 1:
                    _mean, _var = self.weighted_surrogate.surrogate_container[
                        r].predict(test_x)
                    predictive_mu.append(_mean)
                    predictive_std.append(np.sqrt(_var))
                else:
                    fold_num = n_instance // n_fold
                    target_mu, target_std = list(), list()
                    for i in range(n_fold):
                        instance_indexs = list(range(n_instance))
                        bound = (n_instance -
                                 i * fold_num) if i == (n_fold -
                                                        1) else fold_num
                        start_id = i * fold_num
                        del instance_indexs[start_id:start_id + bound]
                        types, bounds = get_types(self.config_space)
                        _surrogate = RandomForestWithInstances(types=types,
                                                               bounds=bounds)
                        _surrogate.train(test_x[instance_indexs, :],
                                         test_y[instance_indexs])
                        _mu, _var = _surrogate.predict(
                            test_x[start_id:start_id + bound])
                        target_mu.extend(_mu.flatten())
                        target_std.extend(np.sqrt(_var).flatten())
                    predictive_mu.append(target_mu)
                    predictive_std.append(target_std)

            for _ in range(n_sampling):
                ranking_loss_list = list()
                for i, r in enumerate(r_list):
                    sampled_y = np.random.normal(predictive_mu[i],
                                                 predictive_std[i])
                    rank_loss = 0
                    for i in range(len(test_y)):
                        for j in range(len(test_y)):
                            if (test_y[i] < test_y[j]) ^ (sampled_y[i] <
                                                          sampled_y[j]):
                                rank_loss += 1
                    ranking_loss_list.append(rank_loss)

                ranking_loss_hist.append(ranking_loss_list)
                argmin_id = np.argmin(ranking_loss_list)
                argmin_cnt[argmin_id] += 1

            new_weights = np.array(argmin_cnt) / n_sampling

        else:
            old_weights = list()
            for i, r in enumerate(r_list):
                _weight = self.weighted_surrogate.surrogate_weight[r]
                old_weights.append(_weight)
            new_weights = old_weights.copy()

        self.logger.info('Model weights[%d]: %s' %
                         (self.weight_changed_cnt, str(new_weights)))
        # Assign the weight to each basic surrogate.
        for i, r in enumerate(r_list):
            self.weighted_surrogate.surrogate_weight[r] = new_weights[i]
        self.weight_changed_cnt += 1
        # Save the weight data.
        self.hist_weights.append(new_weights)