Exemplo n.º 1
0
 def load_gird_search(self, model, param_grid):
     my_loader = Loader()
     train, valid, test = my_loader.load_data('data/train.csv',
                                              'data/test.csv')
     X_train, y_train, y_train_registered, y_train_casual = my_loader.create_data(
         train, self.input_cols)
     self.find_optimal_parameters(X_train, y_train_registered, model,
                                  param_grid)
     self.find_optimal_parameters(X_train, y_train_casual, model,
                                  param_grid)
Exemplo n.º 2
0
    def train(self, path_train, path_test):
        my_loader = Loader()
        train, valid, _ = my_loader.load_data(path_train, path_test)
        X_train, y_train, y_train_registered, y_train_casual = my_loader.create_data(
            train, self.input_cols)
        X_valid, y_valid, y_valid_registered, y_valid_casual = my_loader.create_data(
            valid, self.input_cols)

        model_registered = self.gradient_boosting_train(
            X_train, y_train_registered)
        y_predict_registered = np.exp(
            self.model_predict(model_registered, X_valid)) - 1

        model_casual = self.gradient_boosting_train(X_train, y_train_casual)
        y_predict_casual = np.exp(self.model_predict(model_casual,
                                                     X_valid)) - 1

        y_predict_count = np.round(y_predict_registered + y_predict_casual)

        rmsle = self.get_rmsle(
            y_predict_count,
            np.exp(y_valid_registered) + np.exp(y_valid_casual) - 2)
        print(rmsle)
        self.predict(path_test, model_registered, model_casual)