def __getFillnaMedian(self, _df): return self.__getFillMissingData(_df, 'median') def __getFillnaFrequent(self, _df): return self.__getFillMissingData(_df, 'most_frequent') def __getFillnaIterative(self, _df): return self.__fillIterativeImputer(_df) def getMissingDataMethodList(self): return { # 'None': self.__getFillnaNoneDf, 'Fill_0': self.__getFillna0Df, 'Fill_Previous': self.__getFillnaPrevDf, 'Fill_Next': self.__getFillnaNextDf, 'Fill_Mean': self.__getFillnaMean, 'Fill_Median': self.__getFillnaMedian, 'Fill_Frequent': self.__getFillnaFrequent, 'Fill_Iterative': self.__getFillnaIterative } #%% if __name__ == '__main__': rootPath = definitions.getProjectRootPath() csv_path = os.path.join(rootPath, 'sample_small.csv') df = pd.read_csv(csv_path) missing_data = MissingData(df) hyperparams_space = { 'missing_data': hp.choice('feature_scaler', missing_data.getMissingDataMethodList().values()) }
def setUp(self): self.project_name = 'UnitTest' self.root_path = definitions.getProjectRootPath() self.csv_path = os.path.join(self.root_path, 'sample_small.csv')