예제 #1
0
  def __getFillnaMedian(self, _df):
    return self.__getFillMissingData(_df, 'median')
  
  def __getFillnaFrequent(self, _df):
    return self.__getFillMissingData(_df, 'most_frequent')
  
  def __getFillnaIterative(self, _df):
    return self.__fillIterativeImputer(_df)

  def getMissingDataMethodList(self):
    return {
      # 'None': self.__getFillnaNoneDf, 
      'Fill_0': self.__getFillna0Df, 
      'Fill_Previous': self.__getFillnaPrevDf, 
      'Fill_Next': self.__getFillnaNextDf,
      'Fill_Mean': self.__getFillnaMean,
      'Fill_Median': self.__getFillnaMedian,
      'Fill_Frequent': self.__getFillnaFrequent,
      'Fill_Iterative': self.__getFillnaIterative
    }

#%%
if __name__ == '__main__':
  rootPath = definitions.getProjectRootPath()
  csv_path = os.path.join(rootPath, 'sample_small.csv')
  df = pd.read_csv(csv_path)
  missing_data = MissingData(df)  
  hyperparams_space = {
    'missing_data': hp.choice('feature_scaler', missing_data.getMissingDataMethodList().values())
  }
예제 #2
0
 def setUp(self):
   self.project_name = 'UnitTest'
   self.root_path = definitions.getProjectRootPath()
   self.csv_path = os.path.join(self.root_path, 'sample_small.csv')