# Select some representative values? Probably a good practice





# -----------------------------------------------------------------------------
# NaN Treatment
# -----------------------------------------------------------------------------

# I think you need to deal with NaN's at this stage
# Important: You should also think of this as being a processor for both training as well as testing data

# This is a very problem-dependent step
from rg_toolbox_ml_nan import nan2avg
data_trn = nan2avg(data_trn)
data_tst = nan2avg(data_trn, data_tst)





# -----------------------------------------------------------------------------
# Data Augmentation
# -----------------------------------------------------------------------------

# This is also a very problem-specific algo
# And this also needs to work as a method both on training as well as on test data
from rg_toolbox_ml import data_augment

# THIS DOESN'T WORK YET ... REVIEW
Beispiel #2
0
# Can you do a model conditional on certain variables?
# Say you decide that one sex is a good determinant. Then you allpy a ML model
# only to the male population

# Select some representative values? Probably a good practice

# -----------------------------------------------------------------------------
# NaN Treatment
# -----------------------------------------------------------------------------

# I think you need to deal with NaN's at this stage
# Important: You should also think of this as being a processor for both training as well as testing data

# This is a very problem-dependent step
from rg_toolbox_ml_nan import nan2avg
data_trn = nan2avg(data_trn)
data_tst = nan2avg(data_trn, data_tst)

# -----------------------------------------------------------------------------
# Data Augmentation
# -----------------------------------------------------------------------------

# This is also a very problem-specific algo
# And this also needs to work as a method both on training as well as on test data
from rg_toolbox_ml import data_augment

# THIS DOESN'T WORK YET ... REVIEW
data_trn_aug = data_augment(data_trn)
data_tst_aug = data_augment(data_tst)

# Feature data types