from ballet import Feature from ballet.eng import ConditionalTransformer from ballet.eng.sklearn import SimpleImputer input = ["JWTR", "JWRIP", "JWMNP"] # TODO - str or list of str def calculate_travel_budget(df): if (df["JWTR"] == 1.0).all(): return df["JWMNP"] * df["JWRIP"] return df["JWMNP"] * df["JWTR"] transformer = [ calculate_travel_budget, SimpleImputer(strategy="mean"), ] # TODO - function, transformer-like, or list thereof name = "work_travel_combined" # TODO - str description = "Combine data for time to travel to work with vehicle. Lower value, the most likely they have higher income" # TODO - str feature = Feature(input, transformer, name=name, description=description)
from ballet import Feature from ballet.eng.sklearn import SimpleImputer import numpy as np input = "RESMODE" transformer = SimpleImputer(missing_values=np.nan, strategy="constant", fill_value=0) name = "Imputed Response Mode" description = "Missing response modes values filled in with 0" feature = Feature(input, transformer, name=name, description=description)
from ballet import Feature from ballet.eng.sklearn import SimpleImputer input = "Lot Frontage" transformer = SimpleImputer(strategy="mean") feature = Feature(input, transformer)
from ballet import Feature from ballet.eng.sklearn import SimpleImputer input = ["Year Built"] transformer = SimpleImputer( strategy="mean") # TODO - function, transformer-like, or list thereof name = "Imputed Year Built" # TODO - str feature = Feature(input=input, transformer=transformer, name=name)
from ballet import Feature from ballet.eng.sklearn import SimpleImputer import numpy as np input = "JWAP" # Time of arrival at work transformer = [ SimpleImputer(missing_values=np.nan, strategy="constant", fill_value=0.0), lambda df: np.where((df >= 70) & (df <= 124), 1, 0), ] name = "If job has a morning start time" description = "Return 1 if the Work arrival time >=6:30AM and <=10:30AM" feature = Feature(input, transformer, name=name, description=description)
from ballet import Feature from ballet.eng.sklearn import SimpleImputer input = "ESP" # TODO - str or list of str transformer = SimpleImputer( strategy="most_frequent" ) # TODO - function, transformer-like, or list thereof name = "Imputed ESP" # TODO - str description = "Mode imputed employment status of parents" # TODO - str feature = Feature(input, transformer, name=name, description=description)