def HandleMissingVal(Input): HandledMissingValCol = [ 'creatinine', 'pH', 'Hct', 'BUN', 'Na', 'K', 'TP', 'systolicBP', 'meanBP', 'MSI', 'eGFR' ] for feature in HandledMissingValCol: Input[feature] = Input.groupby(Input.index // 6)[feature].bfill() Input[feature] = Input.groupby(Input.index // 6)[feature].ffill()
def ConvertFormat(Input): creatinine = pd.DataFrame() intake = pd.DataFrame() urine = pd.DataFrame() pH = pd.DataFrame() Hct = pd.DataFrame() BUN = pd.DataFrame() Na = pd.DataFrame() K = pd.DataFrame() TP = pd.DataFrame() systolicBP = pd.DataFrame() meanBP = pd.DataFrame() MSI = pd.DataFrame() eGFR = pd.DataFrame() age = Input.groupby(Input.index // 6)['age'].nth(0) # day=Input.groupby(Input.index//6)['day'].nth(0) weight = Input.groupby(Input.index // 6)['weight'].nth(0) gender = Input.groupby(Input.index // 6)['gender'].nth(0) for i in range(0, 6): creatinine['creatinine_seq_' + str(i)] = Input.groupby( Input.index // 6)['creatinine'].nth(i) intake['intake_seq_' + str(i)] = Input.groupby(Input.index // 6)['intake'].nth(i) urine['urine_seq_' + str(i)] = Input.groupby(Input.index // 6)['urine'].nth(i) pH['pH_seq_' + str(i)] = Input.groupby(Input.index // 6)['pH'].nth(i) Hct['Hct_seq_' + str(i)] = Input.groupby(Input.index // 6)['Hct'].nth(i) BUN['Bun_seq_' + str(i)] = Input.groupby(Input.index // 6)['BUN'].nth(i) Na['Na_seq_' + str(i)] = Input.groupby(Input.index // 6)['Na'].nth(i) K['K_seq_' + str(i)] = Input.groupby(Input.index // 6)['K'].nth(i) TP['TP_seq_' + str(i)] = Input.groupby(Input.index // 6)['TP'].nth(i) systolicBP['systolicBP_seq_' + str(i)] = Input.groupby( Input.index // 6)['systolicBP'].nth(i) meanBP['meanBP_seq_' + str(i)] = Input.groupby(Input.index // 6)['meanBP'].nth(i) MSI['MSI_seq_' + str(i)] = Input.groupby(Input.index // 6)['MSI'].nth(i) eGFR['eGFR_seq_' + str(i)] = Input.groupby(Input.index // 6)['eGFR'].nth(i) xgb_input = pd.DataFrame() xgb_input['age'] = age # xgb_input['day']=day xgb_input['weight'] = weight xgb_input['gender'] = gender xgb_input = pd.concat([ xgb_input, creatinine, intake, urine, pH, Hct, BUN, Na, K, TP, systolicBP, meanBP, MSI, eGFR ], axis=1) return xgb_input