v_stack = pd.concat([kyc, age, cp_percent, tu_percent, trans_time_count, num_countries, trans_repeats, range_amount, std_amount, trans_min, country_count, outlier_amount, failed_signin], axis=1) v_stack = self.encode(v_stack) v_stack = v_stack.fillna(0) return v_stack if __name__ == "__main__": engine = create_engine(conn_str, echo=False) session = sessionmaker() session.configure(bind=engine) from features import Features features = Features(session) user_df = features.get_users() trans_df = features.get_transactions() print('Creating Features...') #Create features and store them feature_df = features.create() labels = user_df['is_fraudster'] * 1 labels = labels[feature_df.index] print('Saving Features...') all_data = pd.concat([feature_df, labels], axis=1) pickle.dump(all_data, open('features.pck','wb') ) print('Done.')