from util import query_to_df from util import campaign_to_num, event_to_num, transform_column, hist_and_show, vectorize db = create_engine('sqlite:///forjar.db') metadata = MetaData(db) Session = sessionmaker(bind=db) session = Session() """ Counts the users by campaign id """ user_dist = session.query(Users) user_df = query_to_df(session, user_dist) transform_column(user_df, 'Users_Campaign_ID', campaign_to_num.get) hist_and_show(user_df, 'Users_Campaign_ID') q = session.query(Users.Campaign_ID, Event.Type, Users.id, Event.User_Id).filter(Event.Type == 'bought') d = query_to_df(session, q) print d.columns transform_column(d, 'Users_Campaign_ID', campaign_to_num.get) """ Show the counts for the event types """ transform_column(d, 'Event_Type', event_to_num.get) hist_and_show(d, 'Users_Campaign_ID')
meal_to_num = { 'japanese': 1, 'chinese': 2, 'french': 3, 'german': 4, 'italian': 5, 'mexican': 6, 'vietnamese': 7 } """ Counts the users by campaign id """ user_dist = session.query(Users) user_df = query_to_df(session, user_dist) transform_column(user_df, 'Users_Campaign_ID', campaign_to_num.get) q = session.query(Users.Campaign_ID, Event.Type, Users.id) d = query_to_df(session, q) column_transforms = { 'Users_Campaign_ID': campaign_to_num.get, 'Event_Type': event_to_num.get } sub_plot_size = len(d.columns) * len(d.columns) """ Subplot call here """ for column in d.columns: if column_transforms.has_key(column):
from util import query_to_df from util import campaign_to_num,event_to_num,transform_column,hist_and_show,vectorize db = create_engine('sqlite:///forjar.db') metadata = MetaData(db) Session = sessionmaker(bind=db) session = Session() """ Counts the users by campaign id """ user_dist = session.query(Users) user_df = query_to_df(session,user_dist) transform_column(user_df,'Users_Campaign_ID',campaign_to_num.get) q = session.query(Users.Campaign_ID,Event.Type,Users.id,Event.User_Id) d = query_to_df(session,q) print d #print d.sort('Users_id') grouped = d.groupby(['Users_Campaign_ID','Event_Type']) print grouped.agg({'Event_Type' : np.count_nonzero}).sort('Event_Type')
import matplotlib.pyplot as plt from sqlalchemy import * import numpy as np from sqlalchemy.orm import sessionmaker from churndata import * from pandas import DataFrame from util import query_to_df from util import campaign_to_num, event_to_num, transform_column, hist_and_show, vectorize db = create_engine('sqlite:///forjar.db') metadata = MetaData(db) Session = sessionmaker(bind=db) session = Session() """ Counts the users by campaign id """ user_dist = session.query(Users) user_df = query_to_df(session, user_dist) transform_column(user_df, 'Users_Campaign_ID', campaign_to_num.get) q = session.query(Users.Campaign_ID, Event.Type, Users.id, Event.User_Id).filter(Event.Type == 'bought') d = query_to_df(session, q) #print d.sort('Users_id') grouped = d.groupby('Users_id') print grouped.agg({'Event_Type': np.count_nonzero}).sort('Event_Type')
metadata = MetaData(db) Session = sessionmaker(bind=db) session = Session() """ Counts the users by campaign id """ user_dist = session.query(Users) user_df = query_to_df(session,user_dist) transform_column(user_df,'Users_Campaign_ID',campaign_to_num.get) hist_and_show(user_df,'Users_Campaign_ID') q = session.query(Users.Campaign_ID,Event.Type,Users.id,Event.User_Id).filter(Event.Type == 'bought') d = query_to_df(session,q) print d.columns transform_column(d,'Users_Campaign_ID',campaign_to_num.get) """ Show the counts for the event types """ transform_column(d,'Event_Type',event_to_num.get) hist_and_show(d,'Users_Campaign_ID')
'japanese': 1, 'chinese' : 2, 'french' : 3, 'german' : 4, 'italian' : 5, 'mexican' : 6, 'vietnamese' : 7 } """ Counts the users by campaign id """ user_dist = session.query(Users) user_df = query_to_df(session,user_dist) transform_column(user_df,'Users_Campaign_ID',campaign_to_num.get) q = session.query(Users.Campaign_ID,Event.Type,Users.id) d = query_to_df(session,q) column_transforms = { 'Users_Campaign_ID' : campaign_to_num.get, 'Event_Type' : event_to_num.get } sub_plot_size = len(d.columns) * len(d.columns) """ Subplot call here