def getTestData(): test = pd.read_csv("../Input/train2.csv") testDict = {} for record in test.iterrows(): record = record[1] uid = record['user'] if uid not in testDict: testDict[uid] = [] testDict[uid].append({ 'eid': record['event'], 'invited': record['invited'] }) testData = {} for uid, events in testDict.iteritems(): eDict = {e['eid']: (e['invited']) for e in events} features_dict = FeatureSet.process(uid, eDict) X = [] for e in events: eid = e['eid'] X.append(features_dict[eid]) testData[uid] = { 'X': X, 'events': events } return testData