def test_join(self): sheet1 = SeriesSet(TABLE_DATA, TABLE_COL, nan=None) sheet2 = SeriesSet(TABLE_DATA, TABLE_COL, nan=None) sheet2.append_col(['K', 'K'], 'K_col') sheet = sheet1.join(sheet2) self.assertEqual(tuple(sheet.shape), (3, 9)) self.assertEqual(sheet.missing, [0, 0, 1, 0, 0, 0, 1, 0, 1]) self.assertEqual( sheet.columns, ['A', 'B', 'C', 'D', 'A_1', 'B_1', 'C_1', 'D_1', 'K_col'])
def fit(self, X, Y): X, Y = SeriesSet(X), Y feature_name = X.columns # we combine the X and Y in a dataset X.append_col(Y, '__target__') self._feature_name = copy(feature_name) self._class_name = set(['Class=%s' % value for value in Y]) self._root = self._create_tree(X, Y, feature_name) return self