def test_seriesAggregateByIndex(self): dataLocal = [((1,), arange(12))] index = [0, 0, 0, 0, 1, 1, 1, 1, 2, 2, 2, 2] data = Series(self.sc.parallelize(dataLocal), index=index) result = data.seriesAggregateByIndex(sum) print result.values().first() assert_true(array_equal(result.values().first(), array([6, 22, 38]))) assert_true(array_equal(result.index, array([0, 1, 2]))) index = [ [0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1], [0, 0, 1, 1, 1, 1, 0, 0, 1, 1, 1, 1], [0, 1, 0, 1, 2, 3, 0, 1, 0, 1, 2, 3] ] data.index = array(index).T result = data.seriesAggregateByIndex(sum, level=[0, 1]) assert_true(array_equal(result.values().first(), array([1, 14, 13, 38]))) assert_true(array_equal(result.index, array([[0, 0], [0, 1], [1, 0], [1, 1]])))