def test_sub_to_ind_rdd(self): subs = [(1, 1, 1), (2, 1, 1), (1, 2, 1), (2, 2, 1), (1, 3, 1), (2, 3, 1), (1, 1, 2), (2, 1, 2), (1, 2, 2), (2, 2, 2), (1, 3, 2), (2, 3, 2)] dataLocal = map(lambda x: (x, array([1.0])), subs) data = Series(self.sc.parallelize(dataLocal)) inds = array(data.subToInd().keys().collect()) assert(allclose(inds, array(range(1, 13))))
def test_round_trip_rdd(self): subs = [(1, 1, 1), (2, 1, 1), (1, 2, 1), (2, 2, 1), (1, 3, 1), (2, 3, 1), (1, 1, 2), (2, 1, 2), (1, 2, 2), (2, 2, 2), (1, 3, 2), (2, 3, 2)] dataLocal = map(lambda x: (x, array([1.0])), subs) data = Series(self.sc.parallelize(dataLocal)) start = data.keys().collect() stop = data.subToInd().indToSub().keys().collect() assert(allclose(array(start), array(stop)))