def test_construct_str_xframe(self): # construct and XFrame given a saved xframe path = '{}/user/xpatterns/files/test-frame'.format(hdfs_prefix) res = XFrame(path, format='xframe') res = res.sort('id') self.assertEqualLen(3, res) self.assertListEqual(['id', 'val'], res.column_names()) self.assertListEqual([int, str], res.column_types()) self.assertDictEqual({'id': 1, 'val': 'a'}, res[0]) self.assertDictEqual({'id': 2, 'val': 'b'}, res[1]) self.assertDictEqual({'id': 3, 'val': 'c'}, res[2])
def test_construct_auto_str_xframe(self): # construct an XFrame given a file with unrecognized file extension path = '{}/user/xpatterns/files/test-frame'.format(hdfs_prefix) res = XFrame(path) res = res.sort('id') self.assertEqualLen(3, res) self.assertListEqual(['id', 'val'], res.column_names()) self.assertListEqual([int, str], res.column_types()) self.assertDictEqual({'id': 1, 'val': 'a'}, res[0]) self.assertDictEqual({'id': 2, 'val': 'b'}, res[1]) self.assertDictEqual({'id': 3, 'val': 'c'}, res[2])
def test_read_parquet_str(self): t = XFrame({'id': [1, 2, 3], 'val': ['a', 'b', 'c']}) path = '{}/tmp/frame-parquet'.format(hdfs_prefix) t.save(path, format='parquet') res = XFrame('{}/tmp/frame-parquet.parquet'.format(hdfs_prefix)) # results may not come back in the same order res = res.sort('id') self.assertEqualLen(3, res) self.assertListEqual(['id', 'val'], res.column_names()) self.assertListEqual([int, str], res.column_types()) self.assertDictEqual({'id': 1, 'val': 'a'}, res[0]) self.assertDictEqual({'id': 2, 'val': 'b'}, res[1]) self.assertDictEqual({'id': 3, 'val': 'c'}, res[2]) fileio.delete(path)