def test_readback(self): pipe = hdfs.HdfsAtomicWriteDirPipe(self.path) self.assertFalse(self.fs.exists(self.path)) pipe.write(b"foo\nbar") pipe.close() self.assertTrue(hdfs.exists(self.path)) dirlist = hdfs.listdir(self.path) datapath = '%s/data' % self.path returnlist = [d for d in dirlist] self.assertTrue(returnlist[0].endswith(datapath)) pipe = hdfs.HdfsReadPipe(datapath) self.assertEqual(pipe.read(), b"foo\nbar")
def check_mr_success(hdfs_dir): hdfs = luigi.contrib.hdfs.hadoopcli_clients.create_hadoopcli_client() return hdfs.exists('%s/_SUCCESS' % hdfs_dir)
def check_mr_success(hdfs_dir): #create_hadoopcli_client : #Given that we want one of the hadoop cli clients (unlike snakebite), this one will return the right one. hdfs = luigi.contrib.hdfs.hadoopcli_clients.create_hadoopcli_client() #Use hadoop fs -stat to check file existence. return hdfs.exists('%s/_SUCCESS' % hdfs_dir)