示例#1
0
  def test_dict_options_missing(self):
    self._fake_hdfs = FakeHdfs()
    hdfs.hdfs.InsecureClient = (
        lambda *args, **kwargs: self._fake_hdfs)

    with self.assertRaisesRegexp(ValueError, r'hdfs_host'):
      self.fs = hdfs.HadoopFileSystem(
          pipeline_options={
              'hdfs_port': 0,
              'hdfs_user': '',
          }
      )

    with self.assertRaisesRegexp(ValueError, r'hdfs_port'):
      self.fs = hdfs.HadoopFileSystem(
          pipeline_options={
              'hdfs_host': '',
              'hdfs_user': '',
          }
      )

    with self.assertRaisesRegexp(ValueError, r'hdfs_user'):
      self.fs = hdfs.HadoopFileSystem(
          pipeline_options={
              'hdfs_host': '',
              'hdfs_port': 0,
          }
      )
    def test_dict_options_full_urls(self):
        pipeline_options = {
            'hdfs_host': '',
            'hdfs_port': 0,
            'hdfs_user': '',
            'hdfs_full_urls': 'invalid',
        }

        with self.assertRaisesRegex(ValueError, r'hdfs_full_urls'):
            self.fs = hdfs.HadoopFileSystem(pipeline_options=pipeline_options)

        pipeline_options['hdfs_full_urls'] = True
        self.fs = hdfs.HadoopFileSystem(pipeline_options=pipeline_options)
        self.assertTrue(self.fs._full_urls)
    def test_dict_options_missing(self):
        with self.assertRaisesRegex(ValueError, r'hdfs_host'):
            self.fs = hdfs.HadoopFileSystem(pipeline_options={
                'hdfs_port': 0,
                'hdfs_user': '',
            })

        with self.assertRaisesRegex(ValueError, r'hdfs_port'):
            self.fs = hdfs.HadoopFileSystem(pipeline_options={
                'hdfs_host': '',
                'hdfs_user': '',
            })

        with self.assertRaisesRegex(ValueError, r'hdfs_user'):
            self.fs = hdfs.HadoopFileSystem(pipeline_options={
                'hdfs_host': '',
                'hdfs_port': 0,
            })
    def test_dict_options(self):
        pipeline_options = {
            'hdfs_host': '',
            'hdfs_port': 0,
            'hdfs_user': '',
        }

        self.fs = hdfs.HadoopFileSystem(pipeline_options=pipeline_options)
        self.assertFalse(self.fs._full_urls)
示例#5
0
    def setUp(self):
        self._fake_hdfs = FakeHdfs()
        hadoopfilesystem.HDFileSystem = lambda *args, **kwargs: self._fake_hdfs
        self.fs = hadoopfilesystem.HadoopFileSystem()
        self.tmpdir = 'hdfs://test_dir'

        for filename in ['old_file1', 'old_file2']:
            url = self.fs.join(self.tmpdir, filename)
            self.fs.create(url).close()
示例#6
0
    def test_dict_options(self):
        self._fake_hdfs = FakeHdfs()
        hdfs.hdfs.InsecureClient = (lambda *args, **kwargs: self._fake_hdfs)
        pipeline_options = {
            'hdfs_host': '',
            'hdfs_port': 0,
            'hdfs_user': '',
        }

        self.fs = hdfs.HadoopFileSystem(pipeline_options=pipeline_options)
示例#7
0
    def setUp(self):
        self._fake_hdfs = FakeHdfs()
        hdfs.hdfs.InsecureClient = (lambda *args, **kwargs: self._fake_hdfs)
        pipeline_options = PipelineOptions()
        hdfs_options = pipeline_options.view_as(HadoopFileSystemOptions)
        hdfs_options.hdfs_host = ''
        hdfs_options.hdfs_port = 0
        hdfs_options.hdfs_user = ''

        self.fs = hdfs.HadoopFileSystem(pipeline_options)
        self.tmpdir = 'hdfs://test_dir'

        for filename in ['old_file1', 'old_file2']:
            url = self.fs.join(self.tmpdir, filename)
            self.fs.create(url).close()