Esempio n. 1
0
 def _stream_history_log_dirs(self, output_dir=None):
     """Yield lists of directories to look for the history log in."""
     for log_dir in unique(self._hadoop_log_dirs(output_dir=output_dir)):
         if _logs_exist(self.fs, log_dir):
             log.info('Looking for history log in %s...' % log_dir)
             # logs aren't always in a subdir named history/
             yield [log_dir]
Esempio n. 2
0
 def _stream_history_log_dirs(self, output_dir=None):
     """Yield lists of directories to look for the history log in."""
     for log_dir in unique(self._hadoop_log_dirs(output_dir=output_dir)):
         if _logs_exist(self.fs, log_dir):
             log.info('Looking for history log in %s...' % log_dir)
             # logs aren't always in a subdir named history/
             yield [log_dir]
Esempio n. 3
0
    def _stream_task_log_dirs(self, application_id=None, output_dir=None):
        """Yield lists of directories to look for the task logs in."""
        # Note: this is unlikely to be super-helpful on "real" (multi-node)
        # pre-YARN Hadoop because task logs aren't generally shipped to a
        # local directory. It's a start, anyways. See #1201.
        for log_dir in unique(self._hadoop_log_dirs(output_dir=output_dir)):
            if application_id:
                path = self.fs.join(log_dir, 'userlogs', application_id)
            else:
                path = self.fs.join(log_dir, 'userlogs')

            if _logs_exist(self.fs, path):
                log.info('Looking for task syslogs in %s...' % path)
                yield [path]
Esempio n. 4
0
    def _stream_task_log_dirs(self, application_id=None, output_dir=None):
        """Yield lists of directories to look for the task logs in."""
        # Note: this is unlikely to be super-helpful on "real" (multi-node)
        # pre-YARN Hadoop because task logs aren't generally shipped to a
        # local directory. It's a start, anyways. See #1201.
        for log_dir in unique(self._hadoop_log_dirs(output_dir=output_dir)):
            if application_id:
                path = self.fs.join(log_dir, 'userlogs', application_id)
            else:
                path = self.fs.join(log_dir, 'userlogs')

            if _logs_exist(self.fs, path):
                log.info('Looking for task syslogs in %s...' % path)
                yield [path]