示例#1
0
def link_outputs_to_outdir(run_dir, out_dir, outputs):
  """Links any named outputs to out_dir so they can be uploaded.

  Raises an error if the file already exists in that directory.
  """
  if not outputs:
    return
  isolateserver.create_directories(out_dir, outputs)
  for o in outputs:
    copy_recursively(os.path.join(run_dir, o), os.path.join(out_dir, o))
示例#2
0
def link_outputs_to_outdir(run_dir, out_dir, outputs):
    """Links any named outputs to out_dir so they can be uploaded.

  Raises an error if the file already exists in that directory.
  """
    if not outputs:
        return
    isolateserver.create_directories(out_dir, outputs)
    for o in outputs:
        try:
            file_path.link_file(os.path.join(out_dir, o),
                                os.path.join(run_dir, o),
                                file_path.HARDLINK_WITH_FALLBACK)
        except OSError as e:
            logging.info("Couldn't collect output file %s: %s", o, e)
示例#3
0
def link_outputs_to_outdir(run_dir, out_dir, outputs):
    """Links any named outputs to out_dir so they can be uploaded.

  Raises an error if the file already exists in that directory.
  """
    if not outputs:
        return
    isolateserver.create_directories(out_dir, outputs)
    for o in outputs:
        try:
            file_path.link_file(os.path.join(out_dir, o),
                                os.path.join(run_dir, o),
                                file_path.HARDLINK_WITH_FALLBACK)
        except OSError as e:
            # TODO(aludwin): surface this error
            sys.stderr.write('<Could not return file %s: %s>' % (o, e))
示例#4
0
def link_outputs_to_outdir(run_dir, out_dir, outputs):
  """Links any named outputs to out_dir so they can be uploaded.

  Raises an error if the file already exists in that directory.
  """
  if not outputs:
    return
  isolateserver.create_directories(out_dir, outputs)
  for o in outputs:
    try:
      infile = os.path.join(run_dir, o)
      outfile = os.path.join(out_dir, o)
      if fs.islink(infile):
        # TODO(aludwin): handle directories
        fs.copy2(infile, outfile)
      else:
        file_path.link_file(outfile, infile, file_path.HARDLINK_WITH_FALLBACK)
    except OSError as e:
      logging.info("Couldn't collect output file %s: %s", o, e)
示例#5
0
def map_and_run(command, isolated_hash, storage, isolate_cache, outputs,
                init_named_caches, leak_temp_dir, root_dir, hard_timeout,
                grace_period, bot_file, install_packages_fn, use_symlinks,
                constant_run_path):
    """Runs a command with optional isolated input/output.

  See run_tha_test for argument documentation.

  Returns metadata about the result.
  """
    assert isinstance(command, list), command
    assert root_dir or root_dir is None
    result = {
        'duration': None,
        'exit_code': None,
        'had_hard_timeout': False,
        'internal_failure': None,
        'stats': {
            # 'isolated': {
            #    'cipd': {
            #      'duration': 0.,
            #      'get_client_duration': 0.,
            #    },
            #    'download': {
            #      'duration': 0.,
            #      'initial_number_items': 0,
            #      'initial_size': 0,
            #      'items_cold': '<large.pack()>',
            #      'items_hot': '<large.pack()>',
            #    },
            #    'upload': {
            #      'duration': 0.,
            #      'items_cold': '<large.pack()>',
            #      'items_hot': '<large.pack()>',
            #    },
            #  },
        },
        # 'cipd_pins': {
        #   'packages': [
        #     {'package_name': ..., 'version': ..., 'path': ...},
        #     ...
        #   ],
        #  'client_package': {'package_name': ..., 'version': ...},
        # },
        'outputs_ref': None,
        'version': 5,
    }

    if root_dir:
        file_path.ensure_tree(root_dir, 0700)
    elif isolate_cache.cache_dir:
        root_dir = os.path.dirname(isolate_cache.cache_dir)
    # See comment for these constants.
    # If root_dir is not specified, it is not constant.
    # TODO(maruel): This is not obvious. Change this to become an error once we
    # make the constant_run_path an exposed flag.
    if constant_run_path and root_dir:
        run_dir = os.path.join(root_dir, ISOLATED_RUN_DIR)
        os.mkdir(run_dir)
    else:
        run_dir = make_temp_dir(ISOLATED_RUN_DIR, root_dir)
    # storage should be normally set but don't crash if it is not. This can happen
    # as Swarming task can run without an isolate server.
    out_dir = make_temp_dir(ISOLATED_OUT_DIR, root_dir) if storage else None
    tmp_dir = make_temp_dir(ISOLATED_TMP_DIR, root_dir)
    cwd = run_dir

    try:
        with install_packages_fn(run_dir) as cipd_info:
            if cipd_info:
                result['stats']['cipd'] = cipd_info.stats
                result['cipd_pins'] = cipd_info.pins

            if isolated_hash:
                isolated_stats = result['stats'].setdefault('isolated', {})
                bundle, isolated_stats['download'] = fetch_and_map(
                    isolated_hash=isolated_hash,
                    storage=storage,
                    cache=isolate_cache,
                    outdir=run_dir,
                    use_symlinks=use_symlinks)
                change_tree_read_only(run_dir, bundle.read_only)
                cwd = os.path.normpath(os.path.join(cwd, bundle.relative_cwd))
                # Inject the command
                if bundle.command:
                    command = bundle.command + command

            if not command:
                # Handle this as a task failure, not an internal failure.
                sys.stderr.write(
                    '<No command was specified!>\n'
                    '<Please secify a command when triggering your Swarming task>\n'
                )
                result['exit_code'] = 1
                return result

            # If we have an explicit list of files to return, make sure their
            # directories exist now.
            if storage and outputs:
                isolateserver.create_directories(run_dir, outputs)

            command = tools.fix_python_path(command)
            command = process_command(command, out_dir, bot_file)
            file_path.ensure_command_has_abs_path(command, cwd)

            with init_named_caches(run_dir):
                sys.stdout.flush()
                start = time.time()
                try:
                    result['exit_code'], result[
                        'had_hard_timeout'] = run_command(
                            command, cwd, get_command_env(tmp_dir, cipd_info),
                            hard_timeout, grace_period)
                finally:
                    result['duration'] = max(time.time() - start, 0)
    except Exception as e:
        # An internal error occurred. Report accordingly so the swarming task will
        # be retried automatically.
        logging.exception('internal failure: %s', e)
        result['internal_failure'] = str(e)
        on_error.report(None)

    # Clean up
    finally:
        try:
            # Try to link files to the output directory, if specified.
            if out_dir:
                link_outputs_to_outdir(run_dir, out_dir, outputs)

            success = False
            if leak_temp_dir:
                success = True
                logging.warning(
                    'Deliberately leaking %s for later examination', run_dir)
            else:
                # On Windows rmtree(run_dir) call above has a synchronization effect: it
                # finishes only when all task child processes terminate (since a running
                # process locks *.exe file). Examine out_dir only after that call
                # completes (since child processes may write to out_dir too and we need
                # to wait for them to finish).
                if fs.isdir(run_dir):
                    try:
                        success = file_path.rmtree(run_dir)
                    except OSError as e:
                        logging.error('Failure with %s', e)
                        success = False
                    if not success:
                        print >> sys.stderr, (
                            'Failed to delete the run directory, thus failing the task.\n'
                            'This may be due to a subprocess outliving the main task\n'
                            'process, holding on to resources. Please fix the task so\n'
                            'that it releases resources and cleans up subprocesses.'
                        )
                        if result['exit_code'] == 0:
                            result['exit_code'] = 1
                if fs.isdir(tmp_dir):
                    try:
                        success = file_path.rmtree(tmp_dir)
                    except OSError as e:
                        logging.error('Failure with %s', e)
                        success = False
                    if not success:
                        print >> sys.stderr, (
                            'Failed to delete the temp directory, thus failing the task.\n'
                            'This may be due to a subprocess outliving the main task\n'
                            'process, holding on to resources. Please fix the task so\n'
                            'that it releases resources and cleans up subprocesses.'
                        )
                        if result['exit_code'] == 0:
                            result['exit_code'] = 1

            # This deletes out_dir if leak_temp_dir is not set.
            if out_dir:
                isolated_stats = result['stats'].setdefault('isolated', {})
                result['outputs_ref'], success, isolated_stats['upload'] = (
                    delete_and_upload(storage, out_dir, leak_temp_dir))
            if not success and result['exit_code'] == 0:
                result['exit_code'] = 1
        except Exception as e:
            # Swallow any exception in the main finally clause.
            if out_dir:
                logging.exception('Leaking out_dir %s: %s', out_dir, e)
            result['internal_failure'] = str(e)
    return result
示例#6
0
def map_and_run(command, isolated_hash, storage, isolate_cache, outputs,
                init_name_caches, leak_temp_dir, root_dir, hard_timeout,
                grace_period, bot_file, extra_args, install_packages_fn,
                use_symlinks):
    """Runs a command with optional isolated input/output.

  See run_tha_test for argument documentation.

  Returns metadata about the result.
  """
    assert root_dir or root_dir is None
    assert bool(command) ^ bool(isolated_hash)
    result = {
        'duration': None,
        'exit_code': None,
        'had_hard_timeout': False,
        'internal_failure': None,
        'stats': {
            # 'isolated': {
            #    'cipd': {
            #      'duration': 0.,
            #      'get_client_duration': 0.,
            #    },
            #    'download': {
            #      'duration': 0.,
            #      'initial_number_items': 0,
            #      'initial_size': 0,
            #      'items_cold': '<large.pack()>',
            #      'items_hot': '<large.pack()>',
            #    },
            #    'upload': {
            #      'duration': 0.,
            #      'items_cold': '<large.pack()>',
            #      'items_hot': '<large.pack()>',
            #    },
            #  },
        },
        # 'cipd_pins': {
        #   'packages': [
        #     {'package_name': ..., 'version': ..., 'path': ...},
        #     ...
        #   ],
        #  'client_package': {'package_name': ..., 'version': ...},
        # },
        'outputs_ref': None,
        'version': 5,
    }

    if root_dir:
        file_path.ensure_tree(root_dir, 0700)
    elif isolate_cache.cache_dir:
        root_dir = os.path.dirname(isolate_cache.cache_dir)
    # See comment for these constants.
    run_dir = make_temp_dir(ISOLATED_RUN_DIR, root_dir)
    # storage should be normally set but don't crash if it is not. This can happen
    # as Swarming task can run without an isolate server.
    out_dir = make_temp_dir(ISOLATED_OUT_DIR, root_dir) if storage else None
    tmp_dir = make_temp_dir(ISOLATED_TMP_DIR, root_dir)
    cwd = run_dir

    try:
        cipd_info = install_packages_fn(run_dir)
        if cipd_info:
            result['stats']['cipd'] = cipd_info['stats']
            result['cipd_pins'] = cipd_info['cipd_pins']

        if isolated_hash:
            isolated_stats = result['stats'].setdefault('isolated', {})
            bundle, isolated_stats['download'] = fetch_and_map(
                isolated_hash=isolated_hash,
                storage=storage,
                cache=isolate_cache,
                outdir=run_dir,
                use_symlinks=use_symlinks)
            if not bundle.command:
                # Handle this as a task failure, not an internal failure.
                sys.stderr.write(
                    '<The .isolated doesn\'t declare any command to run!>\n'
                    '<Check your .isolate for missing \'command\' variable>\n')
                if os.environ.get('SWARMING_TASK_ID'):
                    # Give an additional hint when running as a swarming task.
                    sys.stderr.write('<This occurs at the \'isolate\' step>\n')
                result['exit_code'] = 1
                return result

            change_tree_read_only(run_dir, bundle.read_only)
            cwd = os.path.normpath(os.path.join(cwd, bundle.relative_cwd))
            command = bundle.command + extra_args

        # If we have an explicit list of files to return, make sure their
        # directories exist now.
        if storage and outputs:
            isolateserver.create_directories(run_dir, outputs)

        command = tools.fix_python_path(command)
        command = process_command(command, out_dir, bot_file)
        file_path.ensure_command_has_abs_path(command, cwd)

        init_name_caches(run_dir)

        sys.stdout.flush()
        start = time.time()
        try:
            result['exit_code'], result['had_hard_timeout'] = run_command(
                command, cwd, tmp_dir, hard_timeout, grace_period)
        finally:
            result['duration'] = max(time.time() - start, 0)
    except Exception as e:
        # An internal error occurred. Report accordingly so the swarming task will
        # be retried automatically.
        logging.exception('internal failure: %s', e)
        result['internal_failure'] = str(e)
        on_error.report(None)

    # Clean up
    finally:
        try:
            # Try to link files to the output directory, if specified.
            if out_dir:
                link_outputs_to_outdir(run_dir, out_dir, outputs)

            success = False
            if leak_temp_dir:
                success = True
                logging.warning(
                    'Deliberately leaking %s for later examination', run_dir)
            else:
                # On Windows rmtree(run_dir) call above has a synchronization effect: it
                # finishes only when all task child processes terminate (since a running
                # process locks *.exe file). Examine out_dir only after that call
                # completes (since child processes may write to out_dir too and we need
                # to wait for them to finish).
                if fs.isdir(run_dir):
                    try:
                        success = file_path.rmtree(run_dir)
                    except OSError as e:
                        logging.error('Failure with %s', e)
                        success = False
                    if not success:
                        print >> sys.stderr, (
                            'Failed to delete the run directory, forcibly failing\n'
                            'the task because of it. No zombie process can outlive a\n'
                            'successful task run and still be marked as successful.\n'
                            'Fix your stuff.')
                        if result['exit_code'] == 0:
                            result['exit_code'] = 1
                if fs.isdir(tmp_dir):
                    try:
                        success = file_path.rmtree(tmp_dir)
                    except OSError as e:
                        logging.error('Failure with %s', e)
                        success = False
                    if not success:
                        print >> sys.stderr, (
                            'Failed to delete the temporary directory, forcibly failing\n'
                            'the task because of it. No zombie process can outlive a\n'
                            'successful task run and still be marked as successful.\n'
                            'Fix your stuff.')
                        if result['exit_code'] == 0:
                            result['exit_code'] = 1

            # This deletes out_dir if leak_temp_dir is not set.
            if out_dir:
                isolated_stats = result['stats'].setdefault('isolated', {})
                result['outputs_ref'], success, isolated_stats['upload'] = (
                    delete_and_upload(storage, out_dir, leak_temp_dir))
            if not success and result['exit_code'] == 0:
                result['exit_code'] = 1
        except Exception as e:
            # Swallow any exception in the main finally clause.
            if out_dir:
                logging.exception('Leaking out_dir %s: %s', out_dir, e)
            result['internal_failure'] = str(e)
    return result
示例#7
0
def map_and_run(data, constant_run_path):
  """Runs a command with optional isolated input/output.

  Arguments:
  - data: TaskData instance.
  - constant_run_path: TODO

  Returns metadata about the result.
  """
  result = {
    'duration': None,
    'exit_code': None,
    'had_hard_timeout': False,
    'internal_failure': 'run_isolated did not complete properly',
    'stats': {
    # 'isolated': {
    #    'cipd': {
    #      'duration': 0.,
    #      'get_client_duration': 0.,
    #    },
    #    'download': {
    #      'duration': 0.,
    #      'initial_number_items': 0,
    #      'initial_size': 0,
    #      'items_cold': '<large.pack()>',
    #      'items_hot': '<large.pack()>',
    #    },
    #    'upload': {
    #      'duration': 0.,
    #      'items_cold': '<large.pack()>',
    #      'items_hot': '<large.pack()>',
    #    },
    #  },
    },
    # 'cipd_pins': {
    #   'packages': [
    #     {'package_name': ..., 'version': ..., 'path': ...},
    #     ...
    #   ],
    #  'client_package': {'package_name': ..., 'version': ...},
    # },
    'outputs_ref': None,
    'version': 5,
  }

  if data.root_dir:
    file_path.ensure_tree(data.root_dir, 0700)
  elif data.isolate_cache.cache_dir:
    data = data._replace(
        root_dir=os.path.dirname(data.isolate_cache.cache_dir))
  # See comment for these constants.
  # If root_dir is not specified, it is not constant.
  # TODO(maruel): This is not obvious. Change this to become an error once we
  # make the constant_run_path an exposed flag.
  if constant_run_path and data.root_dir:
    run_dir = os.path.join(data.root_dir, ISOLATED_RUN_DIR)
    if os.path.isdir(run_dir):
      file_path.rmtree(run_dir)
    os.mkdir(run_dir, 0700)
  else:
    run_dir = make_temp_dir(ISOLATED_RUN_DIR, data.root_dir)
  # storage should be normally set but don't crash if it is not. This can happen
  # as Swarming task can run without an isolate server.
  out_dir = make_temp_dir(
      ISOLATED_OUT_DIR, data.root_dir) if data.storage else None
  tmp_dir = make_temp_dir(ISOLATED_TMP_DIR, data.root_dir)
  cwd = run_dir
  if data.relative_cwd:
    cwd = os.path.normpath(os.path.join(cwd, data.relative_cwd))
  command = data.command
  try:
    with data.install_packages_fn(run_dir) as cipd_info:
      if cipd_info:
        result['stats']['cipd'] = cipd_info.stats
        result['cipd_pins'] = cipd_info.pins

      if data.isolated_hash:
        isolated_stats = result['stats'].setdefault('isolated', {})
        bundle, isolated_stats['download'] = fetch_and_map(
            isolated_hash=data.isolated_hash,
            storage=data.storage,
            cache=data.isolate_cache,
            outdir=run_dir,
            use_symlinks=data.use_symlinks)
        change_tree_read_only(run_dir, bundle.read_only)
        # Inject the command
        if not command and bundle.command:
          command = bundle.command + data.extra_args
          # Only set the relative directory if the isolated file specified a
          # command, and no raw command was specified.
          if bundle.relative_cwd:
            cwd = os.path.normpath(os.path.join(cwd, bundle.relative_cwd))

      if not command:
        # Handle this as a task failure, not an internal failure.
        sys.stderr.write(
            '<No command was specified!>\n'
            '<Please secify a command when triggering your Swarming task>\n')
        result['exit_code'] = 1
        return result

      if not cwd.startswith(run_dir):
        # Handle this as a task failure, not an internal failure. This is a
        # 'last chance' way to gate against directory escape.
        sys.stderr.write('<Relative CWD is outside of run directory!>\n')
        result['exit_code'] = 1
        return result

      if not os.path.isdir(cwd):
        # Accepts relative_cwd that does not exist.
        os.makedirs(cwd, 0700)

      # If we have an explicit list of files to return, make sure their
      # directories exist now.
      if data.storage and data.outputs:
        isolateserver.create_directories(run_dir, data.outputs)

      command = tools.fix_python_path(command)
      command = process_command(command, out_dir, data.bot_file)
      file_path.ensure_command_has_abs_path(command, cwd)

      with data.install_named_caches(run_dir):
        sys.stdout.flush()
        start = time.time()
        try:
          # Need to switch the default account before 'get_command_env' call,
          # so it can grab correct value of LUCI_CONTEXT env var.
          with set_luci_context_account(data.switch_to_account, tmp_dir):
            env = get_command_env(
                tmp_dir, cipd_info, run_dir, data.env, data.env_prefix)
            result['exit_code'], result['had_hard_timeout'] = run_command(
                command, cwd, env, data.hard_timeout, data.grace_period)
        finally:
          result['duration'] = max(time.time() - start, 0)

    # We successfully ran the command, set internal_failure back to
    # None (even if the command failed, it's not an internal error).
    result['internal_failure'] = None
  except Exception as e:
    # An internal error occurred. Report accordingly so the swarming task will
    # be retried automatically.
    logging.exception('internal failure: %s', e)
    result['internal_failure'] = str(e)
    on_error.report(None)

  # Clean up
  finally:
    try:
      # Try to link files to the output directory, if specified.
      if out_dir:
        link_outputs_to_outdir(run_dir, out_dir, data.outputs)

      success = False
      if data.leak_temp_dir:
        success = True
        logging.warning(
            'Deliberately leaking %s for later examination', run_dir)
      else:
        # On Windows rmtree(run_dir) call above has a synchronization effect: it
        # finishes only when all task child processes terminate (since a running
        # process locks *.exe file). Examine out_dir only after that call
        # completes (since child processes may write to out_dir too and we need
        # to wait for them to finish).
        if fs.isdir(run_dir):
          try:
            success = file_path.rmtree(run_dir)
          except OSError as e:
            logging.error('Failure with %s', e)
            success = False
          if not success:
            sys.stderr.write(OUTLIVING_ZOMBIE_MSG % ('run', data.grace_period))
            if result['exit_code'] == 0:
              result['exit_code'] = 1
        if fs.isdir(tmp_dir):
          try:
            success = file_path.rmtree(tmp_dir)
          except OSError as e:
            logging.error('Failure with %s', e)
            success = False
          if not success:
            sys.stderr.write(OUTLIVING_ZOMBIE_MSG % ('temp', data.grace_period))
            if result['exit_code'] == 0:
              result['exit_code'] = 1

      # This deletes out_dir if leak_temp_dir is not set.
      if out_dir:
        isolated_stats = result['stats'].setdefault('isolated', {})
        result['outputs_ref'], success, isolated_stats['upload'] = (
            delete_and_upload(data.storage, out_dir, data.leak_temp_dir))
      if not success and result['exit_code'] == 0:
        result['exit_code'] = 1
    except Exception as e:
      # Swallow any exception in the main finally clause.
      if out_dir:
        logging.exception('Leaking out_dir %s: %s', out_dir, e)
      result['internal_failure'] = str(e)
  return result