예제 #1
0
def get_hadoop_conf_dir():
    """
  Return the hadoop shared conf directory which should be used for the command's component. The
  directory including the component's version is tried first, but if that doesn't exist,
  this will fallback to using "current".
  """
    stack_root = Script.get_stack_root()
    stack_version = Script.get_stack_version()

    hadoop_conf_dir = os.path.join(os.path.sep, "etc", "hadoop", "conf")
    if check_stack_feature(StackFeature.CONFIG_VERSIONING, stack_version):
        # read the desired version from the component map and use that for building the hadoop home
        version = component_version.get_component_repository_version()
        if version is None:
            version = default("/commandParams/version", None)

        hadoop_conf_dir = os.path.join(stack_root, str(version), "hadoop",
                                       "conf")
        if version is None or sudo.path_isdir(hadoop_conf_dir) is False:
            hadoop_conf_dir = os.path.join(stack_root, "current",
                                           "hadoop-client", "conf")

        Logger.info("Using hadoop conf dir: {0}".format(hadoop_conf_dir))

    return hadoop_conf_dir
예제 #2
0
def get_hadoop_dir(target):
  """
  Return the hadoop shared directory which should be used for the command's component. The
  directory including the component's version is tried first, but if that doesn't exist,
  this will fallback to using "current".

  :target: the target directory
  """
  stack_root = Script.get_stack_root()
  stack_version = Script.get_stack_version()

  if not target in HADOOP_DIR_DEFAULTS:
    raise Fail("Target {0} not defined".format(target))

  hadoop_dir = HADOOP_DIR_DEFAULTS[target]

  formatted_stack_version = format_stack_version(stack_version)

  if stack_features.check_stack_feature(StackFeature.ROLLING_UPGRADE, formatted_stack_version):
    # read the desired version from the component map and use that for building the hadoop home
    version = component_version.get_component_repository_version()
    if version is None:
      version = default("/commandParams/version", None)

    # home uses a different template
    if target == "home":
      hadoop_dir = HADOOP_HOME_DIR_TEMPLATE.format(stack_root, version, "hadoop")
      if version is None or sudo.path_isdir(hadoop_dir) is False:
        hadoop_dir = HADOOP_HOME_DIR_TEMPLATE.format(stack_root, "current", "hadoop-client")
    else:
      hadoop_dir = HADOOP_DIR_TEMPLATE.format(stack_root, version, "hadoop", target)
      if version is None or sudo.path_isdir(hadoop_dir) is False:
        hadoop_dir = HADOOP_DIR_TEMPLATE.format(stack_root, "current", "hadoop-client", target)

  return hadoop_dir
예제 #3
0
def get_hadoop_dir(target, force_latest_on_upgrade=False):
    """
  Return the hadoop shared directory in the following override order
  1. Use default for 2.1 and lower
  2. If 2.2 and higher, use <stack-root>/current/hadoop-client/{target}
  3. If 2.2 and higher AND for an upgrade, use <stack-root>/<version>/hadoop/{target}.
  However, if the upgrade has not yet invoked <stack-selector-tool>, return the current
  version of the component.
  :target: the target directory
  :force_latest_on_upgrade: if True, then this will return the "current" directory
  without the stack version built into the path, such as <stack-root>/current/hadoop-client
  """
    stack_root = Script.get_stack_root()
    stack_version = Script.get_stack_version()

    if not target in HADOOP_DIR_DEFAULTS:
        raise Fail("Target {0} not defined".format(target))

    hadoop_dir = HADOOP_DIR_DEFAULTS[target]

    formatted_stack_version = format_stack_version(stack_version)
    if formatted_stack_version and check_stack_feature(
            StackFeature.ROLLING_UPGRADE, formatted_stack_version):
        # home uses a different template
        if target == "home":
            hadoop_dir = HADOOP_HOME_DIR_TEMPLATE.format(
                stack_root, "current", "hadoop-client")
        else:
            hadoop_dir = HADOOP_DIR_TEMPLATE.format(stack_root, "current",
                                                    "hadoop-client", target)

        # if we are not forcing "current" for HDP 2.2, then attempt to determine
        # if the exact version needs to be returned in the directory
        if not force_latest_on_upgrade:
            stack_info = _get_upgrade_stack()

            if stack_info is not None:
                stack_version = stack_info[1]

                # determine if <stack-selector-tool> has been run and if not, then use the current
                # hdp version until this component is upgraded
                current_stack_version = get_role_component_current_stack_version(
                )
                if current_stack_version is not None and stack_version != current_stack_version:
                    stack_version = current_stack_version

                if target == "home":
                    # home uses a different template
                    hadoop_dir = HADOOP_HOME_DIR_TEMPLATE.format(
                        stack_root, stack_version, "hadoop")
                else:
                    hadoop_dir = HADOOP_DIR_TEMPLATE.format(
                        stack_root, stack_version, "hadoop", target)

    return hadoop_dir
예제 #4
0
def get_hadoop_dir(target, force_latest_on_upgrade=False):
  """
  Return the hadoop shared directory in the following override order
  1. Use default for 2.1 and lower
  2. If 2.2 and higher, use <stack-root>/current/hadoop-client/{target}
  3. If 2.2 and higher AND for an upgrade, use <stack-root>/<version>/hadoop/{target}.
  However, if the upgrade has not yet invoked <stack-selector-tool>, return the current
  version of the component.
  :target: the target directory
  :force_latest_on_upgrade: if True, then this will return the "current" directory
  without the stack version built into the path, such as <stack-root>/current/hadoop-client
  """
  stack_root = Script.get_stack_root()
  stack_version = Script.get_stack_version()

  if not target in HADOOP_DIR_DEFAULTS:
    raise Fail("Target {0} not defined".format(target))

  hadoop_dir = HADOOP_DIR_DEFAULTS[target]

  formatted_stack_version = format_stack_version(stack_version)
  if formatted_stack_version and  check_stack_feature(StackFeature.ROLLING_UPGRADE, formatted_stack_version):
    # home uses a different template
    if target == "home":
      hadoop_dir = HADOOP_HOME_DIR_TEMPLATE.format(stack_root, "current", "hadoop-client")
    else:
      hadoop_dir = HADOOP_DIR_TEMPLATE.format(stack_root, "current", "hadoop-client", target)

    # if we are not forcing "current" for HDP 2.2, then attempt to determine
    # if the exact version needs to be returned in the directory
    if not force_latest_on_upgrade:
      stack_info = _get_upgrade_stack()

      if stack_info is not None:
        stack_version = stack_info[1]

        # determine if <stack-selector-tool> has been run and if not, then use the current
        # hdp version until this component is upgraded
        current_stack_version = get_role_component_current_stack_version()
        if current_stack_version is not None and stack_version != current_stack_version:
          stack_version = current_stack_version

        if target == "home":
          # home uses a different template
          hadoop_dir = HADOOP_HOME_DIR_TEMPLATE.format(stack_root, stack_version, "hadoop")
        else:
          hadoop_dir = HADOOP_DIR_TEMPLATE.format(stack_root, stack_version, "hadoop", target)

  return hadoop_dir
예제 #5
0
def get_hadoop_conf_dir(force_latest_on_upgrade=False):
    """
  Gets the shared hadoop conf directory using:
  1.  Start with /etc/hadoop/conf
  2.  When the stack is greater than HDP-2.2, use <stack-root>/current/hadoop-client/conf
  3.  Only when doing a RU and HDP-2.3 or higher, use the value as computed
      by <conf-selector-tool>.  This is in the form <stack-root>/VERSION/hadoop/conf to make sure
      the configs are written in the correct place. However, if the component itself has
      not yet been upgraded, it should use the hadoop configs from the prior version.
      This will perform an <stack-selector-tool> status to determine which version to use.
  :param force_latest_on_upgrade:  if True, then force the returned path to always
  be that of the upgrade target version, even if <stack-selector-tool> has not been called. This
  is primarily used by hooks like before-ANY to ensure that hadoop environment
  configurations are written to the correct location since they are written out
  before the <stack-selector-tool>/<conf-selector-tool> would have been called.
  """
    hadoop_conf_dir = "/etc/hadoop/conf"
    stack_name = None
    stack_root = Script.get_stack_root()
    stack_version = Script.get_stack_version()
    version = None
    allow_setting_conf_select_symlink = False

    if not Script.in_stack_upgrade():
        # During normal operation, the HDP stack must be 2.3 or higher
        if stack_version and check_stack_feature(StackFeature.ROLLING_UPGRADE,
                                                 stack_version):
            hadoop_conf_dir = os.path.join(stack_root, "current",
                                           "hadoop-client", "conf")

        if stack_version and check_stack_feature(
                StackFeature.CONFIG_VERSIONING, stack_version):
            hadoop_conf_dir = os.path.join(stack_root, "current",
                                           "hadoop-client", "conf")
            stack_name = default("/hostLevelParams/stack_name", None)
            version = default("/commandParams/version", None)

            if not os.path.islink(hadoop_conf_dir) and stack_name and version:
                version = str(version)
                allow_setting_conf_select_symlink = True
    else:
        # During an upgrade/downgrade, which can be a Rolling or Express Upgrade, need to calculate it based on the version
        '''
    Whenever upgrading to HDP 2.2, or downgrading back to 2.2, need to use /etc/hadoop/conf
    Whenever upgrading to HDP 2.3, or downgrading back to 2.3, need to use a versioned hadoop conf dir

    Type__|_Source_|_Target_|_Direction_____________|_Comment_____________________________________________________________
    Normal|        | 2.2    |                       | Use /etc/hadoop/conf
    Normal|        | 2.3    |                       | Use /etc/hadoop/conf, which should be a symlink to <stack-root>/current/hadoop-client/conf
    EU    | 2.1    | 2.3    | Upgrade               | Use versioned <stack-root>/current/hadoop-client/conf
          |        |        | No Downgrade Allowed  | Invalid
    EU/RU | 2.2    | 2.2.*  | Any                   | Use <stack-root>/current/hadoop-client/conf
    EU/RU | 2.2    | 2.3    | Upgrade               | Use <stack-root>/$version/hadoop/conf, which should be a symlink destination
          |        |        | Downgrade             | Use <stack-root>/current/hadoop-client/conf
    EU/RU | 2.3    | 2.3.*  | Any                   | Use <stack-root>/$version/hadoop/conf, which should be a symlink destination
    '''

        # The "stack_version" is the desired stack, e.g., 2.2 or 2.3
        # In an RU, it is always the desired stack, and doesn't change even during the Downgrade!
        # In an RU Downgrade from HDP 2.3 to 2.2, the first thing we do is
        # rm /etc/[component]/conf and then mv /etc/[component]/conf.backup /etc/[component]/conf
        if stack_version and check_stack_feature(StackFeature.ROLLING_UPGRADE,
                                                 stack_version):
            hadoop_conf_dir = os.path.join(stack_root, "current",
                                           "hadoop-client", "conf")

            # This contains the "version", including the build number, that is actually used during a stack upgrade and
            # is the version upgrading/downgrading to.
            stack_info = stack_select._get_upgrade_stack()

            if stack_info is not None:
                stack_name = stack_info[0]
                version = stack_info[1]
            else:
                raise Fail("Unable to get parameter 'version'")

            Logger.info(
                "In the middle of a stack upgrade/downgrade for Stack {0} and destination version {1}, determining which hadoop conf dir to use."
                .format(stack_name, version))
            # This is the version either upgrading or downgrading to.
            if version and check_stack_feature(StackFeature.CONFIG_VERSIONING,
                                               version):
                # Determine if <stack-selector-tool> has been run and if not, then use the current
                # hdp version until this component is upgraded.
                if not force_latest_on_upgrade:
                    current_stack_version = stack_select.get_role_component_current_stack_version(
                    )
                    if current_stack_version is not None and version != current_stack_version:
                        version = current_stack_version
                        stack_selector_name = stack_tools.get_stack_tool_name(
                            stack_tools.STACK_SELECTOR_NAME)
                        Logger.info(
                            "{0} has not yet been called to update the symlink for this component, "
                            "keep using version {1}".format(
                                stack_selector_name, current_stack_version))

                # Only change the hadoop_conf_dir path, don't <conf-selector-tool> this older version
                hadoop_conf_dir = os.path.join(stack_root, version, "hadoop",
                                               "conf")
                Logger.info("Hadoop conf dir: {0}".format(hadoop_conf_dir))

                allow_setting_conf_select_symlink = True

    if allow_setting_conf_select_symlink:
        # If not in the middle of an upgrade and on HDP 2.3 or higher, or if
        # upgrading stack to version 2.3.0.0 or higher (which may be upgrade or downgrade), then consider setting the
        # symlink for /etc/hadoop/conf.
        # If a host does not have any HDFS or YARN components (e.g., only ZK), then it will not contain /etc/hadoop/conf
        # Therefore, any calls to <conf-selector-tool> will fail.
        # For that reason, if the hadoop conf directory exists, then make sure it is set.
        if os.path.exists(hadoop_conf_dir):
            conf_selector_name = stack_tools.get_stack_tool_name(
                stack_tools.CONF_SELECTOR_NAME)
            Logger.info(
                "The hadoop conf dir {0} exists, will call {1} on it for version {2}"
                .format(hadoop_conf_dir, conf_selector_name, version))
            select(stack_name, "hadoop", version)

    Logger.info("Using hadoop conf dir: {0}".format(hadoop_conf_dir))
    return hadoop_conf_dir
예제 #6
0
def get_hadoop_conf_dir(force_latest_on_upgrade=False):
  """
  Gets the shared hadoop conf directory using:
  1.  Start with /etc/hadoop/conf
  2.  When the stack is greater than HDP-2.2, use <stack-root>/current/hadoop-client/conf
  3.  Only when doing a RU and HDP-2.3 or higher, use the value as computed
      by <conf-selector-tool>.  This is in the form <stack-root>/VERSION/hadoop/conf to make sure
      the configs are written in the correct place. However, if the component itself has
      not yet been upgraded, it should use the hadoop configs from the prior version.
      This will perform an <stack-selector-tool> status to determine which version to use.
  :param force_latest_on_upgrade:  if True, then force the returned path to always
  be that of the upgrade target version, even if <stack-selector-tool> has not been called. This
  is primarily used by hooks like before-ANY to ensure that hadoop environment
  configurations are written to the correct location since they are written out
  before the <stack-selector-tool>/<conf-selector-tool> would have been called.
  """
  hadoop_conf_dir = "/etc/hadoop/conf"
  stack_name = None
  stack_root = Script.get_stack_root()
  stack_version = Script.get_stack_version()
  version = None
  allow_setting_conf_select_symlink = False

  if not Script.in_stack_upgrade():
    # During normal operation, the HDP stack must be 2.3 or higher
    if stack_version and check_stack_feature(StackFeature.ROLLING_UPGRADE, stack_version):
      hadoop_conf_dir = os.path.join(stack_root, "current", "hadoop-client", "conf")

    if stack_version and check_stack_feature(StackFeature.CONFIG_VERSIONING, stack_version):
      hadoop_conf_dir = os.path.join(stack_root, "current", "hadoop-client", "conf")
      stack_name = default("/hostLevelParams/stack_name", None)
      version = default("/commandParams/version", None)

      if stack_name and version:
        version = str(version)
        allow_setting_conf_select_symlink = True
  else:
    # During an upgrade/downgrade, which can be a Rolling or Express Upgrade, need to calculate it based on the version
    '''
    Whenever upgrading to HDP 2.2, or downgrading back to 2.2, need to use /etc/hadoop/conf
    Whenever upgrading to HDP 2.3, or downgrading back to 2.3, need to use a versioned hadoop conf dir

    Type__|_Source_|_Target_|_Direction_____________|_Comment_____________________________________________________________
    Normal|        | 2.2    |                       | Use /etc/hadoop/conf
    Normal|        | 2.3    |                       | Use /etc/hadoop/conf, which should be a symlink to <stack-root>/current/hadoop-client/conf
    EU    | 2.1    | 2.3    | Upgrade               | Use versioned <stack-root>/current/hadoop-client/conf
          |        |        | No Downgrade Allowed  | Invalid
    EU/RU | 2.2    | 2.2.*  | Any                   | Use <stack-root>/current/hadoop-client/conf
    EU/RU | 2.2    | 2.3    | Upgrade               | Use <stack-root>/$version/hadoop/conf, which should be a symlink destination
          |        |        | Downgrade             | Use <stack-root>/current/hadoop-client/conf
    EU/RU | 2.3    | 2.3.*  | Any                   | Use <stack-root>/$version/hadoop/conf, which should be a symlink destination
    '''

    # The "stack_version" is the desired stack, e.g., 2.2 or 2.3
    # In an RU, it is always the desired stack, and doesn't change even during the Downgrade!
    # In an RU Downgrade from HDP 2.3 to 2.2, the first thing we do is 
    # rm /etc/[component]/conf and then mv /etc/[component]/conf.backup /etc/[component]/conf
    if stack_version and check_stack_feature(StackFeature.ROLLING_UPGRADE, stack_version):
      hadoop_conf_dir = os.path.join(stack_root, "current", "hadoop-client", "conf")

      # This contains the "version", including the build number, that is actually used during a stack upgrade and
      # is the version upgrading/downgrading to.
      stack_info = stack_select._get_upgrade_stack()

      if stack_info is not None:
        stack_name = stack_info[0]
        version = stack_info[1]
      else:
        raise Fail("Unable to get parameter 'version'")
      
      Logger.info("In the middle of a stack upgrade/downgrade for Stack {0} and destination version {1}, determining which hadoop conf dir to use.".format(stack_name, version))
      # This is the version either upgrading or downgrading to.
      if version and check_stack_feature(StackFeature.CONFIG_VERSIONING, version):
        # Determine if <stack-selector-tool> has been run and if not, then use the current
        # hdp version until this component is upgraded.
        if not force_latest_on_upgrade:
          current_stack_version = stack_select.get_role_component_current_stack_version()
          if current_stack_version is not None and version != current_stack_version:
            version = current_stack_version
            stack_selector_name = stack_tools.get_stack_tool_name(stack_tools.STACK_SELECTOR_NAME)
            Logger.info("{0} has not yet been called to update the symlink for this component, "
                        "keep using version {1}".format(stack_selector_name, current_stack_version))

        # Only change the hadoop_conf_dir path, don't <conf-selector-tool> this older version
        hadoop_conf_dir = os.path.join(stack_root, version, "hadoop", "conf")
        Logger.info("Hadoop conf dir: {0}".format(hadoop_conf_dir))

        allow_setting_conf_select_symlink = True

  if allow_setting_conf_select_symlink:
    # If not in the middle of an upgrade and on HDP 2.3 or higher, or if
    # upgrading stack to version 2.3.0.0 or higher (which may be upgrade or downgrade), then consider setting the
    # symlink for /etc/hadoop/conf.
    # If a host does not have any HDFS or YARN components (e.g., only ZK), then it will not contain /etc/hadoop/conf
    # Therefore, any calls to <conf-selector-tool> will fail.
    # For that reason, if the hadoop conf directory exists, then make sure it is set.
    if os.path.exists(hadoop_conf_dir):
      conf_selector_name = stack_tools.get_stack_tool_name(stack_tools.CONF_SELECTOR_NAME)
      Logger.info("The hadoop conf dir {0} exists, will call {1} on it for version {2}".format(
              hadoop_conf_dir, conf_selector_name, version))
      select(stack_name, "hadoop", version)

  Logger.info("Using hadoop conf dir: {0}".format(hadoop_conf_dir))
  return hadoop_conf_dir
예제 #7
0
def get_hadoop_conf_dir(force_latest_on_upgrade=False):
    """
  Gets the shared hadoop conf directory using:
  1.  Start with /etc/hadoop/conf
  2.  When the stack is greater than HDP-2.2, use <stack-root>/current/hadoop-client/conf
  3.  Only when doing a RU and HDP-2.3 or higher, use the value as computed
      by <conf-selector-tool>.  This is in the form <stack-root>/VERSION/hadoop/conf to make sure
      the configs are written in the correct place. However, if the component itself has
      not yet been upgraded, it should use the hadoop configs from the prior version.
      This will perform an <stack-selector-tool> status to determine which version to use.
  :param force_latest_on_upgrade:  if True, then force the returned path to always
  be that of the upgrade target version, even if <stack-selector-tool> has not been called. This
  is primarily used by hooks like before-ANY to ensure that hadoop environment
  configurations are written to the correct location since they are written out
  before the <stack-selector-tool>/<conf-selector-tool> would have been called.
  """
    hadoop_conf_dir = "/etc/hadoop/conf"
    stack_name = None
    stack_root = Script.get_stack_root()
    stack_version = Script.get_stack_version()
    version = None

    if not Script.in_stack_upgrade():
        # During normal operation, the HDP stack must be 2.3 or higher
        if stack_version and check_stack_feature(StackFeature.ROLLING_UPGRADE,
                                                 stack_version):
            hadoop_conf_dir = os.path.join(stack_root, "current",
                                           "hadoop-client", "conf")

        if stack_version and check_stack_feature(
                StackFeature.CONFIG_VERSIONING, stack_version):
            hadoop_conf_dir = os.path.join(stack_root, "current",
                                           "hadoop-client", "conf")
            stack_name = default("/hostLevelParams/stack_name", None)
            version = default("/commandParams/version", None)

            if not os.path.islink(hadoop_conf_dir) and stack_name and version:
                version = str(version)
    else:
        # The "stack_version" is the desired stack, e.g., 2.2 or 2.3
        # In an RU, it is always the desired stack, and doesn't change even during the Downgrade!
        # In an RU Downgrade from HDP 2.3 to 2.2, the first thing we do is
        # rm /etc/[component]/conf and then mv /etc/[component]/conf.backup /etc/[component]/conf
        if stack_version and check_stack_feature(StackFeature.ROLLING_UPGRADE,
                                                 stack_version):
            hadoop_conf_dir = os.path.join(stack_root, "current",
                                           "hadoop-client", "conf")

            # This contains the "version", including the build number, that is actually used during a stack upgrade and
            # is the version upgrading/downgrading to.
            stack_info = stack_select._get_upgrade_stack()

            if stack_info is None:
                raise Fail(
                    "Unable to retrieve the upgrade/downgrade stack information from the request"
                )

            stack_name = stack_info[0]
            version = stack_info[1]

            Logger.info(
                "An upgrade/downgrade for {0}-{1} is in progress, determining which hadoop conf dir to use."
                .format(stack_name, version))

            # This is the version either upgrading or downgrading to.
            if version and check_stack_feature(StackFeature.CONFIG_VERSIONING,
                                               version):
                # Determine if <stack-selector-tool> has been run and if not, then use the current
                # hdp version until this component is upgraded.
                if not force_latest_on_upgrade:
                    current_stack_version = stack_select.get_role_component_current_stack_version(
                    )
                    if current_stack_version is not None and version != current_stack_version:
                        version = current_stack_version
                        stack_selector_name = stack_tools.get_stack_tool_name(
                            stack_tools.STACK_SELECTOR_NAME)
                        Logger.info(
                            "{0} has not yet been called to update the symlink for this component, "
                            "keep using version {1}".format(
                                stack_selector_name, current_stack_version))

                # Only change the hadoop_conf_dir path, don't <conf-selector-tool> this older version
                hadoop_conf_dir = os.path.join(stack_root, version, "hadoop",
                                               "conf")
                Logger.info("Hadoop conf dir: {0}".format(hadoop_conf_dir))

    Logger.info("Using hadoop conf dir: {0}".format(hadoop_conf_dir))
    return hadoop_conf_dir