def get_lso_channel(): """ Get the channel to use for installing the local storage operator Returns: str: local storage operator channel """ ocp_version = get_ocp_version() # If OCP version is not GA, we will be using the Optional Operators CatalogSource # This means there are two PackageManifests with the name local-storage-operator # so we need to also use a selector to ensure we retrieve the correct one ocp_ga_version = get_ocp_ga_version(ocp_version) selector = constants.OPTIONAL_OPERATORS_SELECTOR if not ocp_ga_version else None # Retrieve available channels for LSO package_manifest = PackageManifest( resource_name=constants.LOCAL_STORAGE_CSV_PREFIX, selector=selector) channels = package_manifest.get_channels() channel_names = [channel["name"] for channel in channels] # Ensure channel_names is sorted versions = [ LooseVersion(name) for name in channel_names if name != "stable" ] versions.sort() sorted_versions = [v.vstring for v in versions] if ocp_version in channel_names: # Use channel corresponding to OCP version return ocp_version else: # Use latest channel return sorted_versions[-1]
def generate_exporter_script(): """ Generates exporter script for RHCS cluster Returns: str: path to the exporter script """ # generate exporter script through packagemanifest ocs_operator_name = defaults.OCS_OPERATOR_NAME operator_selector = get_selector_for_ocs_operator() package_manifest = PackageManifest( resource_name=ocs_operator_name, selector=operator_selector, ) ocs_operator_data = package_manifest.get() encoded_script = ocs_operator_data["status"]["channels"][0]["currentCSVDesc"][ "annotations" ]["external.features.ocs.openshift.io/export-script"] # decode the exporter script and write to file external_script = decode(encoded_script) external_cluster_details_exporter = tempfile.NamedTemporaryFile( mode="w+", prefix="external-cluster-details-exporter-", suffix=".py", delete=False, ) with open(external_cluster_details_exporter.name, "w") as fd: fd.write(external_script) logger.info( f"external cluster script is located at {external_cluster_details_exporter.name}" ) return external_cluster_details_exporter.name
def get_lso_channel(): """ Get the channel to use for installing the local storage operator Returns: str: local storage operator channel """ ocp_version = get_ocp_version() # Retrieve available channels for LSO package_manifest = PackageManifest( resource_name=constants.LOCAL_STORAGE_CSV_PREFIX) channels = package_manifest.get_channels() channel_names = [channel['name'] for channel in channels] # Ensure channel_names is sorted versions = [LooseVersion(name) for name in channel_names] versions.sort() sorted_versions = [v.vstring for v in versions] if ocp_version in channel_names: # Use channel corresponding to OCP version return ocp_version else: # Use latest channel return sorted_versions[-1]
def get_version_info(namespace=None): package_manifest = PackageManifest( resource_name=defaults.OCS_OPERATOR_NAME) csv_name = package_manifest.get_current_csv() csv_pre = CSV(resource_name=csv_name, namespace=namespace) info = get_images(csv_pre.get()) return info
def deploy_ocs_via_operator(self): """ Method for deploy OCS via OCS operator """ logger.info("Deployment of OCS via OCS operator") olm_manifest = self.get_olm_manifest() self.label_and_taint_nodes() run_cmd(f"oc create -f {olm_manifest}") # wait for package manifest package_manifest = PackageManifest( resource_name=defaults.OCS_OPERATOR_NAME) # Wait for package manifest is ready package_manifest.wait_for_resource() channel = config.DEPLOYMENT.get('ocs_csv_channel') csv_name = package_manifest.get_current_csv(channel=channel) csv = CSV(resource_name=csv_name, kind="csv", namespace=self.namespace) csv.wait_for_phase("Succeeded") ocs_operator_storage_cluster_cr = config.DEPLOYMENT.get( 'ocs_operator_storage_cluster_cr') cluster_data = templating.load_yaml(ocs_operator_storage_cluster_cr) cluster_data['metadata']['name'] = config.ENV_DATA[ 'storage_cluster_name'] deviceset_data = templating.load_yaml(constants.DEVICESET_YAML) device_size = int( config.ENV_DATA.get('device_size', defaults.DEVICE_SIZE)) deviceset_data['dataPVCTemplate']['spec']['resources']['requests'][ 'storage'] = f"{device_size}Gi" cluster_data['spec']['storageDeviceSets'] = [deviceset_data] cluster_data_yaml = tempfile.NamedTemporaryFile( mode='w+', prefix='cluster_storage', delete=False) templating.dump_data_to_temp_yaml(cluster_data, cluster_data_yaml.name) run_cmd(f"oc create -f {cluster_data_yaml.name}")
def check_if_upgrade_completed(self, channel, csv_name_pre_upgrade): """ Checks if OCS operator finishes it's upgrade Args: channel: (str): OCS subscription channel csv_name_pre_upgrade: (str): OCS operator name Returns: bool: True if upgrade completed, False otherwise """ operator_selector = get_selector_for_ocs_operator() package_manifest = PackageManifest( resource_name=OCS_OPERATOR_NAME, selector=operator_selector, subscription_plan_approval=self.subscription_plan_approval, ) csv_name_post_upgrade = package_manifest.get_current_csv(channel) if csv_name_post_upgrade == csv_name_pre_upgrade: log.info(f"CSV is still: {csv_name_post_upgrade}") return False else: log.info(f"CSV now upgraded to: {csv_name_post_upgrade}") return True
def subscribe_ocs(self): """ This method subscription manifest and subscribe to OCS operator. """ subscription_yaml_data = templating.load_yaml( constants.SUBSCRIPTION_YAML) subscription_plan_approval = config.DEPLOYMENT.get( 'subscription_plan_approval') if subscription_plan_approval: subscription_yaml_data['spec']['installPlanApproval'] = ( subscription_plan_approval) channel = config.DEPLOYMENT.get('ocs_csv_channel') if channel: subscription_yaml_data['spec']['channel'] = channel subscription_manifest = tempfile.NamedTemporaryFile( mode='w+', prefix='subscription_manifest', delete=False) templating.dump_data_to_temp_yaml(subscription_yaml_data, subscription_manifest.name) run_cmd(f"oc create -f {subscription_manifest.name}") # wait for package manifest package_manifest = PackageManifest( resource_name=defaults.OCS_OPERATOR_NAME) # Wait for package manifest is ready package_manifest.wait_for_resource(timeout=300) channel = config.DEPLOYMENT.get('ocs_csv_channel') subscription_plan_approval = config.DEPLOYMENT.get( 'subscription_plan_approval') if subscription_plan_approval == 'Manual': wait_for_install_plan_and_approve(self.namespace)
def subscribe_ocs(self): """ This method subscription manifest and subscribe to OCS operator. """ live_deployment = config.DEPLOYMENT.get("live_deployment") if ( config.ENV_DATA["platform"] == constants.IBMCLOUD_PLATFORM and not live_deployment ): link_all_sa_and_secret_and_delete_pods(constants.OCS_SECRET, self.namespace) operator_selector = get_selector_for_ocs_operator() # wait for package manifest # For OCS version >= 4.9, we have odf-operator ocs_version = version.get_semantic_ocs_version_from_config() if ocs_version >= version.VERSION_4_9: ocs_operator_name = defaults.ODF_OPERATOR_NAME subscription_file = constants.SUBSCRIPTION_ODF_YAML else: ocs_operator_name = defaults.OCS_OPERATOR_NAME subscription_file = constants.SUBSCRIPTION_YAML package_manifest = PackageManifest( resource_name=ocs_operator_name, selector=operator_selector, ) # Wait for package manifest is ready package_manifest.wait_for_resource(timeout=300) default_channel = package_manifest.get_default_channel() subscription_yaml_data = templating.load_yaml(subscription_file) subscription_plan_approval = config.DEPLOYMENT.get("subscription_plan_approval") if subscription_plan_approval: subscription_yaml_data["spec"][ "installPlanApproval" ] = subscription_plan_approval custom_channel = config.DEPLOYMENT.get("ocs_csv_channel") if custom_channel: logger.info(f"Custom channel will be used: {custom_channel}") subscription_yaml_data["spec"]["channel"] = custom_channel else: logger.info(f"Default channel will be used: {default_channel}") subscription_yaml_data["spec"]["channel"] = default_channel if config.DEPLOYMENT.get("stage"): subscription_yaml_data["spec"]["source"] = constants.OPERATOR_SOURCE_NAME if config.DEPLOYMENT.get("live_deployment"): subscription_yaml_data["spec"]["source"] = config.DEPLOYMENT.get( "live_content_source", defaults.LIVE_CONTENT_SOURCE ) subscription_manifest = tempfile.NamedTemporaryFile( mode="w+", prefix="subscription_manifest", delete=False ) templating.dump_data_to_temp_yaml( subscription_yaml_data, subscription_manifest.name ) run_cmd(f"oc create -f {subscription_manifest.name}") logger.info("Sleeping for 15 seconds after subscribing OCS") if subscription_plan_approval == "Manual": wait_for_install_plan_and_approve(self.namespace)
def get_version_info(namespace=None): operator_selector = get_selector_for_ocs_operator() package_manifest = PackageManifest( resource_name=defaults.OCS_OPERATOR_NAME, selector=operator_selector, ) csv_name = package_manifest.get_current_csv() csv_pre = CSV(resource_name=csv_name, namespace=namespace) info = get_images(csv_pre.get()) return info
def deploy_ocs_via_operator(self): """ Method for deploy OCS via OCS operator """ logger.info("Deployment of OCS via OCS operator") olm_manifest, subscription_manifest = ( self.get_olm_and_subscription_manifest()) self.label_and_taint_nodes() run_cmd(f"oc create -f {olm_manifest}") catalog_source = CatalogSource( resource_name='ocs-catalogsource', namespace='openshift-marketplace', ) # Wait for catalog source is ready catalog_source.wait_for_state("READY") run_cmd(f"oc create -f {subscription_manifest}") package_manifest = PackageManifest( resource_name=defaults.OCS_OPERATOR_NAME) # Wait for package manifest is ready package_manifest.wait_for_resource() channel = config.DEPLOYMENT.get('ocs_csv_channel') csv_name = package_manifest.get_current_csv(channel=channel) csv = CSV(resource_name=csv_name, kind="csv", namespace=self.namespace) csv.wait_for_phase("Succeeded", timeout=400) ocs_operator_storage_cluster_cr = config.DEPLOYMENT.get( 'ocs_operator_storage_cluster_cr') cluster_data = templating.load_yaml(ocs_operator_storage_cluster_cr) cluster_data['metadata']['name'] = config.ENV_DATA[ 'storage_cluster_name'] deviceset_data = templating.load_yaml(constants.DEVICESET_YAML) device_size = int( config.ENV_DATA.get('device_size', defaults.DEVICE_SIZE)) deviceset_data['dataPVCTemplate']['spec']['resources']['requests'][ 'storage'] = f"{device_size}Gi" # Allow lower instance requests and limits for OCS deployment if config.DEPLOYMENT.get('allow_lower_instance_requirements'): none_resources = {'Requests': None, 'Limits': None} deviceset_data["resources"] = deepcopy(none_resources) cluster_data['spec']['resources'] = { resource: deepcopy(none_resources) for resource in ['mon', 'mds', 'rgw', 'mgr', 'noobaa'] } if self.platform.lower() == constants.VSPHERE_PLATFORM: cluster_data['spec']['monPVCTemplate']['spec'][ 'storageClassName'] = constants.DEFAULT_SC_VSPHERE deviceset_data['dataPVCTemplate']['spec'][ 'storageClassName'] = constants.DEFAULT_SC_VSPHERE cluster_data['spec']['storageDeviceSets'] = [deviceset_data] cluster_data_yaml = tempfile.NamedTemporaryFile( mode='w+', prefix='cluster_storage', delete=False) templating.dump_data_to_temp_yaml(cluster_data, cluster_data_yaml.name) run_cmd(f"oc create -f {cluster_data_yaml.name}")
def deploy_with_external_mode(self): """ This function handles the deployment of OCS on external/indpendent RHCS cluster """ live_deployment = config.DEPLOYMENT.get("live_deployment") logger.info("Deploying OCS with external mode RHCS") ui_deployment = config.DEPLOYMENT.get("ui_deployment") if not ui_deployment: logger.info("Creating namespace and operator group.") run_cmd(f"oc create -f {constants.OLM_YAML}") if not live_deployment: self.create_ocs_operator_source() self.subscribe_ocs() operator_selector = get_selector_for_ocs_operator() subscription_plan_approval = config.DEPLOYMENT.get( "subscription_plan_approval") package_manifest = PackageManifest( resource_name=defaults.OCS_OPERATOR_NAME, selector=operator_selector, subscription_plan_approval=subscription_plan_approval, ) package_manifest.wait_for_resource(timeout=300) channel = config.DEPLOYMENT.get("ocs_csv_channel") csv_name = package_manifest.get_current_csv(channel=channel) csv = CSV(resource_name=csv_name, namespace=self.namespace) csv.wait_for_phase("Succeeded", timeout=720) # Create secret for external cluster secret_data = templating.load_yaml( constants.EXTERNAL_CLUSTER_SECRET_YAML) external_cluster_details = config.EXTERNAL_MODE.get( "external_cluster_details", "") if not external_cluster_details: raise ExternalClusterDetailsException( "No external cluster data found") secret_data["data"][ "external_cluster_details"] = external_cluster_details secret_data_yaml = tempfile.NamedTemporaryFile( mode="w+", prefix="external_cluster_secret", delete=False) templating.dump_data_to_temp_yaml(secret_data, secret_data_yaml.name) logger.info("Creating external cluster secret") run_cmd(f"oc create -f {secret_data_yaml.name}") cluster_data = templating.load_yaml( constants.EXTERNAL_STORAGE_CLUSTER_YAML) cluster_data["metadata"]["name"] = config.ENV_DATA[ "storage_cluster_name"] cluster_data_yaml = tempfile.NamedTemporaryFile( mode="w+", prefix="external_cluster_storage", delete=False) templating.dump_data_to_temp_yaml(cluster_data, cluster_data_yaml.name) run_cmd(f"oc create -f {cluster_data_yaml.name}", timeout=2400) self.external_post_deploy_validation() setup_ceph_toolbox()
def subscribe_ocs(self): """ This method subscription manifest and subscribe to OCS operator. """ operator_selector = get_selector_for_ocs_operator() # wait for package manifest package_manifest = PackageManifest( resource_name=defaults.OCS_OPERATOR_NAME, selector=operator_selector, ) # Wait for package manifest is ready package_manifest.wait_for_resource(timeout=300) default_channel = package_manifest.get_default_channel() subscription_yaml_data = templating.load_yaml( constants.SUBSCRIPTION_YAML ) subscription_plan_approval = config.DEPLOYMENT.get( 'subscription_plan_approval' ) if subscription_plan_approval: subscription_yaml_data['spec']['installPlanApproval'] = ( subscription_plan_approval ) custom_channel = config.DEPLOYMENT.get('ocs_csv_channel') if custom_channel: logger.info(f"Custom channel will be used: {custom_channel}") subscription_yaml_data['spec']['channel'] = custom_channel else: logger.info(f"Default channel will be used: {default_channel}") subscription_yaml_data['spec']['channel'] = default_channel if config.DEPLOYMENT.get('stage'): subscription_yaml_data['spec']['source'] = ( constants.OPERATOR_SOURCE_NAME ) if config.DEPLOYMENT.get('live_deployment'): subscription_yaml_data['spec']['source'] = ( config.DEPLOYMENT.get( 'live_content_source', defaults.LIVE_CONTENT_SOURCE ) ) subscription_manifest = tempfile.NamedTemporaryFile( mode='w+', prefix='subscription_manifest', delete=False ) templating.dump_data_to_temp_yaml( subscription_yaml_data, subscription_manifest.name ) run_cmd(f"oc create -f {subscription_manifest.name}") subscription_plan_approval = config.DEPLOYMENT.get( 'subscription_plan_approval' ) if subscription_plan_approval == 'Manual': wait_for_install_plan_and_approve(self.namespace)
def deploy_with_external_mode(self): """ This function handles the deployment of OCS on external/indpendent RHCS cluster """ live_deployment = config.DEPLOYMENT.get("live_deployment") logger.info("Deploying OCS with external mode RHCS") ui_deployment = config.DEPLOYMENT.get("ui_deployment") if not ui_deployment: logger.info("Creating namespace and operator group.") run_cmd(f"oc create -f {constants.OLM_YAML}") if not live_deployment: create_catalog_source() self.subscribe_ocs() operator_selector = get_selector_for_ocs_operator() subscription_plan_approval = config.DEPLOYMENT.get("subscription_plan_approval") ocs_version = version.get_semantic_ocs_version_from_config() if ocs_version >= version.VERSION_4_9: ocs_operator_names = [ defaults.ODF_OPERATOR_NAME, defaults.OCS_OPERATOR_NAME, ] else: ocs_operator_names = [defaults.OCS_OPERATOR_NAME] channel = config.DEPLOYMENT.get("ocs_csv_channel") for ocs_operator_name in ocs_operator_names: package_manifest = PackageManifest( resource_name=ocs_operator_name, selector=operator_selector, subscription_plan_approval=subscription_plan_approval, ) package_manifest.wait_for_resource(timeout=300) csv_name = package_manifest.get_current_csv(channel=channel) csv = CSV(resource_name=csv_name, namespace=self.namespace) csv.wait_for_phase("Succeeded", timeout=720) # Set rook log level self.set_rook_log_level() # Create secret for external cluster create_external_secret() cluster_data = templating.load_yaml(constants.EXTERNAL_STORAGE_CLUSTER_YAML) cluster_data["metadata"]["name"] = config.ENV_DATA["storage_cluster_name"] cluster_data_yaml = tempfile.NamedTemporaryFile( mode="w+", prefix="external_cluster_storage", delete=False ) templating.dump_data_to_temp_yaml(cluster_data, cluster_data_yaml.name) run_cmd(f"oc create -f {cluster_data_yaml.name}", timeout=2400) self.external_post_deploy_validation() setup_ceph_toolbox()
def get_version_info(namespace=None): operator_selector = get_selector_for_ocs_operator() subscription_plan_approval = config.DEPLOYMENT.get("subscription_plan_approval") package_manifest = PackageManifest( resource_name=defaults.OCS_OPERATOR_NAME, selector=operator_selector, subscription_plan_approval=subscription_plan_approval, ) channel = config.DEPLOYMENT.get("ocs_csv_channel") csv_name = package_manifest.get_current_csv(channel) csv_pre = CSV(resource_name=csv_name, namespace=namespace) info = get_images(csv_pre.get()) return info
def test_upgrade(): ceph_cluster = CephCluster() ceph_cluster.enable_health_monitor() namespace = config.ENV_DATA['cluster_namespace'] ocs_catalog = CatalogSource( resource_name=constants.OPERATOR_CATALOG_SOURCE_NAME, namespace="openshift-marketplace", ) image_url = ocs_catalog.get_image_url() image_tag = ocs_catalog.get_image_name() if config.DEPLOYMENT.get('upgrade_to_latest', True): new_image_tag = get_latest_ds_olm_tag() else: new_image_tag = get_next_version_available_for_upgrade(image_tag) cs_data = deepcopy(ocs_catalog.data) cs_data['spec']['image'] = ':'.join([image_url, new_image_tag]) package_manifest = PackageManifest(resource_name=OCS_OPERATOR_NAME) csv_name_pre_upgrade = package_manifest.get_current_csv() log.info(f"CSV name before upgrade is: {csv_name_pre_upgrade}") csv_pre_upgrade = CSV(resource_name=csv_name_pre_upgrade, namespace=namespace) pre_upgrade_images = get_images(csv_pre_upgrade.get()) with NamedTemporaryFile() as cs_yaml: dump_data_to_temp_yaml(cs_data, cs_yaml.name) ocs_catalog.apply(cs_yaml.name) # Wait for package manifest is ready package_manifest.wait_for_resource() subscription_plan_approval = config.DEPLOYMENT.get( 'subscription_plan_approval') if subscription_plan_approval == 'Manual': wait_for_install_plan_and_approve(namespace) attempts = 145 for attempt in range(1, attempts): if attempts == attempt: raise TimeoutException("No new CSV found after upgrade!") log.info(f"Attempt {attempt}/{attempts} to check CSV upgraded.") package_manifest.reload_data() csv_name_post_upgrade = package_manifest.get_current_csv() if csv_name_post_upgrade == csv_name_pre_upgrade: log.info(f"CSV is still: {csv_name_post_upgrade}") sleep(5) else: log.info(f"CSV now upgraded to: {csv_name_post_upgrade}") break csv_post_upgrade = CSV(resource_name=csv_name_post_upgrade, namespace=namespace) log.info( f"Waiting for CSV {csv_name_post_upgrade} to be in succeeded state") csv_post_upgrade.wait_for_phase("Succeeded", timeout=600) post_upgrade_images = get_images(csv_post_upgrade.get()) old_images, _, _ = get_upgrade_image_info(pre_upgrade_images, post_upgrade_images) verify_image_versions(old_images) ocs_install_verification(timeout=600, skip_osd_distribution_check=True) ceph_cluster.disable_health_monitor() if ceph_cluster.health_error_status: CephHealthException(f"During upgrade hit Ceph HEALTH_ERROR: " f"{ceph_cluster.health_error_status}")
def get_ocs_csv(): """ Get the OCS CSV object Returns: CSV: OCS CSV object Raises: CSVNotFound: In case no CSV found. """ ver = get_semantic_ocs_version_from_config() operator_base = ( defaults.OCS_OPERATOR_NAME if ver < VERSION_4_9 else defaults.ODF_OPERATOR_NAME ) operator_name = f"{operator_base}.openshift-storage" operator = OCP(kind="operator", resource_name=operator_name) if "Error" in operator.data: raise CSVNotFound(f"{operator_name} is not found, csv check will be skipped") namespace = config.ENV_DATA["cluster_namespace"] operator_selector = get_selector_for_ocs_operator() subscription_plan_approval = config.DEPLOYMENT.get("subscription_plan_approval") ocs_package_manifest = PackageManifest( resource_name=defaults.OCS_OPERATOR_NAME, selector=operator_selector, subscription_plan_approval=subscription_plan_approval, ) channel = config.DEPLOYMENT.get("ocs_csv_channel") ocs_csv_name = None # OCS CSV is extracted from the available CSVs in cluster namespace # for Openshift dedicated platform if ( config.ENV_DATA["platform"].lower() == constants.OPENSHIFT_DEDICATED_PLATFORM or config.ENV_DATA["platform"].lower() == constants.ROSA_PLATFORM ): ocp_cluster = OCP(namespace=config.ENV_DATA["cluster_namespace"], kind="csv") for item in ocp_cluster.get()["items"]: if item["metadata"]["name"].startswith(defaults.OCS_OPERATOR_NAME): ocs_csv_name = item["metadata"]["name"] if not ocs_csv_name: raise CSVNotFound(f"No OCS CSV found for {config.ENV_DATA['platform']}") else: ocs_csv_name = ocs_package_manifest.get_current_csv(channel=channel) ocs_csv = CSV(resource_name=ocs_csv_name, namespace=namespace) log.info(f"Check if OCS operator: {ocs_csv_name} is in Succeeded phase.") ocs_csv.wait_for_phase(phase="Succeeded", timeout=600) return ocs_csv
def get_csv_name_pre_upgrade(self): """ Getting OCS operator name as displayed in CSV Returns: str: OCS operator name, as displayed in CSV """ operator_selector = get_selector_for_ocs_operator() package_manifest = PackageManifest( resource_name=OCS_OPERATOR_NAME, selector=operator_selector, ) channel = config.DEPLOYMENT.get('ocs_csv_channel') return package_manifest.get_current_csv(channel)
def get_couchbase_csv(self): """ " Get the Couchbase CSV object Returns: CSV: Couchbase CSV object Raises: CSVNotFound: In case no CSV found. """ cb_package_manifest = PackageManifest( resource_name="couchbase-enterprise-certified") cb_enter_csv = cb_package_manifest.get_current_csv( channel="stable", csv_pattern=constants.COUCHBASE_CSV_PREFIX) return cb_enter_csv
def get_images_post_upgrade(self, channel, pre_upgrade_images, upgrade_version): """ Checks if all images of OCS cluster upgraded, and return list of all images if upgrade success Args: channel: (str): OCS subscription channel pre_upgrade_images: (dict): Contains all OCS cluster images upgrade_version: (str): version to be upgraded Returns: set: Contains full path of OCS cluster old images """ operator_selector = get_selector_for_ocs_operator() package_manifest = PackageManifest( resource_name=OCS_OPERATOR_NAME, selector=operator_selector, subscription_plan_approval=self.subscription_plan_approval, ) csv_name_post_upgrade = package_manifest.get_current_csv(channel) csv_post_upgrade = CSV(resource_name=csv_name_post_upgrade, namespace=self.namespace) log.info( f"Waiting for CSV {csv_name_post_upgrade} to be in succeeded state" ) # Workaround for patching missing ceph-rook-tools pod after upgrade if self.version_before_upgrade == "4.2" and upgrade_version == "4.3": log.info("Force creating Ceph toolbox after upgrade 4.2 -> 4.3") setup_ceph_toolbox(force_setup=True) # End of workaround if config.DEPLOYMENT.get("external_mode") or config.ENV_DATA.get( "mcg_only_deployment"): timeout = 200 else: timeout = 200 * get_osd_count() csv_post_upgrade.wait_for_phase("Succeeded", timeout=timeout) post_upgrade_images = get_images(csv_post_upgrade.get()) old_images, _, _ = get_upgrade_image_info(pre_upgrade_images, post_upgrade_images) return old_images
def set_upgrade_channel(self): """ Wait for the new package manifest for upgrade. Returns: str: OCS subscription channel """ operator_selector = get_selector_for_ocs_operator() package_manifest = PackageManifest( resource_name=OCS_OPERATOR_NAME, selector=operator_selector, ) package_manifest.wait_for_resource() channel = config.DEPLOYMENT.get('ocs_csv_channel') if not channel: channel = package_manifest.get_default_channel() return channel
def get_ocs_csv(): """ Get the OCS CSV object Returns: CSV: OCS CSV object """ namespace = config.ENV_DATA['cluster_namespace'] operator_selector = get_selector_for_ocs_operator() ocs_package_manifest = PackageManifest( resource_name=defaults.OCS_OPERATOR_NAME, selector=operator_selector, ) channel = config.DEPLOYMENT.get('ocs_csv_channel') ocs_csv_name = ocs_package_manifest.get_current_csv(channel=channel) ocs_csv = CSV(resource_name=ocs_csv_name, namespace=namespace) log.info(f"Check if OCS operator: {ocs_csv_name} is in Succeeded phase.") ocs_csv.wait_for_phase(phase="Succeeded", timeout=600) return ocs_csv
def test_no_resource_found_for_packagemanifest(): """ Test that when we run into issue #1338, when no PackageManifest object found. This unit test serves two purposes: - to show what exactly happens to PackageManifest during issue #1338 - demonstrate that PackageManifest API remains unchanged """ # based on value of _data attribute when packagemanifest data are missing # as reported in https://github.com/red-hat-storage/ocs-ci/issues/1338 data_with_no_item = { 'apiVersion': 'v1', 'items': [], 'kind': 'List', 'metadata': {'resourceVersion': '', 'selfLink': ''} } with patch("ocs_ci.ocs.ocp.OCP.get", return_value=data_with_no_item): pm = PackageManifest(resource_name='foo', selector='bar') with pytest.raises(ResourceNotFoundError): pm.get_default_channel()
def get_csv_version(channel): """ Get the cluster-logging and Elasticsearch CSV version and Images of the pods Args: channel (str) : Logging Channel Returns: tuple: Tuple containing three elements cluster_logging_csv (str) : Name of the cluster-logging CSV elasticsearch_csv (str) : Name of the elasticsearch CSV dict: Images dict like: {'image_name': 'image.url.to:tag', ...} """ clo_package_manifest = PackageManifest(resource_name="cluster-logging") cluster_logging_csv = clo_package_manifest.get_current_csv(channel) es_package_manifest = PackageManifest(resource_name="elasticsearch-operator") elasticsearch_csv = es_package_manifest.get_current_csv(channel) logging_csv = CSV( resource_name=cluster_logging_csv, namespace=constants.OPENSHIFT_LOGGING_NAMESPACE, ) images = ocp.get_images(logging_csv.get()) return cluster_logging_csv, elasticsearch_csv, images
def get_ocs_csv(): """ Get the OCS CSV object Returns: CSV: OCS CSV object Raises: CSVNotFound: In case no CSV found. """ namespace = config.ENV_DATA["cluster_namespace"] operator_selector = get_selector_for_ocs_operator() subscription_plan_approval = config.DEPLOYMENT.get( "subscription_plan_approval") ocs_package_manifest = PackageManifest( resource_name=defaults.OCS_OPERATOR_NAME, selector=operator_selector, subscription_plan_approval=subscription_plan_approval, ) channel = config.DEPLOYMENT.get("ocs_csv_channel") ocs_csv_name = None # OCS CSV is extracted from the available CSVs in cluster namespace # for Openshift dedicated platform if config.ENV_DATA["platform"].lower( ) == constants.OPENSHIFT_DEDICATED_PLATFORM: ocp_cluster = OCP(namespace=config.ENV_DATA["cluster_namespace"], kind="csv") for item in ocp_cluster.get()["items"]: if item["metadata"]["name"].startswith(defaults.OCS_OPERATOR_NAME): ocs_csv_name = item["metadata"]["name"] if not ocs_csv_name: raise CSVNotFound("No OCS CSV found for openshift dedicated") else: ocs_csv_name = ocs_package_manifest.get_current_csv(channel=channel) ocs_csv = CSV(resource_name=ocs_csv_name, namespace=namespace) log.info(f"Check if OCS operator: {ocs_csv_name} is in Succeeded phase.") ocs_csv.wait_for_phase(phase="Succeeded", timeout=600) return ocs_csv
def test_upgrade(): namespace = config.ENV_DATA['cluster_namespace'] ocs_catalog = CatalogSource( resource_name=OPERATOR_CATALOG_SOURCE_NAME, namespace="openshift-marketplace", ) image_url = ocs_catalog.get_image_url() image_tag = ocs_catalog.get_image_name() if config.DEPLOYMENT.get('upgrade_to_latest', True): new_image_tag = get_latest_ds_olm_tag() else: new_image_tag = get_next_version_available_for_upgrade(image_tag) cs_data = deepcopy(ocs_catalog.data) cs_data['spec']['image'] = ':'.join([image_url, new_image_tag]) package_manifest = PackageManifest(resource_name=OCS_OPERATOR_NAME) csv_name_pre_upgrade = package_manifest.get_current_csv() log.info(f"CSV name before upgrade is: {csv_name_pre_upgrade}") with NamedTemporaryFile() as cs_yaml: dump_data_to_temp_yaml(cs_data, cs_yaml.name) ocs_catalog.apply(cs_yaml.name) # Wait for package manifest is ready package_manifest.wait_for_resource() attempts = 145 for attempt in range(1, attempts): if attempts == attempt: raise TimeoutException("No new CSV found after upgrade!") log.info(f"Attempt {attempt}/{attempts} to check CSV upgraded.") package_manifest.reload_data() csv_name_post_upgrade = package_manifest.get_current_csv() if csv_name_post_upgrade == csv_name_pre_upgrade: log.info(f"CSV is still: {csv_name_post_upgrade}") sleep(5) else: log.info(f"CSV now upgraded to: {csv_name_post_upgrade}") break csv = CSV( resource_name=csv_name_post_upgrade, namespace=namespace ) log.info( f"Waiting for CSV {csv_name_post_upgrade} to be in succeeded state" ) csv.wait_for_phase("Succeeded", timeout=400) ocs_install_verification(timeout=600)
def test_pm_null_get_default_channel(): pm = PackageManifest() with pytest.raises(ResourceNameNotSpecifiedException): pm.get_default_channel()
def test_pm_null(): """ Test that creation of PackageManifest object without any constructor agruments works (object is created, no exceptions are raised). """ PackageManifest()
def deploy_ocs_via_operator(self): """ Method for deploy OCS via OCS operator """ ui_deployment = config.DEPLOYMENT.get('ui_deployment') live_deployment = config.DEPLOYMENT.get('live_deployment') if config.DEPLOYMENT.get('local_storage'): setup_local_storage() if ui_deployment: if not live_deployment: self.create_ocs_operator_source() self.deployment_with_ui() # Skip the rest of the deployment when deploy via UI return else: logger.info("Deployment of OCS via OCS operator") self.label_and_taint_nodes() logger.info("Creating namespace and operator group.") run_cmd(f"oc create -f {constants.OLM_YAML}") if not live_deployment: self.create_ocs_operator_source() self.subscribe_ocs() operator_selector = get_selector_for_ocs_operator() package_manifest = PackageManifest( resource_name=defaults.OCS_OPERATOR_NAME, selector=operator_selector, ) package_manifest.wait_for_resource(timeout=300) channel = config.DEPLOYMENT.get('ocs_csv_channel') csv_name = package_manifest.get_current_csv(channel=channel) csv = CSV(resource_name=csv_name, namespace=self.namespace) csv.wait_for_phase("Succeeded", timeout=720) # Modify the CSV with custom values if required if all(key in config.DEPLOYMENT for key in ('csv_change_from', 'csv_change_to')): modify_csv(csv=csv_name, replace_from=config.DEPLOYMENT['csv_change_from'], replace_to=config.DEPLOYMENT['csv_change_to']) cluster_data = templating.load_yaml(constants.STORAGE_CLUSTER_YAML) cluster_data['metadata']['name'] = config.ENV_DATA[ 'storage_cluster_name'] deviceset_data = cluster_data['spec']['storageDeviceSets'][0] device_size = int( config.ENV_DATA.get('device_size', defaults.DEVICE_SIZE)) if self.platform.lower() == constants.BAREMETAL_PLATFORM: pv_size_list = helpers.get_pv_size( storageclass=constants.DEFAULT_STORAGECLASS_LSO) pv_size_list.sort() deviceset_data['dataPVCTemplate']['spec']['resources']['requests'][ 'storage'] = f"{pv_size_list[0]}" else: deviceset_data['dataPVCTemplate']['spec']['resources']['requests'][ 'storage'] = f"{device_size}Gi" if self.platform.lower() == constants.VSPHERE_PLATFORM: deviceset_data['dataPVCTemplate']['spec'][ 'storageClassName'] = constants.DEFAULT_SC_VSPHERE if config.DEPLOYMENT.get('local_storage'): cluster_data['spec']['manageNodes'] = False cluster_data['spec']['monDataDirHostPath'] = '/var/lib/rook' deviceset_data['portable'] = False deviceset_data['dataPVCTemplate']['spec'][ 'storageClassName'] = 'localblock' if self.platform.lower() == constants.AWS_PLATFORM: deviceset_data['count'] = 2 ocs_version = float(config.ENV_DATA['ocs_version']) # Allow lower instance requests and limits for OCS deployment # The resources we need to change can be found here: # https://github.com/openshift/ocs-operator/blob/release-4.5/pkg/deploy-manager/storagecluster.go#L88-L116 if config.DEPLOYMENT.get('allow_lower_instance_requirements'): none_resources = {'Requests': None, 'Limits': None} deviceset_data["resources"] = deepcopy(none_resources) resources = [ 'mon', 'mds', 'rgw', 'mgr', 'noobaa-core', 'noobaa-db', ] if ocs_version >= 4.5: resources.append('noobaa-endpoint') cluster_data['spec']['resources'] = { resource: deepcopy(none_resources) for resource in resources } else: local_storage = config.DEPLOYMENT.get('local_storage') platform = config.ENV_DATA.get('platform', '').lower() if local_storage and platform == 'aws': resources = { 'mds': { 'limits': { 'cpu': 3 }, 'requests': { 'cpu': 1 } }, 'noobaa-core': { 'limits': { 'cpu': 2, 'memory': '8Gi' }, 'requests': { 'cpu': 1, 'memory': '8Gi' } }, 'noobaa-db': { 'limits': { 'cpu': 2, 'memory': '8Gi' }, 'requests': { 'cpu': 1, 'memory': '8Gi' } } } if ocs_version >= 4.5: resources['noobaa-endpoint'] = { 'limits': { 'cpu': 2, 'memory': '8Gi' }, 'requests': { 'cpu': 1, 'memory': '8Gi' } } cluster_data['spec']['resources'] = resources # Enable host network if enabled in config (this require all the # rules to be enabled on underlaying platform). if config.DEPLOYMENT.get('host_network'): cluster_data['spec']['hostNetwork'] = True cluster_data['spec']['storageDeviceSets'] = [deviceset_data] cluster_data_yaml = tempfile.NamedTemporaryFile( mode='w+', prefix='cluster_storage', delete=False) templating.dump_data_to_temp_yaml(cluster_data, cluster_data_yaml.name) run_cmd(f"oc create -f {cluster_data_yaml.name}", timeout=2400)
def ocs_install_verification(timeout=600, skip_osd_distribution_check=False): """ Perform steps necessary to verify a successful OCS installation Args: timeout (int): Number of seconds for timeout which will be used in the checks used in this function. skip_osd_distribution_check (bool): If true skip the check for osd distribution. """ from ocs_ci.ocs.node import get_typed_nodes from ocs_ci.ocs.resources.pvc import get_deviceset_pvcs from ocs_ci.ocs.resources.pod import get_ceph_tools_pod, get_all_pods number_of_worker_nodes = len(get_typed_nodes()) namespace = config.ENV_DATA['cluster_namespace'] log.info("Verifying OCS installation") # Verify OCS CSV is in Succeeded phase log.info("verifying ocs csv") operator_selector = get_selector_for_ocs_operator() ocs_package_manifest = PackageManifest( resource_name=defaults.OCS_OPERATOR_NAME, selector=operator_selector, ) ocs_csv_name = ocs_package_manifest.get_current_csv() ocs_csv = CSV(resource_name=ocs_csv_name, namespace=namespace) log.info(f"Check if OCS operator: {ocs_csv_name} is in Succeeded phase.") ocs_csv.wait_for_phase(phase="Succeeded", timeout=timeout) # Verify OCS Cluster Service (ocs-storagecluster) is Ready storage_cluster_name = config.ENV_DATA['storage_cluster_name'] log.info("Verifying status of storage cluster: %s", storage_cluster_name) storage_cluster = StorageCluster( resource_name=storage_cluster_name, namespace=namespace, ) log.info(f"Check if StorageCluster: {storage_cluster_name} is in" f"Succeeded phase") storage_cluster.wait_for_phase(phase='Ready', timeout=timeout) # Verify pods in running state and proper counts log.info("Verifying pod states and counts") pod = OCP(kind=constants.POD, namespace=namespace) # ocs-operator assert pod.wait_for_resource(condition=constants.STATUS_RUNNING, selector=constants.OCS_OPERATOR_LABEL, timeout=timeout) # rook-ceph-operator assert pod.wait_for_resource(condition=constants.STATUS_RUNNING, selector=constants.OPERATOR_LABEL, timeout=timeout) # noobaa assert pod.wait_for_resource(condition=constants.STATUS_RUNNING, selector=constants.NOOBAA_APP_LABEL, resource_count=2, timeout=timeout) # mons assert pod.wait_for_resource(condition=constants.STATUS_RUNNING, selector=constants.MON_APP_LABEL, resource_count=3, timeout=timeout) # csi-cephfsplugin assert pod.wait_for_resource(condition=constants.STATUS_RUNNING, selector=constants.CSI_CEPHFSPLUGIN_LABEL, resource_count=number_of_worker_nodes, timeout=timeout) # csi-cephfsplugin-provisioner assert pod.wait_for_resource( condition=constants.STATUS_RUNNING, selector=constants.CSI_CEPHFSPLUGIN_PROVISIONER_LABEL, resource_count=2, timeout=timeout) # csi-rbdplugin assert pod.wait_for_resource(condition=constants.STATUS_RUNNING, selector=constants.CSI_RBDPLUGIN_LABEL, resource_count=number_of_worker_nodes, timeout=timeout) # csi-rbdplugin-provisioner assert pod.wait_for_resource( condition=constants.STATUS_RUNNING, selector=constants.CSI_RBDPLUGIN_PROVISIONER_LABEL, resource_count=2, timeout=timeout) # osds osd_count = ( int(storage_cluster.data['spec']['storageDeviceSets'][0]['count']) * int(storage_cluster.data['spec']['storageDeviceSets'][0]['replica'])) assert pod.wait_for_resource(condition=constants.STATUS_RUNNING, selector=constants.OSD_APP_LABEL, resource_count=osd_count, timeout=timeout) # mgr assert pod.wait_for_resource(condition=constants.STATUS_RUNNING, selector=constants.MGR_APP_LABEL, timeout=timeout) # mds assert pod.wait_for_resource(condition=constants.STATUS_RUNNING, selector=constants.MDS_APP_LABEL, resource_count=2, timeout=timeout) # rgw check only for VmWare if config.ENV_DATA.get('platform') == constants.VSPHERE_PLATFORM: assert pod.wait_for_resource(condition=constants.STATUS_RUNNING, selector=constants.RGW_APP_LABEL, resource_count=1, timeout=timeout) # Verify ceph health log.info("Verifying ceph health") assert utils.ceph_health_check(namespace=namespace) # Verify StorageClasses (1 ceph-fs, 1 ceph-rbd) log.info("Verifying storage classes") storage_class = OCP(kind=constants.STORAGECLASS, namespace=namespace) storage_cluster_name = config.ENV_DATA['storage_cluster_name'] required_storage_classes = { f'{storage_cluster_name}-cephfs', f'{storage_cluster_name}-ceph-rbd' } storage_classes = storage_class.get() storage_class_names = { item['metadata']['name'] for item in storage_classes['items'] } assert required_storage_classes.issubset(storage_class_names) # Verify OSD's are distributed if not skip_osd_distribution_check: log.info("Verifying OSD's are distributed evenly across worker nodes") ocp_pod_obj = OCP(kind=constants.POD, namespace=namespace) osds = ocp_pod_obj.get(selector=constants.OSD_APP_LABEL)['items'] node_names = [osd['spec']['nodeName'] for osd in osds] for node in node_names: assert not node_names.count(node) > 1, ( "OSD's are not distributed evenly across worker nodes") # Verify that CSI driver object contains provisioner names log.info("Verifying CSI driver object contains provisioner names.") csi_driver = OCP(kind="CSIDriver") assert {defaults.CEPHFS_PROVISIONER, defaults.RBD_PROVISIONER} == ({ item['metadata']['name'] for item in csi_driver.get()['items'] }) # Verify node and provisioner secret names in storage class log.info("Verifying node and provisioner secret names in storage class.") sc_rbd = storage_class.get( resource_name=constants.DEFAULT_STORAGECLASS_RBD) sc_cephfs = storage_class.get( resource_name=constants.DEFAULT_STORAGECLASS_CEPHFS) assert sc_rbd['parameters'][ 'csi.storage.k8s.io/node-stage-secret-name'] == constants.RBD_NODE_SECRET assert sc_rbd['parameters'][ 'csi.storage.k8s.io/provisioner-secret-name'] == constants.RBD_PROVISIONER_SECRET assert sc_cephfs['parameters'][ 'csi.storage.k8s.io/node-stage-secret-name'] == constants.CEPHFS_NODE_SECRET assert sc_cephfs['parameters'][ 'csi.storage.k8s.io/provisioner-secret-name'] == constants.CEPHFS_PROVISIONER_SECRET log.info("Verified node and provisioner secret names in storage class.") # Verify ceph osd tree output log.info( "Verifying ceph osd tree output and checking for device set PVC names " "in the output.") deviceset_pvcs = [pvc.name for pvc in get_deviceset_pvcs()] ct_pod = get_ceph_tools_pod() osd_tree = ct_pod.exec_ceph_cmd(ceph_cmd='ceph osd tree', format='json') schemas = { 'root': constants.OSD_TREE_ROOT, 'rack': constants.OSD_TREE_RACK, 'host': constants.OSD_TREE_HOST, 'osd': constants.OSD_TREE_OSD, 'region': constants.OSD_TREE_REGION, 'zone': constants.OSD_TREE_ZONE } schemas['host']['properties']['name'] = {'enum': deviceset_pvcs} for item in osd_tree['nodes']: validate(instance=item, schema=schemas[item['type']]) if item['type'] == 'host': deviceset_pvcs.remove(item['name']) assert not deviceset_pvcs, ( f"These device set PVCs are not given in ceph osd tree output " f"- {deviceset_pvcs}") log.info( "Verified ceph osd tree output. Device set PVC names are given in the " "output.") # TODO: Verify ceph osd tree output have osd listed as ssd # TODO: Verify ceph osd tree output have zone or rack based on AZ # Verify CSI snapshotter sidecar container is not present log.info("Verifying CSI snapshotter is not present.") provisioner_pods = get_all_pods( namespace=defaults.ROOK_CLUSTER_NAMESPACE, selector=[ constants.CSI_CEPHFSPLUGIN_PROVISIONER_LABEL, constants.CSI_RBDPLUGIN_PROVISIONER_LABEL ]) for pod_obj in provisioner_pods: pod_info = pod_obj.get() for container, image in get_images(data=pod_info).items(): assert ('snapshot' not in container) and ( 'snapshot' not in image), ( f"Snapshot container is present in {pod_obj.name} pod. " f"Container {container}. Image {image}") assert { 'name': 'CSI_ENABLE_SNAPSHOTTER', 'value': 'false' } in (ocs_csv.get()['spec']['install']['spec']['deployments'][0]['spec'] ['template']['spec']['containers'][0]['env'] ), "CSI_ENABLE_SNAPSHOTTER value is not set to 'false'." log.info("Verified: CSI snapshotter is not present.") # Verify pool crush rule is with "type": "zone" if utils.get_az_count() == 3: log.info("Verifying pool crush rule is with type: zone") crush_dump = ct_pod.exec_ceph_cmd(ceph_cmd='ceph osd crush dump', format='') pool_names = [ constants.METADATA_POOL, constants.DEFAULT_BLOCKPOOL, constants.DATA_POOL ] crush_rules = [ rule for rule in crush_dump['rules'] if rule['rule_name'] in pool_names ] for crush_rule in crush_rules: assert [ item for item in crush_rule['steps'] if item.get('type') == 'zone' ], f"{crush_rule['rule_name']} is not with type as zone" log.info("Verified - pool crush rule is with type: zone")
def ocs_install_verification(timeout=600, skip_osd_distribution_check=False): """ Perform steps necessary to verify a successful OCS installation Args: timeout (int): Number of seconds for timeout which will be used in the checks used in this function. skip_osd_distribution_check (bool): If true skip the check for osd distribution. """ from ocs_ci.ocs.node import get_typed_nodes number_of_worker_nodes = len(get_typed_nodes()) namespace = config.ENV_DATA['cluster_namespace'] log.info("Verifying OCS installation") # Verify OCS CSV is in Succeeded phase log.info("verifying ocs csv") ocs_package_manifest = PackageManifest( resource_name=defaults.OCS_OPERATOR_NAME) ocs_csv_name = ocs_package_manifest.get_current_csv() ocs_csv = CSV(resource_name=ocs_csv_name, namespace=namespace) log.info(f"Check if OCS operator: {ocs_csv_name} is in Succeeded phase.") ocs_csv.wait_for_phase(phase="Succeeded", timeout=timeout) # Verify OCS Cluster Service (ocs-storagecluster) is Ready storage_cluster_name = config.ENV_DATA['storage_cluster_name'] log.info("Verifying status of storage cluster: %s", storage_cluster_name) storage_cluster = StorageCluster( resource_name=storage_cluster_name, namespace=namespace, ) log.info(f"Check if StorageCluster: {storage_cluster_name} is in" f"Succeeded phase") storage_cluster.wait_for_phase(phase='Ready', timeout=timeout) # Verify pods in running state and proper counts log.info("Verifying pod states and counts") pod = OCP(kind=constants.POD, namespace=namespace) # ocs-operator assert pod.wait_for_resource(condition=constants.STATUS_RUNNING, selector=constants.OCS_OPERATOR_LABEL, timeout=timeout) # rook-ceph-operator assert pod.wait_for_resource(condition=constants.STATUS_RUNNING, selector=constants.OPERATOR_LABEL, timeout=timeout) # noobaa assert pod.wait_for_resource(condition=constants.STATUS_RUNNING, selector=constants.NOOBAA_APP_LABEL, resource_count=2, timeout=timeout) # mons assert pod.wait_for_resource(condition=constants.STATUS_RUNNING, selector=constants.MON_APP_LABEL, resource_count=3, timeout=timeout) # csi-cephfsplugin assert pod.wait_for_resource(condition=constants.STATUS_RUNNING, selector=constants.CSI_CEPHFSPLUGIN_LABEL, resource_count=number_of_worker_nodes, timeout=timeout) # csi-cephfsplugin-provisioner assert pod.wait_for_resource( condition=constants.STATUS_RUNNING, selector=constants.CSI_CEPHFSPLUGIN_PROVISIONER_LABEL, resource_count=2, timeout=timeout) # csi-rbdplugin assert pod.wait_for_resource(condition=constants.STATUS_RUNNING, selector=constants.CSI_RBDPLUGIN_LABEL, resource_count=number_of_worker_nodes, timeout=timeout) # csi-rbdplugin-profisioner assert pod.wait_for_resource( condition=constants.STATUS_RUNNING, selector=constants.CSI_RBDPLUGIN_PROVISIONER_LABEL, resource_count=2, timeout=timeout) # osds osd_count = ( int(storage_cluster.data['spec']['storageDeviceSets'][0]['count']) * int(storage_cluster.data['spec']['storageDeviceSets'][0]['replica'])) assert pod.wait_for_resource(condition=constants.STATUS_RUNNING, selector=constants.OSD_APP_LABEL, resource_count=osd_count, timeout=timeout) # mgr assert pod.wait_for_resource(condition=constants.STATUS_RUNNING, selector=constants.MGR_APP_LABEL, timeout=timeout) # mds assert pod.wait_for_resource(condition=constants.STATUS_RUNNING, selector=constants.MDS_APP_LABEL, resource_count=2, timeout=timeout) # rgw check only for VmWare if config.ENV_DATA.get('platform') == constants.VSPHERE_PLATFORM: assert pod.wait_for_resource(condition=constants.STATUS_RUNNING, selector=constants.RGW_APP_LABEL, resource_count=1, timeout=timeout) # Verify ceph health log.info("Verifying ceph health") assert utils.ceph_health_check(namespace=namespace) # Verify StorageClasses (1 ceph-fs, 1 ceph-rbd) log.info("Verifying storage classes") storage_class = OCP(kind=constants.STORAGECLASS, namespace=namespace) storage_cluster_name = config.ENV_DATA['storage_cluster_name'] required_storage_classes = { f'{storage_cluster_name}-cephfs', f'{storage_cluster_name}-ceph-rbd' } storage_classes = storage_class.get() storage_class_names = { item['metadata']['name'] for item in storage_classes['items'] } assert required_storage_classes.issubset(storage_class_names) # Verify OSD's are distributed if not skip_osd_distribution_check: log.info("Verifying OSD's are distributed evenly across worker nodes") ocp_pod_obj = OCP(kind=constants.POD, namespace=namespace) osds = ocp_pod_obj.get(selector=constants.OSD_APP_LABEL)['items'] node_names = [osd['spec']['nodeName'] for osd in osds] for node in node_names: assert not node_names.count(node) > 1, ( "OSD's are not distributed evenly across worker nodes")