def test_sa_expect_column_value_z_scores_to_be_less_than_impl(postgresql_engine): df = pd.DataFrame({"a": [1, 5, 22, 3, 5, 10]}) df.to_sql( name="z_score_test_data", con=postgresql_engine, index=False, if_exists="replace", ) expectationConfiguration = ExpectationConfiguration( expectation_type="expect_column_value_z_scores_to_be_less_than", kwargs={ "column": "a", "mostly": 0.9, "threshold": 4, "double_sided": True, }, ) expectation = ExpectColumnValueZScoresToBeLessThan(expectationConfiguration) engine = SqlAlchemyExecutionEngine(engine=postgresql_engine) engine.load_batch_data( "my_id", SqlAlchemyBatchData(execution_engine=engine, table_name="z_score_test_data"), ) result = expectation.validate(Validator(execution_engine=engine)) assert result == ExpectationValidationResult( success=True, )
def test_spark_expect_column_value_z_scores_to_be_less_than_impl( spark_session, basic_spark_df_execution_engine ): df = pd.DataFrame({"a": [1, 5, 22, 3, 5, 10]}) spark = get_or_create_spark_application( spark_config={ "spark.sql.catalogImplementation": "hive", "spark.executor.memory": "450m", # "spark.driver.allowMultipleContexts": "true", # This directive does not appear to have any effect. } ) df = spark.createDataFrame(df) expectationConfiguration = ExpectationConfiguration( expectation_type="expect_column_value_z_scores_to_be_less_than", kwargs={ "column": "a", "mostly": 0.9, "threshold": 4, "double_sided": True, }, ) expectation = ExpectColumnValueZScoresToBeLessThan(expectationConfiguration) engine = basic_spark_df_execution_engine engine.load_batch_data(batch_id="my_id", batch_data=df) result = expectation.validate(Validator(execution_engine=engine)) assert result == ExpectationValidationResult( success=True, )
def test_expect_column_value_z_scores_to_be_less_than_impl(): df = pd.DataFrame({"a": [1, 5, 22, 3, 5, 10]}) expectationConfiguration = ExpectationConfiguration( expectation_type="expect_column_value_z_scores_to_be_less_than", kwargs={ "column": "a", "mostly": 0.9, "threshold": 4, "double_sided": True, }, ) expectation = ExpectColumnValueZScoresToBeLessThan( expectationConfiguration) engine = PandasExecutionEngine(batch_data_dict={"my_id": df}) result = expectation.validate(Validator(execution_engine=engine)) assert result == ExpectationValidationResult(success=True, )