Exemple #1
0
 def test_v3_checkpoint_api_pass(self):
     task = RunGreatExpectationsValidation(
         context_root_dir=str(V3_API_PATH),
         checkpoint_name="my_checkpoint_pass",
     )
     results = task.run()
     assert type(results) is CheckpointResult
Exemple #2
0
 def test_v2_checkpoint_api(self):
     task = RunGreatExpectationsValidation(
         context_root_dir=str(V2_API_PATH),
         checkpoint_name="my_chk",
     )
     results = task.run()
     assert type(results) is ValidationOperatorResult
 def test_v3_checkpoint_api_fail(self):
     task = RunGreatExpectationsValidation(
         context_root_dir=str(Path(__file__).parent.resolve() / "v3_api"),
         checkpoint_name="my_checkpoint_fail",
     )
     with pytest.raises(signals.FAIL):
         task.run()
Exemple #4
0
 def test_v3_checkpoint_api_fail(self):
     task = RunGreatExpectationsValidation(
         context_root_dir=str(V3_API_PATH),
         checkpoint_name="my_checkpoint_fail",
     )
     with pytest.raises(signals.FAIL):
         task.run()
Exemple #5
0
 def test_v3_with_checkpoint_config(self, in_memory_checkpoint):
     task = RunGreatExpectationsValidation(
         ge_checkpoint=in_memory_checkpoint,
         context_root_dir=str(V3_API_PATH),
     )
     results = task.run()
     assert type(results) is CheckpointResult
 def test_v3_checkpoint_api_pass(self):
     task = RunGreatExpectationsValidation(
         context_root_dir=str(Path(__file__).parent.resolve() / "v3_api"),
         checkpoint_name="my_checkpoint_pass",
     )
     results = task.run()
     assert type(results) is CheckpointResult
Exemple #7
0
 def test_v3_with_checkpoint_config(self, in_memory_checkpoint):
     task = RunGreatExpectationsValidation(
         ge_checkpoint=in_memory_checkpoint,
         context_root_dir=str(V3_API_PATH),
     )
     results = task.run()
     assert type(results) is CheckpointResult
     serializable_results = repr(results)
     assert "run_id" in serializable_results
     assert "run_results" in serializable_results
     assert "checkpoint_config" in serializable_results
     assert "success" in serializable_results
Exemple #8
0
 def test_v3_checkpoint_api_pass(self):
     task = RunGreatExpectationsValidation(
         context_root_dir=str(V3_API_PATH),
         checkpoint_name="my_checkpoint_pass",
     )
     results = task.run()
     assert type(results) is CheckpointResult
     serializable_results = repr(results)
     assert "run_id" in serializable_results
     assert "run_results" in serializable_results
     assert "checkpoint_config" in serializable_results
     assert "success" in serializable_results
Exemple #9
0
 def test_v2_checkpoint_api(self):
     task = RunGreatExpectationsValidation(
         context_root_dir=str(V2_API_PATH),
         checkpoint_name="my_chk",
     )
     results = task.run()
     assert type(results) is ValidationOperatorResult
     serializable_results = repr(results)
     assert "run_id" in serializable_results
     assert "run_results" in serializable_results
     assert "validation_operator_config" in serializable_results
     assert "evaluation_parameters" in serializable_results
     assert "success" in serializable_results
Exemple #10
0
 def test_suite_name_with_batch_kwargs(self):
     task = RunGreatExpectationsValidation(
         context_root_dir=str(V2_API_PATH),
         batch_kwargs={
             "path":
             "tests/tasks/great_expectations/data/yellow_tripdata_sample_2019-01.csv",
             "datasource": "data__dir",
             "data_asset_name": "yellow_tripdata_sample_2019-01",
         },
         expectation_suite_name="taxi.demo",
     )
     results = task.run()
     assert type(results) is ValidationOperatorResult
Exemple #11
0
 def test_v3_with_runtime_data_frame(self, in_memory_runtime_batch_request,
                                     in_memory_data_context):
     task = RunGreatExpectationsValidation(
         checkpoint_name="my_checkpoint_pass",
         context=in_memory_data_context,
         checkpoint_kwargs={
             "validations": [{
                 "batch_request": in_memory_runtime_batch_request,
                 "expectation_suite_name": "taxi.demo_pass",
             }]
         },
     )
     results = task.run()
     assert type(results) is CheckpointResult
Exemple #12
0
 def test_kwargs_get_passed_to_task_init(self):
     t = RunGreatExpectationsValidation(
         checkpoint_name="checkpoint",
         context=1234,
         assets_to_validate=["assets"],
         batch_kwargs={"kwargs": "here"},
         expectation_suite_name="name",
         context_root_dir="/path/to/somewhere",
         runtime_environment={
             "plugins_directory": "/path/to/plugins/somewhere/else"
         },
         run_name="1234",
         run_info_at_end=False,
         disable_markdown_artifact=True,
         evaluation_parameters=dict(prev_run_row_count=100),
     )
     assert t.checkpoint_name == "checkpoint"
     assert t.context == 1234
     assert t.assets_to_validate == ["assets"]
     assert t.batch_kwargs == {"kwargs": "here"}
     assert t.expectation_suite_name == "name"
     assert t.context_root_dir == "/path/to/somewhere"
     assert t.runtime_environment == {
         "plugins_directory": "/path/to/plugins/somewhere/else"
     }
     assert t.run_name == "1234"
     assert t.run_info_at_end == False
     assert t.disable_markdown_artifact == True
     assert t.evaluation_parameters == dict(prev_run_row_count=100)
Exemple #13
0
 def test_assets_to_validate(self):
     context = ge.DataContext(context_root_dir=str(V2_API_PATH))
     task = RunGreatExpectationsValidation(
         context=context,
         assets_to_validate=[
             context.get_batch(
                 {
                     "path":
                     "tests/tasks/great_expectations/data/yellow_tripdata_sample_2019-01.csv",
                     "datasource": "data__dir",
                     "data_asset_name": "yellow_tripdata_sample_2019-01",
                 },
                 "taxi.demo",
             )
         ],
     )
     results = task.run()
     assert type(results) is ValidationOperatorResult
Exemple #14
0
 def test_suite_name_with_batch_kwargs(self):
     task = RunGreatExpectationsValidation(
         context_root_dir=str(V2_API_PATH),
         batch_kwargs={
             "path":
             "tests/tasks/great_expectations/data/yellow_tripdata_sample_2019-01.csv",
             "datasource": "data__dir",
             "data_asset_name": "yellow_tripdata_sample_2019-01",
         },
         expectation_suite_name="taxi.demo",
     )
     results = task.run()
     assert type(results) is ValidationOperatorResult
     serializable_results = repr(results)
     assert "run_id" in serializable_results
     assert "run_results" in serializable_results
     assert "validation_operator_config" in serializable_results
     assert "evaluation_parameters" in serializable_results
     assert "success" in serializable_results
Exemple #15
0
 def test_assets_to_validate(self):
     context = ge.DataContext(context_root_dir=str(V2_API_PATH))
     task = RunGreatExpectationsValidation(
         context=context,
         assets_to_validate=[
             context.get_batch(
                 {
                     "path":
                     "tests/tasks/great_expectations/data/yellow_tripdata_sample_2019-01.csv",
                     "datasource": "data__dir",
                     "data_asset_name": "yellow_tripdata_sample_2019-01",
                 },
                 "taxi.demo",
             )
         ],
     )
     results = task.run()
     assert type(results) is ValidationOperatorResult
     serializable_results = repr(results)
     assert "run_id" in serializable_results
     assert "run_results" in serializable_results
     assert "validation_operator_config" in serializable_results
     assert "evaluation_parameters" in serializable_results
     assert "success" in serializable_results
from prefect import Flow, Parameter
from prefect.tasks.great_expectations import RunGreatExpectationsValidation

ge_task = RunGreatExpectationsValidation()

with Flow("great expectations example flow") as flow:
    checkpoint_name = Parameter("checkpoint_name")
    validations = ge_task.map(checkpoint_name)

if __name__ == "__main__":
    flow.run(checkpoint_name=[
        "warning_npi_checkpoint", "guaranteed_failure_npi_checkpoint"
    ])
Exemple #17
0
 def test_inits_with_no_args(self):
     t = RunGreatExpectationsValidation()
     assert t
Exemple #18
0
    def test_raises_if_params_not_mutually_exclusive(self):
        task = RunGreatExpectationsValidation(context="test")
        with pytest.raises(ValueError, match="Exactly"):
            task.run()

        with pytest.raises(ValueError, match="Exactly"):
            task.run(expectation_suite_name="name")

        with pytest.raises(ValueError, match="Exactly"):
            task.run(batch_kwargs={"here"})

        with pytest.raises(ValueError, match="Exactly"):
            task.run(
                expectation_suite_name="name",
                batch_kwargs={"here"},
                assets_to_validate=["val"],
            )

        with pytest.raises(ValueError, match="Exactly"):
            task.run(assets_to_validate=["val"], checkpoint_name="name")