Python RunGreatExpectationsValidation示例，prefect.tasks.great_expectations.RunGreatExpectationsValidation Python示例

示例#1

0

显示文件

 def test_v3_checkpoint_api_pass(self):
     task = RunGreatExpectationsValidation(
         context_root_dir=str(V3_API_PATH),
         checkpoint_name="my_checkpoint_pass",
     )
     results = task.run()
     assert type(results) is CheckpointResult

示例#2

0

显示文件

 def test_v2_checkpoint_api(self):
     task = RunGreatExpectationsValidation(
         context_root_dir=str(V2_API_PATH),
         checkpoint_name="my_chk",
     )
     results = task.run()
     assert type(results) is ValidationOperatorResult

示例#3

0

显示文件

文件： test_great_expectations_validation.py 项目： tank0226/prefect

 def test_v3_checkpoint_api_fail(self):
     task = RunGreatExpectationsValidation(
         context_root_dir=str(Path(__file__).parent.resolve() / "v3_api"),
         checkpoint_name="my_checkpoint_fail",
     )
     with pytest.raises(signals.FAIL):
         task.run()

示例#4

0

显示文件

 def test_v3_checkpoint_api_fail(self):
     task = RunGreatExpectationsValidation(
         context_root_dir=str(V3_API_PATH),
         checkpoint_name="my_checkpoint_fail",
     )
     with pytest.raises(signals.FAIL):
         task.run()

示例#5

0

显示文件

 def test_v3_with_checkpoint_config(self, in_memory_checkpoint):
     task = RunGreatExpectationsValidation(
         ge_checkpoint=in_memory_checkpoint,
         context_root_dir=str(V3_API_PATH),
     )
     results = task.run()
     assert type(results) is CheckpointResult

示例#6

0

显示文件

文件： test_great_expectations_validation.py 项目： tank0226/prefect

 def test_v3_checkpoint_api_pass(self):
     task = RunGreatExpectationsValidation(
         context_root_dir=str(Path(__file__).parent.resolve() / "v3_api"),
         checkpoint_name="my_checkpoint_pass",
     )
     results = task.run()
     assert type(results) is CheckpointResult

示例#7

0

显示文件

 def test_v3_with_checkpoint_config(self, in_memory_checkpoint):
     task = RunGreatExpectationsValidation(
         ge_checkpoint=in_memory_checkpoint,
         context_root_dir=str(V3_API_PATH),
     )
     results = task.run()
     assert type(results) is CheckpointResult
     serializable_results = repr(results)
     assert "run_id" in serializable_results
     assert "run_results" in serializable_results
     assert "checkpoint_config" in serializable_results
     assert "success" in serializable_results

示例#8

0

显示文件

 def test_v3_checkpoint_api_pass(self):
     task = RunGreatExpectationsValidation(
         context_root_dir=str(V3_API_PATH),
         checkpoint_name="my_checkpoint_pass",
     )
     results = task.run()
     assert type(results) is CheckpointResult
     serializable_results = repr(results)
     assert "run_id" in serializable_results
     assert "run_results" in serializable_results
     assert "checkpoint_config" in serializable_results
     assert "success" in serializable_results

示例#9

0

显示文件

 def test_v2_checkpoint_api(self):
     task = RunGreatExpectationsValidation(
         context_root_dir=str(V2_API_PATH),
         checkpoint_name="my_chk",
     )
     results = task.run()
     assert type(results) is ValidationOperatorResult
     serializable_results = repr(results)
     assert "run_id" in serializable_results
     assert "run_results" in serializable_results
     assert "validation_operator_config" in serializable_results
     assert "evaluation_parameters" in serializable_results
     assert "success" in serializable_results

示例#10

0

显示文件

 def test_suite_name_with_batch_kwargs(self):
     task = RunGreatExpectationsValidation(
         context_root_dir=str(V2_API_PATH),
         batch_kwargs={
             "path":
             "tests/tasks/great_expectations/data/yellow_tripdata_sample_2019-01.csv",
             "datasource": "data__dir",
             "data_asset_name": "yellow_tripdata_sample_2019-01",
         },
         expectation_suite_name="taxi.demo",
     )
     results = task.run()
     assert type(results) is ValidationOperatorResult

示例#11

0

显示文件

 def test_v3_with_runtime_data_frame(self, in_memory_runtime_batch_request,
                                     in_memory_data_context):
     task = RunGreatExpectationsValidation(
         checkpoint_name="my_checkpoint_pass",
         context=in_memory_data_context,
         checkpoint_kwargs={
             "validations": [{
                 "batch_request": in_memory_runtime_batch_request,
                 "expectation_suite_name": "taxi.demo_pass",
             }]
         },
     )
     results = task.run()
     assert type(results) is CheckpointResult

示例#12

0

显示文件

 def test_kwargs_get_passed_to_task_init(self):
     t = RunGreatExpectationsValidation(
         checkpoint_name="checkpoint",
         context=1234,
         assets_to_validate=["assets"],
         batch_kwargs={"kwargs": "here"},
         expectation_suite_name="name",
         context_root_dir="/path/to/somewhere",
         runtime_environment={
             "plugins_directory": "/path/to/plugins/somewhere/else"
         },
         run_name="1234",
         run_info_at_end=False,
         disable_markdown_artifact=True,
         evaluation_parameters=dict(prev_run_row_count=100),
     )
     assert t.checkpoint_name == "checkpoint"
     assert t.context == 1234
     assert t.assets_to_validate == ["assets"]
     assert t.batch_kwargs == {"kwargs": "here"}
     assert t.expectation_suite_name == "name"
     assert t.context_root_dir == "/path/to/somewhere"
     assert t.runtime_environment == {
         "plugins_directory": "/path/to/plugins/somewhere/else"
     }
     assert t.run_name == "1234"
     assert t.run_info_at_end == False
     assert t.disable_markdown_artifact == True
     assert t.evaluation_parameters == dict(prev_run_row_count=100)

示例#13

0

显示文件

 def test_assets_to_validate(self):
     context = ge.DataContext(context_root_dir=str(V2_API_PATH))
     task = RunGreatExpectationsValidation(
         context=context,
         assets_to_validate=[
             context.get_batch(
                 {
                     "path":
                     "tests/tasks/great_expectations/data/yellow_tripdata_sample_2019-01.csv",
                     "datasource": "data__dir",
                     "data_asset_name": "yellow_tripdata_sample_2019-01",
                 },
                 "taxi.demo",
             )
         ],
     )
     results = task.run()
     assert type(results) is ValidationOperatorResult

示例#14

0

显示文件

 def test_suite_name_with_batch_kwargs(self):
     task = RunGreatExpectationsValidation(
         context_root_dir=str(V2_API_PATH),
         batch_kwargs={
             "path":
             "tests/tasks/great_expectations/data/yellow_tripdata_sample_2019-01.csv",
             "datasource": "data__dir",
             "data_asset_name": "yellow_tripdata_sample_2019-01",
         },
         expectation_suite_name="taxi.demo",
     )
     results = task.run()
     assert type(results) is ValidationOperatorResult
     serializable_results = repr(results)
     assert "run_id" in serializable_results
     assert "run_results" in serializable_results
     assert "validation_operator_config" in serializable_results
     assert "evaluation_parameters" in serializable_results
     assert "success" in serializable_results

示例#15

0

显示文件

 def test_assets_to_validate(self):
     context = ge.DataContext(context_root_dir=str(V2_API_PATH))
     task = RunGreatExpectationsValidation(
         context=context,
         assets_to_validate=[
             context.get_batch(
                 {
                     "path":
                     "tests/tasks/great_expectations/data/yellow_tripdata_sample_2019-01.csv",
                     "datasource": "data__dir",
                     "data_asset_name": "yellow_tripdata_sample_2019-01",
                 },
                 "taxi.demo",
             )
         ],
     )
     results = task.run()
     assert type(results) is ValidationOperatorResult
     serializable_results = repr(results)
     assert "run_id" in serializable_results
     assert "run_results" in serializable_results
     assert "validation_operator_config" in serializable_results
     assert "evaluation_parameters" in serializable_results
     assert "success" in serializable_results

示例#16

0

显示文件

文件： great_expectations_flow.py 项目： zschumacher/prefect

from prefect import Flow, Parameter
from prefect.tasks.great_expectations import RunGreatExpectationsValidation

ge_task = RunGreatExpectationsValidation()

with Flow("great expectations example flow") as flow:
    checkpoint_name = Parameter("checkpoint_name")
    validations = ge_task.map(checkpoint_name)

if __name__ == "__main__":
    flow.run(checkpoint_name=[
        "warning_npi_checkpoint", "guaranteed_failure_npi_checkpoint"
    ])

示例#17

0

显示文件

 def test_inits_with_no_args(self):
     t = RunGreatExpectationsValidation()
     assert t

示例#18

0

显示文件

    def test_raises_if_params_not_mutually_exclusive(self):
        task = RunGreatExpectationsValidation(context="test")
        with pytest.raises(ValueError, match="Exactly"):
            task.run()

        with pytest.raises(ValueError, match="Exactly"):
            task.run(expectation_suite_name="name")

        with pytest.raises(ValueError, match="Exactly"):
            task.run(batch_kwargs={"here"})

        with pytest.raises(ValueError, match="Exactly"):
            task.run(
                expectation_suite_name="name",
                batch_kwargs={"here"},
                assets_to_validate=["val"],
            )

        with pytest.raises(ValueError, match="Exactly"):
            task.run(assets_to_validate=["val"], checkpoint_name="name")