def test_basic_drift_detection():
    """
    Tests that drift detection works.
    """
    data = FileSystem.load("tests/data/test_cli_detectors/detector/1.json")
    start_state = StateSchema().load(data)
    data = FileSystem.load("tests/data/test_cli_detectors/detector/2.json")
    end_state = StateSchema().load(data)
    new_results, missing_results = perform_drift_detection(
        start_state, end_state)
    new_results = [
        drift_info_detector_pair[0] for drift_info_detector_pair in new_results
    ]
    missing_results = [
        drift_info_detector_pair[0]
        for drift_info_detector_pair in missing_results
    ]
    assert {
        'd.test': '36',
        'd.test2': '37',
        'd.test3': ['38', '39', '40']
    } in new_results
    assert {
        'd.test': '7',
        'd.test2': '14',
        'd.test3': ['21', '28', '35']
    } in missing_results
示例#2
0
def test_get_state_detectors(neo4j_session):
    data = [
        ["1", "8", ["15", "22", "29"]],
        ["2", "9", ["16", "23", "30"]],
        ["3", "10", ["17", "24", "31"]],
        ["4", "11", ["18", "25", "32"]],
        ["5", "12", ["19", "26", "33"]],
        ["6", "13", ["20", "27", "34"]],
        ["7", "14", ["21", "28", "35"]],
        ["36", "37", ["38", "39", "40"]],
    ]
    ingest_nodes = """
        MERGE (person:Person{test: {test}})
        SET person.test2 = {test2},
        person.test3 = {test3}
        """
    for node in data:
        test = node[0]
        test2 = node[1]
        test3 = node[2]
        neo4j_session.run(
            ingest_nodes,
            test=test,
            test2=test2,
            test3=test3,
        )

    query_directory = "tests/data/test_update_detectors/test_detector"
    state_serializer = StateSchema()
    shortcut_serializer = ShortcutSchema()
    storage = FileSystem

    file_1 = str(datetime.datetime(2019, 1, 1, 0, 0, 2)) + ".json"
    file_2 = str(datetime.datetime(2019, 1, 1, 0, 0, 1)) + ".json"

    get_query_state(neo4j_session, query_directory, state_serializer, storage,
                    file_1)
    add_shortcut(FileSystem(), ShortcutSchema(), query_directory,
                 "most-recent", file_1)

    detector_1_data = FileSystem.load(os.path.join(query_directory, file_1))
    detector_1 = state_serializer.load(detector_1_data)

    detector_2_data = FileSystem.load(os.path.join(query_directory, file_2))
    detector_2 = state_serializer.load(detector_2_data)

    assert detector_1.name == detector_2.name
    assert detector_1.validation_query == detector_2.validation_query
    assert detector_1.properties == detector_2.properties
    assert detector_1.results == detector_2.results

    shortcut_data = FileSystem.load(
        os.path.join(query_directory, "shortcut.json"))
    shortcut = shortcut_serializer.load(shortcut_data)
    assert shortcut.shortcuts['most-recent'] == file_1
    shortcut_data = shortcut_serializer.dump(shortcut)
    FileSystem.write(shortcut_data,
                     os.path.join(query_directory, "shortcut.json"))
示例#3
0
def test_basic_drift_detection():
    """
    Tests that drift detection works.
    """
    data = FileSystem.load("tests/data/test_cli_detectors/detector/1.json")
    start_state = StateSchema().load(data)
    data = FileSystem.load("tests/data/test_cli_detectors/detector/2.json")
    end_state = StateSchema().load(data)
    new_results, missing_results = perform_drift_detection(start_state, end_state)
    assert ['36', '37', ['38', '39', '40']] in new_results
    assert ['7', '14', ['21', '28', '35']] in missing_results
示例#4
0
def test_state_differences():
    """
    Test that state_differences picks up new drift
    :return:
    """

    filepath = "tests/data/detectors/test_expectations.json"
    data = FileSystem.load(filepath)
    state_1 = StateSchema().load(data)
    state_2 = StateSchema().load(data)
    state_2.results.append(["7"])
    drift_info_state_pairs = compare_states(state_1, state_2)
    assert ({'d.test': "7"}, state_2) in drift_info_state_pairs
示例#5
0
def test_compare_states():
    """
    Test that differences between two states is recorded
    :return:
    """

    filepath = "tests/data/detectors/test_expectations.json"
    data = FileSystem.load(filepath)
    state_1 = StateSchema().load(data)
    state_2 = StateSchema().load(data)
    state_1.results.append(["7"])
    state_2.results.append(["8"])
    new, missing = perform_drift_detection(state_1, state_2)
    assert ({'d.test': "7"}, state_1) in missing
    assert ({'d.test': "8"}, state_2) in new
示例#6
0
def test_faulty_queries(neo4j_session):
    data = [["1", "8", ["15", "22", "29"]], ["2", "9", ["16", "23", "30"]],
            ["3", "10", ["17", "24", "31"]], ["4", "11", ["18", "25", "32"]],
            ["5", "12", ["19", "26", "33"]], ["6", "13", ["20", "27", "34"]],
            ["7", "14", ["21", "28", "35"]], ["36", "37", ["38", "39", "40"]]]
    ingest_nodes = """
            MERGE (person:Person{test: {test}})
            SET person.test2 = {test2},
            person.test3 = {test3}
            """
    for node in data:
        test = node[0]
        test2 = node[1]
        test3 = node[2]
        neo4j_session.run(ingest_nodes, test=test, test2=test2, test3=test3)

    query_directory = "tests/data/test_update_detectors/invalid_query"
    state_serializer = StateSchema()
    storage = FileSystem

    file_1 = str(datetime.datetime(2019, 1, 1, 0, 0, 2)) + ".json"
    with pytest.raises(neobolt.exceptions.CypherSyntaxError):
        get_query_state(neo4j_session, query_directory, state_serializer,
                        storage, file_1)

    query_directory = "tests/data/test_update_detectors/invalid_template"

    with pytest.raises(ValidationError):
        get_query_state(neo4j_session, query_directory, state_serializer,
                        storage, file_1)
def run_drift_detection(config):
    try:
        if not valid_directory(config.query_directory):
            logger.error("Invalid Drift Detection Directory")
            return
        state_serializer = StateSchema()
        shortcut_serializer = ShortcutSchema()
        shortcut_data = FileSystem.load(os.path.join(config.query_directory, "shortcut.json"))
        shortcut = shortcut_serializer.load(shortcut_data)
        start_state_data = FileSystem.load(
            os.path.join(
                config.query_directory, shortcut.shortcuts.get(
                    config.start_state,
                    config.start_state,
                ),
            ),
        )
        start_state = state_serializer.load(start_state_data)
        end_state_data = FileSystem.load(
            os.path.join(
                config.query_directory, shortcut.shortcuts.get(
                    config.end_state,
                    config.end_state,
                ),
            ),
        )
        end_state = state_serializer.load(end_state_data)
        new_results, missing_results = perform_drift_detection(start_state, end_state)
        report_drift_new(new_results)
        report_drift_missing(missing_results)
    except ValidationError as err:
        msg = "Unable to create DriftStates from files {},{} for \n{} in directory {}.".format(
            config.start_state,
            config.end_state,
            err.messages,
            config.query_directory,
        )
        logger.exception(msg)
    except ValueError as err:
        msg = "Unable to create DriftStates from files {},{} for \n{} in directory {}.".format(
            config.start_state,
            config.end_state,
            err,
            config.query_directory,
        )
        logger.exception(msg)
示例#8
0
def test_drift_from_multiple_properties():
    """
    Test fields with multiple properties handles correctly.
    :return:
    """
    mock_session = MagicMock()
    mock_boltstatementresult = MagicMock()
    key_1 = "d.test"
    key_2 = "d.test2"
    key_3 = "d.test3"
    results = [{
        key_1: "1",
        key_2: "8",
        key_3: ["15", "22", "29"]
    }, {
        key_1: "2",
        key_2: "9",
        key_3: ["16", "23", "30"]
    }, {
        key_1: "3",
        key_2: "10",
        key_3: ["17", "24", "31"]
    }, {
        key_1: "4",
        key_2: "11",
        key_3: ["18", "25", "32"]
    }, {
        key_1: "5",
        key_2: "12",
        key_3: ["19", "26", "33"]
    }, {
        key_1: "6",
        key_2: "13",
        key_3: ["20", "27", "34"]
    }, {
        key_1: "7",
        key_2: "14",
        key_3: ["21", "28", "35"]
    }]
    mock_boltstatementresult.__getitem__.side_effect = results.__getitem__
    mock_boltstatementresult.__iter__.side_effect = results.__iter__
    mock_session.run.return_value = mock_boltstatementresult
    data = FileSystem.load(
        "tests/data/detectors/test_multiple_properties.json")
    state_old = StateSchema().load(data)
    state_new = State(state_old.name, state_old.validation_query,
                      state_old.properties, [])
    get_state(mock_session, state_new)
    state_new.properties = state_old.properties
    drifts = compare_states(state_old, state_new)
    mock_session.run.assert_called_with(state_new.validation_query)
    print(drifts)
    assert {key_1: "7", key_2: "14", key_3: ["21", "28", "35"]} in drifts[0]
    assert {
        key_1: "3",
        key_2: "10",
        key_3: ["17", "24", "31"]
    } not in drifts[0]
def test_drift_detection_errors():
    data = FileSystem.load("tests/data/test_cli_detectors/detector/1.json")
    start_state = StateSchema().load(data)
    data = FileSystem.load("tests/data/test_cli_detectors/detector/2.json")
    end_state = StateSchema().load(data)

    start_state.name = "Wrong Name"
    with pytest.raises(ValueError):
        perform_drift_detection(start_state, end_state)

    start_state = StateSchema().load(data)
    start_state.properties = ["Incorrect", "Properties"]
    with pytest.raises(ValueError):
        perform_drift_detection(start_state, end_state)

    start_state = StateSchema().load(data)
    start_state.validation_query = "Invalid Validation Query"
    with pytest.raises(ValueError):
        perform_drift_detection(start_state, end_state)
示例#10
0
def test_state_multiple_expectations():
    """
    Test that multiple fields runs properly.
    :return:
    """
    key_1 = "d.test"
    key_2 = "d.test2"
    mock_session = MagicMock()
    mock_boltstatementresult = MagicMock()
    results = [
        {
            key_1: "1",
            key_2: "8"
        },
        {
            key_1: "2",
            key_2: "9"
        },
        {
            key_1: "3",
            key_2: "10"
        },
        {
            key_1: "4",
            key_2: "11"
        },
        {
            key_1: "5",
            key_2: "12"
        },
        {
            key_1: "6",
            key_2: "13"
        },
        {
            key_1: "7",
            key_2: "14"
        },
    ]

    mock_boltstatementresult.__getitem__.side_effect = results.__getitem__
    mock_boltstatementresult.__iter__.side_effect = results.__iter__
    mock_session.run.return_value = mock_boltstatementresult
    data = FileSystem.load(
        "tests/data/detectors/test_multiple_expectations.json")
    state_old = StateSchema().load(data)
    state_new = State(state_old.name, state_old.validation_query,
                      state_old.properties, [])
    get_state(mock_session, state_new)
    state_new.properties = state_old.properties
    drifts = compare_states(state_old, state_new)
    mock_session.run.assert_called_with(state_new.validation_query)
    assert {key_1: "7", key_2: "14"} in drifts[0]
示例#11
0
def test_json_loader():
    """
    Test loading schema passes
    :return:
    """

    filepath = "tests/data/detectors/test_expectations.json"
    data = FileSystem.load(filepath)
    state = StateSchema().load(data)
    assert state.name == "Test-Expectations"
    assert state.validation_query == "MATCH (d) RETURN d.test"
    assert state.results == [['1'], ['2'], ['3'], ['4'], ['5'], ['6']]
示例#12
0
def test_state_picks_up_drift():
    """
    Test that a state that detects drift.
    :return:
    """
    key = "d.test"
    mock_session = MagicMock()
    mock_boltstatementresult = MagicMock()
    results = [
        {
            key: "1"
        },
        {
            key: "2"
        },
        {
            key: "3"
        },
        {
            key: "4"
        },
        {
            key: "5"
        },
        {
            key: "6"
        },
        {
            key: "7"
        },
    ]

    mock_boltstatementresult.__getitem__.side_effect = results.__getitem__
    mock_boltstatementresult.__iter__.side_effect = results.__iter__
    mock_session.run.return_value = mock_boltstatementresult
    data = FileSystem.load("tests/data/detectors/test_expectations.json")
    state_old = StateSchema().load(data)
    state_new = State(state_old.name, state_old.validation_query,
                      state_old.properties, [])
    get_state(mock_session, state_new)
    state_new.properties = state_old.properties
    drifts = compare_states(state_old, state_new)
    mock_session.run.assert_called_with(state_new.validation_query)
    assert drifts
    assert drifts[0][0] == {key: "7"}
示例#13
0
def run_get_states(config):
    """
    Handles neo4j errors and then updates detectors.

    :type config: Config Object
    :param config: Config Object from CLI
    :return:
    """
    if not valid_directory(config.drift_detection_directory):
        logger.error("Invalid Drift Detection Directory")
        return
    neo4j_auth = None
    if config.neo4j_user or config.neo4j_password:
        neo4j_auth = (config.neo4j_user, config.neo4j_password)
    try:
        neo4j_driver = GraphDatabase.driver(
            config.neo4j_uri,
            auth=neo4j_auth,
        )
    except neobolt.exceptions.ServiceUnavailable as e:
        logger.debug("Error occurred during Neo4j connect.", exc_info=True)
        logger.error(
            ("Unable to connect to Neo4j using the provided URI '%s', an error occurred: '%s'. Make sure the "
             "Neo4j server is running and accessible from your network."),
            config.neo4j_uri,
            e,
        )
        return
    except neobolt.exceptions.AuthError as e:
        logger.debug("Error occurred during Neo4j auth.", exc_info=True)
        if not neo4j_auth:
            logger.error(
                ("Unable to auth to Neo4j, an error occurred: '%s'. driftdetect attempted to connect to Neo4j "
                 "without any auth. Check your Neo4j server settings to see if auth is required and, if it is, "
                 "provide driftdetect with a valid username and password."),
                e,
            )
        else:
            logger.error(
                ("Unable to auth to Neo4j, an error occurred: '%s'. driftdetect attempted to connect to Neo4j "
                 "with a username and password. Check your Neo4j server settings to see if the username and "
                 "password provided to driftdetect are valid credentials."),
                e,
            )
        return

    with neo4j_driver.session() as session:
        filename = '.'.join([str(i) for i in time.gmtime()] + ["json"])
        state_serializer = StateSchema()
        shortcut_serializer = ShortcutSchema()
        for query_directory in FileSystem.walk(
                config.drift_detection_directory):
            try:
                get_query_state(session, query_directory, state_serializer,
                                FileSystem, filename)
                add_shortcut(FileSystem, shortcut_serializer, query_directory,
                             'most-recent', filename)
            except ValidationError as err:
                msg = "Unable to create State for directory {}, with data \n{}".format(
                    query_directory,
                    err.messages,
                )
                logger.exception(msg)
            except KeyError as err:
                msg = f"Could not find {err} field in state template for directory {query_directory}."
                logger.exception(msg)
            except FileNotFoundError as err:
                logger.exception(err)
            except neobolt.exceptions.CypherSyntaxError as err:
                logger.exception(err)