Example #1
0
    def __init__(self, Environment, randseed=None, name=None):
        if not name:
            name = "crm-ais"
        crm_lha.__init__(self, Environment, randseed=randseed, name=name)

        self.fullcomplist = {}
        self.templates = PatternSelector(self.name)
Example #2
0
    def __init__(self, Environment, randseed=None):
        crm_lha.__init__(self, Environment, randseed=randseed)

        self.update(
            {
                "Name": "crm-ais",
                "EpocheCmd": "crm_node -e --openais",
                "QuorumCmd": "crm_node -q --openais",
                "ParitionCmd": "crm_node -p --openais",
                "Pat:They_stopped": "%s crmd.*Node %s\[.*state is now lost",
                "Pat:ChildExit": "Child process .* exited",
                # Bad news Regexes.  Should never occur.
                "BadRegexes": (
                    r" trace:",
                    r"error:",
                    r"crit:",
                    r"ERROR:",
                    r"CRIT:",
                    r"Shutting down...NOW",
                    r"Timer I_TERMINATE just popped",
                    r"input=I_ERROR",
                    r"input=I_FAIL",
                    r"input=I_INTEGRATED cause=C_TIMER_POPPED",
                    r"input=I_FINALIZED cause=C_TIMER_POPPED",
                    r"input=I_ERROR",
                    r", exiting\.",
                    r"(WARN|warn).*Ignoring HA message.*vote.*not in our membership list",
                    r"pengine.*Attempting recovery of resource",
                    r"is taking more than 2x its timeout",
                    r"Confirm not received from",
                    r"Welcome reply not received from",
                    r"Attempting to schedule .* after a stop",
                    r"Resource .* was active at shutdown",
                    r"duplicate entries for call_id",
                    r"Search terminated:",
                    r":global_timer_callback",
                    r"Faking parameter digest creation",
                    r"Parameters to .* action changed:",
                    r"Parameters to .* changed",
                    r"Child process .* terminated with signal",
                    r"Executing .* fencing operation",
                    r"LogActions: Recover",
                    r"rsyslogd.* imuxsock lost .* messages from pid .* due to rate-limiting",
                    r"Peer is not part of our cluster",
                    r"We appear to be in an election loop",
                    r"Unknown node -> we will not deliver message",
                    r"crm_write_blackbox",
                    r"pacemakerd.*Could not connect to Cluster Configuration Database API",
                    # r"crm_ipc_send:.*Request .* failed",
                    # r"crm_ipc_send:.*Sending to .* is disabled until pending reply is recieved",
                    # Not inherently bad, but worth tracking
                    # r"No need to invoke the TE",
                    # r"ping.*: DEBUG: Updated connected = 0",
                    # r"Digest mis-match:",
                ),
            }
        )
Example #3
0
    def __init__(self, Environment, randseed=None):
        crm_lha.__init__(self, Environment, randseed=randseed)

        self.update({
            "Name":
            "crm-ais",
            "EpocheCmd":
            "crm_node -e --openais",
            "QuorumCmd":
            "crm_node -q --openais",
            "ParitionCmd":
            "crm_node -p --openais",
            "Pat:They_stopped":
            "%s crmd:.*Node %s: .* state=lost .new",
            "Pat:ChildExit":
            "Child process .* exited",

            # Bad news Regexes.  Should never occur.
            "BadRegexes": (
                r"ERROR:",
                r"CRIT:",
                r"TRACE:",
                r"Shutting down\.",
                r"Forcing shutdown\.",
                r"Timer I_TERMINATE just popped",
                r"input=I_ERROR",
                r"input=I_FAIL",
                r"input=I_INTEGRATED cause=C_TIMER_POPPED",
                r"input=I_FINALIZED cause=C_TIMER_POPPED",
                r"input=I_ERROR",
                r", exiting\.",
                r"WARN.*Ignoring HA message.*vote.*not in our membership list",
                r"pengine.*Attempting recovery of resource",
                r"is taking more than 2x its timeout",
                r"Confirm not received from",
                r"Welcome reply not received from",
                r"Attempting to schedule .* after a stop",
                r"Resource .* was active at shutdown",
                r"duplicate entries for call_id",
                r"Search terminated:",
                r":global_timer_callback",
                r"Faking parameter digest creation",
                r"Parameters to .* action changed:",
                r"Parameters to .* changed",
                r"Child process .* terminated with signal 11",
                r"Executing .* fencing operation",
                r"LogActions: Recover",

                # Not inherently bad, but worth tracking
                #r"No need to invoke the TE",
                #r"ping.*: DEBUG: Updated connected = 0",
                #r"Digest mis-match:",
            ),
        })
Example #4
0
    def __init__(self, Environment, randseed=None):
        crm_lha.__init__(self, Environment, randseed=randseed)

        self.update({
            "Name"           : "crm-ais",

            "EpocheCmd"      : "crm_node -e --openais",
            "QuorumCmd"      : "crm_node -q --openais",
            "ParitionCmd"    : "crm_node -p --openais",

            "Pat:They_stopped" : "%s crmd.*Node %s: .* state=lost .new",            
            "Pat:ChildExit"    : "Child process .* exited",

            # Bad news Regexes.  Should never occur.
            "BadRegexes"   : (
                r" trace:",
                r"error:",
                r"crit:",
                r"ERROR:",
                r"CRIT:",
                r"Shutting down...NOW",
                r"Timer I_TERMINATE just popped",
                r"input=I_ERROR",
                r"input=I_FAIL",
                r"input=I_INTEGRATED cause=C_TIMER_POPPED",
                r"input=I_FINALIZED cause=C_TIMER_POPPED",
                r"input=I_ERROR",
                r", exiting\.",
                r"(WARN|warn).*Ignoring HA message.*vote.*not in our membership list",
                r"pengine.*Attempting recovery of resource",
                r"is taking more than 2x its timeout",
                r"Confirm not received from",
                r"Welcome reply not received from",
                r"Attempting to schedule .* after a stop",
                r"Resource .* was active at shutdown",
                r"duplicate entries for call_id",
                r"Search terminated:",
                r":global_timer_callback",
                r"Faking parameter digest creation",
                r"Parameters to .* action changed:",
                r"Parameters to .* changed",
                r"Child process .* terminated with signal 11",
                r"Executing .* fencing operation",
                r"LogActions: Recover",

                # Not inherently bad, but worth tracking
                #r"No need to invoke the TE",
                #r"ping.*: DEBUG: Updated connected = 0",
                #r"Digest mis-match:",
            ),
        })
Example #5
0
    def __init__(self, Environment, randseed=None):
        crm_lha.__init__(self, Environment, randseed=randseed)

        self.update({
            "Name":
            "crm-ais",
            "EpocheCmd":
            "crm_node -e --openais",
            "QuorumCmd":
            "crm_node -q --openais",
            "ParitionCmd":
            "crm_node -p --openais",
            "Pat:They_stopped":
            "%s crmd.*Node %s\[.*state is now lost",
            "Pat:ChildExit":
            "Child process .* exited",

            # Bad news Regexes.  Should never occur.
            "BadRegexes": (
                r" trace:",
                r"error:",
                r"crit:",
                r"ERROR:",
                r"CRIT:",
                r"Shutting down...NOW",
                r"Timer I_TERMINATE just popped",
                r"input=I_ERROR",
                r"input=I_FAIL",
                r"input=I_INTEGRATED cause=C_TIMER_POPPED",
                r"input=I_FINALIZED cause=C_TIMER_POPPED",
                r"input=I_ERROR",
                r", exiting\.",
                r"(WARN|warn).*Ignoring HA message.*vote.*not in our membership list",
                r"pengine.*Attempting recovery of resource",
                r"is taking more than 2x its timeout",
                r"Confirm not received from",
                r"Welcome reply not received from",
                r"Attempting to schedule .* after a stop",
                r"Resource .* was active at shutdown",
                r"duplicate entries for call_id",
                r"Search terminated:",
                r":global_timer_callback",
                r"Faking parameter digest creation",
                r"Parameters to .* action changed:",
                r"Parameters to .* changed",
                r"Child process .* terminated with signal",
                r"Executing .* fencing operation",
                r"LogActions: Recover",
                r"rsyslogd.* imuxsock lost .* messages from pid .* due to rate-limiting",
                r"Peer is not part of our cluster",
                r"We appear to be in an election loop",
                r"Unknown node -> we will not deliver message",
                r"crm_write_blackbox",
                r"pacemakerd.*Could not connect to Cluster Configuration Database API",

                #r"crm_ipc_send:.*Request .* failed",
                #r"crm_ipc_send:.*Sending to .* is disabled until pending reply is recieved",

                # Not inherently bad, but worth tracking
                #r"No need to invoke the TE",
                #r"ping.*: DEBUG: Updated connected = 0",
                #r"Digest mis-match:",
                r"te_graph_trigger: Transition failed: terminated",
                r"fence_pcmk.* Call to fence",
                r"fence_pcmk",
                r"cman killed by node",
            ),
        })
Example #6
0
    def __init__(self, Environment, randseed=None, name=None):
        if not name: name = "crm-ais"
        crm_lha.__init__(self, Environment, randseed=randseed, name=name)

        self.fullcomplist = {}
        self.templates = PatternSelector(self.name)