/usr/share/check_mk/checks/heartbeat_crm is in check-mk-server 1.1.12-1ubuntu1.
This file is owned by root:root, with mode 0o755.
The actual contents of the file can be viewed below.
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 163 164 165 166 167 168 169 170 171 172 173 174 175 176 177 178 179 180 181 182 183 184 185 186 187 188 189 190 191 192 193 194 195 | #!/usr/bin/python
# -*- encoding: utf-8; py-indent-offset: 4 -*-
# +------------------------------------------------------------------+
# | ____ _ _ __ __ _ __ |
# | / ___| |__ ___ ___| | __ | \/ | |/ / |
# | | | | '_ \ / _ \/ __| |/ / | |\/| | ' / |
# | | |___| | | | __/ (__| < | | | | . \ |
# | \____|_| |_|\___|\___|_|\_\___|_| |_|_|\_\ |
# | |
# | Copyright Mathias Kettner 2010 mk@mathias-kettner.de |
# +------------------------------------------------------------------+
#
# This file is part of Check_MK.
# The official homepage is at http://mathias-kettner.de/check_mk.
#
# check_mk is free software; you can redistribute it and/or modify it
# under the terms of the GNU General Public License as published by
# the Free Software Foundation in version 2. check_mk is distributed
# in the hope that it will be useful, but WITHOUT ANY WARRANTY; with-
# out even the implied warranty of MERCHANTABILITY or FITNESS FOR A
# PARTICULAR PURPOSE. See the GNU General Public License for more de-
# ails. You should have received a copy of the GNU General Public
# License along with GNU Make; see the file COPYING. If not, write
# to the Free Software Foundation, Inc., 51 Franklin St, Fifth Floor,
# Boston, MA 02110-1301 USA.
# Author: Lars Michelsen <lm@mathias-kettner.de>
# Example outputs from agent:
# <<<heartbeat_crm>>>
# ============
# Last updated: Thu Jul 1 07:48:19 2010
# Current DC: mwp (118cc1e7-bbf3-4550-b820-cac372885be1)
# 2 Nodes configured.
# 2 Resources configured.
# ============
# Node: smwp (2395453b-d647-48ff-a908-a7cd76062265): online
# Node: mwp (118cc1e7-bbf3-4550-b820-cac372885be1): online
# Full list of resources:
# Resource Group: group_slapmaster
# resource_virtip1 (ocf::heartbeat:IPaddr): Started mwp
# resource_virtip2 (ocf::heartbeat:IPaddr): Started mwp
# resource_pingnodes (ocf::heartbeat:pingd): Started mwp
# resource_slapmaster (ocf::heartbeat:OpenLDAP): Started mwp
# resource_slapslave (ocf::heartbeat:OpenLDAP): Started smwp
import time, datetime
# Nails down the DC to the node which is the DC during inventory. The check
# will report CRITICAL when another node becomes the DC during later checks.
# If set to "False" the check will be passed.
heartbeat_crm_naildown = True
# Max age of "last updated"
heartbeat_crm_default_max_age = 60
# Naildown the resources to the nodes which care about the resources during
# the inventory run
heartbeat_crm_resources_naildown = True
def heartbeat_crm_parse_general(info, dc = '', numNodes = -1, numResources = -1):
for line in info:
if ' '.join(line[0:2]) == 'Last updated:':
lastUpdated = ' '.join(line[2:])
elif dc == '' and ' '.join(line[0:2]) == 'Current DC:' and heartbeat_crm_naildown:
dc = line[2]
elif numNodes == -1 and ' '.join(line[1:3]) == 'Nodes configured.':
numNodes = int(line[0])
elif numResources == -1 and ' '.join(line[1:3]) == 'Resources configured.':
numResources = int(line[0])
return (lastUpdated, dc, numNodes, numResources)
def inventory_heartbeat_crm(info):
# Use these lines to gather the inventory and perform this check:
# ============
# Last updated: Thu Jul 1 07:48:19 2010
# Current DC: mwp (118cc1e7-bbf3-4550-b820-cac372885be1)
# 2 Nodes configured.
# 2 Resources configured.
# ============
#
# - Naildown the DC or not.
# - Check the number of nodes/resources
# - Check the age of "last updated"
if len(info) > 0:
lastUpdated, dc, numNodes, numResources = heartbeat_crm_parse_general(info)
if not heartbeat_crm_naildown:
dc = None # Ignore DC on check
return [(None, '(heartbeat_crm_default_max_age, %r, %d, %d)' % (dc, numNodes, numResources))]
def check_heartbeat_crm(item, params, info):
if len(info) > 0:
lastUpdated, dc, numNodes, numResources = heartbeat_crm_parse_general(info)
param_max_age, param_dc, param_nodes, param_ressources = params
# Check the freshness of the crm_mon output and terminate with CRITICAL
# when too old information are found
dt = int(datetime.datetime(*time.strptime(lastUpdated, '%a %b %d %H:%M:%S %Y')[0:5]).strftime("%s"))
now = time.time()
delta = now - dt
if delta > param_max_age:
return (2, 'CRIT - Status output too old: %d secs' % delta)
output = ''
status = 0
# Check for correct DC when enabled
if param_dc:
if dc == param_dc:
output += 'DC: %s, ' % dc
else:
output += 'DC: %s (Expected %s), ' % (dc, param_dc)
status = 2
# Check for number of nodes when enabled
if param_nodes != -1:
if numNodes == param_nodes:
output += 'Nodes: %d, ' % numNodes
else:
output += 'Nodes: %d (Expected %d), ' % (numNodes, param_nodes)
status = 2
# Check for number of resources when enabled
if param_ressources != -1:
if numResources == param_ressources:
output += 'Resources: %d, ' % numResources
else:
output += 'Resources: %d (Expected %d), ' % (numResources, param_ressources)
status = 2
return (status, '%s - %s' % (nagios_state_names[status], output.rstrip(', ')))
return (3, "UNKNOWN - Empty output from agent")
def heartbeat_crm_parse_resources(info):
blockStart = False
resources = {}
resource = ''
for line in info:
if not blockStart and ' '.join(line) == 'Full list of resources:':
blockStart = True
elif blockStart:
if ' '.join(line[0:2]) == 'Resource Group:':
# Resource group
resources[line[-1]] = []
resource = line[-1]
elif line[0] == '_':
# Resource group member
resources[resource].append(line[1:])
else:
# Single resource
resources[line[0]] = [ line ]
return resources
def inventory_heartbeat_crm_resources(info):
# Full list of resources:
# Resource Group: group_slapmaster
# resource_virtip1 (ocf::heartbeat:IPaddr): Started mwp
# resource_virtip2 (ocf::heartbeat:IPaddr): Started mwp
# resource_pingnodes (ocf::heartbeat:pingd): Started mwp
# resource_slapmaster (ocf::heartbeat:OpenLDAP): Started mwp
# resource_slapslave (ocf::heartbeat:OpenLDAP): Started smwp
inventory = []
if len(info) > 0:
for name, resources in heartbeat_crm_parse_resources(info).iteritems():
# In naildown mode only resources which are started somewhere can be
# inventorized
if heartbeat_crm_resources_naildown and resources[0][2] != 'Stopped':
inventory.append((name, '"%s"' % resources[0][3]))
else:
inventory.append((name, None))
return inventory
def check_heartbeat_crm_resources(item, target_node, info):
output = ''
status = 0
for resource in [ resources for name, resources in heartbeat_crm_parse_resources(info).iteritems() if name == item ][0]:
output += ' '.join(resource)
if len(resource) == 3 or resource[2] != 'Started':
status = 2
output += ' (CRITICAL: Resource is in state "%s")' % resource[2]
elif target_node and target_node != resource[3]:
status = 2
output += ' (CRITICAL: Expected node: %s)' % target_node
output += ', '
return (status, '%s - %s' % (nagios_state_names[status], output.rstrip(', ')))
check_info['heartbeat_crm'] = (check_heartbeat_crm, "Heartbeat CRM General", 0, inventory_heartbeat_crm)
check_info['heartbeat_crm.resources'] = (check_heartbeat_crm_resources, "Heartbeat CRM %s", 0, inventory_heartbeat_crm_resources)
check_config_variables.append("heartbeat_crm_naildown")
check_config_variables.append("heartbeat_crm_resources_naildown")
|