/usr/share/check_mk/checks/smart is in check-mk-server 1.2.2p3-1.
This file is owned by root:root, with mode 0o755.
The actual contents of the file can be viewed below.
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 | #!/usr/bin/python
# -*- encoding: utf-8; py-indent-offset: 4 -*-
# +------------------------------------------------------------------+
# | ____ _ _ __ __ _ __ |
# | / ___| |__ ___ ___| | __ | \/ | |/ / |
# | | | | '_ \ / _ \/ __| |/ / | |\/| | ' / |
# | | |___| | | | __/ (__| < | | | | . \ |
# | \____|_| |_|\___|\___|_|\_\___|_| |_|_|\_\ |
# | |
# | Copyright Mathias Kettner 2013 mk@mathias-kettner.de |
# +------------------------------------------------------------------+
#
# This file is part of Check_MK.
# The official homepage is at http://mathias-kettner.de/check_mk.
#
# check_mk is free software; you can redistribute it and/or modify it
# under the terms of the GNU General Public License as published by
# the Free Software Foundation in version 2. check_mk is distributed
# in the hope that it will be useful, but WITHOUT ANY WARRANTY; with-
# out even the implied warranty of MERCHANTABILITY or FITNESS FOR A
# PARTICULAR PURPOSE. See the GNU General Public License for more de-
# ails. You should have received a copy of the GNU General Public
# License along with GNU Make; see the file COPYING. If not, write
# to the Free Software Foundation, Inc., 51 Franklin St, Fifth Floor,
# Boston, MA 02110-1301 USA.
# Author: Lars Michelsen <lm@mathias-kettner.de>
# EXAMPLE DATA FROM: WDC SSC-D0128SC-2100
#<<<smart>>>
#/dev/sda ATA WDC_SSC-D0128SC- 1 Raw_Read_Error_Rate 0x000b 100 100 050 Pre-fail Always - 16777215
#/dev/sda ATA WDC_SSC-D0128SC- 3 Spin_Up_Time 0x0007 100 100 050 Pre-fail Always - 0
#/dev/sda ATA WDC_SSC-D0128SC- 5 Reallocated_Sector_Ct 0x0013 100 100 050 Pre-fail Always - 0
#/dev/sda ATA WDC_SSC-D0128SC- 7 Seek_Error_Rate 0x000b 100 100 050 Pre-fail Always - 0
#/dev/sda ATA WDC_SSC-D0128SC- 9 Power_On_Hours 0x0012 100 100 000 Old_age Always - 1408
#/dev/sda ATA WDC_SSC-D0128SC- 10 Spin_Retry_Count 0x0013 100 100 050 Pre-fail Always - 0
#/dev/sda ATA WDC_SSC-D0128SC- 12 Power_Cycle_Count 0x0012 100 100 000 Old_age Always - 523
#/dev/sda ATA WDC_SSC-D0128SC- 168 Unknown_Attribute 0x0012 100 100 000 Old_age Always - 1
#/dev/sda ATA WDC_SSC-D0128SC- 175 Program_Fail_Count_Chip 0x0003 100 100 010 Pre-fail Always - 0
#/dev/sda ATA WDC_SSC-D0128SC- 192 Power-Off_Retract_Count 0x0012 100 100 000 Old_age Always - 0
#/dev/sda ATA WDC_SSC-D0128SC- 194 Temperature_Celsius 0x0022 040 100 000 Old_age Always - 40 (Lifetime Min/Max 30/60)
#/dev/sda ATA WDC_SSC-D0128SC- 197 Current_Pending_Sector 0x0012 100 100 000 Old_age Always - 0
#/dev/sda ATA WDC_SSC-D0128SC- 240 Head_Flying_Hours 0x0013 100 100 050 Pre-fail Always - 0
#/dev/sda ATA WDC_SSC-D0128SC- 170 Unknown_Attribute 0x0003 100 100 010 Pre-fail Always - 1769478
#/dev/sda ATA WDC_SSC-D0128SC- 173 Unknown_Attribute 0x0012 100 100 000 Old_age Always - 4217788040605
smart_temp_default_levels = (35, 40)
smart_stats_default_levels = {
'realloc_events': (1, 1),
'realloc_sectors': (1, 1),
'spin_retries': (1, 1),
'pending_retries': (1, 1),
'pending_sectors': (1, 1),
'cmd_timeouts': (5, 10),
'e2e_errs': (1, 1),
'uncorr_errs': (1, 1),
'udma_crcs': (1, 1),
}
def inventory_smart(check_type, info):
inventory = []
for line in info:
if len(line) < 13:
continue
if check_type == 'smart.stats' \
and line[4] in [ 'Power_On_Hours', 'Power_Cycle_Count',
'Reallocated_Sector_Ct', 'Spin_Retry_Count',
'Reallocated_Event_Count', 'Current_Pending_Sector',
'Command_Timeout', 'End-to-End_Error',
'Reported_Uncorrect', 'UDMA_CRC_Error_Count', ] \
and not (line[0], None) in inventory:
inventory.append((line[0], None, 'smart_stats_default_levels'))
elif check_type == 'smart.temp' and line[4] == 'Temperature_Celsius':
inventory.append((line[0], None, 'smart_temp_default_levels'))
return inventory
def check_smart_stats(item, params, info):
status = 0
output = []
perfdata = []
for line in info:
if len(line) != 13 or line[0] != item:
continue
for uom, lab, txt, thresh in [
(' hours', 'Power_On_Hours', 'Powered on', None),
('', 'Power_Cycle_Count', 'Power cycles', None),
('', 'Reallocated_Sector_Ct', 'Reallocated sectors', 'realloc_sectors'),
('', 'Reallocated_Event_Count', 'Reallocated events', 'realloc_events'),
('', 'Spin_Retry_Count', 'Spin retries', 'spin_retries'),
('', 'Current_Pending_Sector', 'Pending sectors', 'pending_sectors'),
('', 'Command_Timeout', 'Command timeouts', 'cmd_timeouts'),
('', 'End-to-End_Error', 'End-to-End errors', 'e2e_errs'),
('', 'Reported_Uncorrect', 'Uncorrectable errors', 'uncorr_errs'),
('', 'UDMA_CRC_Error_Count', 'UDMA CRC errors', 'udma_crcs'),
]:
if line[4] == lab:
value = int(line[12].split("/", 1)[0])
warn, crit, cur_status, thresh_out = None, None, 0, ''
if thresh in params and value >= params[thresh][1]:
cur_status = 2
thresh_out = '(!!)'
elif thresh in params and value >= params[thresh][0]:
cur_status = 1
thresh_out = '(!)'
perfdata.append((lab, value, thresh and params[thresh][0] or None, thresh and params[thresh][1] or None))
output.append('%s: %d%s%s' % (txt, value, uom, thresh_out))
status = max(status, cur_status)
if not output:
return (3, 'UNKNOWN - Found no info in agent outout')
return (status, '%s - %s' % (nagios_state_names[status], ', '.join(output)), perfdata)
# Written by Benjamin Odenthal
# http://exchange.check-mk.org/index.php?option=com_remository&Itemid=53&func=fileinfo&id=1
def check_smart_temp(item, params, info):
warn, crit = params
for line in info:
if len(line) >= 13 and line[0] == item and line[4] == "Temperature_Celsius":
celsius = int(line[12])
perfdata = [ ( "temp", celsius, warn, crit ) ]
if celsius >= crit:
return (2, "CRIT - Temperature is %dC" % celsius, perfdata)
elif celsius >= warn:
return (1, "WARN - Temperature is %dC" % celsius, perfdata)
else:
return (0, "OK - Temperature is %dC" % celsius, perfdata)
return (3, "UNKNOWN - Temperature_Celsius not found in agent output for disk %s" % item)
check_info["smart.stats"] = {
'check_function': check_smart_stats,
'inventory_function': lambda info: inventory_smart("smart.stats", info),
'service_description': 'SMART %s Stats',
'has_perfdata': True,
}
check_info["smart.temp"] = {
'check_function': check_smart_temp,
'inventory_function': lambda info: inventory_smart("smart.temp", info),
'service_description': 'Temperature SMART %s',
'group': 'disk_temperature',
'has_perfdata': True,
}
|