1
0
mirror of https://github.com/opinkerfi/nagios-plugins.git synced 2024-11-25 03:43:46 +01:00
nagios-plugins/check_storwize/check_storwize.py

206 lines
7.2 KiB
Python
Raw Normal View History

#!/usr/bin/env python
from pynag.Plugins import PluginHelper, ok, warning, critical, unknown
from pynag.Utils import runCommand
from collections import namedtuple
2013-12-06 14:58:44 +01:00
valid_queries = "lsarray lsdrive lsenclosurebattery lsenclosurecanister lsenclosurepsu lsenclosureslot lsenclosure lsmdiskgrp lsmdskgrp lsmgrp lsrcrelationship lsvdisk"
p = PluginHelper()
p.add_option("-H", "--hostname", '-M', help="Hostname or ip address", dest="hostname")
p.add_option("-U", "--user", help="Log in as this user to storwize", dest="user", default="nagios")
p.add_option("-Q", "--query", help="Query to send to storwize (see also -L)", dest="query", default="lsarray")
p.add_option("-L", "--list-queries", help="List of valid queries", dest="list_queries", action="store_true")
p.add_option("--test", help="Run this plugin in test mode", dest="test", action="store_true")
p.parse_arguments()
2013-12-06 16:53:59 +01:00
if p.options.list_queries is True:
p.parser.error("Valid Queries: %s" % valid_queries)
if not p.options.hostname:
2013-11-19 16:59:36 +01:00
p.parser.error("Required options -H is missing")
if p.options.query not in valid_queries.split():
2013-11-19 16:59:36 +01:00
p.parser.error("%s does not look like a valid query. Use -L for a list of valid queries" % p.options.query)
query = p.options.query
2013-11-19 16:59:36 +01:00
# Connect to remote storwize and run a connect
2013-11-19 16:59:36 +01:00
def run_query():
""" Connect to a remote storwize box and run query """
command = "ssh %s@%s %s -delim ':'" % (p.options.user, p.options.hostname, p.options.query)
2013-11-19 16:59:36 +01:00
if p.options.test:
2013-12-06 16:48:55 +01:00
command = "cat %s.txt" % (p.options.query)
2013-11-19 16:59:36 +01:00
return_code, stdout, stderr = runCommand(command)
if return_code != 0:
p.status(unknown)
p.add_summary("Got error %s when trying to log into remote storwize box" % return_code)
p.add_long_output("\ncommand:\n===============\n%s" % command)
p.add_long_output("\nStandard output:\n==============\n%s" % (stdout))
p.add_long_output("\nStandard stderr:\n==============\n%s" % (stderr))
p.exit()
if stderr:
p.status(unknown)
p.add_summary("Error when connecting to storwize: %s" % stderr)
p.exit()
# Parse the output of run query and return a list of "rows"
lines = stdout.splitlines()
top_line = lines.pop(0)
headers = top_line.split(':')
2013-11-19 16:59:36 +01:00
Row = namedtuple('Row', ' '.join(headers))
rows = []
for i in lines:
i = i.strip()
columns = i.split(':')
2013-11-19 16:59:36 +01:00
row = Row(*columns)
rows.append(row)
return rows
def check_lsmdiskgrp():
p.add_summary("%s diskgroups found" % (len(rows)))
p.add_metric("number of groups", len(rows))
for row in rows:
if row.status != 'online':
p.status(critical)
p.add_summary("group %s is %s." % (row.name, row.status))
p.add_long_output("%s: used: %s out of %s" % (row.name, row.used_capacity, row.capacity))
# Add a performance metric
metric_name = "%s_capacity" % row.name
p.add_metric(metric_name, value=row.used_capacity, max=row.capacity)
def check_lsdrive():
p.add_summary("%s drives found" % (len(rows)))
p.add_metric("number of drives", len(rows))
for row in rows:
if row.status != 'online':
2013-12-06 15:16:57 +01:00
p.status(critical)
2013-11-19 16:59:36 +01:00
p.add_summary("drive %s is %s" % (row.id, row.status))
2013-12-06 16:48:55 +01:00
def check_lsmgrp():
p.add_summary("%s groups found" % (len(rows)))
p.add_metric("number of groups", len(rows))
for row in rows:
if row.status != 'online':
p.status(critical)
p.add_summary("group %s is %s" % (row.name, row.status))
2013-12-06 14:58:44 +01:00
def check_lsenclosurebattery():
p.add_summary("%s batteries found" % (len(rows)))
p.add_metric("number of batteries", len(rows))
for row in rows:
if row.status != 'online':
2013-12-06 15:16:57 +01:00
p.status(critical)
2013-12-06 14:58:44 +01:00
p.add_summary("battery %s:%s is %s" % (row.enclosure_id, row.battery_id, row.status))
2013-12-06 15:16:57 +01:00
def check_lsenclosurecanister():
p.add_summary("%s canisters found" % (len(rows)))
p.add_metric("number of canisters", len(rows))
for row in rows:
if row.status != 'online':
p.status(critical)
p.add_summary("canister %s:%s is %s" % (row.enclosure_id, row.canister_id, row.status))
2013-12-06 15:18:15 +01:00
def check_lsenclosurepsu():
2013-12-06 15:16:57 +01:00
p.add_summary("%s psu found" % (len(rows)))
p.add_metric("number of psu", len(rows))
for row in rows:
if row.status != 'online':
p.status(critical)
p.add_summary("psu %s:%s is %s" % (row.enclosure_id, row.PSU_id, row.status))
def check_lsenclosure():
p.add_summary("%s enclosures found" % (len(rows)))
p.add_metric("number of enclosures", len(rows))
for row in rows:
if row.status != 'online':
p.status(critical)
p.add_summary("enclosure %s is %s" % (row.id, row.status))
2013-12-06 16:48:55 +01:00
def check_lsenclosureslot():
p.add_summary("%s slots found" % (len(rows)))
p.add_metric("number of slots", len(rows))
for row in rows:
if row.port_1_status != 'online':
p.status(critical)
p.add_summary("port1 on slot %s:%s is %s" % (row.enclosure_id, row.slot_id, row.port_1_status))
if row.port_2_status != 'online':
p.status(critical)
p.add_summary("port2 on slot %s:%s is %s" % (row.enclosure_id, row.slot_id, row.port_2_status))
2013-12-06 15:18:15 +01:00
def check_lsrcrelationship():
2013-12-06 16:48:55 +01:00
p.add_summary("%s cluster relationships found" % (len(rows)))
2013-12-06 15:16:57 +01:00
p.add_metric("number of relationships", len(rows))
for row in rows:
2013-12-06 16:48:55 +01:00
if row.state != 'consistent_synchronized':
2013-12-06 15:16:57 +01:00
p.status(critical)
2013-12-06 16:48:55 +01:00
p.add_summary("%s is %s" % (row.consistency_group_name, row.state))
2013-12-06 15:16:57 +01:00
def check_lsvdisk():
p.add_summary("%s disks found" % (len(rows)))
p.add_metric("number of disks", len(rows))
for row in rows:
if row.status != 'online':
2013-12-06 15:16:57 +01:00
p.status(critical)
p.add_summary("disk %s is %s" % (row.name, row.status))
2013-11-19 16:59:36 +01:00
def check_lsarray():
p.add_summary("%s arrays found" % (len(rows)))
p.add_metric("number of arrays", len(rows))
for row in rows:
if row.status != 'online':
2013-12-06 16:48:55 +01:00
p.add_summary("array %s is %s." % (row.mdisk_name, row.status))
p.status(critical)
if row.raid_status != 'online':
p.add_summary("array %s has raid status %s." % (row.mdisk_name, row.raid_status))
2013-11-19 16:59:36 +01:00
p.status(critical)
# Add some performance metrics
metric_name = row.mdisk_name + "_capacity"
p.add_metric(metric_name, value=row.capacity)
# Run our given query, and parse the output
rows = run_query()
if query == 'lsmdiskgrp':
check_lsmdiskgrp()
elif query == 'lsarray':
check_lsarray()
elif query == 'lsdrive':
check_lsdrive()
elif query == 'lsvdisk':
check_lsvdisk()
2013-12-06 16:48:55 +01:00
elif query == 'lsmgrp':
check_lsmgrp()
2013-12-06 15:16:57 +01:00
elif query == 'lsenclosure':
check_lsenclosure()
2013-12-06 14:58:44 +01:00
elif query == 'lsenclosurebattery':
check_lsenclosurebattery()
2013-12-06 15:16:57 +01:00
elif query == 'lsenclosurecanister':
check_lsenclosurecanister()
elif query == 'lsenclosurepsu':
check_lsenclosurepsu()
elif query == 'lsrcrelationship':
check_lsrcrelationship()
2013-12-06 16:48:55 +01:00
elif query == 'lsenclosureslot':
check_lsenclosureslot()
else:
p.status(unknown)
p.add_summary("unsupported query: %s. See -L for list of valid queries" % query)
2013-11-19 16:59:36 +01:00
p.exit()
# Check metrics and exit
p.check_all_metrics()
p.exit()