summaryrefslogtreecommitdiffstats
path: root/plugins/check_cluster_vol_usage.py
diff options
context:
space:
mode:
authorSahina Bose <sabose@redhat.com>2014-03-14 12:49:59 +0530
committerBala.FA <barumuga@redhat.com>2014-04-29 10:21:36 +0530
commitad004f45088ee81723b2a2420b3bce01f0bd845b (patch)
tree126104f6a84140b5f459b44d641e94ae4376d3d9 /plugins/check_cluster_vol_usage.py
parent998e1f9ef43f8fd6e2a7a3722bfd4f3f734c450d (diff)
plugins: Plugin to check the cluster utilization
This plugin sums up the volume utilization outputs in a cluster Added a utils livestatus for common code related to mk_livestatus Added constants for livestatussocket path Change-Id: Id665ad3aaa1140e54c831d721ee874421ae84fa3 Signed-off-by: Sahina Bose <sabose@redhat.com> Reviewed-on: https://cuckoo.blr.redhat.com:8443/10 Reviewed-by: Bala FA <barumuga@redhat.com>
Diffstat (limited to 'plugins/check_cluster_vol_usage.py')
-rwxr-xr-xplugins/check_cluster_vol_usage.py105
1 files changed, 105 insertions, 0 deletions
diff --git a/plugins/check_cluster_vol_usage.py b/plugins/check_cluster_vol_usage.py
new file mode 100755
index 0000000..2225634
--- /dev/null
+++ b/plugins/check_cluster_vol_usage.py
@@ -0,0 +1,105 @@
+#!/usr/bin/python
+#
+# check_cluster_vol_usage
+# Aggregated cluster capacity utilization for a
+# gluster cluster
+# The plugin reads status data using mk-livestatus
+# Assumptions:
+# - Volume utilization service names begin with "Volume-"
+# - Host name associated is cluster name
+# - All volume utilization output is of form
+# "used=<val>;warn;crit;min;max"
+#
+# Copyright (C) 2014 Red Hat Inc
+#
+# This program is free software; you can redistribute it and/or
+# modify it under the terms of the GNU General Public License
+# as published by the Free Software Foundation; either version 2
+# of the License, or (at your option) any later version.
+#
+# This program is distributed in the hope that it will be useful,
+# but WITHOUT ANY WARRANTY; without even the implied warranty of
+# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
+# GNU General Public License for more details.
+#
+# You should have received a copy of the GNU General Public License
+# along with this program; if not, write to the Free Software
+# Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301, USA
+#
+
+import sys
+import re
+from argparse import ArgumentParser
+from plugins import livestatus
+
+
+def checkVolumePerfData(clusterName):
+
+ # Write command to socket
+ cmd = "GET services\nColumns: description host_name " \
+ "perf_data custom_variables\nFilter: " \
+ "description ~~ %s\n" % 'Volume-'
+ table = livestatus.readLiveStatus(cmd)
+ totalUsed = 0.0
+ totalAvail = 0.0
+ for row in table:
+ if len(row) <= 3:
+ return 0.0, 0.0
+ host = row[1]
+ perf_data = row[2]
+ if len(perf_data) > 2:
+ perf_arr = perf_data.split(' ')
+ used = perf_arr[2].split('=')[1]
+ avail = perf_arr[1].split('=')[1]
+ if host == clusterName:
+ totalUsed += float(re.match(r'\d*\.?\d+', used).group())
+ totalAvail += float(re.match(r'\d*\.?\d+', avail).group())
+ return totalUsed, totalAvail
+
+# Main method
+if __name__ == "__main__":
+
+ parser = ArgumentParser(description=
+ "Calculate the aggregate "
+ "capacity usage in cluster")
+ parser.add_argument('-w', '--warning',
+ action='store',
+ type=int,
+ dest='warn',
+ help='Warning in %',
+ default=70)
+ parser.add_argument('-c', '--critical',
+ action='store',
+ type=int,
+ dest='crit',
+ help='Critical threshold Warning in %',
+ default=95)
+ parser.add_argument('-hg', '--host-group',
+ action='store',
+ type=str,
+ dest='hostgroup',
+ help='Name of cluster or hostgroup',
+ required=True)
+ args = parser.parse_args()
+ # Check the various performance statuses for the host
+ used, avail = checkVolumePerfData(args.hostgroup)
+ statusstr = "OK"
+ exitstatus = 0
+ if used == 0 and avail == 0:
+ statusstr = "UNKNOWN"
+ exitstatus = 3
+ else:
+ warn = int((args.warn * avail) / 100.0)
+ crit = int((args.crit * avail) / 100.0)
+ usedpercent = int((used/avail) * 100.0)
+ if (usedpercent >= args.warn):
+ statusstr = "WARNING"
+ exitstatus = 1
+ if (usedpercent >= args.crit):
+ statusstr = "CRITICAL"
+ exitstatus = 2
+
+ print ("%s - used %s%% of available %s|used=%s;%s;%s;0;%s;"
+ % (statusstr, usedpercent,
+ avail, usedpercent, args.warn, args.crit, 100))
+ sys.exit(exitstatus)