This repository has been archived by the owner on Nov 8, 2023. It is now read-only.
-
Notifications
You must be signed in to change notification settings - Fork 4
/
check_purefa_perf.py
executable file
·156 lines (136 loc) · 6.42 KB
/
check_purefa_perf.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
#!/usr/bin/env python
# Copyright (c) 2018, 2019, 2020, 2022 Pure Storage, Inc.
#
# * Overview
#
# This simple Nagios/Icinga plugin code can be used to monitor Pure Storage FlashArrays.
# The Pure Storage Python REST Client is used to query the FlashArray performance counters. An optional parameter
# allow to check a single volume instead than the whole flasharray
#
# * Installation
#
# The script should be copied to the Nagios plugins directory on the machine hosting the Nagios server or the NRPE
# for example the /usr/lib/nagios/plugins folder.
# Change the execution rights of the program to allow the execution to 'all' (usually chmod 0755).
#
"""Pure Storage FlashArray performance indicators
Nagios plugin to retrieve the six (6) basic KPIs from a Pure Storage FlashArray.
Bandwidth counters (read/write), IOPs counters (read/write) and latency (read/write) are collected from the
target FA using the REST call.
The plugin has two mandatory arguments: 'endpoint', which specifies the target FA and 'apitoken', which
specifies the autentication token for the REST call session. A third optional parameter, 'volname' can
be used to check a specific named volume.
The plugin accepts multiple warning and critical threshold parameters in a positional fashion:
1st threshold refers to write latency
2nd threshold refers to read latency
3rd threshold refers to write bandwidth
4th threshold refers to read bandwidth
5th threshold refers to write IOPS
6th threshold refers to read IOPS
"""
import sys
if not sys.warnoptions:
import warnings
warnings.simplefilter("ignore")
import argparse
import logging
import logging.handlers
import nagiosplugin
from pypureclient import flasharray, PureError
# Disable warnings using urllib3 embedded in requests or directly
try:
import requests
from requests.packages.urllib3.exceptions import InsecureRequestWarning
requests.packages.urllib3.disable_warnings(InsecureRequestWarning)
except:
import urllib3
urllib3.disable_warnings(urllib3.exceptions.InsecureRequestWarning)
class PureFAperf(nagiosplugin.Resource):
"""Pure Storage FlashArray performance indicators
Get the six global KPIs of the flasharray and stores them in the
metric objects
"""
def __init__(self, endpoint, apitoken, volname=None):
self.endpoint = endpoint
self.apitoken = apitoken
self.volname = volname
self.logger = logging.getLogger(self.name)
handler = logging.handlers.SysLogHandler(address = '/dev/log')
handler.setLevel(logging.ERROR)
formatter = logging.Formatter('%(asctime)s - %(name)s - %(levelname)s - %(message)s')
handler.setFormatter(formatter)
self.logger.addHandler(handler)
@property
def name(self):
if (self.volname is None):
return 'PURE_FA_PERF'
else:
return 'PURE_FA_VOL_PERF'
def get_perf(self):
"""Get performance counters from flasharray."""
fainfo = {}
try:
client = flasharray.Client(target=self.endpoint,
api_token=self.apitoken,
user_agent='Pure_Nagios_plugin/0.2.0')
if (self.volname is None):
res = client.get_arrays_performance()
else:
res = client.get_volumes_performance(names=[self.volname])
if isinstance(res, flasharray.ValidResponse):
fainfo = res.items.next()
except Exception as e:
raise nagiosplugin.CheckError('FA REST call returned "{}"'.format(e))
return(fainfo)
def probe(self):
fainfo = self.get_perf()
if not fainfo:
return []
wlat = int(fainfo.usec_per_write_op)
rlat = int(fainfo.usec_per_read_op)
wbw = int(fainfo.write_bytes_per_sec)
rbw = int(fainfo.read_bytes_per_sec)
wiops = int(fainfo.writes_per_sec)
riops = int(fainfo.reads_per_sec)
if (self.volname is None):
mlabel = 'FA_'
else:
mlabel = self.volname + '_'
metrics = [
nagiosplugin.Metric(mlabel + 'wlat', wlat, 'us', min=0, context='wlat'),
nagiosplugin.Metric(mlabel + 'rlat', rlat, 'us', min=0, context='rlat'),
nagiosplugin.Metric(mlabel + 'wbw', wbw, min=0, context='wbw'),
nagiosplugin.Metric(mlabel + 'rbw', rbw, min=0, context='rbw'),
nagiosplugin.Metric(mlabel + 'wiops', wiops, min=0, context='wiops'),
nagiosplugin.Metric(mlabel + 'riops', riops, min=0, context='riops')
]
return metrics
def parse_args():
argp = argparse.ArgumentParser()
argp.add_argument('endpoint', help="FA hostname or ip address")
argp.add_argument('apitoken', help="FA api_token")
argp.add_argument('--vol', help="FA volme. If omitted the whole FA performance counters are checked")
argp.add_argument('--tw', '--ttot-warning', metavar='RANGE[,RANGE,...]',
type=nagiosplugin.MultiArg, default='',
help="positional thresholds: write_latency, read_latency, write_bandwidth, read_bandwidth, write_iops, read_iops")
argp.add_argument('--tc', '--ttot-critical', metavar='RANGE[,RANGE,...]',
type=nagiosplugin.MultiArg, default='',
help="positional thresholds: write_latency, read_latency, write_bandwidth, read_bandwidth, write_iops, read_iops")
argp.add_argument('-v', '--verbose', action='count', default=0,
help='increase output verbosity (use up to 3 times)')
argp.add_argument('-t', '--timeout', default=30,
help='abort execution after TIMEOUT seconds')
return argp.parse_args()
@nagiosplugin.guarded
def main():
args = parse_args()
check = nagiosplugin.Check( PureFAperf(args.endpoint, args.apitoken, args.vol) )
check.add(nagiosplugin.ScalarContext('wlat', args.tw[0], args.tc[0]))
check.add(nagiosplugin.ScalarContext('rlat', args.tw[1], args.tc[1]))
check.add(nagiosplugin.ScalarContext('wbw', args.tw[2], args.tc[2]))
check.add(nagiosplugin.ScalarContext('rbw', args.tw[3], args.tc[3]))
check.add(nagiosplugin.ScalarContext('wiops', args.tw[4], args.tc[4]))
check.add(nagiosplugin.ScalarContext('riops', args.tw[5], args.tc[5]))
check.main(args.verbose, args.timeout)
if __name__ == '__main__':
main()