check_naf.py 15 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380
  1. #!/usr/bin/env python
  2. # -*- encoding: utf-8 -*-
  3. #####################################################################
  4. # (c) 2006-2010 by Sven Velt and team(ix) GmbH, Nuernberg, Germany #
  5. # sv@teamix.net #
  6. # #
  7. # This file is part of check_naf (FKA check_netappfiler) #
  8. # #
  9. # check_naf is free software: you can redistribute it and/or modify #
  10. # it under the terms of the GNU General Public License as published #
  11. # by the Free Software Foundation, either version 2 of the License, #
  12. # or (at your option) any later version. #
  13. # #
  14. # check_naf is distributed in the hope that it will be useful, but #
  15. # WITHOUT ANY WARRANTY; without even the implied warranty of #
  16. # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the #
  17. # GNU General Public License for more details. #
  18. # #
  19. # You should have received a copy of the GNU General Public License #
  20. # along with check_naf. If not, see <http://www.gnu.org/licenses/>. #
  21. #####################################################################
  22. from monitoringplugin import SNMPMonitoringPlugin
  23. class CheckNAF(SNMPMonitoringPlugin):
  24. OID = {
  25. 'CPU_Arch': '.1.3.6.1.4.1.789.1.1.11.0',
  26. 'CPU_Time_Busy': '.1.3.6.1.4.1.789.1.2.1.3.0',
  27. 'CPU_Time_Idle': '.1.3.6.1.4.1.789.1.2.1.5.0',
  28. 'CPU_Context_Switches': '.1.3.6.1.4.1.789.1.2.1.8.0',
  29. 'Disks_Total': '.1.3.6.1.4.1.789.1.6.4.1.0',
  30. 'Disks_Active': '.1.3.6.1.4.1.789.1.6.4.2.0',
  31. 'Disks_Reconstructing': '.1.3.6.1.4.1.789.1.6.4.3.0',
  32. 'Disks_ReconstParity': '.1.3.6.1.4.1.789.1.6.4.4.0',
  33. 'Disks_Scrubbing': '.1.3.6.1.4.1.789.1.6.4.6.0',
  34. 'Disks_Failed': '.1.3.6.1.4.1.789.1.6.4.7.0',
  35. 'Disks_Spare': '.1.3.6.1.4.1.789.1.6.4.8.0',
  36. 'Disks_ZeroDisks': '.1.3.6.1.4.1.789.1.6.4.9.0',
  37. 'Disks_Failed_Descr': '.1.3.6.1.4.1.789.1.6.4.10.0',
  38. 'Global_Status': '.1.3.6.1.4.1.789.1.2.2.4.0',
  39. 'Global_Status_Message': '.1.3.6.1.4.1.789.1.2.2.25.0',
  40. 'NVRAM_Status': '.1.3.6.1.4.1.789.1.2.5.1.0',
  41. 'Model': '.1.3.6.1.4.1.789.1.1.5.0',
  42. 'ONTAP_Version': '.1.3.6.1.4.1.789.1.1.2.0',
  43. 'df_FS_Index': '.1.3.6.1.4.1.789.1.5.4.1.1',
  44. 'df_FS_Name': '.1.3.6.1.4.1.789.1.5.4.1.2',
  45. 'df_FS_Mounted_On': '.1.3.6.1.4.1.789.1.5.4.1.10',
  46. 'df_FS_Status': '.1.3.6.1.4.1.789.1.5.4.1.20',
  47. 'df_FS_Type': '.1.3.6.1.4.1.789.1.5.4.1.23',
  48. 'df_FS_kBTotal': ['.1.3.6.1.4.1.789.1.5.4.1.29', '.1.3.6.1.4.1.789.1.5.4.1.15', '.1.3.6.1.4.1.789.1.5.4.1.14',],
  49. 'df_FS_kBUsed': ['.1.3.6.1.4.1.789.1.5.4.1.30', '.1.3.6.1.4.1.789.1.5.4.1.17', '.1.3.6.1.4.1.789.1.5.4.1.16',],
  50. 'df_FS_kBAvail': ['.1.3.6.1.4.1.789.1.5.4.1.31', '.1.3.6.1.4.1.789.1.5.4.1.19', '.1.3.6.1.4.1.789.1.5.4.1.18',],
  51. 'df_FS_INodeUsed': '.1.3.6.1.4.1.789.1.5.4.1.7',
  52. 'df_FS_INodeFree': '.1.3.6.1.4.1.789.1.5.4.1.8',
  53. 'df_FS_MaxFilesAvail': '.1.3.6.1.4.1.789.1.5.4.1.11',
  54. 'df_FS_MaxFilesUsed': '.1.3.6.1.4.1.789.1.5.4.1.12',
  55. 'df_FS_MaxFilesPossible': '.1.3.6.1.4.1.789.1.5.4.1.13',
  56. }
  57. OWC = {
  58. 'Global_Status': ( (3,), (4,), (5,6), ),
  59. 'NVRAM_Status': ( (1,9), (2,5,8), (3,4,6), ),
  60. }
  61. Status2String = {
  62. 'CPU_Arch' : { '1' : 'x86', '2' : 'alpha', '3' : 'mips', '4' : 'sparc', '5' : 'amd64', },
  63. 'NVRAM_Status' : { '1' : 'ok', '2' : 'partiallyDischarged', '3' : 'fullyDischarged', '4' : 'notPresent', '5' : 'nearEndOfLife', '6' : 'atEndOfLife', '7' : 'unknown', '8' : 'overCharged', '9' : 'fullyCharged', },
  64. 'df_FS_Status' : { '1' : 'unmounted', '2' : 'mounted', '3' : 'frozen', '4' : 'destroying', '5' : 'creating', '6' : 'mounting', '7' : 'unmounting', '8' : 'nofsinfo', '9' : 'replaying', '10': 'replayed', },
  65. 'df_FS_Type' : { '1' : 'traditionalVolume', '2' : 'flexibleVolume', '3' : 'aggregate', },
  66. }
  67. def map_status_to_returncode(self, value, mapping):
  68. for returncode in xrange(0,3):
  69. if value in mapping[returncode]:
  70. return returncode
  71. return 3
  72. def check_cpu(self, warn='', crit=''):
  73. cpu_arch = self.SNMPGET(self.OID['CPU_Arch'])
  74. cpu_timebusy = int(self.SNMPGET(self.OID['CPU_Time_Busy']))
  75. # cputimeidle = int(self.SNMPGET(self.OID['CPU_Time_Idle']))
  76. cpu_cs = self.SNMPGET(self.OID['CPU_Context_Switches'])
  77. if '%' in warn:
  78. warn = warn[:-1]
  79. if '%' in crit:
  80. crit = crit[:-1]
  81. returncode = self.value_wc_to_returncode(cpu_timebusy, warn, crit)
  82. output = 'CPU ' + str(cpu_timebusy) + '% busy, CPU architecture: ' + self.Status2String['CPU_Arch'].get(cpu_arch)
  83. perfdata = []
  84. pd = {'label':'nacpu', 'value':cpu_timebusy, 'unit':'%', 'min':0, 'max':100}
  85. if warn:
  86. pd['warn'] = warn
  87. if crit:
  88. pd['crit'] = crit
  89. perfdata.append(pd)
  90. perfdata.append({'label':'nacs', 'value':cpu_cs, 'unit':'c'})
  91. return self.remember_check('cpu', returncode, output, perfdata=perfdata)
  92. def check_disk(self, target='failed', warn='', crit=''):
  93. di_total = int(self.SNMPGET(self.OID['Disks_Total']))
  94. di_active = int(self.SNMPGET(self.OID['Disks_Active']))
  95. di_reconstructing = int(self.SNMPGET(self.OID['Disks_Reconstructing']))
  96. di_reconstparity = int(self.SNMPGET(self.OID['Disks_ReconstParity']))
  97. # di_scrubbing = int(self.SNMPGET(self.OID['Disks_Scrubbing']))
  98. di_failed = int(self.SNMPGET(self.OID['Disks_Failed']))
  99. di_spare = int(self.SNMPGET(self.OID['Disks_Spare']))
  100. # di_zerodisks = int(self.SNMPGET(self.OID['Disks_ZeroDisks']))
  101. di_reconstr = di_reconstructing + di_reconstparity
  102. if target == 'spare':
  103. returncode = self.value_wc_to_returncode(di_spare, warn, crit)
  104. output = str(di_spare) + ' spare disk'
  105. if di_spare > 1:
  106. output += 's'
  107. else:
  108. target = 'failed' # Set to defined value
  109. returncode = self.value_wc_to_returncode(di_failed, warn, crit)
  110. if returncode == 0:
  111. output = 'No failed disks'
  112. else:
  113. output = self.SNMPGET(self.OID['Disks_Failed_Descr'])
  114. perfdata = []
  115. perfdata.append({'label':'nadisk_total', 'value':di_total, 'unit':'', 'min':0})
  116. perfdata.append({'label':'nadisk_active', 'value':di_active, 'unit':'', 'min':0})
  117. pd = {'label':'nadisk_spare', 'value':di_spare, 'unit':'', 'min':0}
  118. if warn and target=='spare':
  119. pd['warn'] = warn
  120. if crit and target=='spare':
  121. pd['crit'] = crit
  122. perfdata.append(pd)
  123. pd = {'label':'nadisk_failed', 'value':di_failed, 'unit':'', 'min':0}
  124. if warn and target=='failed':
  125. pd['warn'] = warn
  126. if crit and target=='failed':
  127. pd['crit'] = crit
  128. perfdata.append(pd)
  129. return self.remember_check('disk', returncode, output, perfdata=perfdata, target=target)
  130. def check_global(self):
  131. model = self.SNMPGET(self.OID['Model'])
  132. globalstatus = int(self.SNMPGET(self.OID['Global_Status']))
  133. globalstatusmsg = self.SNMPGET(self.OID['Global_Status_Message'])[:255]
  134. returncode = self.map_status_to_returncode(globalstatus, self.OWC['Global_Status'])
  135. output = model + ': ' + globalstatusmsg
  136. return self.remember_check('global', returncode, output)
  137. def check_nvram(self):
  138. nvramstatus = int(self.SNMPGET(self.OID['NVRAM_Status']))
  139. returncode = self.map_status_to_returncode(nvramstatus, self.OWC['NVRAM_Status'])
  140. output = 'NVRAM battery status is "' + self.Status2String['NVRAM_Status'].get(str(nvramstatus)) + '"'
  141. return self.remember_check('nvram', returncode, output)
  142. def check_version(self):
  143. model = self.SNMPGET(self.OID['Model'])
  144. ontapversion = self.SNMPGET(self.OID['ONTAP_Version'])
  145. return self.remember_check('version', 0, model + ': ' + ontapversion)
  146. def common_vol_idx(self, volume):
  147. if volume.endswith('.snapshot'):
  148. return None
  149. idx = str(self.find_in_table(self.OID['df_FS_Index'], self.OID['df_FS_Name'] , volume))
  150. sn_idx = int(idx) + 1
  151. return (idx, sn_idx)
  152. def check_vol_data(self, volume, warn, crit):
  153. (idx, sn_idx) = self.common_vol_idx(volume)
  154. fs_total = long(self.SNMPGET(self.OID['df_FS_kBTotal'], idx)) * 1024L
  155. fs_used = long(self.SNMPGET(self.OID['df_FS_kBUsed'], idx)) * 1024L
  156. # fs_avail = long(self.SNMPGET(self.OID['df_FS_kBAvail'], idx)) * 1024L
  157. sn_total = long(self.SNMPGET(self.OID['df_FS_kBTotal'], sn_idx)) * 1024L
  158. sn_used = long(self.SNMPGET(self.OID['df_FS_kBUsed'], sn_idx)) * 1024L
  159. # sn_avail = long(self.SNMPGET(self.OID['df_FS_kBAvail'], sn_idx)) * 1024L
  160. mountedon = self.SNMPGET(self.OID['df_FS_Mounted_On'] + "." + idx)
  161. status = self.Status2String['df_FS_Status'].get(self.SNMPGET(self.OID['df_FS_Status'] + "." + idx))
  162. fstype = self.Status2String['df_FS_Type'].get(self.SNMPGET(self.OID['df_FS_Type'] + "." + idx))
  163. fs_pctused = float(fs_used) / float(fs_total) * 100.0
  164. warn = self.range_dehumanize(warn, fs_total)
  165. crit = self.range_dehumanize(crit, fs_total)
  166. returncode = self.value_wc_to_returncode(fs_used, warn, crit)
  167. output = volume + ': Used ' + self.value_to_human_binary(fs_used, 'B')
  168. output += ' (' + '%3.1f' % fs_pctused + '%)'+ ' out of ' + self.value_to_human_binary(fs_total, 'B')
  169. target = volume.replace('/vol/', '')[:-1]
  170. perfdata = []
  171. perfdata.append({'label':'navdu_' + target, 'value':fs_used, 'unit':'B', 'warn':warn, 'crit':crit, 'min':0})
  172. perfdata.append({'label':'navdt_' + target, 'value':fs_total, 'unit':'B'})
  173. perfdata.append({'label':'navsu_' + target, 'value':sn_used, 'unit':'B', 'min':0})
  174. perfdata.append({'label':'navst_' + target, 'value':sn_total, 'unit':'B'})
  175. return self.remember_check('vol_data', returncode, output, perfdata=perfdata, target=target)
  176. def check_vol_snap(self, volume, warn, crit):
  177. (idx, sn_idx) = self.common_vol_idx(volume)
  178. # fs_total = long(self.SNMPGET(self.OID['df_FS_kBTotal'], idx)) * 1024L
  179. # fs_used = long(self.SNMPGET(self.OID['df_FS_kBUsed'], idx)) * 1024L
  180. # fs_avail = long(self.SNMPGET(self.OID['df_FS_kBAvail'], idx)) * 1024L
  181. sn_total = long(self.SNMPGET(self.OID['df_FS_kBTotal'], sn_idx)) * 1024L
  182. sn_used = long(self.SNMPGET(self.OID['df_FS_kBUsed'], sn_idx)) * 1024L
  183. # sn_avail = long(self.SNMPGET(self.OID['df_FS_kBAvail'], sn_idx)) * 1024L
  184. sn_pctused = float(sn_used) / float(sn_total) * 100.0
  185. warn = self.range_dehumanize(warn, sn_total)
  186. crit = self.range_dehumanize(crit, sn_total)
  187. returncode = self.value_wc_to_returncode(sn_used, warn, crit)
  188. output = volume + '.snapshot: Used ' + self.value_to_human_binary(sn_used, 'B')
  189. output += ' (' + '%3.1f' % sn_pctused + '%)'+ ' out of ' + self.value_to_human_binary(sn_total, 'B')
  190. target = volume.replace('/vol/', '')[:-1]
  191. perfdata = []
  192. perfdata.append({'label':'navsu_' + target, 'value':sn_used, 'unit':'B', 'warn':warn, 'crit':crit, 'min':0})
  193. perfdata.append({'label':'navst_' + target, 'value':sn_total, 'unit':'B'})
  194. return self.remember_check('vol_snap', returncode, output, perfdata=perfdata, target=target)
  195. def check_vol_inode(self, volume, warn, crit):
  196. (idx, sn_idx) = self.common_vol_idx(volume)
  197. in_used = long(self.SNMPGET(self.OID['df_FS_INodeUsed'] + '.' + idx))
  198. in_free = long(self.SNMPGET(self.OID['df_FS_INodeFree'] + '.' + idx))
  199. in_total = in_used + in_free
  200. in_pctused = float(in_used) / float(in_total) * 100.0
  201. warn = self.range_dehumanize(warn, in_total)
  202. crit = self.range_dehumanize(crit, in_total)
  203. returncode = self.value_wc_to_returncode(in_used, warn, crit)
  204. output = volume + ': Used inodes ' + self.value_to_human_si(in_used)
  205. output += ' (' + '%3.1f' % in_pctused + '%)'+ ' out of ' + self.value_to_human_si(in_total)
  206. target = volume.replace('/vol/', '')[:-1]
  207. perfdata = []
  208. perfdata.append({'label':'naviu_' + target, 'value':in_used, 'unit':None, 'warn':warn, 'crit':crit, 'min':0})
  209. perfdata.append({'label':'navit_' + target, 'value':in_total, 'unit':None})
  210. return self.remember_check('vol_inode', returncode, output, perfdata=perfdata, target=target)
  211. def check_vol_files(self, volume, warn, crit):
  212. (idx, sn_idx) = self.common_vol_idx(volume)
  213. fi_avail = long(self.SNMPGET(self.OID['df_FS_MaxFilesAvail'] + '.' + idx))
  214. fi_used = long(self.SNMPGET(self.OID['df_FS_MaxFilesUsed'] + '.' + idx))
  215. fi_possible = long(self.SNMPGET(self.OID['df_FS_MaxFilesPossible'] + '.' + idx))
  216. fi_total = fi_used + fi_avail
  217. fi_pctused = float(fi_used) / float(fi_total) * 100.0
  218. warn = self.range_dehumanize(warn, fi_total)
  219. crit = self.range_dehumanize(crit, fi_total)
  220. returncode = self.value_wc_to_returncode(fi_used, warn, crit)
  221. output = volume + ': Used files ' + self.value_to_human_si(fi_used)
  222. output += ' (' + '%3.1f' % fi_pctused + '%)'+ ' out of ' + self.value_to_human_si(fi_total)
  223. output += ', may raised to ' + self.value_to_human_si(fi_possible)
  224. target = volume.replace('/vol/', '')[:-1]
  225. perfdata = []
  226. perfdata.append({'label':'navfu_' + target, 'value':fi_used, 'unit':None, 'warn':warn, 'crit':crit, 'min':0})
  227. perfdata.append({'label':'navft_' + target, 'value':fi_total, 'unit':None})
  228. return self.remember_check('vol_files', returncode, output, perfdata=perfdata, target=target)
  229. def main():
  230. plugin = CheckNAF(pluginname='check_naf', tagforstatusline='NAF', description=u'Monitoring NetApp™ FAS systems', version='0.9')
  231. plugin.add_cmdlineoption('', '--check', 'check', 'OBSOLETE - use new syntax!', default='')
  232. plugin.add_cmdlineoption('', '--target', 'target', 'OBSOLETE - use new syntax!', default='')
  233. plugin.add_cmdlineoption('-w', '', 'warn', 'OBSOLETE - use new syntax!', default='')
  234. plugin.add_cmdlineoption('-c', '', 'crit', 'OBSOLETE - use new syntax!', default='')
  235. plugin.parse_cmdlineoptions()
  236. plugin.prepare_snmp()
  237. if plugin.options.check or plugin.options.target:
  238. import sys
  239. arguments = plugin.options.check
  240. for s in [plugin.options.target, plugin.options.warn, plugin.options.crit]:
  241. arguments += ':' + s
  242. plugin.back2nagios(3, 'Obsolete syntax - please use new syntax: "%s %s"' % (sys.argv[0], arguments))
  243. checks = []
  244. for quad in plugin.args:
  245. quad = quad.split(':')
  246. quad = (quad + ['', '', ''])[:4] # Fix length to 4, fill with ''
  247. # Convert list of checks to list
  248. if ',' in quad[0]:
  249. quad[0] = quad[0].split(',')
  250. else:
  251. quad[0] = [quad[0],]
  252. # Convert list of targets to list
  253. if ',' in quad[1]:
  254. quad[1] = quad[1].split(',')
  255. else:
  256. quad[1] = [quad[1],]
  257. for target in quad[1]:
  258. for check in quad[0]:
  259. checks.append(tuple([check, target, quad[2], quad[3]]))
  260. if len(checks) == 0:
  261. plugin.back2nagios(3, 'No check specified!')
  262. for quad in checks:
  263. (check, target, warn, crit) = tuple(quad)
  264. if check == 'global':
  265. result = plugin.check_global()
  266. elif check == 'cpu':
  267. result = plugin.check_cpu(warn=warn, crit=crit)
  268. elif check == 'disk':
  269. result = plugin.check_disk(target=target, warn=warn, crit=crit)
  270. elif check == 'nvram':
  271. result = plugin.check_nvram()
  272. elif check == 'version':
  273. result = plugin.check_version()
  274. elif check == 'vol_data':
  275. result = plugin.check_vol_data(volume=target, warn=warn, crit=crit)
  276. elif check == 'vol_snap':
  277. result = plugin.check_vol_snap(volume=target, warn=warn, crit=crit)
  278. elif check =='vol_inode':
  279. result = plugin.check_vol_inode(volume=target, warn=warn, crit=crit)
  280. elif check =='vol_files':
  281. result = plugin.check_vol_files(volume=target, warn=warn, crit=crit)
  282. # from pprint import pprint
  283. # pprint(plugin.dump_brain())
  284. plugin.brain2output()
  285. plugin.exit()
  286. if __name__ == '__main__':
  287. main()
  288. #vim: ts=4 sw=4 foldmethod=indent