858 lines
33 KiB
Python
Executable File
858 lines
33 KiB
Python
Executable File
#!/usr/bin/env python3
|
|
"""SNMP based Synology DMS / DMS UC checks"""
|
|
"""dependencys:
|
|
- pip3 install nagiosplugin
|
|
- pip3 install argparse
|
|
- pip3 install easysnmp
|
|
- https://easysnmp.readthedocs.io/en/latest/index.html
|
|
- https://easysnmp.readthedocs.io/en/latest/session_api.html
|
|
"""
|
|
|
|
__version__ = '0.13.1'
|
|
__author__ = 'anima'
|
|
|
|
# imports
|
|
import logging
|
|
import argparse
|
|
import nagiosplugin
|
|
from easysnmp import Session
|
|
|
|
# log settings
|
|
logging.basicConfig(format='[%(asctime)s] %(levelname)s %(message)s', level=logging.INFO)
|
|
|
|
def init_snmp_session(hostname: str = 'localhost', snmp_version: str | int = '2', snmp_community: str = 'public',
|
|
snmp_security_level: str = 'auth_with_privacy', snmp_security_username: str = 'monitoring',
|
|
snmp_auth_protocol: str = 'SHA256', snmp_auth_password: str | None = None,
|
|
snmp_privacy_protocol: str = 'AES', snmp_privacy_password: str | None = None
|
|
) -> Session:
|
|
"""init a easysnmp session
|
|
|
|
Args:
|
|
hostname (str, optional): hostname or ip of host. Defaults to 'localhost'.
|
|
snmp_version (str, optional): version of snmp (1, 2, 3). Defaults to 2.
|
|
snmp_community (str, only need for v1 & v2): snmp community if snmp v1 or v2 used (any). Defaults to 'public'.
|
|
snmp_security_level (str, only need for v3): security level (no_auth_or_privacy, auth_without_privacy or auth_with_privacy). Defaults to 'auth_with_privacy'.
|
|
snmp_security_username (str, only need for v3): security name (any). Defaults to 'monitoring'.
|
|
snmp_auth_protocol (str, only need for v3): authentication protocol (MD5, SHA256, SHA512). Defaults to 'SHA256'.
|
|
snmp_auth_password (str, only need for v3): authentication passphrase (any). Defaults to None.
|
|
snmp_privacy_protocol (str, only need for v3): privacy protocol (AES, DES). Defaults to 'AES'.
|
|
snmp_privacy_password (str, only need for v3): privacy passphrase (any). Defaults to None.
|
|
|
|
Return:
|
|
easysnmp.Session: session for get or walk actions
|
|
"""
|
|
# check if snmp version an valid str or int and saves as int
|
|
valid_versions: list[str, int] = ['1','2','3', 1, 2, 3]
|
|
if snmp_version not in valid_versions:
|
|
raise ValueError(f'{snmp_version=} non of {valid_versions=}')
|
|
else:
|
|
snmp_version = int(snmp_version)
|
|
|
|
if snmp_version == '3':
|
|
# check if snmp security level valid
|
|
valid_security_levels: list[str] = ['no_auth_or_privacy', 'auth_without_privacy', 'auth_with_privacy']
|
|
if snmp_security_level not in valid_security_levels:
|
|
raise ValueError(f'{snmp_security_level=} is non of {valid_security_levels=}')
|
|
|
|
# check if auth protocol valid
|
|
if snmp_security_level.startswith('auth'):
|
|
valid_auth_protocols: list[str] = ['MD5', 'SHA', 'SHA256', 'SHA512']
|
|
if snmp_auth_protocol not in valid_auth_protocols:
|
|
raise ValueError(f'{snmp_auth_protocol=} is non of {valid_auth_protocols=}')
|
|
|
|
if snmp_auth_password is None:
|
|
raise ValueError(f'{snmp_auth_password=} is not set')
|
|
|
|
# check if privacy protocol valid
|
|
if not snmp_security_level.startswith('no'):
|
|
valid_privacy_protocols: list[str] = ['AES', 'DES']
|
|
if snmp_privacy_protocol not in valid_privacy_protocols:
|
|
raise ValueError(f'{snmp_privacy_protocol=} is non of {valid_privacy_protocols=}')
|
|
|
|
if snmp_privacy_password is None:
|
|
raise ValueError(f'{snmp_privacy_password=} is not set')
|
|
|
|
|
|
if snmp_version == 3: # 2025-01-02: only 'auth_with_privacy' is tested
|
|
session = Session(hostname=hostname, version=snmp_version,
|
|
security_level=snmp_security_level, security_username=snmp_security_username,
|
|
privacy_protocol=snmp_privacy_protocol, privacy_password=snmp_privacy_password,
|
|
auth_protocol=snmp_auth_protocol, auth_password=snmp_auth_password)
|
|
else:
|
|
session = Session(hostname=hostname, version=snmp_version, community=snmp_community)
|
|
return session
|
|
|
|
|
|
#
|
|
# Synology [DSM & DSM UC] Checks disk staus (baseclass)
|
|
#
|
|
class SNMPSynologyDisk():
|
|
def __init__(self, session):
|
|
self.session = session
|
|
|
|
def get_disks(self):
|
|
disks = list()
|
|
baseoid = '.1.3.6.1.4.1.6574.2.1.1'
|
|
oids = dict()
|
|
oids['index'] = '1'
|
|
oids['id'] = '2'
|
|
oids['model'] = '3'
|
|
oids['type'] = '4'
|
|
oids['status'] = '5'
|
|
oids['temp'] = '6'
|
|
oids['role'] = '7'
|
|
oids['retry'] = '8'
|
|
oids['badSectors'] = '9'
|
|
oids['identFail'] = '10'
|
|
oids['remainLife'] = '11'
|
|
oids['name'] = '12'
|
|
oids['health'] = '13'
|
|
|
|
disk_ids = list()
|
|
results = self.session.walk(baseoid)
|
|
for result in results:
|
|
if '6574.2.1.1.1.' in result.oid:
|
|
disk_ids.append(result.value)
|
|
|
|
for disk in disk_ids:
|
|
tmp_disk = dict()
|
|
for result in results:
|
|
for name, oid in oids.items():
|
|
if '6574.2.1.1.' + oid + '.' + disk in result.oid:
|
|
tmp_disk[name] = result.value
|
|
break
|
|
disks.append(tmp_disk)
|
|
|
|
return disks
|
|
|
|
|
|
#
|
|
# Synology [DSM & DSM UC] Checks raids (baseclass)
|
|
#
|
|
class SNMPSynologyRaid():
|
|
def __init__(self, session):
|
|
self.session = session
|
|
|
|
def get_raids(self):
|
|
raids = list()
|
|
baseoid = '.1.3.6.1.4.1.6574.3'
|
|
oids = dict()
|
|
oids['index'] = '1'
|
|
oids['name'] = '2'
|
|
oids['status'] = '3'
|
|
oids['free'] = '4'
|
|
oids['total'] = '5'
|
|
oids['hotspare'] = '6'
|
|
|
|
raid_ids = list()
|
|
results = self.session.walk(baseoid)
|
|
for result in results:
|
|
if '6574.3.1.1.1.' in result.oid:
|
|
raid_ids.append(result.value)
|
|
|
|
for raid in raid_ids:
|
|
tmp_raid = dict()
|
|
for result in results:
|
|
for name, oid in oids.items():
|
|
if '6574.3.1.1.' + oid + '.' + raid in result.oid:
|
|
tmp_raid[name] = result.value
|
|
break
|
|
raids.append(tmp_raid)
|
|
|
|
return raids
|
|
|
|
|
|
#
|
|
# Synology General Summary
|
|
#
|
|
|
|
class SNMPSynologySummary(nagiosplugin.Summary):
|
|
def verbose(self, results):
|
|
result_str = ''
|
|
for result in results:
|
|
result_str += f'{str(result)}\n'
|
|
return result_str
|
|
|
|
def ok(self, results):
|
|
return
|
|
|
|
def problem(self, results):
|
|
return
|
|
|
|
|
|
|
|
|
|
#
|
|
# Synology [DSM & DSM UC] System partition status.
|
|
#
|
|
class SNMPSynologySystemResource(nagiosplugin.Resource):
|
|
def __init__(self, session) -> None:
|
|
self.session = session
|
|
|
|
def probe(self) -> list:
|
|
"""check system status (normal or failed)
|
|
|
|
Returns:
|
|
nagiosplugin.Metric: single metric element (return)
|
|
"""
|
|
baseoid = '.1.3.6.1.4.1.6574.1'
|
|
oids = dict()
|
|
oids['status'] = '.1.0'
|
|
oids['model'] = '.5.1.0'
|
|
oids['sn'] = '.5.2.0'
|
|
# oids['hostname'] = '.1.0'
|
|
|
|
result = dict()
|
|
for key, oid in oids.items():
|
|
result[key] = self.session.get(baseoid + oid).value
|
|
return nagiosplugin.Metric(name='status', value=result, context='system_context')
|
|
|
|
|
|
class SNMPSynologySystemContext(nagiosplugin.Context):
|
|
def __init__(self, name):
|
|
super().__init__(name, fmt_metric='{name} is', result_cls=SNMPSynologySystemResult)
|
|
|
|
def evaluate(self, metric, resource):
|
|
if metric.value['status'] == '2':
|
|
return self.result_cls(nagiosplugin.Critical, "critical", metric)
|
|
elif metric.value['status'] == '1':
|
|
return self.result_cls(nagiosplugin.Ok, "ok", metric)
|
|
return self.result_cls(nagiosplugin.Unknown, "unknown", metric)
|
|
|
|
|
|
class SNMPSynologySystemResult(nagiosplugin.Result):
|
|
def __str__(self):
|
|
if self.metric.value['status'] == '1': status = 'normal'
|
|
else: status = 'failed'
|
|
return f'{self.metric.value["model"]} (SN: {self.metric.value["sn"]}) is in status {status}!'
|
|
|
|
|
|
#
|
|
# Synology [DSM & DSM UC] Temperature of NAS
|
|
#
|
|
class SNMPSynologyTemperatureResource(nagiosplugin.Resource, SNMPSynologyDisk):
|
|
def __init__(self, session) -> None:
|
|
self.session = session
|
|
|
|
def probe(self) -> list:
|
|
"""check system temperature in °C
|
|
|
|
Returns:
|
|
nagiosplugin.Metric: single metric element (return)
|
|
"""
|
|
baseoid = '.1.3.6.1.4.1.6574.1'
|
|
oids = dict()
|
|
result = self.session.get(baseoid + '.2.0').value
|
|
yield nagiosplugin.Metric(name='temp_system', value=int(result), uom='°C', context='temperature_scalar_context')
|
|
disks = self.get_disks()
|
|
for disk in disks:
|
|
yield nagiosplugin.Metric(name='temp_' + disk['id'].lower().replace(' ', '_'), value=int(disk['temp']), uom='°C', context='temperature_scalar_context')
|
|
|
|
def __init__(self, session) -> None:
|
|
self.session = session
|
|
|
|
|
|
#
|
|
# Synology [DSM & DSM UC] Returns error if power supplies fail
|
|
#
|
|
class SNMPSynologyPowerSupplyResource(nagiosplugin.Resource):
|
|
def __init__(self, session) -> None:
|
|
self.session = session
|
|
|
|
def probe(self) -> list:
|
|
"""check power supply status (normal or failed)
|
|
|
|
Returns:
|
|
nagiosplugin.Metric: single metric element (return)
|
|
"""
|
|
baseoid = '.1.3.6.1.4.1.6574.1'
|
|
result = self.session.get(baseoid + '.3.0').value
|
|
return nagiosplugin.Metric(name='status', value=result, context='powersupply_context')
|
|
|
|
|
|
class SNMPSynologyPowerSupplyContext(nagiosplugin.Context):
|
|
def __init__(self, name):
|
|
super().__init__(name, fmt_metric='{name} is', result_cls=SNMPSynologyPowerSupplyResult)
|
|
|
|
def evaluate(self, metric, resource):
|
|
if metric.value == '2':
|
|
return self.result_cls(nagiosplugin.Critical, "critical", metric)
|
|
elif metric.value == '1':
|
|
return self.result_cls(nagiosplugin.Ok, "ok", metric)
|
|
return self.result_cls(nagiosplugin.Unknown, "unknown", metric)
|
|
|
|
|
|
class SNMPSynologyPowerSupplyResult(nagiosplugin.Result):
|
|
def __str__(self):
|
|
if self.metric.value == '1': status = 'normal'
|
|
else: status = 'failed'
|
|
return f'Power Supply is in status {status}!'
|
|
|
|
|
|
#
|
|
# Synology [DSM & DSM UC] returns error if system fan fails
|
|
#
|
|
class SNMPSynologyFansResource(nagiosplugin.Resource):
|
|
def __init__(self, session) -> None:
|
|
self.session = session
|
|
|
|
def probe(self) -> list:
|
|
"""check fans status (normal or failed)
|
|
|
|
Returns:
|
|
Generator[nagisplugin.Metric]: multiple metric elements (yield)
|
|
"""
|
|
baseoid = '.1.3.6.1.4.1.6574.1'
|
|
fans = dict()
|
|
fans['system'] = '.4.1.0'
|
|
fans['cpu'] = '.4.2.0'
|
|
|
|
for fan, oid in fans.items():
|
|
result = self.session.get(baseoid + oid).value
|
|
yield nagiosplugin.Metric(name=fan, value=result, context='fan_context')
|
|
|
|
|
|
class SNMPSynologyFansContext(nagiosplugin.Context):
|
|
def __init__(self, name):
|
|
super().__init__(name, fmt_metric='{name} is', result_cls=SNMPSynologyFansResult)
|
|
|
|
def evaluate(self, metric, resource):
|
|
if metric.value == '2':
|
|
return self.result_cls(nagiosplugin.Critical, "critical", metric)
|
|
elif metric.value == '1':
|
|
return self.result_cls(nagiosplugin.Ok, "ok", metric)
|
|
return self.result_cls(nagiosplugin.Unknown, "unknown", metric)
|
|
|
|
|
|
class SNMPSynologyFansResult(nagiosplugin.Result):
|
|
def __str__(self):
|
|
if self.metric.value == '1': status = 'normal'
|
|
else: status = 'failed'
|
|
return f'{self.metric.name} fan is in status {status}!'
|
|
|
|
|
|
#
|
|
# Synology [DSM & DSM UC] Checks whether a new version or update of DSM is available
|
|
#
|
|
class SNMPSynologyFirmwareResource(nagiosplugin.Resource):
|
|
def __init__(self, session) -> None:
|
|
self.session = session
|
|
|
|
def probe(self) -> list:
|
|
"""check if firmware update available
|
|
|
|
Returns:
|
|
nagiosplugin.Metric: single metric element (return)
|
|
"""
|
|
baseoid = '.1.3.6.1.4.1.6574.1'
|
|
oids = dict()
|
|
oids['version'] = '.5.3.0'
|
|
oids['status'] = '.5.4.0'
|
|
oids['model'] = '.5.1.0'
|
|
oids['sn'] = '.5.2.0'
|
|
|
|
result = dict()
|
|
for key, oid in oids.items():
|
|
result[key] = self.session.get(baseoid + oid).value
|
|
return nagiosplugin.Metric(name='status', value=result, context='firmware_context')
|
|
|
|
|
|
class SNMPSynologyFirmwareContext(nagiosplugin.Context):
|
|
def __init__(self, name):
|
|
super().__init__(name, fmt_metric='{name} is', result_cls=SNMPSynologyFirmwareResult)
|
|
|
|
def evaluate(self, metric, resource):
|
|
if metric.value['status'] == '1':
|
|
return self.result_cls(nagiosplugin.Critical, "critical", metric)
|
|
elif metric.value['status'] == '2':
|
|
return self.result_cls(nagiosplugin.Ok, "ok", metric)
|
|
elif metric.value['status'] in ['3', '4']:
|
|
return self.result_cls(nagiosplugin.Warn, "warning", metric)
|
|
return self.result_cls(nagiosplugin.Unknown, "unknown", metric)
|
|
|
|
|
|
class SNMPSynologyFirmwareResult(nagiosplugin.Result):
|
|
def __str__(self):
|
|
if self.metric.value['status'] == '1': status = 'available'
|
|
elif self.metric.value['status'] == '2': status = 'up2date'
|
|
elif self.metric.value['status'] == '3': status = 'connecting'
|
|
elif self.metric.value['status'] == '4': status = 'disconnected'
|
|
else: status = 'unknown'
|
|
return f'Firmware of {self.metric.value["model"]} (SN: {self.metric.value["sn"]}; Version: {self.metric.value["version"]}) is in status {status}!'
|
|
|
|
|
|
#
|
|
# Synology [DSM] Utilization % is the sum of user and system CPU usage
|
|
#
|
|
class SNMPSynologyCPUResource(nagiosplugin.Resource):
|
|
def __init__(self, session) -> None:
|
|
self.session = session
|
|
|
|
def probe(self) -> list:
|
|
"""check cpu usage %
|
|
|
|
Returns:
|
|
nagiosplugin.Metric: single metric element (return)
|
|
"""
|
|
baseoid = '.1.3.6.1.4.1.6574.1'
|
|
result = self.session.get(baseoid + '.7.1.0').value
|
|
return nagiosplugin.Metric(name='cpu', value=int(result), uom='%', context='cpu_scalar_context')
|
|
|
|
|
|
#
|
|
# Synology [DSM] Utilization % is the sum of user and system CPU usage
|
|
#
|
|
class SNMPSynologyMemoryResource(nagiosplugin.Resource):
|
|
def __init__(self, session) -> None:
|
|
self.session = session
|
|
|
|
def probe(self) -> list:
|
|
"""check memory usage in %
|
|
|
|
Returns:
|
|
nagiosplugin.Metric: single metric element (return)
|
|
"""
|
|
baseoid = '.1.3.6.1.4.1.6574.1'
|
|
result = self.session.get(baseoid + '.7.2.0').value
|
|
return nagiosplugin.Metric(name='memory', value=int(result), uom='%', context='memory_scalar_context')
|
|
|
|
|
|
#
|
|
# Synology [DSM & DSM UC] Checks disks
|
|
#
|
|
class SNMPSynologyDiskRetryResource(nagiosplugin.Resource, SNMPSynologyDisk):
|
|
def __init__(self, session) -> None:
|
|
self.session = session
|
|
|
|
def probe(self) -> list:
|
|
"""check staus and health of all disks
|
|
|
|
Returns:
|
|
Generator[nagisplugin.Metric]: multiple metric elements (yield)
|
|
"""
|
|
disks = self.get_disks()
|
|
for disk in disks:
|
|
yield nagiosplugin.Metric(name=disk['id'], value=int(disk['retry']), uom=' retrys', context='disk_retry_scalar_context')
|
|
|
|
|
|
class SNMPSynologyDiskIdentResource(nagiosplugin.Resource, SNMPSynologyDisk):
|
|
def __init__(self, session) -> None:
|
|
self.session = session
|
|
|
|
def probe(self) -> list:
|
|
"""check staus and health of all disks
|
|
|
|
Returns:
|
|
Generator[nagisplugin.Metric]: multiple metric elements (yield)
|
|
"""
|
|
disks = self.get_disks()
|
|
for disk in disks:
|
|
yield nagiosplugin.Metric(name=disk['id'], value=int(disk['identFail']), uom=' fails', context='disk_ident_scalar_context')
|
|
|
|
|
|
class SNMPSynologyDiskLifeResource(nagiosplugin.Resource, SNMPSynologyDisk):
|
|
def __init__(self, session) -> None:
|
|
self.session = session
|
|
|
|
def probe(self) -> list:
|
|
"""check staus and health of all disks
|
|
|
|
Returns:
|
|
Generator[nagisplugin.Metric]: multiple metric elements (yield)
|
|
"""
|
|
disks = self.get_disks()
|
|
for disk in disks:
|
|
yield nagiosplugin.Metric(name=disk['id'], value=int(disk['remainLife']), uom=' remaining life', context='disk_life_scalar_context')
|
|
|
|
|
|
class SNMPSynologyDiskSectorsResource(nagiosplugin.Resource, SNMPSynologyDisk):
|
|
def __init__(self, session) -> None:
|
|
self.session = session
|
|
|
|
def probe(self) -> list:
|
|
"""check staus and health of all disks
|
|
|
|
Returns:
|
|
Generator[nagisplugin.Metric]: multiple metric elements (yield)
|
|
"""
|
|
disks = self.get_disks()
|
|
for disk in disks:
|
|
yield nagiosplugin.Metric(name=disk['id'], value=int(disk['badSectors']), uom=' bad sectors', context='disk_sectors_scalar_context')
|
|
|
|
|
|
class SNMPSynologyDiskHealthResource(nagiosplugin.Resource, SNMPSynologyDisk):
|
|
def __init__(self, session) -> None:
|
|
self.session = session
|
|
|
|
def probe(self) -> list:
|
|
"""check staus and health of all disks
|
|
|
|
Returns:
|
|
Generator[nagisplugin.Metric]: multiple metric elements (yield)
|
|
"""
|
|
disks = self.get_disks()
|
|
for disk in disks:
|
|
yield nagiosplugin.Metric(name=disk['id'], value=disk, context='disk_status_context')
|
|
yield nagiosplugin.Metric(name=disk['id'], value=disk, context='disk_health_context')
|
|
|
|
|
|
|
|
class SNMPSynologyDiskStatusContext(nagiosplugin.Context):
|
|
def __init__(self, name):
|
|
super().__init__(name, fmt_metric='{name} is', result_cls=SNMPSynologyDiskStatusResult)
|
|
|
|
def evaluate(self, metric, resource):
|
|
if metric.value['status'] in ['4', '5']:
|
|
return self.result_cls(nagiosplugin.Critical, "critical", metric)
|
|
elif metric.value['status'] in ['2', '3']:
|
|
return self.result_cls(nagiosplugin.Warn, "warning", metric)
|
|
elif metric.value['status'] == '1':
|
|
return self.result_cls(nagiosplugin.Ok, "ok", metric)
|
|
return self.result_cls(nagiosplugin.Unknown, "unknown", metric)
|
|
|
|
|
|
class SNMPSynologyDiskStatusResult(nagiosplugin.Result):
|
|
def __str__(self):
|
|
if self.metric.value['status'] == '1': status = 'Normal'
|
|
elif self.metric.value['status'] == '2': status = 'Initialized'
|
|
elif self.metric.value['status'] == '3': status = 'NotInitialized'
|
|
elif self.metric.value['status'] == '4': status = 'SystemPartitionFailed'
|
|
elif self.metric.value['status'] == '5': status = 'Crashed'
|
|
else: status = 'unknown'
|
|
return f'{self.metric.name} (model: {self.metric.value["model"]} - {self.metric.value["type"]}) (role: {self.metric.value["role"]}) is in status {status}!'
|
|
|
|
|
|
class SNMPSynologyDiskHealthContext(nagiosplugin.Context):
|
|
def __init__(self, name):
|
|
super().__init__(name, fmt_metric='{name} is', result_cls=SNMPSynologyDiskHealthResult)
|
|
|
|
def evaluate(self, metric, resource):
|
|
if metric.value['health'] in ['3', '4']:
|
|
return self.result_cls(nagiosplugin.Critical, "critical", metric)
|
|
elif metric.value['health'] == '2':
|
|
return self.result_cls(nagiosplugin.Warn, "warning", metric)
|
|
elif metric.value['health'] == '1':
|
|
return self.result_cls(nagiosplugin.Ok, "ok", metric)
|
|
return self.result_cls(nagiosplugin.Unknown, "unknown", metric)
|
|
|
|
|
|
class SNMPSynologyDiskHealthResult(nagiosplugin.Result):
|
|
def __str__(self):
|
|
if self.metric.value['health'] == '1': status = 'Normal'
|
|
elif self.metric.value['health'] == '2': status = 'Warning'
|
|
elif self.metric.value['health'] == '3': status = 'Critical'
|
|
elif self.metric.value['health'] == '4': status = 'Failing'
|
|
else: status = 'unknown'
|
|
return f'Health of {self.metric.name} is in status {status}!'
|
|
|
|
|
|
#
|
|
# Synology [DSM & DSM UC] Checks RAID status
|
|
#
|
|
class SNMPSynologyRaidSpaceResource(nagiosplugin.Resource, SNMPSynologyRaid):
|
|
def __init__(self, session) -> None:
|
|
self.session = session
|
|
|
|
def probe(self) -> list:
|
|
"""check memory usage in %
|
|
|
|
Returns:
|
|
Generator[nagisplugin.Metric]: multiple metric elements (yield)
|
|
"""
|
|
raids = self.get_raids()
|
|
for raid in raids:
|
|
# skip storage pools because they already full of there volumes
|
|
# works only with default naming maybe as argument ?
|
|
if raid['name'].startswith('Storage Pool'):
|
|
continue
|
|
used_space_in_percent = 100 - int(int(raid['free']) / int(raid['total']) * 100)
|
|
yield nagiosplugin.Metric(name='raid_' + raid["name"].lower().replace(' ', '_'), value=used_space_in_percent, uom='%', context='raid_space_scalar_context')
|
|
|
|
def __init__(self, session) -> None:
|
|
self.session = session
|
|
|
|
|
|
class SNMPSynologyRaidStatusResource(nagiosplugin.Resource, SNMPSynologyRaid):
|
|
def __init__(self, session) -> None:
|
|
self.session = session
|
|
|
|
def probe(self) -> list:
|
|
"""check staus and health of all raids
|
|
|
|
Returns:
|
|
Generator[nagisplugin.Metric]: multiple metric elements (yield)
|
|
"""
|
|
raids = self.get_raids()
|
|
for raid in raids:
|
|
yield nagiosplugin.Metric(name=raid['name'], value=raid, context='raid_status_context')
|
|
|
|
|
|
|
|
class SNMPSynologyRaidStatusContext(nagiosplugin.Context):
|
|
def __init__(self, name):
|
|
super().__init__(name, fmt_metric='{name} is', result_cls=SNMPSynologyRaidStatusResult)
|
|
|
|
def evaluate(self, metric, resource):
|
|
if metric.value['status'] in ['12', '18']:
|
|
return self.result_cls(nagiosplugin.Critical, "critical", metric)
|
|
elif 2 <= int(metric.value['status']) <= 21:
|
|
return self.result_cls(nagiosplugin.Warn, "warning", metric)
|
|
elif metric.value['status'] == '1':
|
|
return self.result_cls(nagiosplugin.Ok, "ok", metric)
|
|
return self.result_cls(nagiosplugin.Unknown, "unknown", metric)
|
|
|
|
|
|
class SNMPSynologyRaidStatusResult(nagiosplugin.Result):
|
|
def __str__(self):
|
|
if self.metric.value['status'] == '1': status = 'Normal'
|
|
elif self.metric.value['status'] == '2': status = 'Repairing'
|
|
elif self.metric.value['status'] == '3': status = 'Migrating'
|
|
elif self.metric.value['status'] == '4': status = 'Expanding'
|
|
elif self.metric.value['status'] == '5': status = 'Deleting'
|
|
elif self.metric.value['status'] == '6': status = 'Creating'
|
|
elif self.metric.value['status'] == '7': status = 'RaidSyncing'
|
|
elif self.metric.value['status'] == '8': status = 'RaidParityChecking'
|
|
elif self.metric.value['status'] == '9': status = 'RaidAssembling'
|
|
elif self.metric.value['status'] == '10': status = 'Canceling'
|
|
elif self.metric.value['status'] == '11': status = 'Degrade'
|
|
elif self.metric.value['status'] == '12': status = 'Crashed'
|
|
elif self.metric.value['status'] == '13': status = 'DataScrubbing'
|
|
elif self.metric.value['status'] == '14': status = 'RaidDeploying'
|
|
elif self.metric.value['status'] == '15': status = 'RaidUnDeploying'
|
|
elif self.metric.value['status'] == '16': status = 'RaidMountCache'
|
|
elif self.metric.value['status'] == '17': status = 'RaidUnmountCache'
|
|
elif self.metric.value['status'] == '18': status = 'RaidExpandingUnnishedSHR'
|
|
elif self.metric.value['status'] == '19': status = 'RaidConvertSHRToPool'
|
|
elif self.metric.value['status'] == '20': status = 'RaidMigrateSHR1ToSHR2'
|
|
elif self.metric.value['status'] == '21': status = 'RaidUnknownStatus'
|
|
else: status = 'unknown'
|
|
return f'{self.metric.name} is in status {status}!'
|
|
|
|
|
|
#
|
|
# Synology [DSM & DSM UC] UPS staus (paused, not done)
|
|
#
|
|
class SNMPSynologyUPSResource(nagiosplugin.Resource):
|
|
def __init__(self, session) -> None:
|
|
self.session = session
|
|
|
|
def probe(self) -> list:
|
|
"""check ups status
|
|
|
|
Returns:
|
|
nagiosplugin.Metric: single metric element (return)
|
|
"""
|
|
baseoid = '1.3.6.1.4.1.6574.4'
|
|
# data = self.session.walk(baseoid)
|
|
# not sure if this value time remaining ...
|
|
time_until_empty = self.session.get(baseoid + '.3.6.1.0').value
|
|
# not shure what (for my ups) satus 'OL' says, maybe "online" ?
|
|
ups = dict()
|
|
|
|
ups['status'] = self.session.get(baseoid + '.2.1.0').value
|
|
ups['model'] = self.session.get(baseoid + '.1.1.0').value
|
|
ups['serial'] = self.session.get(baseoid + '.1.3.0').value
|
|
return nagiosplugin.Metric(name='ups_' + ups["model"].lower().replace(' ', '_'), value=ups, context='ups_context')
|
|
|
|
|
|
|
|
class SNMPSynologyUPSContext(nagiosplugin.Context):
|
|
def __init__(self, name):
|
|
super().__init__(name, fmt_metric='{name} is', result_cls=SNMPSynologyUPSResult)
|
|
|
|
def evaluate(self, metric, resource):
|
|
if metric.value['status'] == '?':
|
|
return self.result_cls(nagiosplugin.Critical, "critical", metric)
|
|
elif metric.value['status'] == '?':
|
|
return self.result_cls(nagiosplugin.Warn, "warning", metric)
|
|
elif metric.value['status'] == 'OL':
|
|
return self.result_cls(nagiosplugin.Ok, "ok", metric)
|
|
return self.result_cls(nagiosplugin.Unknown, "unknown", metric)
|
|
|
|
|
|
class SNMPSynologyUPSResult(nagiosplugin.Result):
|
|
def __str__(self):
|
|
if self.metric.value['status'] == 'OL': status = 'Online' # ?
|
|
else: status = 'unknown'
|
|
return f'{self.metric.name} is in status {status}!'
|
|
|
|
|
|
#
|
|
# Arguments
|
|
#
|
|
def parse_args() -> argparse.Namespace:
|
|
"""evaluates given arguments
|
|
|
|
Returns:
|
|
argsparse.Namespace: Namespace Object with all arguments insert (use: args.long_name_of_argument)
|
|
"""
|
|
argp = argparse.ArgumentParser(description=__doc__)
|
|
# Default args
|
|
argp.add_argument('-v', '--verbose', action='count', default=0,
|
|
help='increase output verbosity (use up to 3 times)')
|
|
argp.add_argument('-H', '--hostname', default='localhost',
|
|
help='IP address or hostname of device to query')
|
|
argp.add_argument('-t', '--timeout', default=30,
|
|
help='abort execution after TIMEOUT seconds')
|
|
# TEMPLATE TODO: edit choices
|
|
argp.add_argument('-m', '--check_mode',
|
|
choices=[
|
|
'system',
|
|
'temperature',
|
|
'powersupply',
|
|
'fans',
|
|
'firmware',
|
|
'cpu',
|
|
'memory',
|
|
'disk',
|
|
'disk_retry',
|
|
'disk_ident',
|
|
'disk_life',
|
|
'disk_sectors',
|
|
'raid',
|
|
'raid_space',
|
|
'ups',
|
|
'smart',
|
|
],
|
|
help='check mode to run')
|
|
|
|
# Nagios args / see https://nagios-plugins.org/doc/guidelines.html#THRESHOLDFORMAT
|
|
argp.add_argument('-w', '--warning', default=':80',
|
|
help='warning threshold')
|
|
argp.add_argument('-c', '--critical', default=':90',
|
|
help='critical threshold')
|
|
|
|
# SNMP args (same -* as snmpwalk / snmpget linux command; exept -C/-c & -V /-v because already used (see above))
|
|
argp.add_argument('-V', '--snmp-version', default='2',
|
|
help='Used SNMP Version. (1, 2, 3)')
|
|
argp.add_argument('-C', '--snmp_community', default='public',
|
|
help='SNMP community if snmp v1 or v2 used (any).')
|
|
argp.add_argument('-l', '--snmp-security-level', default='auth_with_privacy',
|
|
help='Security level (no_auth_or_privacy, auth_without_privacy or auth_with_privacy)')
|
|
argp.add_argument('-u', '--snmp-security-username', default='monitoring',
|
|
help='Security name (any)')
|
|
argp.add_argument('-a', '--snmp-auth-protocol', default='SHA256',
|
|
help='Authentication protocol (MD5, SHA256, SHA512)')
|
|
argp.add_argument('-A', '--snmp-auth-pass', default=None,
|
|
help='Authentication passphrase (any)')
|
|
argp.add_argument('-x', '--snmp-privacy-protocol', default='AES',
|
|
help='Privacy protocol (AES, DES)')
|
|
argp.add_argument('-X', '--snmp-privacy-pass', default=None,
|
|
help='Privacy passphrase (any)')
|
|
|
|
args = argp.parse_args()
|
|
return args
|
|
|
|
#
|
|
# init
|
|
#
|
|
def main():
|
|
args = parse_args()
|
|
if args.verbose >= 3:
|
|
logging.getLogger().setLevel(logging.DEBUG)
|
|
|
|
session = init_snmp_session(hostname=args.hostname, snmp_version=args.snmp_version, snmp_community=args.snmp_community,
|
|
snmp_security_level=args.snmp_security_level, snmp_security_username=args.snmp_security_username,
|
|
snmp_auth_protocol=args.snmp_auth_protocol, snmp_auth_password=args.snmp_auth_pass,
|
|
snmp_privacy_protocol=args.snmp_privacy_protocol, snmp_privacy_password=args.snmp_privacy_pass)
|
|
|
|
# dice which check will be run bases on check_mode
|
|
match args.check_mode:
|
|
case 'system':
|
|
check = nagiosplugin.Check(
|
|
SNMPSynologySystemResource(session=session),
|
|
SNMPSynologySystemContext(name='system_context'),
|
|
nagiosplugin.Summary())
|
|
check.name = "System Status"
|
|
case 'temperature':
|
|
check = nagiosplugin.Check(
|
|
SNMPSynologyTemperatureResource(session=session),
|
|
nagiosplugin.ScalarContext(name='temperature_scalar_context', warning=args.warning, critical=args.critical),
|
|
nagiosplugin.Summary())
|
|
check.name = "System Temperature"
|
|
case 'powersupply':
|
|
check = nagiosplugin.Check(
|
|
SNMPSynologyPowerSupplyResource(session=session),
|
|
SNMPSynologyPowerSupplyContext(name='powersupply_context'),
|
|
nagiosplugin.Summary())
|
|
check.name = "Power Supply Status"
|
|
case 'fans':
|
|
check = nagiosplugin.Check(
|
|
SNMPSynologyFansResource(session=session),
|
|
SNMPSynologyFansContext(name='fan_context'),
|
|
SNMPSynologySummary())
|
|
check.name = "Fans Status"
|
|
case 'firmware':
|
|
check = nagiosplugin.Check(
|
|
SNMPSynologyFirmwareResource(session=session),
|
|
SNMPSynologyFirmwareContext(name='firmware_context'),
|
|
nagiosplugin.Summary())
|
|
check.name = "Firmware"
|
|
case 'cpu':
|
|
check = nagiosplugin.Check(
|
|
SNMPSynologyCPUResource(session=session),
|
|
nagiosplugin.ScalarContext(name='cpu_scalar_context', warning=args.warning, critical=args.critical),
|
|
nagiosplugin.Summary())
|
|
check.name = "CPU Usage"
|
|
case 'memory':
|
|
check = nagiosplugin.Check(
|
|
SNMPSynologyMemoryResource(session=session),
|
|
nagiosplugin.ScalarContext(name='memory_scalar_context', warning=args.warning, critical=args.critical),
|
|
nagiosplugin.Summary())
|
|
check.name = "Memory Usage"
|
|
case 'disk':
|
|
check = nagiosplugin.Check(
|
|
SNMPSynologyDiskHealthResource(session=session),
|
|
SNMPSynologyDiskHealthContext(name='disk_health_context'),
|
|
SNMPSynologyDiskStatusContext(name='disk_status_context'),
|
|
SNMPSynologySummary())
|
|
check.name = "Disk Health"
|
|
case 'disk_retry':
|
|
check = nagiosplugin.Check(
|
|
SNMPSynologyDiskRetryResource(session=session),
|
|
nagiosplugin.ScalarContext(name='disk_retry_scalar_context', warning=args.warning, critical=args.critical),
|
|
nagiosplugin.Summary())
|
|
check.name = "Disk Connection Retrys"
|
|
case 'disk_life':
|
|
check = nagiosplugin.Check(
|
|
SNMPSynologyDiskLifeResource(session=session),
|
|
nagiosplugin.ScalarContext(name='disk_life_scalar_context', warning=args.warning, critical=args.critical),
|
|
nagiosplugin.Summary())
|
|
check.name = "Disk Remaining Life"
|
|
case 'disk_ident':
|
|
check = nagiosplugin.Check(
|
|
SNMPSynologyDiskIdentResource(session=session),
|
|
nagiosplugin.ScalarContext(name='disk_ident_scalar_context', warning=args.warning, critical=args.critical),
|
|
nagiosplugin.Summary())
|
|
check.name = "Disk IdentFail"
|
|
case 'disk_sectors':
|
|
check = nagiosplugin.Check(
|
|
SNMPSynologyDiskSectorsResource(session=session),
|
|
nagiosplugin.ScalarContext(name='disk_sectors_scalar_context', warning=args.warning, critical=args.critical),
|
|
nagiosplugin.Summary())
|
|
check.name = "Disk BadSectors"
|
|
case 'raid':
|
|
check = nagiosplugin.Check(
|
|
SNMPSynologyRaidStatusResource(session=session),
|
|
SNMPSynologyRaidStatusContext(name='raid_status_context'),
|
|
SNMPSynologySummary())
|
|
check.name = "Raid status"
|
|
case 'raid_space':
|
|
check = nagiosplugin.Check(
|
|
SNMPSynologyRaidSpaceResource(session=session),
|
|
nagiosplugin.ScalarContext(name='raid_space_scalar_context', warning=args.warning, critical=args.critical),
|
|
nagiosplugin.Summary())
|
|
check.name = "Raid space usage"
|
|
case 'ups':
|
|
check = nagiosplugin.Check(
|
|
SNMPSynologyUPSResource(session=session),
|
|
SNMPSynologyUPSContext(name='ups_context'),
|
|
SNMPSynologySummary())
|
|
check.name = "UPS status"
|
|
case _:
|
|
raise nagiosplugin.CheckError(f'Unknown check mode: {args.check_mode}')
|
|
|
|
check.main(args.verbose, args.timeout)
|
|
|
|
if __name__ == '__main__':
|
|
main() |