docker-storcli-prometheus/storcli.py

179 lines
6.7 KiB
Python
Raw Normal View History

2018-05-21 10:55:24 -06:00
#!/usr/bin/env python
"""
Based on storcli.py example from node_exporter, with substantial changes.
https://github.com/prometheus/node_exporter/blob/master/text_collector_examples/storcli.py
megaraid_controllers{controller,model}=1
megaraid_controller_memory_errors{controller,correctable=y|n}=counter
megaraid_controller_bbu{controller}=0|1
megaraid_roc_temp_celcius{controller}=gauge
megaraid_virtual_drives{controller,vd,type,state=optimal|partially|degraded|offline}=1
megaraid_vd_size_bytes{controller,vd}=gauge
megaraid_physical_drives{controller,enclosure,slot,vd,state=online|offline|ugood|ubad|ghs|dhs}=1
megaraid_pd_size_bytes{controller,enclosure,slot}=gauge
"""
from __future__ import print_function
import argparse
import json
import os
import subprocess
import re
2018-06-21 12:18:38 -06:00
import time
2018-05-21 10:55:24 -06:00
from decimal import Decimal
DESCRIPTION = """Parses StorCLI's JSON output and exposes MegaRAID health as
Prometheus metrics."""
VERSION = '0.0.1'
def parse_size(size):
n, u = re.match(r'(\d+\.\d+) ([A-Z])B$', size).groups()
n = Decimal(n)
for k in 'KMGTPE':
n *= 1024
if u == k:
break
else:
raise RuntimeError('unsupported size unit')
return int(n)
def main(args):
""" main """
controllers = []
vds = []
pds = []
2018-06-21 12:18:38 -06:00
start = time.time()
2018-05-21 10:55:24 -06:00
data = json.loads(get_storcli_json(args.storcli_path))
2018-06-21 12:18:38 -06:00
end = time.time()
2018-05-21 10:55:24 -06:00
cmd = os.path.split(args.storcli_path)[-1]
2018-05-21 10:55:24 -06:00
for ctrl in data['Controllers']:
dg_vd_map = {'-': None}
resp = ctrl.get('Response Data')
if not resp:
continue
ctrl_id = int(resp['Basics']['Controller'])
controllers.append({
'controller': ctrl_id,
'model': resp['Basics']['Model'],
'errors_correctable': int(resp['Status']['Memory Correctable Errors']),
'errors_uncorrectable': int(resp['Status']['Memory Uncorrectable Errors']),
'bbu': int(resp['HwCfg']['BBU'] != 'Absent'),
2018-06-21 11:45:24 -06:00
'roc_temp': int(resp['HwCfg'].get('ROC temperature(Degree Celsius)', 0)),
2018-05-21 10:55:24 -06:00
})
for vd in resp['VD LIST']:
dg, vd_id = map(int, vd['DG/VD'].split('/'))
dg_vd_map[vd_id] = dg
vds.append({
'controller': ctrl_id,
'vd': vd_id,
'type': vd['TYPE'],
2018-05-21 11:40:25 -06:00
'state': vd['State'].lower(),
2018-05-21 10:55:24 -06:00
'size': parse_size(vd['Size']),
})
for pd in resp['PD LIST']:
enc, slot = map(int, pd['EID:Slt'].split(':'))
pds.append({
'controller': ctrl_id,
'enclosure': enc,
'slot': slot,
'vd': dg_vd_map.get(pd['DG']),
2018-05-21 11:40:25 -06:00
'state': pd['State'].lower(),
2018-05-21 10:55:24 -06:00
'size': parse_size(pd['Size']),
})
2018-06-21 12:18:38 -06:00
print('# HELP megaraid_scrape_duration_seconds Scrape duration')
print('# TYPE megaraid_scrape_duration_seconds gauge')
print('megaraid_scrape_duration_seconds{{cmd="{cmd}"}} {duration:f}'.format(cmd=cmd, duration=end - start))
2018-06-21 12:18:38 -06:00
2018-05-21 10:55:24 -06:00
print('# HELP megaraid_controllers MegaRAID controllers')
2018-05-21 11:17:11 -06:00
print('# TYPE megaraid_controllers gauge')
2018-05-21 10:55:24 -06:00
for ctrl in controllers:
print('megaraid_controllers{{cmd="{cmd}",controller="{controller}",model="{model}"}} 1'.format(cmd=cmd, **ctrl))
2018-05-21 10:55:24 -06:00
print('# HELP megaraid_controller_memory_errors MegaRAID controller memory errors')
print('# TYPE megaraid_controller_memory_errors counter')
for ctrl in controllers:
print('megaraid_controller_memory_errors{{cmd="{cmd}",controller="{controller}",correctable="y"}} '
'{errors_correctable}'.format(cmd=cmd, **ctrl))
print('megaraid_controller_memory_errors{{cmd="{cmd}",controller="{controller}",correctable="n"}} '
'{errors_uncorrectable}'.format(cmd=cmd, **ctrl))
2018-05-21 10:55:24 -06:00
print('# HELP megaraid_controller_bbu MegaRAID controller BBU presence')
2018-05-21 11:17:11 -06:00
print('# TYPE megaraid_controller_bbu gauge')
2018-05-21 10:55:24 -06:00
for ctrl in controllers:
print('megaraid_controller_bbu{{cmd="{cmd}",controller="{controller}"}} {bbu}'.format(cmd=cmd, **ctrl))
2018-05-21 10:55:24 -06:00
print('# HELP megaraid_roc_temp_celcius MegaRAID controller ROC temperature')
2018-05-21 11:17:11 -06:00
print('# TYPE megaraid_roc_temp_celcius gauge')
2018-05-21 10:55:24 -06:00
for ctrl in controllers:
print('megaraid_roc_temp_celcius{{cmd="{cmd}",controller="{controller}"}} {roc_temp}'.format(cmd=cmd, **ctrl))
2018-05-21 10:55:24 -06:00
print('# HELP megaraid_virtual_drives MegaRAID virtual drives')
2018-05-21 11:17:11 -06:00
print('# TYPE megaraid_virtual_drives gauge')
2018-05-21 10:55:24 -06:00
for vd in vds:
print('megaraid_virtual_drives{{cmd="{cmd}",controller="{controller}",vd="{vd}",'
'type="{type}",state="{state}"}} 1'.format(cmd=cmd, **vd))
2018-05-21 10:55:24 -06:00
print('# HELP megaraid_vd_size_bytes MegaRAID virtual drive size')
2018-05-21 11:17:11 -06:00
print('# TYPE megaraid_vd_size_bytes gauge')
2018-05-21 10:55:24 -06:00
for vd in vds:
print('megaraid_vd_size_bytes{{cmd="{cmd}",controller="{controller}",vd="{vd}"}} {size}'.format(cmd=cmd, **vd))
2018-05-21 10:55:24 -06:00
print('# HELP megaraid_physical_drives MegaRAID physical drives')
2018-05-21 11:17:11 -06:00
print('# TYPE megaraid_physical_drives gauge')
2018-05-21 10:55:24 -06:00
for pd in pds:
print('megaraid_physical_drives{{cmd="{cmd}",controller="{controller}",enclosure="{enclosure}",'
'slot="{slot}",vd="{vd}",state="{state}"}} 1'.format(cmd=cmd, **pd))
2018-05-21 10:55:24 -06:00
print('# HELP megaraid_pd_size_bytes MegaRAID physical drive size')
2018-05-21 11:17:11 -06:00
print('# TYPE megaraid_pd_size_bytes gauge')
2018-05-21 10:55:24 -06:00
for pd in pds:
print('megaraid_pd_size_bytes{{cmd="{cmd}",controller="{controller}",enclosure="{enclosure}",'
'slot="{slot}"}} {size}'.format(cmd=cmd, **pd))
2018-05-21 10:55:24 -06:00
def get_storcli_json(storcli_path):
"""Get storcli output in JSON format."""
# Check if storcli is installed
if os.path.isfile(storcli_path) and os.access(storcli_path, os.X_OK):
2018-05-21 11:05:31 -06:00
storcli_cmd = [storcli_path, '/call', 'show', 'all', 'J']
2018-05-21 10:55:24 -06:00
proc = subprocess.Popen(storcli_cmd, shell=False,
stdout=subprocess.PIPE, stderr=subprocess.PIPE)
output_json = proc.communicate()[0]
else:
output_json = (
'{"Controllers":[{"Command Status": {"Status": "Failure", '
'"Description": "No Controller found"}}]}'
)
# Trim crap
output_json = re.sub(r'[\x00-\x1f\x7f-\xff]', '', output_json)
2018-05-21 10:55:24 -06:00
return output_json
if __name__ == "__main__":
PARSER = argparse.ArgumentParser(description=DESCRIPTION,
formatter_class=argparse.ArgumentDefaultsHelpFormatter)
PARSER.add_argument('--storcli_path',
default='/usr/sbin/storcli',
help='path to StorCLi binary')
PARSER.add_argument('--version',
action='version',
version='%(prog)s {}'.format(VERSION))
ARGS = PARSER.parse_args()
main(ARGS)