2014-07-08 07:24:29 -07:00
|
|
|
// +build megacli
|
|
|
|
|
|
|
|
package collector
|
|
|
|
|
|
|
|
import (
|
|
|
|
"bufio"
|
|
|
|
"io"
|
|
|
|
"os/exec"
|
|
|
|
"strconv"
|
|
|
|
"strings"
|
|
|
|
|
|
|
|
"github.com/prometheus/client_golang/prometheus"
|
|
|
|
)
|
|
|
|
|
|
|
|
const (
|
|
|
|
defaultMegaCli = "megacli"
|
|
|
|
adapterHeaderSep = "================"
|
|
|
|
)
|
|
|
|
|
|
|
|
var (
|
|
|
|
driveTemperature = prometheus.NewGaugeVec(prometheus.GaugeOpts{
|
|
|
|
Namespace: Namespace,
|
2014-07-09 09:47:17 -07:00
|
|
|
Name: "megacli_drive_temperature_celsius",
|
2014-07-08 07:24:29 -07:00
|
|
|
Help: "megacli: drive temperature",
|
|
|
|
}, []string{"enclosure", "slot"})
|
|
|
|
|
|
|
|
driveCounters = prometheus.NewCounterVec(prometheus.CounterOpts{
|
|
|
|
Namespace: Namespace,
|
2014-07-09 09:47:17 -07:00
|
|
|
Name: "megacli_drive_count",
|
2014-07-08 07:24:29 -07:00
|
|
|
Help: "megacli: drive error and event counters",
|
|
|
|
}, []string{"enclosure", "slot", "type"})
|
|
|
|
|
|
|
|
drivePresence = prometheus.NewGaugeVec(prometheus.GaugeOpts{
|
|
|
|
Namespace: Namespace,
|
2014-07-09 09:47:17 -07:00
|
|
|
Name: "megacli_adapter_disk_presence",
|
2014-07-08 07:24:29 -07:00
|
|
|
Help: "megacli: disk presence per adapter",
|
|
|
|
}, []string{"type"})
|
|
|
|
|
|
|
|
counters = []string{"Media Error Count", "Other Error Count", "Predictive Failure Count"}
|
|
|
|
)
|
|
|
|
|
|
|
|
func init() {
|
|
|
|
Factories["megacli"] = NewMegaCliCollector
|
|
|
|
}
|
|
|
|
|
|
|
|
func parseMegaCliDisks(r io.ReadCloser) (map[int]map[int]map[string]string, error) {
|
|
|
|
defer r.Close()
|
|
|
|
stats := map[int]map[int]map[string]string{}
|
|
|
|
scanner := bufio.NewScanner(r)
|
|
|
|
|
|
|
|
curEnc := -1
|
|
|
|
curSlot := -1
|
|
|
|
for scanner.Scan() {
|
|
|
|
var err error
|
|
|
|
text := strings.TrimSpace(scanner.Text())
|
|
|
|
parts := strings.SplitN(text, ":", 2)
|
|
|
|
if len(parts) != 2 { // Adapter #X
|
|
|
|
continue
|
|
|
|
}
|
|
|
|
key := strings.TrimSpace(parts[0])
|
|
|
|
value := strings.TrimSpace(parts[1])
|
|
|
|
switch {
|
|
|
|
case key == "Enclosure Device ID":
|
|
|
|
curEnc, err = strconv.Atoi(value)
|
|
|
|
if err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
case key == "Slot Number":
|
|
|
|
curSlot, err = strconv.Atoi(value)
|
|
|
|
if err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
case curSlot != -1 && curEnc != -1:
|
|
|
|
if _, ok := stats[curEnc]; !ok {
|
|
|
|
stats[curEnc] = map[int]map[string]string{}
|
|
|
|
}
|
|
|
|
if _, ok := stats[curEnc][curSlot]; !ok {
|
|
|
|
stats[curEnc][curSlot] = map[string]string{}
|
|
|
|
}
|
|
|
|
stats[curEnc][curSlot][key] = value
|
|
|
|
}
|
|
|
|
}
|
|
|
|
return stats, nil
|
|
|
|
}
|
|
|
|
|
|
|
|
func parseMegaCliAdapter(r io.ReadCloser) (map[string]map[string]string, error) {
|
|
|
|
defer r.Close()
|
|
|
|
raidStats := map[string]map[string]string{}
|
|
|
|
scanner := bufio.NewScanner(r)
|
|
|
|
header := ""
|
|
|
|
last := ""
|
|
|
|
for scanner.Scan() {
|
|
|
|
text := strings.TrimSpace(scanner.Text())
|
|
|
|
if text == adapterHeaderSep {
|
|
|
|
header = last
|
|
|
|
raidStats[header] = map[string]string{}
|
|
|
|
continue
|
|
|
|
}
|
|
|
|
last = text
|
|
|
|
if header == "" { // skip Adapter #X and separator
|
|
|
|
continue
|
|
|
|
}
|
|
|
|
parts := strings.SplitN(text, ":", 2)
|
|
|
|
if len(parts) != 2 { // these section never include anything we are interested in
|
|
|
|
continue
|
|
|
|
}
|
|
|
|
key := strings.TrimSpace(parts[0])
|
|
|
|
value := strings.TrimSpace(parts[1])
|
|
|
|
|
|
|
|
raidStats[header][key] = value
|
|
|
|
|
|
|
|
}
|
|
|
|
return raidStats, nil
|
|
|
|
}
|
|
|
|
|
|
|
|
type megaCliCollector struct {
|
|
|
|
config Config
|
|
|
|
cli string
|
|
|
|
}
|
|
|
|
|
|
|
|
// Takes a config struct and prometheus registry and returns a new Collector exposing
|
|
|
|
// RAID status through megacli.
|
|
|
|
func NewMegaCliCollector(config Config) (Collector, error) {
|
|
|
|
cli := defaultMegaCli
|
|
|
|
if config.Config["megacli_command"] != "" {
|
|
|
|
cli = config.Config["megacli_command"]
|
|
|
|
}
|
|
|
|
|
|
|
|
c := megaCliCollector{
|
|
|
|
config: config,
|
|
|
|
cli: cli,
|
|
|
|
}
|
|
|
|
return &c, nil
|
|
|
|
}
|
|
|
|
|
2014-10-29 07:16:43 -07:00
|
|
|
func (c *megaCliCollector) Update(ch chan<- prometheus.Metric) (err error) {
|
|
|
|
err = c.updateAdapter()
|
2014-07-08 07:24:29 -07:00
|
|
|
if err != nil {
|
2014-10-29 07:16:43 -07:00
|
|
|
return err
|
2014-07-08 07:24:29 -07:00
|
|
|
}
|
2014-10-29 07:16:43 -07:00
|
|
|
err = c.updateDisks()
|
|
|
|
driveTemperature.Collect(ch)
|
|
|
|
driveCounters.Collect(ch)
|
|
|
|
drivePresence.Collect(ch)
|
|
|
|
return err
|
2014-07-08 07:24:29 -07:00
|
|
|
}
|
|
|
|
|
2014-10-29 07:16:43 -07:00
|
|
|
func (c *megaCliCollector) updateAdapter() error {
|
2014-07-08 07:24:29 -07:00
|
|
|
cmd := exec.Command(c.cli, "-AdpAllInfo", "-aALL")
|
|
|
|
pipe, err := cmd.StdoutPipe()
|
|
|
|
if err != nil {
|
2014-10-29 07:16:43 -07:00
|
|
|
return err
|
2014-07-08 07:24:29 -07:00
|
|
|
}
|
|
|
|
|
|
|
|
if err := cmd.Start(); err != nil {
|
2014-10-29 07:16:43 -07:00
|
|
|
return err
|
2014-07-08 07:24:29 -07:00
|
|
|
}
|
|
|
|
|
|
|
|
stats, err := parseMegaCliAdapter(pipe)
|
|
|
|
if err != nil {
|
2014-10-29 07:16:43 -07:00
|
|
|
return err
|
2014-07-08 07:24:29 -07:00
|
|
|
}
|
|
|
|
if err := cmd.Wait(); err != nil {
|
2014-10-29 07:16:43 -07:00
|
|
|
return err
|
2014-07-08 07:24:29 -07:00
|
|
|
}
|
|
|
|
|
|
|
|
for k, v := range stats["Device Present"] {
|
|
|
|
value, err := strconv.ParseFloat(v, 64)
|
|
|
|
if err != nil {
|
2014-10-29 07:16:43 -07:00
|
|
|
return err
|
2014-07-08 07:24:29 -07:00
|
|
|
}
|
|
|
|
drivePresence.WithLabelValues(k).Set(value)
|
|
|
|
}
|
2014-10-29 07:16:43 -07:00
|
|
|
return nil
|
2014-07-08 07:24:29 -07:00
|
|
|
}
|
|
|
|
|
2014-10-29 07:16:43 -07:00
|
|
|
func (c *megaCliCollector) updateDisks() error {
|
2014-07-08 07:24:29 -07:00
|
|
|
cmd := exec.Command(c.cli, "-PDList", "-aALL")
|
|
|
|
pipe, err := cmd.StdoutPipe()
|
|
|
|
if err != nil {
|
2014-10-29 07:16:43 -07:00
|
|
|
return err
|
2014-07-08 07:24:29 -07:00
|
|
|
}
|
|
|
|
|
|
|
|
if err := cmd.Start(); err != nil {
|
2014-10-29 07:16:43 -07:00
|
|
|
return err
|
2014-07-08 07:24:29 -07:00
|
|
|
}
|
|
|
|
|
|
|
|
stats, err := parseMegaCliDisks(pipe)
|
|
|
|
if err != nil {
|
2014-10-29 07:16:43 -07:00
|
|
|
return err
|
2014-07-08 07:24:29 -07:00
|
|
|
}
|
|
|
|
if err := cmd.Wait(); err != nil {
|
2014-10-29 07:16:43 -07:00
|
|
|
return err
|
2014-07-08 07:24:29 -07:00
|
|
|
}
|
|
|
|
|
|
|
|
for enc, encStats := range stats {
|
|
|
|
for slot, slotStats := range encStats {
|
|
|
|
tStr := slotStats["Drive Temperature"]
|
|
|
|
tStr = tStr[:strings.Index(tStr, "C")]
|
|
|
|
t, err := strconv.ParseFloat(tStr, 64)
|
|
|
|
if err != nil {
|
2014-10-29 07:16:43 -07:00
|
|
|
return err
|
2014-07-08 07:24:29 -07:00
|
|
|
}
|
|
|
|
|
|
|
|
encStr := strconv.Itoa(enc)
|
|
|
|
slotStr := strconv.Itoa(slot)
|
|
|
|
|
|
|
|
driveTemperature.WithLabelValues(encStr, slotStr).Set(t)
|
|
|
|
|
|
|
|
for _, c := range counters {
|
|
|
|
counter, err := strconv.ParseFloat(slotStats[c], 64)
|
|
|
|
if err != nil {
|
2014-10-29 07:16:43 -07:00
|
|
|
return err
|
2014-07-08 07:24:29 -07:00
|
|
|
}
|
|
|
|
|
|
|
|
driveCounters.WithLabelValues(encStr, slotStr, c).Set(counter)
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
2014-10-29 07:16:43 -07:00
|
|
|
return nil
|
2014-07-08 07:24:29 -07:00
|
|
|
}
|