2015-09-26 08:36:40 -07:00
|
|
|
// Copyright 2015 The Prometheus Authors
|
|
|
|
// Licensed under the Apache License, Version 2.0 (the "License");
|
|
|
|
// you may not use this file except in compliance with the License.
|
|
|
|
// You may obtain a copy of the License at
|
|
|
|
//
|
|
|
|
// http://www.apache.org/licenses/LICENSE-2.0
|
|
|
|
//
|
|
|
|
// Unless required by applicable law or agreed to in writing, software
|
|
|
|
// distributed under the License is distributed on an "AS IS" BASIS,
|
|
|
|
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
|
|
// See the License for the specific language governing permissions and
|
|
|
|
// limitations under the License.
|
|
|
|
|
2014-11-24 14:15:13 -08:00
|
|
|
// +build !norunit
|
2014-02-07 08:09:39 -08:00
|
|
|
|
2014-02-18 03:35:11 -08:00
|
|
|
package collector
|
2013-07-25 06:30:35 -07:00
|
|
|
|
|
|
|
import (
|
|
|
|
"github.com/prometheus/client_golang/prometheus"
|
2015-10-30 13:20:06 -07:00
|
|
|
"github.com/prometheus/common/log"
|
2013-07-25 06:30:35 -07:00
|
|
|
"github.com/soundcloud/go-runit/runit"
|
2017-08-12 06:07:24 -07:00
|
|
|
"gopkg.in/alecthomas/kingpin.v2"
|
2013-07-25 06:30:35 -07:00
|
|
|
)
|
|
|
|
|
2017-08-12 06:07:24 -07:00
|
|
|
var runitServiceDir = kingpin.Flag("collector.runit.servicedir", "Path to runit service directory.").Default("/etc/service").String()
|
2016-12-19 04:10:38 -08:00
|
|
|
|
2013-07-25 06:30:35 -07:00
|
|
|
type runitCollector struct {
|
2016-12-28 06:21:31 -08:00
|
|
|
state, stateDesired, stateNormal, stateTimestamp typedDesc
|
2013-07-25 06:30:35 -07:00
|
|
|
}
|
|
|
|
|
2014-02-07 08:09:39 -08:00
|
|
|
func init() {
|
2017-09-28 06:06:26 -07:00
|
|
|
registerCollector("runit", defaultDisabled, NewRunitCollector)
|
2014-02-07 08:09:39 -08:00
|
|
|
}
|
|
|
|
|
2017-02-28 08:44:53 -08:00
|
|
|
// NewRunitCollector returns a new Collector exposing runit statistics.
|
2015-05-20 11:04:49 -07:00
|
|
|
func NewRunitCollector() (Collector, error) {
|
2014-11-24 14:15:13 -08:00
|
|
|
var (
|
|
|
|
subsystem = "service"
|
|
|
|
constLabels = prometheus.Labels{"supervisor": "runit"}
|
|
|
|
labelNames = []string{"service"}
|
|
|
|
)
|
2013-07-25 06:30:35 -07:00
|
|
|
|
2014-11-24 18:00:17 -08:00
|
|
|
return &runitCollector{
|
2016-12-28 06:21:31 -08:00
|
|
|
state: typedDesc{prometheus.NewDesc(
|
2017-09-28 06:06:26 -07:00
|
|
|
prometheus.BuildFQName(namespace, subsystem, "state"),
|
2016-12-28 06:21:31 -08:00
|
|
|
"State of runit service.",
|
|
|
|
labelNames, constLabels,
|
|
|
|
), prometheus.GaugeValue},
|
|
|
|
stateDesired: typedDesc{prometheus.NewDesc(
|
2017-09-28 06:06:26 -07:00
|
|
|
prometheus.BuildFQName(namespace, subsystem, "desired_state"),
|
2016-12-28 06:21:31 -08:00
|
|
|
"Desired state of runit service.",
|
|
|
|
labelNames, constLabels,
|
|
|
|
), prometheus.GaugeValue},
|
|
|
|
stateNormal: typedDesc{prometheus.NewDesc(
|
2017-09-28 06:06:26 -07:00
|
|
|
prometheus.BuildFQName(namespace, subsystem, "normal_state"),
|
2016-12-28 06:21:31 -08:00
|
|
|
"Normal state of runit service.",
|
|
|
|
labelNames, constLabels,
|
|
|
|
), prometheus.GaugeValue},
|
|
|
|
stateTimestamp: typedDesc{prometheus.NewDesc(
|
2017-09-28 06:06:26 -07:00
|
|
|
prometheus.BuildFQName(namespace, subsystem, "state_last_change_timestamp_seconds"),
|
2016-12-28 06:21:31 -08:00
|
|
|
"Unix timestamp of the last runit service state change.",
|
|
|
|
labelNames, constLabels,
|
|
|
|
), prometheus.GaugeValue},
|
2014-11-24 18:00:17 -08:00
|
|
|
}, nil
|
2013-07-25 06:30:35 -07:00
|
|
|
}
|
|
|
|
|
2014-11-24 18:00:17 -08:00
|
|
|
func (c *runitCollector) Update(ch chan<- prometheus.Metric) error {
|
2016-12-19 04:10:38 -08:00
|
|
|
services, err := runit.GetServices(*runitServiceDir)
|
2013-07-25 06:30:35 -07:00
|
|
|
if err != nil {
|
2014-10-29 07:16:43 -07:00
|
|
|
return err
|
2013-07-25 06:30:35 -07:00
|
|
|
}
|
|
|
|
|
|
|
|
for _, service := range services {
|
|
|
|
status, err := service.Status()
|
|
|
|
if err != nil {
|
2015-05-28 12:21:44 -07:00
|
|
|
log.Debugf("Couldn't get status for %s: %s, skipping...", service.Name, err)
|
2013-07-30 07:08:54 -07:00
|
|
|
continue
|
2013-07-25 06:30:35 -07:00
|
|
|
}
|
2013-07-25 06:55:07 -07:00
|
|
|
|
2015-05-28 12:21:44 -07:00
|
|
|
log.Debugf("%s is %d on pid %d for %d seconds", service.Name, status.State, status.Pid, status.Duration)
|
2016-12-28 06:21:31 -08:00
|
|
|
ch <- c.state.mustNewConstMetric(float64(status.State), service.Name)
|
|
|
|
ch <- c.stateDesired.mustNewConstMetric(float64(status.Want), service.Name)
|
|
|
|
ch <- c.stateTimestamp.mustNewConstMetric(float64(status.Timestamp.Unix()), service.Name)
|
2013-07-25 06:30:35 -07:00
|
|
|
if status.NormallyUp {
|
2016-12-28 06:21:31 -08:00
|
|
|
ch <- c.stateNormal.mustNewConstMetric(1, service.Name)
|
2013-07-25 06:30:35 -07:00
|
|
|
} else {
|
2016-12-28 06:21:31 -08:00
|
|
|
ch <- c.stateNormal.mustNewConstMetric(0, service.Name)
|
2013-07-25 06:30:35 -07:00
|
|
|
}
|
|
|
|
}
|
2014-11-24 18:00:17 -08:00
|
|
|
return nil
|
2013-07-25 06:30:35 -07:00
|
|
|
}
|