mirror of
https://github.com/prometheus/node_exporter.git
synced 2025-01-15 16:03:03 -08:00
96eaff8c7e
This catches things like listen overflows, retransmits and other things that are very useful for retroactive debugging thus I think it's justified to have it on by default.
162 lines
3.8 KiB
Go
162 lines
3.8 KiB
Go
package main
|
|
|
|
import (
|
|
"encoding/json"
|
|
"flag"
|
|
"fmt"
|
|
"io/ioutil"
|
|
"log"
|
|
"net/http"
|
|
"os"
|
|
"os/signal"
|
|
"runtime/pprof"
|
|
"strings"
|
|
"sync"
|
|
"syscall"
|
|
"time"
|
|
|
|
"github.com/golang/glog"
|
|
"github.com/prometheus/client_golang/prometheus"
|
|
"github.com/prometheus/node_exporter/collector"
|
|
)
|
|
|
|
const subsystem = "exporter"
|
|
|
|
var (
|
|
configFile = flag.String("config", "node_exporter.conf", "config file.")
|
|
memProfile = flag.String("memprofile", "", "write memory profile to this file")
|
|
listeningAddress = flag.String("listen", ":8080", "address to listen on")
|
|
enabledCollectors = flag.String("enabledCollectors", "attributes,diskstats,filesystem,loadavg,meminfo,stat,time,netdev,netstat", "comma-seperated list of collectors to use")
|
|
printCollectors = flag.Bool("printCollectors", false, "If true, print available collectors and exit")
|
|
|
|
collectorLabelNames = []string{"collector", "result"}
|
|
|
|
scrapeDurations = prometheus.NewSummaryVec(
|
|
prometheus.SummaryOpts{
|
|
Namespace: collector.Namespace,
|
|
Subsystem: subsystem,
|
|
Name: "scrape_duration_seconds",
|
|
Help: "node_exporter: Duration of a scrape job.",
|
|
},
|
|
collectorLabelNames,
|
|
)
|
|
)
|
|
|
|
// Implements Collector.
|
|
type NodeCollector struct {
|
|
collectors map[string]collector.Collector
|
|
}
|
|
|
|
// Implements Collector.
|
|
func (n NodeCollector) Describe(ch chan<- *prometheus.Desc) {
|
|
scrapeDurations.Describe(ch)
|
|
}
|
|
|
|
// Implements Collector.
|
|
func (n NodeCollector) Collect(ch chan<- prometheus.Metric) {
|
|
wg := sync.WaitGroup{}
|
|
wg.Add(len(n.collectors))
|
|
for name, c := range n.collectors {
|
|
go func(name string, c collector.Collector) {
|
|
Execute(name, c, ch)
|
|
wg.Done()
|
|
}(name, c)
|
|
}
|
|
wg.Wait()
|
|
scrapeDurations.Collect(ch)
|
|
}
|
|
|
|
func Execute(name string, c collector.Collector, ch chan<- prometheus.Metric) {
|
|
begin := time.Now()
|
|
err := c.Update(ch)
|
|
duration := time.Since(begin)
|
|
var result string
|
|
|
|
if err != nil {
|
|
glog.Infof("ERROR: %s failed after %fs: %s", name, duration.Seconds(), err)
|
|
result = "error"
|
|
} else {
|
|
glog.Infof("OK: %s success after %fs.", name, duration.Seconds())
|
|
result = "success"
|
|
}
|
|
scrapeDurations.WithLabelValues(name, result).Observe(duration.Seconds())
|
|
}
|
|
|
|
func getConfig(file string) (*collector.Config, error) {
|
|
config := &collector.Config{}
|
|
glog.Infof("Reading config %s", *configFile)
|
|
bytes, err := ioutil.ReadFile(*configFile)
|
|
if err != nil {
|
|
return nil, err
|
|
}
|
|
return config, json.Unmarshal(bytes, &config)
|
|
}
|
|
|
|
func loadCollectors(file string) (map[string]collector.Collector, error) {
|
|
collectors := map[string]collector.Collector{}
|
|
config, err := getConfig(file)
|
|
if err != nil {
|
|
log.Fatalf("Couldn't read config %s: %s", file, err)
|
|
}
|
|
for _, name := range strings.Split(*enabledCollectors, ",") {
|
|
fn, ok := collector.Factories[name]
|
|
if !ok {
|
|
log.Fatalf("Collector '%s' not available", name)
|
|
}
|
|
c, err := fn(*config)
|
|
if err != nil {
|
|
return nil, err
|
|
}
|
|
collectors[name] = c
|
|
}
|
|
return collectors, nil
|
|
}
|
|
|
|
func main() {
|
|
flag.Parse()
|
|
if *printCollectors {
|
|
fmt.Printf("Available collectors:\n")
|
|
for n, _ := range collector.Factories {
|
|
fmt.Printf(" - %s\n", n)
|
|
}
|
|
return
|
|
}
|
|
collectors, err := loadCollectors(*configFile)
|
|
if err != nil {
|
|
log.Fatalf("Couldn't load config and collectors: %s", err)
|
|
}
|
|
|
|
glog.Infof("Enabled collectors:")
|
|
for n, _ := range collectors {
|
|
glog.Infof(" - %s", n)
|
|
}
|
|
|
|
nodeCollector := NodeCollector{collectors: collectors}
|
|
prometheus.MustRegister(nodeCollector)
|
|
|
|
sigUsr1 := make(chan os.Signal)
|
|
signal.Notify(sigUsr1, syscall.SIGUSR1)
|
|
|
|
go func() {
|
|
http.Handle("/metrics", prometheus.Handler())
|
|
http.ListenAndServe(*listeningAddress, nil)
|
|
}()
|
|
|
|
for {
|
|
select {
|
|
case <-sigUsr1:
|
|
glog.Infof("got signal")
|
|
if *memProfile != "" {
|
|
glog.Infof("Writing memory profile to %s", *memProfile)
|
|
f, err := os.Create(*memProfile)
|
|
if err != nil {
|
|
log.Fatal(err)
|
|
}
|
|
pprof.WriteHeapProfile(f)
|
|
f.Close()
|
|
}
|
|
}
|
|
}
|
|
|
|
}
|