2015-04-20 03:24:25 -07:00
|
|
|
// Copyright 2015 The Prometheus Authors
|
2013-06-11 13:59:27 -07:00
|
|
|
// Licensed under the Apache License, Version 2.0 (the "License");
|
|
|
|
// you may not use this file except in compliance with the License.
|
|
|
|
// You may obtain a copy of the License at
|
|
|
|
//
|
|
|
|
// http://www.apache.org/licenses/LICENSE-2.0
|
|
|
|
//
|
|
|
|
// Unless required by applicable law or agreed to in writing, software
|
|
|
|
// distributed under the License is distributed on an "AS IS" BASIS,
|
|
|
|
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
|
|
// See the License for the specific language governing permissions and
|
|
|
|
// limitations under the License.
|
|
|
|
|
2015-04-20 03:24:25 -07:00
|
|
|
package discovery
|
2013-06-11 13:59:27 -07:00
|
|
|
|
|
|
|
import (
|
|
|
|
"fmt"
|
2014-03-09 15:17:17 -07:00
|
|
|
"net"
|
2013-10-29 08:34:00 -07:00
|
|
|
"strings"
|
2015-04-20 03:24:25 -07:00
|
|
|
"sync"
|
2013-06-11 13:59:27 -07:00
|
|
|
"time"
|
|
|
|
|
2013-09-10 08:48:05 -07:00
|
|
|
"github.com/miekg/dns"
|
2014-06-18 10:43:15 -07:00
|
|
|
"github.com/prometheus/client_golang/prometheus"
|
2015-05-20 09:10:29 -07:00
|
|
|
"github.com/prometheus/log"
|
2013-09-10 08:48:05 -07:00
|
|
|
|
2013-06-25 05:02:27 -07:00
|
|
|
clientmodel "github.com/prometheus/client_golang/model"
|
2015-05-20 09:10:29 -07:00
|
|
|
|
2013-06-11 13:59:27 -07:00
|
|
|
"github.com/prometheus/prometheus/config"
|
|
|
|
)
|
|
|
|
|
2015-04-20 03:24:25 -07:00
|
|
|
const (
|
|
|
|
resolvConf = "/etc/resolv.conf"
|
|
|
|
|
2015-08-07 04:18:19 -07:00
|
|
|
DNSNameLabel = clientmodel.MetaLabelPrefix + "dns_srv_name"
|
2015-04-20 03:24:25 -07:00
|
|
|
|
|
|
|
// Constants for instrumentation.
|
|
|
|
namespace = "prometheus"
|
|
|
|
interval = "interval"
|
|
|
|
)
|
2013-09-10 08:48:05 -07:00
|
|
|
|
2014-06-18 10:43:15 -07:00
|
|
|
var (
|
2014-12-26 04:37:30 -08:00
|
|
|
dnsSDLookupsCount = prometheus.NewCounter(
|
2014-06-18 10:43:15 -07:00
|
|
|
prometheus.CounterOpts{
|
2014-07-23 10:55:33 -07:00
|
|
|
Namespace: namespace,
|
|
|
|
Name: "dns_sd_lookups_total",
|
2014-12-26 04:37:30 -08:00
|
|
|
Help: "The number of DNS-SD lookups.",
|
|
|
|
})
|
|
|
|
dnsSDLookupFailuresCount = prometheus.NewCounter(
|
|
|
|
prometheus.CounterOpts{
|
|
|
|
Namespace: namespace,
|
|
|
|
Name: "dns_sd_lookup_failures_total",
|
|
|
|
Help: "The number of DNS-SD lookup failures.",
|
|
|
|
})
|
2014-06-18 10:43:15 -07:00
|
|
|
)
|
|
|
|
|
|
|
|
func init() {
|
2014-12-26 04:37:30 -08:00
|
|
|
prometheus.MustRegister(dnsSDLookupFailuresCount)
|
2014-06-18 10:43:15 -07:00
|
|
|
prometheus.MustRegister(dnsSDLookupsCount)
|
|
|
|
}
|
|
|
|
|
2015-04-20 03:24:25 -07:00
|
|
|
// DNSDiscovery periodically performs DNS-SD requests. It implements
|
|
|
|
// the TargetProvider interface.
|
|
|
|
type DNSDiscovery struct {
|
2015-04-25 03:59:05 -07:00
|
|
|
names []string
|
2013-06-11 13:59:27 -07:00
|
|
|
|
2015-04-20 03:24:25 -07:00
|
|
|
done chan struct{}
|
|
|
|
ticker *time.Ticker
|
|
|
|
m sync.RWMutex
|
2015-07-30 01:56:48 -07:00
|
|
|
port int
|
|
|
|
qtype uint16
|
2015-04-20 03:24:25 -07:00
|
|
|
}
|
2013-06-11 13:59:27 -07:00
|
|
|
|
2015-04-20 03:24:25 -07:00
|
|
|
// NewDNSDiscovery returns a new DNSDiscovery which periodically refreshes its targets.
|
2015-05-15 05:54:29 -07:00
|
|
|
func NewDNSDiscovery(conf *config.DNSSDConfig) *DNSDiscovery {
|
2015-07-30 01:56:48 -07:00
|
|
|
qtype := dns.TypeSRV
|
|
|
|
switch strings.ToUpper(conf.Type) {
|
|
|
|
case "A":
|
|
|
|
qtype = dns.TypeA
|
|
|
|
case "AAAA":
|
|
|
|
qtype = dns.TypeAAAA
|
|
|
|
case "SRV":
|
|
|
|
qtype = dns.TypeSRV
|
|
|
|
}
|
2015-04-20 03:24:25 -07:00
|
|
|
return &DNSDiscovery{
|
2015-05-15 05:54:29 -07:00
|
|
|
names: conf.Names,
|
2015-04-20 03:24:25 -07:00
|
|
|
done: make(chan struct{}),
|
2015-05-15 05:54:29 -07:00
|
|
|
ticker: time.NewTicker(time.Duration(conf.RefreshInterval)),
|
2015-07-30 01:56:48 -07:00
|
|
|
qtype: qtype,
|
|
|
|
port: conf.Port,
|
2015-04-20 03:24:25 -07:00
|
|
|
}
|
2013-06-11 13:59:27 -07:00
|
|
|
}
|
|
|
|
|
2015-04-20 03:24:25 -07:00
|
|
|
// Run implements the TargetProvider interface.
|
|
|
|
func (dd *DNSDiscovery) Run(ch chan<- *config.TargetGroup) {
|
|
|
|
defer close(ch)
|
|
|
|
|
|
|
|
// Get an initial set right away.
|
2015-04-25 03:59:05 -07:00
|
|
|
dd.refreshAll(ch)
|
2015-04-20 03:24:25 -07:00
|
|
|
|
|
|
|
for {
|
|
|
|
select {
|
|
|
|
case <-dd.ticker.C:
|
2015-04-25 03:59:05 -07:00
|
|
|
dd.refreshAll(ch)
|
2015-04-20 03:24:25 -07:00
|
|
|
case <-dd.done:
|
|
|
|
return
|
|
|
|
}
|
2013-06-11 13:59:27 -07:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2015-04-20 03:24:25 -07:00
|
|
|
// Stop implements the TargetProvider interface.
|
|
|
|
func (dd *DNSDiscovery) Stop() {
|
2015-05-20 09:10:29 -07:00
|
|
|
log.Debug("Stopping DNS discovery for %s...", dd.names)
|
2013-12-13 17:50:48 -08:00
|
|
|
|
2015-04-20 03:24:25 -07:00
|
|
|
dd.ticker.Stop()
|
|
|
|
dd.done <- struct{}{}
|
|
|
|
|
2015-05-20 09:10:29 -07:00
|
|
|
log.Debug("DNS discovery for %s stopped.", dd.names)
|
2015-04-20 03:24:25 -07:00
|
|
|
}
|
2013-06-11 13:59:27 -07:00
|
|
|
|
2015-04-20 03:24:25 -07:00
|
|
|
// Sources implements the TargetProvider interface.
|
|
|
|
func (dd *DNSDiscovery) Sources() []string {
|
2015-04-25 03:59:05 -07:00
|
|
|
var srcs []string
|
|
|
|
for _, name := range dd.names {
|
2015-08-07 04:18:19 -07:00
|
|
|
srcs = append(srcs, name)
|
2015-04-25 03:59:05 -07:00
|
|
|
}
|
|
|
|
return srcs
|
|
|
|
}
|
|
|
|
|
|
|
|
func (dd *DNSDiscovery) refreshAll(ch chan<- *config.TargetGroup) {
|
|
|
|
var wg sync.WaitGroup
|
|
|
|
wg.Add(len(dd.names))
|
|
|
|
for _, name := range dd.names {
|
|
|
|
go func(n string) {
|
|
|
|
if err := dd.refresh(n, ch); err != nil {
|
2015-05-20 09:10:29 -07:00
|
|
|
log.Errorf("Error refreshing DNS targets: %s", err)
|
2015-04-25 03:59:05 -07:00
|
|
|
}
|
|
|
|
wg.Done()
|
|
|
|
}(name)
|
|
|
|
}
|
|
|
|
wg.Wait()
|
2015-04-20 03:24:25 -07:00
|
|
|
}
|
2013-12-13 17:50:48 -08:00
|
|
|
|
2015-04-25 03:59:05 -07:00
|
|
|
func (dd *DNSDiscovery) refresh(name string, ch chan<- *config.TargetGroup) error {
|
2015-07-30 01:56:48 -07:00
|
|
|
response, err := lookupAll(name, dd.qtype)
|
2015-04-20 03:24:25 -07:00
|
|
|
dnsSDLookupsCount.Inc()
|
2013-06-11 13:59:27 -07:00
|
|
|
if err != nil {
|
2015-04-20 03:24:25 -07:00
|
|
|
dnsSDLookupFailuresCount.Inc()
|
|
|
|
return err
|
2015-03-14 19:36:15 -07:00
|
|
|
}
|
2013-06-11 13:59:27 -07:00
|
|
|
|
2015-04-20 03:24:25 -07:00
|
|
|
tg := &config.TargetGroup{}
|
2013-09-10 08:48:05 -07:00
|
|
|
for _, record := range response.Answer {
|
2015-07-30 01:56:48 -07:00
|
|
|
target := clientmodel.LabelValue("")
|
|
|
|
switch addr := record.(type) {
|
|
|
|
case *dns.SRV:
|
|
|
|
// Remove the final dot from rooted DNS names to make them look more usual.
|
|
|
|
addr.Target = strings.TrimRight(addr.Target, ".")
|
|
|
|
|
|
|
|
target = clientmodel.LabelValue(fmt.Sprintf("%s:%d", addr.Target, addr.Port))
|
|
|
|
case *dns.A:
|
|
|
|
target = clientmodel.LabelValue(fmt.Sprintf("%s:%d", addr.A, dd.port))
|
|
|
|
case *dns.AAAA:
|
|
|
|
target = clientmodel.LabelValue(fmt.Sprintf("%s:%d", addr.AAAA, dd.port))
|
|
|
|
default:
|
2015-05-20 09:10:29 -07:00
|
|
|
log.Warnf("%q is not a valid SRV record", record)
|
2013-09-10 08:48:05 -07:00
|
|
|
continue
|
2015-04-20 03:24:25 -07:00
|
|
|
|
2015-07-30 01:56:48 -07:00
|
|
|
}
|
2015-04-20 03:24:25 -07:00
|
|
|
tg.Targets = append(tg.Targets, clientmodel.LabelSet{
|
|
|
|
clientmodel.AddressLabel: target,
|
2015-04-28 15:08:58 -07:00
|
|
|
DNSNameLabel: clientmodel.LabelValue(name),
|
2015-04-20 03:24:25 -07:00
|
|
|
})
|
2013-06-11 13:59:27 -07:00
|
|
|
}
|
|
|
|
|
2015-08-07 04:18:19 -07:00
|
|
|
tg.Source = name
|
2015-04-20 03:24:25 -07:00
|
|
|
ch <- tg
|
|
|
|
|
|
|
|
return nil
|
2013-06-11 13:59:27 -07:00
|
|
|
}
|
2013-09-10 08:48:05 -07:00
|
|
|
|
2015-07-30 01:56:48 -07:00
|
|
|
func lookupAll(name string, qtype uint16) (*dns.Msg, error) {
|
2013-09-10 08:48:05 -07:00
|
|
|
conf, err := dns.ClientConfigFromFile(resolvConf)
|
|
|
|
if err != nil {
|
2015-04-20 03:24:25 -07:00
|
|
|
return nil, fmt.Errorf("could not load resolv.conf: %s", err)
|
2013-09-10 08:48:05 -07:00
|
|
|
}
|
|
|
|
|
2013-10-29 08:34:00 -07:00
|
|
|
client := &dns.Client{}
|
2013-09-10 08:48:05 -07:00
|
|
|
response := &dns.Msg{}
|
2013-10-29 08:34:00 -07:00
|
|
|
|
2013-09-10 08:48:05 -07:00
|
|
|
for _, server := range conf.Servers {
|
2014-03-09 15:17:17 -07:00
|
|
|
servAddr := net.JoinHostPort(server, conf.Port)
|
2013-10-29 08:34:00 -07:00
|
|
|
for _, suffix := range conf.Search {
|
2015-07-30 01:56:48 -07:00
|
|
|
response, err = lookup(name, qtype, client, servAddr, suffix, false)
|
2015-04-20 03:24:25 -07:00
|
|
|
if err != nil {
|
2015-05-20 09:10:29 -07:00
|
|
|
log.Warnf("resolving %s.%s failed: %s", name, suffix, err)
|
2015-04-20 03:24:25 -07:00
|
|
|
continue
|
|
|
|
}
|
|
|
|
if len(response.Answer) > 0 {
|
|
|
|
return response, nil
|
2013-10-29 08:34:00 -07:00
|
|
|
}
|
|
|
|
}
|
2015-07-30 01:56:48 -07:00
|
|
|
response, err = lookup(name, qtype, client, servAddr, "", false)
|
2013-09-10 08:48:05 -07:00
|
|
|
if err == nil {
|
|
|
|
return response, nil
|
|
|
|
}
|
|
|
|
}
|
2015-04-20 03:24:25 -07:00
|
|
|
return response, fmt.Errorf("could not resolve %s: No server responded", name)
|
2013-09-10 08:48:05 -07:00
|
|
|
}
|
|
|
|
|
2014-03-09 15:17:17 -07:00
|
|
|
func lookup(name string, queryType uint16, client *dns.Client, servAddr string, suffix string, edns bool) (*dns.Msg, error) {
|
2013-10-29 08:34:00 -07:00
|
|
|
msg := &dns.Msg{}
|
|
|
|
lname := strings.Join([]string{name, suffix}, ".")
|
|
|
|
msg.SetQuestion(dns.Fqdn(lname), queryType)
|
|
|
|
|
2013-09-10 08:48:05 -07:00
|
|
|
if edns {
|
|
|
|
opt := &dns.OPT{
|
|
|
|
Hdr: dns.RR_Header{
|
|
|
|
Name: ".",
|
|
|
|
Rrtype: dns.TypeOPT,
|
|
|
|
},
|
|
|
|
}
|
|
|
|
opt.SetUDPSize(dns.DefaultMsgSize)
|
|
|
|
msg.Extra = append(msg.Extra, opt)
|
|
|
|
}
|
|
|
|
|
2014-03-09 15:17:17 -07:00
|
|
|
response, _, err := client.Exchange(msg, servAddr)
|
2013-09-10 08:48:05 -07:00
|
|
|
if err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
if msg.Id != response.Id {
|
|
|
|
return nil, fmt.Errorf("DNS ID mismatch, request: %d, response: %d", msg.Id, response.Id)
|
|
|
|
}
|
|
|
|
|
|
|
|
if response.MsgHdr.Truncated {
|
|
|
|
if client.Net == "tcp" {
|
2014-12-10 07:16:49 -08:00
|
|
|
return nil, fmt.Errorf("got truncated message on tcp")
|
2013-09-10 08:48:05 -07:00
|
|
|
}
|
|
|
|
if edns { // Truncated even though EDNS is used
|
|
|
|
client.Net = "tcp"
|
|
|
|
}
|
2014-03-09 15:17:17 -07:00
|
|
|
return lookup(name, queryType, client, servAddr, suffix, !edns)
|
2013-09-10 08:48:05 -07:00
|
|
|
}
|
|
|
|
|
|
|
|
return response, nil
|
|
|
|
}
|