Add stime metric and improve commenting
This commit is contained in:
parent
15c06c265e
commit
1a6a9190f3
51
dns.go
51
dns.go
@ -13,27 +13,36 @@ import (
|
|||||||
log "github.com/sirupsen/logrus"
|
log "github.com/sirupsen/logrus"
|
||||||
"math"
|
"math"
|
||||||
"strconv"
|
"strconv"
|
||||||
|
"time"
|
||||||
)
|
)
|
||||||
|
|
||||||
//////////////////////////////////////////////////////////////////////////
|
//////////////////////////////////////////////////////////////////////////
|
||||||
|
// data structures
|
||||||
|
|
||||||
|
// for holding the metrics
|
||||||
|
|
||||||
type DNSMetrics struct {
|
type DNSMetrics struct {
|
||||||
soa *prometheus.GaugeVec
|
soa *prometheus.GaugeVec
|
||||||
rtt *prometheus.GaugeVec
|
rtt *prometheus.GaugeVec
|
||||||
valid *prometheus.GaugeVec
|
valid *prometheus.GaugeVec
|
||||||
|
stime *prometheus.GaugeVec
|
||||||
label_map []prometheus.Labels
|
label_map []prometheus.Labels
|
||||||
}
|
}
|
||||||
|
|
||||||
|
// for specifying DNS servers
|
||||||
|
|
||||||
type DNSServer struct {
|
type DNSServer struct {
|
||||||
role string
|
role string
|
||||||
name string
|
name string
|
||||||
ip uint8
|
ip uint8
|
||||||
addr string
|
addr string
|
||||||
soa uint
|
soa uint64
|
||||||
}
|
}
|
||||||
|
|
||||||
|
// hardcoded :( list of DNS servers to query
|
||||||
|
|
||||||
var dns_servers = []*DNSServer{
|
var dns_servers = []*DNSServer{
|
||||||
&DNSServer{"master", "master.delegation-servers.dn42", 6, "[fd42:180:3de0:10:5054:ff:fe87:ea39]:53", 0},
|
&DNSServer{"master", "j.master.delegation-servers.dn42", 6, "[fd42:180:3de0:10:5054:ff:fe87:ea39]:53", 0},
|
||||||
&DNSServer{"delegation", "b.delegation-servers.dn42", 4, "172.20.129.1:53", 0},
|
&DNSServer{"delegation", "b.delegation-servers.dn42", 4, "172.20.129.1:53", 0},
|
||||||
&DNSServer{"delegation", "b.delegation-servers.dn42", 6, "[fd42:4242:2601:ac53::1]:53", 0},
|
&DNSServer{"delegation", "b.delegation-servers.dn42", 6, "[fd42:4242:2601:ac53::1]:53", 0},
|
||||||
&DNSServer{"delegation", "j.delegation-servers.dn42", 4, "172.20.1.18:53", 0},
|
&DNSServer{"delegation", "j.delegation-servers.dn42", 4, "172.20.1.18:53", 0},
|
||||||
@ -56,6 +65,7 @@ var dns_servers = []*DNSServer{
|
|||||||
}
|
}
|
||||||
|
|
||||||
//////////////////////////////////////////////////////////////////////////
|
//////////////////////////////////////////////////////////////////////////
|
||||||
|
// initialisation function to register metrics
|
||||||
|
|
||||||
func (m *DNSMetrics) Register() {
|
func (m *DNSMetrics) Register() {
|
||||||
|
|
||||||
@ -77,6 +87,12 @@ func (m *DNSMetrics) Register() {
|
|||||||
}, []string{"role", "name", "ip", "addr"})
|
}, []string{"role", "name", "ip", "addr"})
|
||||||
prometheus.MustRegister(m.valid)
|
prometheus.MustRegister(m.valid)
|
||||||
|
|
||||||
|
m.stime = prometheus.NewGaugeVec(prometheus.GaugeOpts{
|
||||||
|
Name: "dn42_dns_stime",
|
||||||
|
Help: "Returns the time between now and the SOA serial number",
|
||||||
|
}, []string{"role", "name", "ip", "addr"})
|
||||||
|
prometheus.MustRegister(m.stime)
|
||||||
|
|
||||||
// pre-populate the labels
|
// pre-populate the labels
|
||||||
m.label_map = make([]prometheus.Labels, len(dns_servers))
|
m.label_map = make([]prometheus.Labels, len(dns_servers))
|
||||||
|
|
||||||
@ -92,28 +108,53 @@ func (m *DNSMetrics) Register() {
|
|||||||
}
|
}
|
||||||
|
|
||||||
//////////////////////////////////////////////////////////////////////////
|
//////////////////////////////////////////////////////////////////////////
|
||||||
|
// collect metrics for all DNS servers
|
||||||
|
|
||||||
func (m *DNSMetrics) Collect() {
|
func (m *DNSMetrics) Collect() {
|
||||||
|
|
||||||
for ix, server := range dns_servers {
|
now := uint64(time.Now().Unix())
|
||||||
soa, rtt := server.Query()
|
|
||||||
server.soa = uint(soa)
|
|
||||||
|
|
||||||
|
// go through each server in turn
|
||||||
|
for ix, server := range dns_servers {
|
||||||
|
|
||||||
|
// query it
|
||||||
|
soa, rtt := server.Query()
|
||||||
|
server.soa = uint64(soa)
|
||||||
|
|
||||||
|
// SOA and RTT are direct metrics returned from the query
|
||||||
m.soa.With(m.label_map[ix]).Set(soa)
|
m.soa.With(m.label_map[ix]).Set(soa)
|
||||||
m.rtt.With(m.label_map[ix]).Set(rtt)
|
m.rtt.With(m.label_map[ix]).Set(rtt)
|
||||||
|
|
||||||
|
// check if the returned SOA matches j.master.delegation-servers.dn42
|
||||||
var valid uint = 0
|
var valid uint = 0
|
||||||
|
|
||||||
if server.soa == 0 {
|
if server.soa == 0 {
|
||||||
|
// didn't get a result, server issue
|
||||||
valid = 2
|
valid = 2
|
||||||
} else {
|
} else {
|
||||||
if server.soa != dns_servers[0].soa {
|
if server.soa != dns_servers[0].soa {
|
||||||
|
// SOA didn't match
|
||||||
valid = 1
|
valid = 1
|
||||||
} else {
|
} else {
|
||||||
valid = 0
|
valid = 0
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
|
// before setting whether the server is valid, calculate the stime
|
||||||
|
// (difference in time between now and the SOA, to allow checking that
|
||||||
|
// it is not stale)
|
||||||
|
// it's possible that the SOA could be in the future if there is a
|
||||||
|
// clock mismatch between monitor and DNS server, in which case this
|
||||||
|
// is flagged as a server error
|
||||||
|
|
||||||
|
if server.soa > now {
|
||||||
|
// server error
|
||||||
|
valid = 2
|
||||||
|
} else {
|
||||||
|
m.stime.With(m.label_map[ix]).Set(float64(now - server.soa))
|
||||||
|
}
|
||||||
|
|
||||||
|
// finally set the valid status
|
||||||
m.valid.With(m.label_map[ix]).Set(float64(valid))
|
m.valid.With(m.label_map[ix]).Set(float64(valid))
|
||||||
}
|
}
|
||||||
|
|
||||||
|
Loading…
x
Reference in New Issue
Block a user