mirror of
https://github.com/coredns/coredns.git
synced 2025-11-02 10:13:14 -05:00
Metrics: expand coredns_dns_responses_total with plugin label
This adds (somewhat hacky?) code to add a plugin label to the coredns_dns_responses_total metric. It's completely obvlious to the plugin as we just check who called the *recorder.WriteMsg method. We use runtime.Caller( 1 2 3) to get multiple levels of callers, this should be deep enough, but it depends on the dns.ResponseWriter wrapping that's occuring. README.md of metrics updates and test added in test/metrics_test.go to check for the label being set. I went through the plugin to see what metrics could be removed, but actually didn't find any, the plugin push out metrics that make sense. Due to the path fiddling to figure out the plugin name I doubt this works (out-of-the-box) for external plugins, but I haven't tested that. Signed-off-by: Miek Gieben <miek@miek.nl>
This commit is contained in:
@@ -328,7 +328,7 @@ func errorAndMetricsFunc(server string, w dns.ResponseWriter, r *dns.Msg, rc int
|
|||||||
answer.SetRcode(r, rc)
|
answer.SetRcode(r, rc)
|
||||||
state.SizeAndDo(answer)
|
state.SizeAndDo(answer)
|
||||||
|
|
||||||
vars.Report(server, state, vars.Dropped, rcode.ToString(rc), answer.Len(), time.Now())
|
vars.Report(server, state, vars.Dropped, rcode.ToString(rc), "", answer.Len(), time.Now())
|
||||||
|
|
||||||
w.WriteMsg(answer)
|
w.WriteMsg(answer)
|
||||||
}
|
}
|
||||||
|
|||||||
@@ -17,7 +17,7 @@ The following metrics are exported:
|
|||||||
* `coredns_dns_request_size_bytes{server, zone, proto}` - size of the request in bytes.
|
* `coredns_dns_request_size_bytes{server, zone, proto}` - size of the request in bytes.
|
||||||
* `coredns_dns_do_requests_total{server, zone}` - queries that have the DO bit set
|
* `coredns_dns_do_requests_total{server, zone}` - queries that have the DO bit set
|
||||||
* `coredns_dns_response_size_bytes{server, zone, proto}` - response size in bytes.
|
* `coredns_dns_response_size_bytes{server, zone, proto}` - response size in bytes.
|
||||||
* `coredns_dns_responses_total{server, zone, rcode}` - response per zone and rcode.
|
* `coredns_dns_responses_total{server, zone, rcode, plugin}` - response per zone, rcode and plugin.
|
||||||
* `coredns_plugin_enabled{server, zone, name}` - indicates whether a plugin is enabled on per server and zone basis.
|
* `coredns_plugin_enabled{server, zone, name}` - indicates whether a plugin is enabled on per server and zone basis.
|
||||||
|
|
||||||
Each counter has a label `zone` which is the zonename used for the request/response.
|
Each counter has a label `zone` which is the zonename used for the request/response.
|
||||||
@@ -32,6 +32,8 @@ Extra labels used are:
|
|||||||
* `type` which holds the query type. It holds most common types (A, AAAA, MX, SOA, CNAME, PTR, TXT,
|
* `type` which holds the query type. It holds most common types (A, AAAA, MX, SOA, CNAME, PTR, TXT,
|
||||||
NS, SRV, DS, DNSKEY, RRSIG, NSEC, NSEC3, IXFR, AXFR and ANY) and "other" which lumps together all
|
NS, SRV, DS, DNSKEY, RRSIG, NSEC, NSEC3, IXFR, AXFR and ANY) and "other" which lumps together all
|
||||||
other types.
|
other types.
|
||||||
|
* the `plugin` label holds the name of the plugin that made the write to the client. If the server
|
||||||
|
did the write (on error for instance), the value is empty.
|
||||||
|
|
||||||
If monitoring is enabled, queries that do not enter the plugin chain are exported under the fake
|
If monitoring is enabled, queries that do not enter the plugin chain are exported under the fake
|
||||||
name "dropped" (without a closing dot - this is never a valid domain name).
|
name "dropped" (without a closing dot - this is never a valid domain name).
|
||||||
|
|||||||
@@ -2,6 +2,7 @@ package metrics
|
|||||||
|
|
||||||
import (
|
import (
|
||||||
"context"
|
"context"
|
||||||
|
"path/filepath"
|
||||||
|
|
||||||
"github.com/coredns/coredns/plugin"
|
"github.com/coredns/coredns/plugin"
|
||||||
"github.com/coredns/coredns/plugin/metrics/vars"
|
"github.com/coredns/coredns/plugin/metrics/vars"
|
||||||
@@ -33,10 +34,32 @@ func (m *Metrics) ServeDNS(ctx context.Context, w dns.ResponseWriter, r *dns.Msg
|
|||||||
// see https://github.com/coredns/coredns/blob/master/core/dnsserver/server.go#L318
|
// see https://github.com/coredns/coredns/blob/master/core/dnsserver/server.go#L318
|
||||||
rc = status
|
rc = status
|
||||||
}
|
}
|
||||||
vars.Report(WithServer(ctx), state, zone, rcode.ToString(rc), rw.Len, rw.Start)
|
plugin := m.authoritativePlugin(rw.Caller1, rw.Caller2, rw.Caller3)
|
||||||
|
vars.Report(WithServer(ctx), state, zone, rcode.ToString(rc), plugin, rw.Len, rw.Start)
|
||||||
|
|
||||||
return status, err
|
return status, err
|
||||||
}
|
}
|
||||||
|
|
||||||
// Name implements the Handler interface.
|
// Name implements the Handler interface.
|
||||||
func (m *Metrics) Name() string { return "prometheus" }
|
func (m *Metrics) Name() string { return "prometheus" }
|
||||||
|
|
||||||
|
// authoritativePlugin returns which of made the write, if none is found the empty string is returned.
|
||||||
|
func (m *Metrics) authoritativePlugin(a, b, c string) string {
|
||||||
|
// a b and c contain the full path of the caller, the plugin name 2nd last elements
|
||||||
|
// .../coredns/plugin/whoami/whoami.go --> whoami
|
||||||
|
// this is likely FS specific, so use filepath.
|
||||||
|
plug := filepath.Base(filepath.Dir(a))
|
||||||
|
if _, ok := m.plugins[plug]; ok {
|
||||||
|
return plug
|
||||||
|
}
|
||||||
|
plug = filepath.Base(filepath.Dir(b))
|
||||||
|
if _, ok := m.plugins[plug]; ok {
|
||||||
|
return plug
|
||||||
|
}
|
||||||
|
plug = filepath.Base(filepath.Dir(c))
|
||||||
|
if _, ok := m.plugins[plug]; ok {
|
||||||
|
return plug
|
||||||
|
}
|
||||||
|
|
||||||
|
return ""
|
||||||
|
}
|
||||||
|
|||||||
@@ -8,6 +8,7 @@ import (
|
|||||||
"sync"
|
"sync"
|
||||||
"time"
|
"time"
|
||||||
|
|
||||||
|
"github.com/coredns/caddy"
|
||||||
"github.com/coredns/coredns/plugin"
|
"github.com/coredns/coredns/plugin"
|
||||||
"github.com/coredns/coredns/plugin/pkg/reuseport"
|
"github.com/coredns/coredns/plugin/pkg/reuseport"
|
||||||
|
|
||||||
@@ -31,6 +32,8 @@ type Metrics struct {
|
|||||||
zoneNames []string
|
zoneNames []string
|
||||||
zoneMap map[string]struct{}
|
zoneMap map[string]struct{}
|
||||||
zoneMu sync.RWMutex
|
zoneMu sync.RWMutex
|
||||||
|
|
||||||
|
plugins map[string]struct{} // all available plugins, used to determine which plugin made the client write
|
||||||
}
|
}
|
||||||
|
|
||||||
// New returns a new instance of Metrics with the given address.
|
// New returns a new instance of Metrics with the given address.
|
||||||
@@ -39,6 +42,7 @@ func New(addr string) *Metrics {
|
|||||||
Addr: addr,
|
Addr: addr,
|
||||||
Reg: prometheus.DefaultRegisterer.(*prometheus.Registry),
|
Reg: prometheus.DefaultRegisterer.(*prometheus.Registry),
|
||||||
zoneMap: make(map[string]struct{}),
|
zoneMap: make(map[string]struct{}),
|
||||||
|
plugins: pluginList(caddy.ListPlugins()),
|
||||||
}
|
}
|
||||||
|
|
||||||
return met
|
return met
|
||||||
@@ -140,6 +144,19 @@ func keys(m map[string]struct{}) []string {
|
|||||||
return sx
|
return sx
|
||||||
}
|
}
|
||||||
|
|
||||||
|
// pluginList iterates over the returned plugin map from caddy and removes the "dns." prefix from them.
|
||||||
|
func pluginList(m map[string][]string) map[string]struct{} {
|
||||||
|
pm := map[string]struct{}{}
|
||||||
|
for _, p := range m["others"] {
|
||||||
|
// only add 'dns.' plugins
|
||||||
|
if len(p) > 3 {
|
||||||
|
pm[p[4:]] = struct{}{}
|
||||||
|
continue
|
||||||
|
}
|
||||||
|
}
|
||||||
|
return pm
|
||||||
|
}
|
||||||
|
|
||||||
// ListenAddr is assigned the address of the prometheus listener. Its use is mainly in tests where
|
// ListenAddr is assigned the address of the prometheus listener. Its use is mainly in tests where
|
||||||
// we listen on "localhost:0" and need to retrieve the actual address.
|
// we listen on "localhost:0" and need to retrieve the actual address.
|
||||||
var ListenAddr string
|
var ListenAddr string
|
||||||
|
|||||||
@@ -9,7 +9,7 @@ import (
|
|||||||
// Report reports the metrics data associated with request. This function is exported because it is also
|
// Report reports the metrics data associated with request. This function is exported because it is also
|
||||||
// called from core/dnsserver to report requests hitting the server that should not be handled and are thus
|
// called from core/dnsserver to report requests hitting the server that should not be handled and are thus
|
||||||
// not sent down the plugin chain.
|
// not sent down the plugin chain.
|
||||||
func Report(server string, req request.Request, zone, rcode string, size int, start time.Time) {
|
func Report(server string, req request.Request, zone, rcode, plugin string, size int, start time.Time) {
|
||||||
// Proto and Family.
|
// Proto and Family.
|
||||||
net := req.Proto()
|
net := req.Proto()
|
||||||
fam := "1"
|
fam := "1"
|
||||||
@@ -29,5 +29,5 @@ func Report(server string, req request.Request, zone, rcode string, size int, st
|
|||||||
ResponseSize.WithLabelValues(server, zone, net).Observe(float64(size))
|
ResponseSize.WithLabelValues(server, zone, net).Observe(float64(size))
|
||||||
RequestSize.WithLabelValues(server, zone, net).Observe(float64(req.Len()))
|
RequestSize.WithLabelValues(server, zone, net).Observe(float64(req.Len()))
|
||||||
|
|
||||||
ResponseRcode.WithLabelValues(server, zone, rcode).Inc()
|
ResponseRcode.WithLabelValues(server, zone, rcode, plugin).Inc()
|
||||||
}
|
}
|
||||||
|
|||||||
@@ -52,7 +52,7 @@ var (
|
|||||||
Subsystem: subsystem,
|
Subsystem: subsystem,
|
||||||
Name: "responses_total",
|
Name: "responses_total",
|
||||||
Help: "Counter of response status codes.",
|
Help: "Counter of response status codes.",
|
||||||
}, []string{"server", "zone", "rcode"})
|
}, []string{"server", "zone", "rcode", "plugin"})
|
||||||
|
|
||||||
Panic = promauto.NewCounter(prometheus.CounterOpts{
|
Panic = promauto.NewCounter(prometheus.CounterOpts{
|
||||||
Namespace: plugin.Namespace,
|
Namespace: plugin.Namespace,
|
||||||
|
|||||||
@@ -2,6 +2,7 @@
|
|||||||
package dnstest
|
package dnstest
|
||||||
|
|
||||||
import (
|
import (
|
||||||
|
"runtime"
|
||||||
"time"
|
"time"
|
||||||
|
|
||||||
"github.com/miekg/dns"
|
"github.com/miekg/dns"
|
||||||
@@ -19,6 +20,10 @@ type Recorder struct {
|
|||||||
Len int
|
Len int
|
||||||
Msg *dns.Msg
|
Msg *dns.Msg
|
||||||
Start time.Time
|
Start time.Time
|
||||||
|
// CallerN holds string parameters of a call to runtime.Caller(N)
|
||||||
|
Caller1 string
|
||||||
|
Caller2 string
|
||||||
|
Caller3 string
|
||||||
}
|
}
|
||||||
|
|
||||||
// NewRecorder makes and returns a new Recorder,
|
// NewRecorder makes and returns a new Recorder,
|
||||||
@@ -36,7 +41,9 @@ func NewRecorder(w dns.ResponseWriter) *Recorder {
|
|||||||
// WriteMsg records the status code and calls the
|
// WriteMsg records the status code and calls the
|
||||||
// underlying ResponseWriter's WriteMsg method.
|
// underlying ResponseWriter's WriteMsg method.
|
||||||
func (r *Recorder) WriteMsg(res *dns.Msg) error {
|
func (r *Recorder) WriteMsg(res *dns.Msg) error {
|
||||||
r.Rcode = res.Rcode
|
_, r.Caller1, _, _ = runtime.Caller(1)
|
||||||
|
_, r.Caller2, _, _ = runtime.Caller(2)
|
||||||
|
_, r.Caller3, _, _ = runtime.Caller(3)
|
||||||
// We may get called multiple times (axfr for instance).
|
// We may get called multiple times (axfr for instance).
|
||||||
// Save the last message, but add the sizes.
|
// Save the last message, but add the sizes.
|
||||||
r.Len += res.Len()
|
r.Len += res.Len()
|
||||||
|
|||||||
@@ -68,6 +68,34 @@ func TestMetricsRefused(t *testing.T) {
|
|||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
|
func TestMetricsPlugin(t *testing.T) {
|
||||||
|
metricName := "coredns_dns_responses_total"
|
||||||
|
corefile := `example.org:0 {
|
||||||
|
whoami
|
||||||
|
prometheus localhost:0
|
||||||
|
}`
|
||||||
|
|
||||||
|
srv, udp, _, err := CoreDNSServerAndPorts(corefile)
|
||||||
|
if err != nil {
|
||||||
|
t.Fatalf("Could not get CoreDNS serving instance: %s", err)
|
||||||
|
}
|
||||||
|
defer srv.Stop()
|
||||||
|
|
||||||
|
m := new(dns.Msg)
|
||||||
|
m.SetQuestion("example.org.", dns.TypeA)
|
||||||
|
|
||||||
|
if _, err = dns.Exchange(m, udp); err != nil {
|
||||||
|
t.Fatalf("Could not send message: %s", err)
|
||||||
|
}
|
||||||
|
|
||||||
|
data := test.Scrape("http://" + metrics.ListenAddr + "/metrics")
|
||||||
|
_, labels := test.MetricValue(metricName, data)
|
||||||
|
|
||||||
|
if labels["plugin"] != "whoami" {
|
||||||
|
t.Errorf("Expected plugin value %s, but got %s", "whoami", labels["whoami"])
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
func TestMetricsAuto(t *testing.T) {
|
func TestMetricsAuto(t *testing.T) {
|
||||||
tmpdir, err := ioutil.TempDir(os.TempDir(), "coredns")
|
tmpdir, err := ioutil.TempDir(os.TempDir(), "coredns")
|
||||||
if err != nil {
|
if err != nil {
|
||||||
|
|||||||
Reference in New Issue
Block a user