Files
coredns/plugin/metrics/metrics_test.go

218 lines
5.4 KiB
Go
Raw Normal View History

package metrics
import (
"context"
"io"
"net"
"net/http"
"testing"
"time"
"github.com/coredns/coredns/plugin"
"github.com/coredns/coredns/plugin/pkg/dnstest"
"github.com/coredns/coredns/plugin/test"
"github.com/miekg/dns"
"github.com/prometheus/client_golang/prometheus"
"github.com/prometheus/client_golang/prometheus/promauto"
)
func TestMetrics(t *testing.T) {
met := New("localhost:0")
if err := met.OnStartup(); err != nil {
t.Fatalf("Failed to start metrics handler: %s", err)
}
reload: use OnRestart (#1709) * reload: use OnRestart Close the listener on OnRestart for health and metrics so the default setup function can setup the listener when the plugin is "starting up". Lightly test with some SIGUSR1-ing. Also checked the reload plugin with this, seems fine: .com.:1043 .:1043 2018/04/20 15:01:25 [INFO] CoreDNS-1.1.1 2018/04/20 15:01:25 [INFO] linux/amd64, go1.10, CoreDNS-1.1.1 linux/amd64, go1.10, 2018/04/20 15:01:25 [INFO] Running configuration MD5 = aa8b3f03946fb60546ca1f725d482714 2018/04/20 15:02:01 [INFO] Reloading 2018/04/20 15:02:01 [INFO] Running configuration MD5 = b34a96d99e01db4015a892212560155f 2018/04/20 15:02:01 [INFO] Reloading complete ^C2018/04/20 15:02:06 [INFO] SIGINT: Shutting down With this corefile: .com { proxy . 127.0.0.1:53 prometheus :9054 whoami reload } . { proxy . 127.0.0.1:53 prometheus :9054 whoami reload } The prometheus port was 9053, changed that to 54 so reload would pick it up. From a cursory look it seems this also fixes: Fixes #1604 #1618 #1686 #1492 * At least make it test * Use onfinalshutdown * reload: add reload test This test #1604 adn right now fails. * Address review comments * Add bug section explaining things a bit * compile tests * Fix tests * fixes * slightly less crazy * try to make prometheus setup less confusing * Use ephermal port for test * Don't use the listener * These are shared between goroutines, just use the boolean in the main structure. * Fix text in the reload README, * Set addr to TODO once stopping it * Morph fturb's comment into test, to test reload and scrape health and metric endpoint
2018-04-21 17:43:02 +01:00
defer met.OnFinalShutdown()
met.AddZone("example.org.")
tests := []struct {
next plugin.Handler
qname string
qtype uint16
metric string
expectedValue string
}{
// This all works because 1 bucket (1 zone, 1 type)
{
next: test.NextHandler(dns.RcodeSuccess, nil),
qname: "example.org.",
metric: "coredns_dns_requests_total",
expectedValue: "1",
},
{
next: test.NextHandler(dns.RcodeSuccess, nil),
qname: "example.org.",
metric: "coredns_dns_requests_total",
expectedValue: "2",
},
{
next: test.NextHandler(dns.RcodeSuccess, nil),
qname: "example.org.",
metric: "coredns_dns_requests_total",
expectedValue: "3",
},
{
next: test.NextHandler(dns.RcodeSuccess, nil),
qname: "example.org.",
metric: "coredns_dns_responses_total",
expectedValue: "4",
},
}
ctx := context.TODO()
for i, tc := range tests {
req := new(dns.Msg)
if tc.qtype == 0 {
tc.qtype = dns.TypeA
}
req.SetQuestion(tc.qname, tc.qtype)
met.Next = tc.next
rec := dnstest.NewRecorder(&test.ResponseWriter{})
_, err := met.ServeDNS(ctx, rec, req)
if err != nil {
t.Fatalf("Test %d: Expected no error, but got %s", i, err)
}
result := test.Scrape("http://" + ListenAddr + "/metrics")
if tc.expectedValue != "" {
got, _ := test.MetricValue(tc.metric, result)
if got != tc.expectedValue {
t.Errorf("Test %d: Expected value %s for metrics %s, but got %s", i, tc.expectedValue, tc.metric, got)
}
}
}
}
func TestMetricsHTTPTimeout(t *testing.T) {
met := New("localhost:0")
if err := met.OnStartup(); err != nil {
t.Fatalf("Failed to start metrics handler: %s", err)
}
defer met.OnFinalShutdown()
// Use context with timeout to prevent test from hanging indefinitely
ctx, cancel := context.WithTimeout(context.Background(), 10*time.Second)
defer cancel()
done := make(chan error, 1)
go func() {
conn, err := net.Dial("tcp", ListenAddr)
if err != nil {
done <- err
return
}
defer conn.Close()
// Send partial HTTP request and then stop sending data
// This will cause the server to wait for more data and hit ReadTimeout
partialRequest := "GET /metrics HTTP/1.1\r\nHost: " + ListenAddr + "\r\nContent-Length: 100\r\n\r\n"
_, err = conn.Write([]byte(partialRequest))
if err != nil {
done <- err
return
}
// Now just wait - server should timeout trying to read the remaining data
// If server has no ReadTimeout, this will hang indefinitely
buffer := make([]byte, 1024)
_, err = conn.Read(buffer)
done <- err
}()
select {
case <-done:
t.Log("HTTP request timed out by server")
case <-ctx.Done():
t.Error("HTTP request did not time out")
}
}
func TestMustRegister_DuplicateOK(t *testing.T) {
met := New("localhost:0")
met.Reg = prometheus.NewRegistry()
g := promauto.NewGaugeVec(prometheus.GaugeOpts{Namespace: "test", Name: "dup"}, []string{"l"})
met.MustRegister(g)
// registering the same collector again should yield AlreadyRegisteredError internally and be ignored
met.MustRegister(g)
}
func TestRemoveZone(t *testing.T) {
met := New("localhost:0")
met.AddZone("example.org.")
met.AddZone("example.net.")
met.RemoveZone("example.net.")
zones := met.ZoneNames()
for _, z := range zones {
if z == "example.net." {
t.Fatalf("zone %q still present after RemoveZone", z)
}
}
}
func TestOnRestartStopsServer(t *testing.T) {
met := New("localhost:0")
if err := met.OnStartup(); err != nil {
t.Fatalf("startup failed: %v", err)
}
// server should respond before restart
resp, err := http.Get("http://" + ListenAddr + "/metrics")
if err != nil {
t.Fatalf("pre-restart GET failed: %v", err)
}
if resp != nil {
io.Copy(io.Discard, resp.Body)
resp.Body.Close()
}
if err := met.OnRestart(); err != nil {
t.Fatalf("restart failed: %v", err)
}
// after restart, the listener should be closed and request should fail
if _, err := http.Get("http://" + ListenAddr + "/metrics"); err == nil {
t.Fatalf("expected GET to fail after restart, but it succeeded")
}
}
func TestRegistryGetOrSet(t *testing.T) {
r := newReg()
addr := "localhost:12345"
pr1 := prometheus.NewRegistry()
got1 := r.getOrSet(addr, pr1)
if got1 != pr1 {
t.Fatalf("first getOrSet should return provided registry")
}
pr2 := prometheus.NewRegistry()
got2 := r.getOrSet(addr, pr2)
if got2 != pr1 {
t.Fatalf("second getOrSet should return original registry, got different one")
}
}
func TestOnRestartNoop(t *testing.T) {
met := New("localhost:0")
// without OnStartup, OnRestart should be a no-op
if err := met.OnRestart(); err != nil {
t.Fatalf("OnRestart returned error on no-op: %v", err)
}
}
func TestContextHelpersEmpty(t *testing.T) {
if got := WithServer(context.TODO()); got != "" {
t.Fatalf("WithServer(nil) = %q, want empty", got)
}
if got := WithView(context.TODO()); got != "" {
t.Fatalf("WithView(nil) = %q, want empty", got)
}
}