Files
coredns/plugin/metrics/metrics_test.go
Ville Vesilehto ba7d5ff55a test(metrics): improve test coverage (#7538)
Add more unit tests for metrics plugin, around registration
deduplication, zone management, restart/shutdown behavior and
context helpers.

Increases test coverage from 54.8% to 76.1%.

Signed-off-by: Ville Vesilehto <ville@vesilehto.fi>
2025-09-13 15:15:25 -07:00

218 lines
5.4 KiB
Go

package metrics
import (
"context"
"io"
"net"
"net/http"
"testing"
"time"
"github.com/coredns/coredns/plugin"
"github.com/coredns/coredns/plugin/pkg/dnstest"
"github.com/coredns/coredns/plugin/test"
"github.com/miekg/dns"
"github.com/prometheus/client_golang/prometheus"
"github.com/prometheus/client_golang/prometheus/promauto"
)
func TestMetrics(t *testing.T) {
met := New("localhost:0")
if err := met.OnStartup(); err != nil {
t.Fatalf("Failed to start metrics handler: %s", err)
}
defer met.OnFinalShutdown()
met.AddZone("example.org.")
tests := []struct {
next plugin.Handler
qname string
qtype uint16
metric string
expectedValue string
}{
// This all works because 1 bucket (1 zone, 1 type)
{
next: test.NextHandler(dns.RcodeSuccess, nil),
qname: "example.org.",
metric: "coredns_dns_requests_total",
expectedValue: "1",
},
{
next: test.NextHandler(dns.RcodeSuccess, nil),
qname: "example.org.",
metric: "coredns_dns_requests_total",
expectedValue: "2",
},
{
next: test.NextHandler(dns.RcodeSuccess, nil),
qname: "example.org.",
metric: "coredns_dns_requests_total",
expectedValue: "3",
},
{
next: test.NextHandler(dns.RcodeSuccess, nil),
qname: "example.org.",
metric: "coredns_dns_responses_total",
expectedValue: "4",
},
}
ctx := context.TODO()
for i, tc := range tests {
req := new(dns.Msg)
if tc.qtype == 0 {
tc.qtype = dns.TypeA
}
req.SetQuestion(tc.qname, tc.qtype)
met.Next = tc.next
rec := dnstest.NewRecorder(&test.ResponseWriter{})
_, err := met.ServeDNS(ctx, rec, req)
if err != nil {
t.Fatalf("Test %d: Expected no error, but got %s", i, err)
}
result := test.Scrape("http://" + ListenAddr + "/metrics")
if tc.expectedValue != "" {
got, _ := test.MetricValue(tc.metric, result)
if got != tc.expectedValue {
t.Errorf("Test %d: Expected value %s for metrics %s, but got %s", i, tc.expectedValue, tc.metric, got)
}
}
}
}
func TestMetricsHTTPTimeout(t *testing.T) {
met := New("localhost:0")
if err := met.OnStartup(); err != nil {
t.Fatalf("Failed to start metrics handler: %s", err)
}
defer met.OnFinalShutdown()
// Use context with timeout to prevent test from hanging indefinitely
ctx, cancel := context.WithTimeout(context.Background(), 10*time.Second)
defer cancel()
done := make(chan error, 1)
go func() {
conn, err := net.Dial("tcp", ListenAddr)
if err != nil {
done <- err
return
}
defer conn.Close()
// Send partial HTTP request and then stop sending data
// This will cause the server to wait for more data and hit ReadTimeout
partialRequest := "GET /metrics HTTP/1.1\r\nHost: " + ListenAddr + "\r\nContent-Length: 100\r\n\r\n"
_, err = conn.Write([]byte(partialRequest))
if err != nil {
done <- err
return
}
// Now just wait - server should timeout trying to read the remaining data
// If server has no ReadTimeout, this will hang indefinitely
buffer := make([]byte, 1024)
_, err = conn.Read(buffer)
done <- err
}()
select {
case <-done:
t.Log("HTTP request timed out by server")
case <-ctx.Done():
t.Error("HTTP request did not time out")
}
}
func TestMustRegister_DuplicateOK(t *testing.T) {
met := New("localhost:0")
met.Reg = prometheus.NewRegistry()
g := promauto.NewGaugeVec(prometheus.GaugeOpts{Namespace: "test", Name: "dup"}, []string{"l"})
met.MustRegister(g)
// registering the same collector again should yield AlreadyRegisteredError internally and be ignored
met.MustRegister(g)
}
func TestRemoveZone(t *testing.T) {
met := New("localhost:0")
met.AddZone("example.org.")
met.AddZone("example.net.")
met.RemoveZone("example.net.")
zones := met.ZoneNames()
for _, z := range zones {
if z == "example.net." {
t.Fatalf("zone %q still present after RemoveZone", z)
}
}
}
func TestOnRestartStopsServer(t *testing.T) {
met := New("localhost:0")
if err := met.OnStartup(); err != nil {
t.Fatalf("startup failed: %v", err)
}
// server should respond before restart
resp, err := http.Get("http://" + ListenAddr + "/metrics")
if err != nil {
t.Fatalf("pre-restart GET failed: %v", err)
}
if resp != nil {
io.Copy(io.Discard, resp.Body)
resp.Body.Close()
}
if err := met.OnRestart(); err != nil {
t.Fatalf("restart failed: %v", err)
}
// after restart, the listener should be closed and request should fail
if _, err := http.Get("http://" + ListenAddr + "/metrics"); err == nil {
t.Fatalf("expected GET to fail after restart, but it succeeded")
}
}
func TestRegistryGetOrSet(t *testing.T) {
r := newReg()
addr := "localhost:12345"
pr1 := prometheus.NewRegistry()
got1 := r.getOrSet(addr, pr1)
if got1 != pr1 {
t.Fatalf("first getOrSet should return provided registry")
}
pr2 := prometheus.NewRegistry()
got2 := r.getOrSet(addr, pr2)
if got2 != pr1 {
t.Fatalf("second getOrSet should return original registry, got different one")
}
}
func TestOnRestartNoop(t *testing.T) {
met := New("localhost:0")
// without OnStartup, OnRestart should be a no-op
if err := met.OnRestart(); err != nil {
t.Fatalf("OnRestart returned error on no-op: %v", err)
}
}
func TestContextHelpersEmpty(t *testing.T) {
if got := WithServer(context.TODO()); got != "" {
t.Fatalf("WithServer(nil) = %q, want empty", got)
}
if got := WithView(context.TODO()); got != "" {
t.Fatalf("WithView(nil) = %q, want empty", got)
}
}