mirror of
https://github.com/coredns/coredns.git
synced 2025-10-28 00:34:24 -04:00
plugin/health: add lameduck mode (#1379)
* plugin/health: add lameduck mode Add a way to configure lameduck more, i.e. set health to false, stop polling plugins. Then wait for a duration before shutting down. As the health middleware is configured early on in the plugin list, it will hold up all other shutdown, meaning we still answer queries. * Add New * More tests * golint * remove confusing text
This commit is contained in:
@@ -21,6 +21,17 @@ a 503. *health* periodically (1s) polls plugin that exports health information.
|
|||||||
plugin signals that it is unhealthy, the server will go unhealthy too. Each plugin that
|
plugin signals that it is unhealthy, the server will go unhealthy too. Each plugin that
|
||||||
supports health checks has a section "Health" in their README.
|
supports health checks has a section "Health" in their README.
|
||||||
|
|
||||||
|
More options can be set with this extended syntax:
|
||||||
|
|
||||||
|
~~~
|
||||||
|
health [ADDRESS] {
|
||||||
|
lameduck DURATION
|
||||||
|
}
|
||||||
|
~~~
|
||||||
|
|
||||||
|
* Where `lameduck` will make the process unhealthy then *wait* for **DURATION** before the process
|
||||||
|
shuts down.
|
||||||
|
|
||||||
## Plugins
|
## Plugins
|
||||||
|
|
||||||
Any plugin that implements the Healther interface will be used to report health.
|
Any plugin that implements the Healther interface will be used to report health.
|
||||||
@@ -42,3 +53,13 @@ Run another health endpoint on http://localhost:8091.
|
|||||||
health localhost:8091
|
health localhost:8091
|
||||||
}
|
}
|
||||||
~~~
|
~~~
|
||||||
|
|
||||||
|
Set a lameduck duration of 1 second:
|
||||||
|
|
||||||
|
~~~ corefile
|
||||||
|
. {
|
||||||
|
health localhost:8091 {
|
||||||
|
lameduck 1s
|
||||||
|
}
|
||||||
|
}
|
||||||
|
~~~
|
||||||
|
|||||||
@@ -7,12 +7,15 @@ import (
|
|||||||
"net"
|
"net"
|
||||||
"net/http"
|
"net/http"
|
||||||
"sync"
|
"sync"
|
||||||
|
"time"
|
||||||
)
|
)
|
||||||
|
|
||||||
var once sync.Once
|
var once sync.Once
|
||||||
|
|
||||||
|
// Health implements healthchecks by polling plugins.
|
||||||
type health struct {
|
type health struct {
|
||||||
Addr string
|
Addr string
|
||||||
|
lameduck time.Duration
|
||||||
|
|
||||||
ln net.Listener
|
ln net.Listener
|
||||||
mux *http.ServeMux
|
mux *http.ServeMux
|
||||||
@@ -22,7 +25,13 @@ type health struct {
|
|||||||
sync.RWMutex
|
sync.RWMutex
|
||||||
ok bool // ok is the global boolean indicating an all healthy plugin stack
|
ok bool // ok is the global boolean indicating an all healthy plugin stack
|
||||||
|
|
||||||
stop chan bool
|
stop chan bool
|
||||||
|
pollstop chan bool
|
||||||
|
}
|
||||||
|
|
||||||
|
// newHealth returns a new initialized health.
|
||||||
|
func newHealth(addr string) *health {
|
||||||
|
return &health{Addr: addr, stop: make(chan bool), pollstop: make(chan bool)}
|
||||||
}
|
}
|
||||||
|
|
||||||
func (h *health) OnStartup() error {
|
func (h *health) OnStartup() error {
|
||||||
@@ -61,12 +70,21 @@ func (h *health) OnStartup() error {
|
|||||||
}
|
}
|
||||||
|
|
||||||
func (h *health) OnShutdown() error {
|
func (h *health) OnShutdown() error {
|
||||||
|
// Stop polling plugins
|
||||||
|
h.pollstop <- true
|
||||||
|
// NACK health
|
||||||
|
h.SetOk(false)
|
||||||
|
|
||||||
|
if h.lameduck > 0 {
|
||||||
|
log.Printf("[INFO] Going into lameduck mode for %s", h.lameduck)
|
||||||
|
time.Sleep(h.lameduck)
|
||||||
|
}
|
||||||
|
|
||||||
if h.ln != nil {
|
if h.ln != nil {
|
||||||
return h.ln.Close()
|
return h.ln.Close()
|
||||||
}
|
}
|
||||||
|
|
||||||
h.stop <- true
|
h.stop <- true
|
||||||
|
|
||||||
return nil
|
return nil
|
||||||
}
|
}
|
||||||
|
|
||||||
|
|||||||
@@ -5,12 +5,13 @@ import (
|
|||||||
"io/ioutil"
|
"io/ioutil"
|
||||||
"net/http"
|
"net/http"
|
||||||
"testing"
|
"testing"
|
||||||
|
"time"
|
||||||
|
|
||||||
"github.com/coredns/coredns/plugin/erratic"
|
"github.com/coredns/coredns/plugin/erratic"
|
||||||
)
|
)
|
||||||
|
|
||||||
func TestHealth(t *testing.T) {
|
func TestHealth(t *testing.T) {
|
||||||
h := health{Addr: ":0"}
|
h := newHealth(":0")
|
||||||
h.h = append(h.h, &erratic.Erratic{})
|
h.h = append(h.h, &erratic.Erratic{})
|
||||||
|
|
||||||
if err := h.OnStartup(); err != nil {
|
if err := h.OnStartup(); err != nil {
|
||||||
@@ -18,6 +19,11 @@ func TestHealth(t *testing.T) {
|
|||||||
}
|
}
|
||||||
defer h.OnShutdown()
|
defer h.OnShutdown()
|
||||||
|
|
||||||
|
go func() {
|
||||||
|
<-h.pollstop
|
||||||
|
return
|
||||||
|
}()
|
||||||
|
|
||||||
// Reconstruct the http address based on the port allocated by operating system.
|
// Reconstruct the http address based on the port allocated by operating system.
|
||||||
address := fmt.Sprintf("http://%s%s", h.ln.Addr().String(), path)
|
address := fmt.Sprintf("http://%s%s", h.ln.Addr().String(), path)
|
||||||
|
|
||||||
@@ -50,3 +56,22 @@ func TestHealth(t *testing.T) {
|
|||||||
t.Errorf("Invalid response body: expecting 'OK', got '%s'", string(content))
|
t.Errorf("Invalid response body: expecting 'OK', got '%s'", string(content))
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
|
func TestHealthLameduck(t *testing.T) {
|
||||||
|
h := newHealth(":0")
|
||||||
|
h.lameduck = 250 * time.Millisecond
|
||||||
|
h.h = append(h.h, &erratic.Erratic{})
|
||||||
|
|
||||||
|
if err := h.OnStartup(); err != nil {
|
||||||
|
t.Fatalf("Unable to startup the health server: %v", err)
|
||||||
|
}
|
||||||
|
|
||||||
|
// Both these things are behind a sync.Once, fake reading from the channels.
|
||||||
|
go func() {
|
||||||
|
<-h.pollstop
|
||||||
|
<-h.stop
|
||||||
|
return
|
||||||
|
}()
|
||||||
|
|
||||||
|
h.OnShutdown()
|
||||||
|
}
|
||||||
|
|||||||
@@ -1,6 +1,7 @@
|
|||||||
package health
|
package health
|
||||||
|
|
||||||
import (
|
import (
|
||||||
|
"fmt"
|
||||||
"net"
|
"net"
|
||||||
"time"
|
"time"
|
||||||
|
|
||||||
@@ -19,12 +20,13 @@ func init() {
|
|||||||
}
|
}
|
||||||
|
|
||||||
func setup(c *caddy.Controller) error {
|
func setup(c *caddy.Controller) error {
|
||||||
addr, err := healthParse(c)
|
addr, lame, err := healthParse(c)
|
||||||
if err != nil {
|
if err != nil {
|
||||||
return plugin.Error("health", err)
|
return plugin.Error("health", err)
|
||||||
}
|
}
|
||||||
|
|
||||||
h := &health{Addr: addr, stop: make(chan bool)}
|
h := newHealth(addr)
|
||||||
|
h.lameduck = lame
|
||||||
|
|
||||||
c.OnStartup(func() error {
|
c.OnStartup(func() error {
|
||||||
plugins := dnsserver.GetConfig(c).Handlers()
|
plugins := dnsserver.GetConfig(c).Handlers()
|
||||||
@@ -41,8 +43,12 @@ func setup(c *caddy.Controller) error {
|
|||||||
h.poll()
|
h.poll()
|
||||||
go func() {
|
go func() {
|
||||||
for {
|
for {
|
||||||
<-time.After(1 * time.Second)
|
select {
|
||||||
h.poll()
|
case <-time.After(1 * time.Second):
|
||||||
|
h.poll()
|
||||||
|
case <-h.pollstop:
|
||||||
|
return
|
||||||
|
}
|
||||||
}
|
}
|
||||||
}()
|
}()
|
||||||
return nil
|
return nil
|
||||||
@@ -68,8 +74,9 @@ func setup(c *caddy.Controller) error {
|
|||||||
return nil
|
return nil
|
||||||
}
|
}
|
||||||
|
|
||||||
func healthParse(c *caddy.Controller) (string, error) {
|
func healthParse(c *caddy.Controller) (string, time.Duration, error) {
|
||||||
addr := ""
|
addr := ""
|
||||||
|
dur := time.Duration(0)
|
||||||
for c.Next() {
|
for c.Next() {
|
||||||
args := c.RemainingArgs()
|
args := c.RemainingArgs()
|
||||||
|
|
||||||
@@ -78,11 +85,28 @@ func healthParse(c *caddy.Controller) (string, error) {
|
|||||||
case 1:
|
case 1:
|
||||||
addr = args[0]
|
addr = args[0]
|
||||||
if _, _, e := net.SplitHostPort(addr); e != nil {
|
if _, _, e := net.SplitHostPort(addr); e != nil {
|
||||||
return "", e
|
return "", 0, e
|
||||||
}
|
}
|
||||||
default:
|
default:
|
||||||
return "", c.ArgErr()
|
return "", 0, c.ArgErr()
|
||||||
|
}
|
||||||
|
|
||||||
|
for c.NextBlock() {
|
||||||
|
switch c.Val() {
|
||||||
|
case "lameduck":
|
||||||
|
args := c.RemainingArgs()
|
||||||
|
if len(args) != 1 {
|
||||||
|
return "", 0, c.ArgErr()
|
||||||
|
}
|
||||||
|
l, err := time.ParseDuration(args[0])
|
||||||
|
if err != nil {
|
||||||
|
return "", 0, fmt.Errorf("unable to parse lameduck duration value: '%v' : %v", args[0], err)
|
||||||
|
}
|
||||||
|
dur = l
|
||||||
|
default:
|
||||||
|
return "", 0, c.ArgErr()
|
||||||
|
}
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
return addr, nil
|
return addr, dur, nil
|
||||||
}
|
}
|
||||||
|
|||||||
@@ -13,17 +13,27 @@ func TestSetupHealth(t *testing.T) {
|
|||||||
}{
|
}{
|
||||||
{`health`, false},
|
{`health`, false},
|
||||||
{`health localhost:1234`, false},
|
{`health localhost:1234`, false},
|
||||||
|
{`health localhost:1234 {
|
||||||
|
lameduck 4s
|
||||||
|
}`, false},
|
||||||
{`health bla:a`, false},
|
{`health bla:a`, false},
|
||||||
|
|
||||||
{`health bla`, true},
|
{`health bla`, true},
|
||||||
{`health bla bla`, true},
|
{`health bla bla`, true},
|
||||||
|
{`health localhost:1234 {
|
||||||
|
lameduck a
|
||||||
|
}`, true},
|
||||||
|
{`health localhost:1234 {
|
||||||
|
lamedudk 4
|
||||||
|
} `, true},
|
||||||
}
|
}
|
||||||
|
|
||||||
for i, test := range tests {
|
for i, test := range tests {
|
||||||
c := caddy.NewTestController("dns", test.input)
|
c := caddy.NewTestController("dns", test.input)
|
||||||
_, err := healthParse(c)
|
_, _, err := healthParse(c)
|
||||||
|
|
||||||
if test.shouldErr && err == nil {
|
if test.shouldErr && err == nil {
|
||||||
t.Errorf("Test %d: Expected error but found %s for input %s", i, err, test.input)
|
t.Errorf("Test %d: Expected error but found none for input %s", i, test.input)
|
||||||
}
|
}
|
||||||
|
|
||||||
if err != nil {
|
if err != nil {
|
||||||
|
|||||||
Reference in New Issue
Block a user