2016-11-26 19:48:49 +01:00
|
|
|
package healthcheck
|
|
|
|
|
|
|
|
import (
|
2016-11-30 22:49:57 +01:00
|
|
|
"context"
|
2017-03-24 09:36:33 +01:00
|
|
|
"fmt"
|
2017-05-10 14:28:57 -04:00
|
|
|
"net"
|
2016-11-26 19:48:49 +01:00
|
|
|
"net/http"
|
|
|
|
"net/url"
|
2017-05-10 14:28:57 -04:00
|
|
|
"strconv"
|
2016-11-26 19:48:49 +01:00
|
|
|
"sync"
|
|
|
|
"time"
|
2017-01-31 22:55:02 +01:00
|
|
|
|
2018-01-26 11:58:03 +01:00
|
|
|
"github.com/go-kit/kit/metrics"
|
2020-09-16 15:46:04 +02:00
|
|
|
"github.com/traefik/traefik/v2/pkg/config/runtime"
|
|
|
|
"github.com/traefik/traefik/v2/pkg/log"
|
|
|
|
"github.com/traefik/traefik/v2/pkg/safe"
|
2017-01-31 22:55:02 +01:00
|
|
|
"github.com/vulcand/oxy/roundrobin"
|
2016-11-26 19:48:49 +01:00
|
|
|
)
|
|
|
|
|
2019-05-16 10:58:06 +02:00
|
|
|
const (
|
|
|
|
serverUp = "UP"
|
|
|
|
serverDown = "DOWN"
|
|
|
|
)
|
|
|
|
|
2020-07-07 14:42:03 +02:00
|
|
|
var (
|
|
|
|
singleton *HealthCheck
|
|
|
|
once sync.Once
|
|
|
|
)
|
2016-11-26 19:48:49 +01:00
|
|
|
|
2020-05-11 12:06:07 +02:00
|
|
|
// Balancer is the set of operations required to manage the list of servers in a load-balancer.
|
2019-11-29 12:40:05 +01:00
|
|
|
type Balancer interface {
|
2018-06-11 11:36:03 +02:00
|
|
|
Servers() []*url.URL
|
|
|
|
RemoveServer(u *url.URL) error
|
|
|
|
UpsertServer(u *url.URL, options ...roundrobin.ServerOption) error
|
|
|
|
}
|
|
|
|
|
2019-11-29 12:40:05 +01:00
|
|
|
// BalancerHandler includes functionality for load-balancing management.
|
|
|
|
type BalancerHandler interface {
|
|
|
|
ServeHTTP(w http.ResponseWriter, req *http.Request)
|
|
|
|
Balancer
|
|
|
|
}
|
|
|
|
|
2020-05-11 12:06:07 +02:00
|
|
|
// metricsRegistry is a local interface in the health check package,
|
|
|
|
// exposing only the required metrics necessary for the health check package.
|
|
|
|
// This makes it easier for the tests.
|
2018-06-11 11:36:03 +02:00
|
|
|
type metricsRegistry interface {
|
|
|
|
BackendServerUpGauge() metrics.Gauge
|
2016-11-26 19:48:49 +01:00
|
|
|
}
|
|
|
|
|
2017-03-15 19:16:06 +01:00
|
|
|
// Options are the public health check options.
|
|
|
|
type Options struct {
|
2020-02-26 17:28:04 +01:00
|
|
|
Headers map[string]string
|
|
|
|
Hostname string
|
|
|
|
Scheme string
|
|
|
|
Path string
|
|
|
|
Port int
|
|
|
|
FollowRedirects bool
|
|
|
|
Transport http.RoundTripper
|
|
|
|
Interval time.Duration
|
|
|
|
Timeout time.Duration
|
|
|
|
LB Balancer
|
2017-03-15 19:16:06 +01:00
|
|
|
}
|
|
|
|
|
2017-03-24 09:36:33 +01:00
|
|
|
func (opt Options) String() string {
|
2020-02-26 17:28:04 +01:00
|
|
|
return fmt.Sprintf("[Hostname: %s Headers: %v Path: %s Port: %d Interval: %s Timeout: %s FollowRedirects: %v]", opt.Hostname, opt.Headers, opt.Path, opt.Port, opt.Interval, opt.Timeout, opt.FollowRedirects)
|
2017-03-24 09:36:33 +01:00
|
|
|
}
|
|
|
|
|
2019-08-07 08:14:04 -07:00
|
|
|
type backendURL struct {
|
|
|
|
url *url.URL
|
|
|
|
weight int
|
|
|
|
}
|
|
|
|
|
2020-05-11 12:06:07 +02:00
|
|
|
// BackendConfig HealthCheck configuration for a backend.
|
2018-06-11 11:36:03 +02:00
|
|
|
type BackendConfig struct {
|
2017-03-15 19:16:06 +01:00
|
|
|
Options
|
2018-11-27 17:42:04 +01:00
|
|
|
name string
|
2019-08-07 08:14:04 -07:00
|
|
|
disabledURLs []backendURL
|
2016-11-26 19:48:49 +01:00
|
|
|
}
|
|
|
|
|
2018-06-11 11:36:03 +02:00
|
|
|
func (b *BackendConfig) newRequest(serverURL *url.URL) (*http.Request, error) {
|
2018-11-15 15:50:03 +01:00
|
|
|
u, err := serverURL.Parse(b.Path)
|
|
|
|
if err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
2016-11-26 19:48:49 +01:00
|
|
|
|
2018-06-11 11:36:03 +02:00
|
|
|
if len(b.Scheme) > 0 {
|
|
|
|
u.Scheme = b.Scheme
|
|
|
|
}
|
2016-11-26 19:48:49 +01:00
|
|
|
|
2018-06-11 11:36:03 +02:00
|
|
|
if b.Port != 0 {
|
|
|
|
u.Host = net.JoinHostPort(u.Hostname(), strconv.Itoa(b.Port))
|
2017-03-09 16:27:31 +01:00
|
|
|
}
|
2016-11-26 19:48:49 +01:00
|
|
|
|
2018-10-23 10:10:04 +02:00
|
|
|
return http.NewRequest(http.MethodGet, u.String(), http.NoBody)
|
2018-01-26 11:58:03 +01:00
|
|
|
}
|
|
|
|
|
2020-05-11 12:06:07 +02:00
|
|
|
// this function adds additional http headers and hostname to http.request.
|
2018-06-11 11:36:03 +02:00
|
|
|
func (b *BackendConfig) addHeadersAndHost(req *http.Request) *http.Request {
|
|
|
|
if b.Options.Hostname != "" {
|
|
|
|
req.Host = b.Options.Hostname
|
|
|
|
}
|
|
|
|
|
|
|
|
for k, v := range b.Options.Headers {
|
|
|
|
req.Header.Set(k, v)
|
2017-03-09 16:27:31 +01:00
|
|
|
}
|
2018-06-11 11:36:03 +02:00
|
|
|
return req
|
|
|
|
}
|
|
|
|
|
2020-05-11 12:06:07 +02:00
|
|
|
// HealthCheck struct.
|
2018-06-11 11:36:03 +02:00
|
|
|
type HealthCheck struct {
|
|
|
|
Backends map[string]*BackendConfig
|
|
|
|
metrics metricsRegistry
|
|
|
|
cancel context.CancelFunc
|
2016-11-26 19:48:49 +01:00
|
|
|
}
|
|
|
|
|
2020-05-11 12:06:07 +02:00
|
|
|
// SetBackendsConfiguration set backends configuration.
|
2018-06-11 11:36:03 +02:00
|
|
|
func (hc *HealthCheck) SetBackendsConfiguration(parentCtx context.Context, backends map[string]*BackendConfig) {
|
2016-11-26 19:48:49 +01:00
|
|
|
hc.Backends = backends
|
2016-11-30 22:49:57 +01:00
|
|
|
if hc.cancel != nil {
|
|
|
|
hc.cancel()
|
|
|
|
}
|
2017-01-31 22:55:02 +01:00
|
|
|
ctx, cancel := context.WithCancel(parentCtx)
|
2016-11-30 22:49:57 +01:00
|
|
|
hc.cancel = cancel
|
2016-11-26 19:48:49 +01:00
|
|
|
|
2018-01-15 17:27:37 +01:00
|
|
|
for _, backend := range backends {
|
2017-03-09 16:27:31 +01:00
|
|
|
currentBackend := backend
|
2017-01-31 22:55:02 +01:00
|
|
|
safe.Go(func() {
|
2018-01-03 12:32:03 +01:00
|
|
|
hc.execute(ctx, currentBackend)
|
2017-01-31 22:55:02 +01:00
|
|
|
})
|
2016-11-30 22:49:57 +01:00
|
|
|
}
|
2016-11-26 19:48:49 +01:00
|
|
|
}
|
|
|
|
|
2018-06-11 11:36:03 +02:00
|
|
|
func (hc *HealthCheck) execute(ctx context.Context, backend *BackendConfig) {
|
2019-09-13 19:28:04 +02:00
|
|
|
logger := log.FromContext(ctx)
|
|
|
|
logger.Debugf("Initial health check for backend: %q", backend.name)
|
|
|
|
|
|
|
|
hc.checkBackend(ctx, backend)
|
2017-03-09 16:27:31 +01:00
|
|
|
ticker := time.NewTicker(backend.Interval)
|
|
|
|
defer ticker.Stop()
|
2017-04-11 17:10:46 +02:00
|
|
|
for {
|
|
|
|
select {
|
|
|
|
case <-ctx.Done():
|
2019-09-13 19:28:04 +02:00
|
|
|
logger.Debugf("Stopping current health check goroutines of backend: %s", backend.name)
|
2017-04-11 17:10:46 +02:00
|
|
|
return
|
|
|
|
case <-ticker.C:
|
2019-09-13 19:28:04 +02:00
|
|
|
logger.Debugf("Refreshing health check for backend: %s", backend.name)
|
|
|
|
hc.checkBackend(ctx, backend)
|
2017-03-09 16:27:31 +01:00
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2019-09-13 19:28:04 +02:00
|
|
|
func (hc *HealthCheck) checkBackend(ctx context.Context, backend *BackendConfig) {
|
|
|
|
logger := log.FromContext(ctx)
|
|
|
|
|
2018-01-03 12:32:03 +01:00
|
|
|
enabledURLs := backend.LB.Servers()
|
2019-08-07 08:14:04 -07:00
|
|
|
var newDisabledURLs []backendURL
|
2019-11-29 12:40:05 +01:00
|
|
|
for _, disabledURL := range backend.disabledURLs {
|
|
|
|
if err := checkHealth(disabledURL.url, backend); err == nil {
|
2019-09-13 19:28:04 +02:00
|
|
|
logger.Warnf("Health check up: Returning to server list. Backend: %q URL: %q Weight: %d",
|
2019-11-29 12:40:05 +01:00
|
|
|
backend.name, disabledURL.url.String(), disabledURL.weight)
|
|
|
|
if err = backend.LB.UpsertServer(disabledURL.url, roundrobin.Weight(disabledURL.weight)); err != nil {
|
2019-09-13 19:28:04 +02:00
|
|
|
logger.Error(err)
|
2018-08-06 20:00:03 +02:00
|
|
|
}
|
2017-04-11 17:10:46 +02:00
|
|
|
} else {
|
2019-11-29 12:40:05 +01:00
|
|
|
logger.Warnf("Health check still failing. Backend: %q URL: %q Reason: %s", backend.name, disabledURL.url.String(), err)
|
|
|
|
newDisabledURLs = append(newDisabledURLs, disabledURL)
|
2017-04-11 17:10:46 +02:00
|
|
|
}
|
|
|
|
}
|
2018-01-03 12:32:03 +01:00
|
|
|
backend.disabledURLs = newDisabledURLs
|
2017-03-09 16:27:31 +01:00
|
|
|
|
2018-08-06 20:00:03 +02:00
|
|
|
for _, enableURL := range enabledURLs {
|
|
|
|
if err := checkHealth(enableURL, backend); err != nil {
|
2019-08-07 08:14:04 -07:00
|
|
|
weight := 1
|
|
|
|
rr, ok := backend.LB.(*roundrobin.RoundRobin)
|
|
|
|
if ok {
|
|
|
|
var gotWeight bool
|
|
|
|
weight, gotWeight = rr.ServerWeight(enableURL)
|
|
|
|
if !gotWeight {
|
|
|
|
weight = 1
|
|
|
|
}
|
|
|
|
}
|
2019-11-29 12:40:05 +01:00
|
|
|
logger.Warnf("Health check failed, removing from server list. Backend: %q URL: %q Weight: %d Reason: %s", backend.name, enableURL.String(), weight, err)
|
2018-08-06 20:00:03 +02:00
|
|
|
if err := backend.LB.RemoveServer(enableURL); err != nil {
|
2019-09-13 19:28:04 +02:00
|
|
|
logger.Error(err)
|
2018-08-06 20:00:03 +02:00
|
|
|
}
|
2019-08-07 08:14:04 -07:00
|
|
|
backend.disabledURLs = append(backend.disabledURLs, backendURL{enableURL, weight})
|
2017-04-11 17:10:46 +02:00
|
|
|
}
|
|
|
|
}
|
2017-03-09 16:27:31 +01:00
|
|
|
}
|
|
|
|
|
2018-06-11 11:36:03 +02:00
|
|
|
// GetHealthCheck returns the health check which is guaranteed to be a singleton.
|
2018-11-14 10:18:03 +01:00
|
|
|
func GetHealthCheck() *HealthCheck {
|
2018-06-11 11:36:03 +02:00
|
|
|
once.Do(func() {
|
2018-11-14 10:18:03 +01:00
|
|
|
singleton = newHealthCheck()
|
2018-06-11 11:36:03 +02:00
|
|
|
})
|
|
|
|
return singleton
|
2017-05-10 14:28:57 -04:00
|
|
|
}
|
|
|
|
|
2018-11-14 10:18:03 +01:00
|
|
|
func newHealthCheck() *HealthCheck {
|
2018-06-11 11:36:03 +02:00
|
|
|
return &HealthCheck{
|
|
|
|
Backends: make(map[string]*BackendConfig),
|
2018-04-16 11:40:03 +02:00
|
|
|
}
|
2018-06-11 11:36:03 +02:00
|
|
|
}
|
2018-05-22 09:22:03 +02:00
|
|
|
|
2020-05-11 12:06:07 +02:00
|
|
|
// NewBackendConfig Instantiate a new BackendConfig.
|
2018-06-11 11:36:03 +02:00
|
|
|
func NewBackendConfig(options Options, backendName string) *BackendConfig {
|
|
|
|
return &BackendConfig{
|
2018-09-27 13:16:03 -05:00
|
|
|
Options: options,
|
|
|
|
name: backendName,
|
2018-04-16 11:40:03 +02:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2018-01-03 12:32:03 +01:00
|
|
|
// checkHealth returns a nil error in case it was successful and otherwise
|
|
|
|
// a non-nil error with a meaningful description why the health check failed.
|
2018-06-11 11:36:03 +02:00
|
|
|
func checkHealth(serverURL *url.URL, backend *BackendConfig) error {
|
2017-05-10 14:28:57 -04:00
|
|
|
req, err := backend.newRequest(serverURL)
|
|
|
|
if err != nil {
|
2020-05-11 12:06:07 +02:00
|
|
|
return fmt.Errorf("failed to create HTTP request: %w", err)
|
2017-05-10 14:28:57 -04:00
|
|
|
}
|
2018-05-22 09:22:03 +02:00
|
|
|
|
2018-04-16 11:40:03 +02:00
|
|
|
req = backend.addHeadersAndHost(req)
|
2017-05-10 14:28:57 -04:00
|
|
|
|
2018-05-22 09:22:03 +02:00
|
|
|
client := http.Client{
|
2018-09-27 13:16:03 -05:00
|
|
|
Timeout: backend.Options.Timeout,
|
2018-05-22 09:22:03 +02:00
|
|
|
Transport: backend.Options.Transport,
|
2016-11-26 19:48:49 +01:00
|
|
|
}
|
2018-01-03 12:32:03 +01:00
|
|
|
|
2020-02-26 17:28:04 +01:00
|
|
|
if !backend.FollowRedirects {
|
|
|
|
client.CheckRedirect = func(req *http.Request, via []*http.Request) error {
|
|
|
|
return http.ErrUseLastResponse
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2018-05-22 09:22:03 +02:00
|
|
|
resp, err := client.Do(req)
|
|
|
|
if err != nil {
|
2020-05-11 12:06:07 +02:00
|
|
|
return fmt.Errorf("HTTP request failed: %w", err)
|
2018-01-03 12:32:03 +01:00
|
|
|
}
|
2018-05-22 09:22:03 +02:00
|
|
|
|
|
|
|
defer resp.Body.Close()
|
|
|
|
|
2018-05-23 17:06:04 +02:00
|
|
|
if resp.StatusCode < http.StatusOK || resp.StatusCode >= http.StatusBadRequest {
|
|
|
|
return fmt.Errorf("received error status code: %v", resp.StatusCode)
|
2018-05-22 09:22:03 +02:00
|
|
|
}
|
|
|
|
|
2018-01-03 12:32:03 +01:00
|
|
|
return nil
|
2016-11-26 19:48:49 +01:00
|
|
|
}
|
2019-05-16 10:58:06 +02:00
|
|
|
|
2020-05-11 12:06:07 +02:00
|
|
|
// NewLBStatusUpdater returns a new LbStatusUpdater.
|
2019-09-13 19:28:04 +02:00
|
|
|
func NewLBStatusUpdater(bh BalancerHandler, info *runtime.ServiceInfo) *LbStatusUpdater {
|
2019-05-16 10:58:06 +02:00
|
|
|
return &LbStatusUpdater{
|
|
|
|
BalancerHandler: bh,
|
2019-09-13 19:28:04 +02:00
|
|
|
serviceInfo: info,
|
2019-05-16 10:58:06 +02:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
// LbStatusUpdater wraps a BalancerHandler and a ServiceInfo,
|
|
|
|
// so it can keep track of the status of a server in the ServiceInfo.
|
|
|
|
type LbStatusUpdater struct {
|
|
|
|
BalancerHandler
|
2019-07-15 17:04:04 +02:00
|
|
|
serviceInfo *runtime.ServiceInfo // can be nil
|
2019-05-16 10:58:06 +02:00
|
|
|
}
|
|
|
|
|
|
|
|
// RemoveServer removes the given server from the BalancerHandler,
|
|
|
|
// and updates the status of the server to "DOWN".
|
|
|
|
func (lb *LbStatusUpdater) RemoveServer(u *url.URL) error {
|
|
|
|
err := lb.BalancerHandler.RemoveServer(u)
|
|
|
|
if err == nil && lb.serviceInfo != nil {
|
2019-07-15 17:04:04 +02:00
|
|
|
lb.serviceInfo.UpdateServerStatus(u.String(), serverDown)
|
2019-05-16 10:58:06 +02:00
|
|
|
}
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
|
|
|
|
// UpsertServer adds the given server to the BalancerHandler,
|
|
|
|
// and updates the status of the server to "UP".
|
|
|
|
func (lb *LbStatusUpdater) UpsertServer(u *url.URL, options ...roundrobin.ServerOption) error {
|
|
|
|
err := lb.BalancerHandler.UpsertServer(u, options...)
|
|
|
|
if err == nil && lb.serviceInfo != nil {
|
2019-07-15 17:04:04 +02:00
|
|
|
lb.serviceInfo.UpdateServerStatus(u.String(), serverUp)
|
2019-05-16 10:58:06 +02:00
|
|
|
}
|
|
|
|
return err
|
|
|
|
}
|
2019-11-29 12:40:05 +01:00
|
|
|
|
|
|
|
// Balancers is a list of Balancers(s) that implements the Balancer interface.
|
|
|
|
type Balancers []Balancer
|
|
|
|
|
2020-05-11 12:06:07 +02:00
|
|
|
// Servers returns the servers url from all the BalancerHandler.
|
2019-11-29 12:40:05 +01:00
|
|
|
func (b Balancers) Servers() []*url.URL {
|
|
|
|
var servers []*url.URL
|
|
|
|
for _, lb := range b {
|
|
|
|
servers = append(servers, lb.Servers()...)
|
|
|
|
}
|
|
|
|
|
|
|
|
return servers
|
|
|
|
}
|
|
|
|
|
|
|
|
// RemoveServer removes the given server from all the BalancerHandler,
|
|
|
|
// and updates the status of the server to "DOWN".
|
|
|
|
func (b Balancers) RemoveServer(u *url.URL) error {
|
|
|
|
for _, lb := range b {
|
|
|
|
if err := lb.RemoveServer(u); err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
}
|
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
|
|
|
// UpsertServer adds the given server to all the BalancerHandler,
|
|
|
|
// and updates the status of the server to "UP".
|
|
|
|
func (b Balancers) UpsertServer(u *url.URL, options ...roundrobin.ServerOption) error {
|
|
|
|
for _, lb := range b {
|
|
|
|
if err := lb.UpsertServer(u, options...); err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
}
|
|
|
|
return nil
|
|
|
|
}
|