2019-08-26 19:00:04 +02:00
|
|
|
package mirror
|
|
|
|
|
|
|
|
import (
|
2019-08-29 10:28:05 +02:00
|
|
|
"bufio"
|
2020-03-05 18:03:08 +01:00
|
|
|
"bytes"
|
2019-08-26 19:00:04 +02:00
|
|
|
"context"
|
|
|
|
"errors"
|
2020-03-05 18:03:08 +01:00
|
|
|
"fmt"
|
|
|
|
"io"
|
2019-08-29 10:28:05 +02:00
|
|
|
"net"
|
2019-08-26 19:00:04 +02:00
|
|
|
"net/http"
|
|
|
|
"sync"
|
|
|
|
|
2022-11-21 18:36:05 +01:00
|
|
|
"github.com/rs/zerolog/log"
|
2021-06-25 21:08:11 +02:00
|
|
|
"github.com/traefik/traefik/v2/pkg/config/dynamic"
|
|
|
|
"github.com/traefik/traefik/v2/pkg/healthcheck"
|
2020-09-16 15:46:04 +02:00
|
|
|
"github.com/traefik/traefik/v2/pkg/middlewares/accesslog"
|
|
|
|
"github.com/traefik/traefik/v2/pkg/safe"
|
2019-08-26 19:00:04 +02:00
|
|
|
)
|
|
|
|
|
|
|
|
// Mirroring is an http.Handler that can mirror requests.
|
|
|
|
type Mirroring struct {
|
|
|
|
handler http.Handler
|
|
|
|
mirrorHandlers []*mirrorHandler
|
|
|
|
rw http.ResponseWriter
|
|
|
|
routinePool *safe.Pool
|
|
|
|
|
2021-06-25 21:08:11 +02:00
|
|
|
maxBodySize int64
|
|
|
|
wantsHealthCheck bool
|
2020-03-05 18:03:08 +01:00
|
|
|
|
2019-08-26 19:00:04 +02:00
|
|
|
lock sync.RWMutex
|
|
|
|
total uint64
|
|
|
|
}
|
|
|
|
|
|
|
|
// New returns a new instance of *Mirroring.
|
2021-06-25 21:08:11 +02:00
|
|
|
func New(handler http.Handler, pool *safe.Pool, maxBodySize int64, hc *dynamic.HealthCheck) *Mirroring {
|
2019-08-26 19:00:04 +02:00
|
|
|
return &Mirroring{
|
2021-06-25 21:08:11 +02:00
|
|
|
routinePool: pool,
|
|
|
|
handler: handler,
|
|
|
|
rw: blackHoleResponseWriter{},
|
|
|
|
maxBodySize: maxBodySize,
|
|
|
|
wantsHealthCheck: hc != nil,
|
2019-08-26 19:00:04 +02:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
func (m *Mirroring) inc() uint64 {
|
|
|
|
m.lock.Lock()
|
|
|
|
defer m.lock.Unlock()
|
|
|
|
m.total++
|
|
|
|
return m.total
|
|
|
|
}
|
|
|
|
|
|
|
|
type mirrorHandler struct {
|
|
|
|
http.Handler
|
|
|
|
percent int
|
|
|
|
|
|
|
|
lock sync.RWMutex
|
|
|
|
count uint64
|
|
|
|
}
|
|
|
|
|
2020-03-05 18:03:08 +01:00
|
|
|
func (m *Mirroring) getActiveMirrors() []http.Handler {
|
|
|
|
total := m.inc()
|
|
|
|
|
|
|
|
var mirrors []http.Handler
|
|
|
|
for _, handler := range m.mirrorHandlers {
|
|
|
|
handler.lock.Lock()
|
|
|
|
if handler.count*100 < total*uint64(handler.percent) {
|
|
|
|
handler.count++
|
|
|
|
handler.lock.Unlock()
|
|
|
|
mirrors = append(mirrors, handler)
|
|
|
|
} else {
|
|
|
|
handler.lock.Unlock()
|
|
|
|
}
|
|
|
|
}
|
|
|
|
return mirrors
|
|
|
|
}
|
|
|
|
|
2019-08-26 19:00:04 +02:00
|
|
|
func (m *Mirroring) ServeHTTP(rw http.ResponseWriter, req *http.Request) {
|
2020-03-05 18:03:08 +01:00
|
|
|
mirrors := m.getActiveMirrors()
|
|
|
|
if len(mirrors) == 0 {
|
|
|
|
m.handler.ServeHTTP(rw, req)
|
|
|
|
return
|
|
|
|
}
|
|
|
|
|
2022-11-21 18:36:05 +01:00
|
|
|
logger := log.Ctx(req.Context())
|
2020-03-05 18:03:08 +01:00
|
|
|
rr, bytesRead, err := newReusableRequest(req, m.maxBodySize)
|
2020-11-06 09:26:03 +01:00
|
|
|
if err != nil && !errors.Is(err, errBodyTooLarge) {
|
2022-11-21 18:36:05 +01:00
|
|
|
http.Error(rw, fmt.Sprintf("%s: creating reusable request: %v",
|
|
|
|
http.StatusText(http.StatusInternalServerError), err), http.StatusInternalServerError)
|
2020-03-05 18:03:08 +01:00
|
|
|
return
|
|
|
|
}
|
|
|
|
|
2020-11-06 09:26:03 +01:00
|
|
|
if errors.Is(err, errBodyTooLarge) {
|
2021-03-04 20:08:03 +01:00
|
|
|
req.Body = io.NopCloser(io.MultiReader(bytes.NewReader(bytesRead), req.Body))
|
2020-03-05 18:03:08 +01:00
|
|
|
m.handler.ServeHTTP(rw, req)
|
2022-11-21 18:36:05 +01:00
|
|
|
logger.Debug().Msg("No mirroring, request body larger than allowed size")
|
2020-03-05 18:03:08 +01:00
|
|
|
return
|
|
|
|
}
|
|
|
|
|
|
|
|
m.handler.ServeHTTP(rw, rr.clone(req.Context()))
|
2019-08-26 19:00:04 +02:00
|
|
|
|
|
|
|
select {
|
|
|
|
case <-req.Context().Done():
|
|
|
|
// No mirroring if request has been canceled during main handler ServeHTTP
|
2022-11-21 18:36:05 +01:00
|
|
|
logger.Warn().Msg("No mirroring, request has been canceled during main handler ServeHTTP")
|
2019-08-26 19:00:04 +02:00
|
|
|
return
|
|
|
|
default:
|
|
|
|
}
|
|
|
|
|
|
|
|
m.routinePool.GoCtx(func(_ context.Context) {
|
2020-03-05 18:03:08 +01:00
|
|
|
for _, handler := range mirrors {
|
|
|
|
// prepare request, update body from buffer
|
|
|
|
r := rr.clone(req.Context())
|
|
|
|
|
|
|
|
// In ServeHTTP, we rely on the presence of the accessLog datatable found in the request's context
|
|
|
|
// to know whether we should mutate said datatable (and contribute some fields to the log).
|
|
|
|
// In this instance, we do not want the mirrors mutating (i.e. changing the service name in)
|
|
|
|
// the logs related to the mirrored server.
|
|
|
|
// Especially since it would result in unguarded concurrent reads/writes on the datatable.
|
|
|
|
// Therefore, we reset any potential datatable key in the new context that we pass around.
|
|
|
|
ctx := context.WithValue(r.Context(), accesslog.DataTableKey, nil)
|
|
|
|
|
|
|
|
// When a request served by m.handler is successful, req.Context will be canceled,
|
|
|
|
// which would trigger a cancellation of the ongoing mirrored requests.
|
|
|
|
// Therefore, we give a new, non-cancellable context to each of the mirrored calls,
|
|
|
|
// so they can terminate by themselves.
|
|
|
|
handler.ServeHTTP(m.rw, r.WithContext(contextStopPropagation{ctx}))
|
2019-08-26 19:00:04 +02:00
|
|
|
}
|
|
|
|
})
|
|
|
|
}
|
|
|
|
|
|
|
|
// AddMirror adds an httpHandler to mirror to.
|
|
|
|
func (m *Mirroring) AddMirror(handler http.Handler, percent int) error {
|
2019-08-29 10:28:05 +02:00
|
|
|
if percent < 0 || percent > 100 {
|
2019-08-26 19:00:04 +02:00
|
|
|
return errors.New("percent must be between 0 and 100")
|
|
|
|
}
|
|
|
|
m.mirrorHandlers = append(m.mirrorHandlers, &mirrorHandler{Handler: handler, percent: percent})
|
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
2021-06-25 21:08:11 +02:00
|
|
|
// RegisterStatusUpdater adds fn to the list of hooks that are run when the
|
|
|
|
// status of handler of the Mirroring changes.
|
|
|
|
// Not thread safe.
|
|
|
|
func (m *Mirroring) RegisterStatusUpdater(fn func(up bool)) error {
|
|
|
|
// Since the status propagation is completely transparent through the
|
|
|
|
// mirroring (because of the recursion on the underlying service), we could maybe
|
|
|
|
// skip that below, and even not add HealthCheck as a field of
|
|
|
|
// dynamic.Mirroring. But I think it's easier to understand for the user
|
|
|
|
// if the HealthCheck is required absolutely everywhere in the config.
|
|
|
|
if !m.wantsHealthCheck {
|
|
|
|
return errors.New("healthCheck not enabled in config for this mirroring service")
|
|
|
|
}
|
|
|
|
|
|
|
|
updater, ok := m.handler.(healthcheck.StatusUpdater)
|
|
|
|
if !ok {
|
|
|
|
return fmt.Errorf("service of mirroring %T not a healthcheck.StatusUpdater", m.handler)
|
|
|
|
}
|
|
|
|
|
|
|
|
if err := updater.RegisterStatusUpdater(fn); err != nil {
|
|
|
|
return fmt.Errorf("cannot register service of mirroring as updater: %w", err)
|
|
|
|
}
|
|
|
|
|
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
2020-03-05 18:03:08 +01:00
|
|
|
type blackHoleResponseWriter struct{}
|
2019-08-26 19:00:04 +02:00
|
|
|
|
2020-03-05 18:03:08 +01:00
|
|
|
func (b blackHoleResponseWriter) Flush() {}
|
2019-08-29 10:28:05 +02:00
|
|
|
|
2020-03-05 18:03:08 +01:00
|
|
|
func (b blackHoleResponseWriter) Hijack() (net.Conn, *bufio.ReadWriter, error) {
|
|
|
|
return nil, nil, errors.New("connection on blackHoleResponseWriter cannot be hijacked")
|
2019-08-29 10:28:05 +02:00
|
|
|
}
|
|
|
|
|
2020-03-05 18:03:08 +01:00
|
|
|
func (b blackHoleResponseWriter) Header() http.Header {
|
2019-08-26 19:00:04 +02:00
|
|
|
return http.Header{}
|
|
|
|
}
|
|
|
|
|
2021-03-04 09:02:03 +01:00
|
|
|
func (b blackHoleResponseWriter) Write(data []byte) (int, error) {
|
|
|
|
return len(data), nil
|
2019-08-26 19:00:04 +02:00
|
|
|
}
|
|
|
|
|
2022-11-21 18:36:05 +01:00
|
|
|
func (b blackHoleResponseWriter) WriteHeader(_ int) {}
|
2019-08-26 19:00:04 +02:00
|
|
|
|
|
|
|
type contextStopPropagation struct {
|
|
|
|
context.Context
|
|
|
|
}
|
|
|
|
|
|
|
|
func (c contextStopPropagation) Done() <-chan struct{} {
|
|
|
|
return make(chan struct{})
|
|
|
|
}
|
2020-03-05 18:03:08 +01:00
|
|
|
|
|
|
|
// reusableRequest keeps in memory the body of the given request,
|
|
|
|
// so that the request can be fully cloned by each mirror.
|
|
|
|
type reusableRequest struct {
|
|
|
|
req *http.Request
|
|
|
|
body []byte
|
|
|
|
}
|
|
|
|
|
|
|
|
var errBodyTooLarge = errors.New("request body too large")
|
|
|
|
|
|
|
|
// if the returned error is errBodyTooLarge, newReusableRequest also returns the
|
|
|
|
// bytes that were already consumed from the request's body.
|
|
|
|
func newReusableRequest(req *http.Request, maxBodySize int64) (*reusableRequest, []byte, error) {
|
|
|
|
if req == nil {
|
|
|
|
return nil, nil, errors.New("nil input request")
|
|
|
|
}
|
2021-09-02 11:46:13 +03:00
|
|
|
if req.Body == nil || req.ContentLength == 0 {
|
2020-03-05 18:03:08 +01:00
|
|
|
return &reusableRequest{req: req}, nil, nil
|
|
|
|
}
|
|
|
|
|
|
|
|
// unbounded body size
|
|
|
|
if maxBodySize < 0 {
|
2021-03-04 20:08:03 +01:00
|
|
|
body, err := io.ReadAll(req.Body)
|
2020-03-05 18:03:08 +01:00
|
|
|
if err != nil {
|
|
|
|
return nil, nil, err
|
|
|
|
}
|
|
|
|
return &reusableRequest{
|
|
|
|
req: req,
|
|
|
|
body: body,
|
|
|
|
}, nil, nil
|
|
|
|
}
|
|
|
|
|
|
|
|
// we purposefully try to read _more_ than maxBodySize to detect whether
|
|
|
|
// the request body is larger than what we allow for the mirrors.
|
|
|
|
body := make([]byte, maxBodySize+1)
|
|
|
|
n, err := io.ReadFull(req.Body, body)
|
2020-11-06 09:26:03 +01:00
|
|
|
if err != nil && !errors.Is(err, io.ErrUnexpectedEOF) {
|
2020-03-05 18:03:08 +01:00
|
|
|
return nil, nil, err
|
|
|
|
}
|
|
|
|
|
|
|
|
// we got an ErrUnexpectedEOF, which means there was less than maxBodySize data to read,
|
|
|
|
// which permits us sending also to all the mirrors later.
|
2020-11-06 09:26:03 +01:00
|
|
|
if errors.Is(err, io.ErrUnexpectedEOF) {
|
2020-03-05 18:03:08 +01:00
|
|
|
return &reusableRequest{
|
|
|
|
req: req,
|
|
|
|
body: body[:n],
|
|
|
|
}, nil, nil
|
|
|
|
}
|
|
|
|
|
|
|
|
// err == nil , which means data size > maxBodySize
|
|
|
|
return nil, body[:n], errBodyTooLarge
|
|
|
|
}
|
|
|
|
|
|
|
|
func (rr reusableRequest) clone(ctx context.Context) *http.Request {
|
|
|
|
req := rr.req.Clone(ctx)
|
|
|
|
|
|
|
|
if rr.body != nil {
|
2021-03-04 20:08:03 +01:00
|
|
|
req.Body = io.NopCloser(bytes.NewReader(rr.body))
|
2020-03-05 18:03:08 +01:00
|
|
|
}
|
|
|
|
|
|
|
|
return req
|
|
|
|
}
|