Skip to content

Commit

Permalink
Implement SRV and A/AAA upstream sources
Browse files Browse the repository at this point in the history
Also get upstreams at every retry loop iteration instead of just once
before the loop. See #4442.
  • Loading branch information
mholt committed Dec 8, 2021
1 parent 9adeea5 commit 5e872e7
Show file tree
Hide file tree
Showing 3 changed files with 272 additions and 18 deletions.
9 changes: 9 additions & 0 deletions modules/caddyhttp/reverseproxy/hosts.go
Original file line number Diff line number Diff line change
Expand Up @@ -143,6 +143,15 @@ func (u *Upstream) fillDialInfo(r *http.Request) (DialInfo, error) {
}, nil
}

func (u *Upstream) setHost() {
host := new(Host)
existingHost, loaded := hosts.LoadOrStore(u.String(), host)
if loaded {
host = existingHost.(*Host)
}
u.Host = host
}

// Host is the basic, in-memory representation
// of the state of a remote host.
type Host struct {
Expand Down
38 changes: 20 additions & 18 deletions modules/caddyhttp/reverseproxy/reverseproxy.go
Original file line number Diff line number Diff line change
Expand Up @@ -256,12 +256,7 @@ func (h *Handler) Provision(ctx caddy.Context) error {
// set up upstreams
for _, upstream := range h.Upstreams {
// create or get the host representation for this upstream
host := new(Host)
existingHost, loaded := hosts.LoadOrStore(upstream.String(), host)
if loaded {
host = existingHost.(*Host)
}
upstream.Host = host
upstream.setHost()

// give it the circuit breaker, if any
upstream.cb = h.CB
Expand Down Expand Up @@ -417,19 +412,19 @@ func (h *Handler) ServeHTTP(w http.ResponseWriter, r *http.Request, next caddyht
repl.Set("http.reverse_proxy.duration", time.Since(start))
}()

// get the list of upstreams
upstreams := h.Upstreams
if h.DynamicUpstreams != nil {
dUpstreams, err := h.DynamicUpstreams.GetUpstreams(r)
if err != nil {
h.logger.Error("failed getting dynamic upstreams; falling back to static upstreams", zap.Error(err))
} else {
upstreams = dUpstreams
}
}

var proxyErr error
for {
// get the updated list of upstreams
upstreams := h.Upstreams
if h.DynamicUpstreams != nil {
dUpstreams, err := h.DynamicUpstreams.GetUpstreams(r)
if err != nil {
h.logger.Error("failed getting dynamic upstreams; falling back to static upstreams", zap.Error(err))
} else {
upstreams = dUpstreams
}
}

// choose an available upstream
upstream := h.LoadBalancing.SelectionPolicy.Select(upstreams, r, w)
if upstream == nil {
Expand Down Expand Up @@ -932,7 +927,14 @@ type Selector interface {

// UpstreamSource gets the list of upstreams that can be used when
// proxying a request. Returned upstreams will be load balanced and
// health-checked.
// health-checked. This should be a very fast function -- instant
// if possible -- and the return value must be as stable as possible.
// In other words, the list of upstreams should ideally not change much
// across successive calls. If the list of upstreams changes or the
// ordering is not stable, load balancing will suffer. This function
// may be called during each retry, multiple times per request, and as
// such, needs to be instantaneous. The returned slice will not be
// modified.
type UpstreamSource interface {
GetUpstreams(*http.Request) ([]*Upstream, error)
}
Expand Down
243 changes: 243 additions & 0 deletions modules/caddyhttp/reverseproxy/upstreams.go
Original file line number Diff line number Diff line change
@@ -0,0 +1,243 @@
package reverseproxy

import (
"fmt"
"net"
"net/http"
"strconv"
"sync"
"time"

"github.com/caddyserver/caddy/v2"
)

func init() {
caddy.RegisterModule(SRVUpstreams{})
caddy.RegisterModule(AUpstreams{})
}

// SRVUpstreams provides upstreams from SRV lookups.
// The lookup DNS name can be configured either by
// its individual parts (that is, specifying the
// service, protocol, and name separately) to form
// the standard "_service._proto.name" domain, or
// the domain can be specified directly in name by
// leaving service and proto empty. See RFC 2782.
//
// Lookups are cached and refreshed at the configured
// refresh interval.
//
// Returned upstreams are sorted by priority and weight.
type SRVUpstreams struct {
// The interval at which to refresh the SRV lookup.
// Results are cached between lookups. Default: 1m
Refresh time.Duration `json:"refresh,omitempty"`

// The service label.
Service string `json:"service,omitempty"`

// The protocol label; either tcp or udp.
Proto string `json:"proto,omitempty"`

// The name label; or, if service and proto are
// empty, the entire domain name to look up.
Name string `json:"name,omitempty"`
}

// CaddyModule returns the Caddy module information.
func (SRVUpstreams) CaddyModule() caddy.ModuleInfo {
return caddy.ModuleInfo{
ID: "http.reverse_proxy.upstreams.srv",
New: func() caddy.Module { return new(SRVUpstreams) },
}
}

// String returns the RFC 2782 representation of the SRV domain.
func (su SRVUpstreams) String() string {
return fmt.Sprintf("_%s._%s.%s", su.Service, su.Proto, su.Name)
}

func (su *SRVUpstreams) Provision(_ caddy.Context) error {
if su.Proto != "tcp" && su.Proto != "udp" {
return fmt.Errorf("invalid proto '%s'", su.Proto)
}
if su.Refresh == 0 {
su.Refresh = time.Minute
}
return nil
}

func (su SRVUpstreams) GetUpstreams(r *http.Request) ([]*Upstream, error) {
suStr := su.String()

// first, use a cheap read-lock to return a cached result quickly
srvsMu.RLock()
cached := srvs[suStr]
srvsMu.RUnlock()
if cached.fresh() {
return cached.upstreams, nil
}

// otherwise, obtain a write-lock to update the cached value
srvsMu.Lock()
defer srvsMu.Unlock()

// check to see if it's still stale, since we're now in a different
// lock from when we first checked freshness; another goroutine might
// have refreshed it in the meantime before we re-obtained our lock
cached = srvs[suStr]
if cached.fresh() {
return cached.upstreams, nil
}

// prepare parameters and perform the SRV lookup
repl := r.Context().Value(caddy.ReplacerCtxKey).(*caddy.Replacer)
service := repl.ReplaceAll(su.Service, "")
proto := repl.ReplaceAll(su.Proto, "")
name := repl.ReplaceAll(su.Name, "")

_, records, err := net.DefaultResolver.LookupSRV(r.Context(), service, proto, name)
if err != nil {
return nil, err
}

upstreams := make([]*Upstream, len(records))
for i, rec := range records {
upstreams[i] = &Upstream{
Dial: net.JoinHostPort(rec.Target, strconv.Itoa(int(rec.Port))),
}
upstreams[i].setHost()
}

// TODO: expire these somehow
srvs[suStr] = srvLookup{
srvUpstreams: su,
freshness: time.Now(),
upstreams: upstreams,
}

return upstreams, nil
}

type srvLookup struct {
srvUpstreams SRVUpstreams
freshness time.Time
upstreams []*Upstream
}

func (sl srvLookup) fresh() bool {
return time.Since(sl.freshness) < sl.srvUpstreams.Refresh
}

var (
srvs = make(map[string]srvLookup)
srvsMu sync.RWMutex
)

// AUpstreams provides upstreams from A/AAAA lookups.
// Results are cached and refreshed at the configured
// refresh interval.
type AUpstreams struct {
// The domain name to look up.
Name string `json:"name,omitempty"`

// The port to use with the upstreams. Default: 80
Port string `json:"port,omitempty"`

// The interval at which to refresh the SRV lookup.
// Results are cached between lookups. Default: 1m
Refresh time.Duration `json:"refresh,omitempty"`
}

// CaddyModule returns the Caddy module information.
func (AUpstreams) CaddyModule() caddy.ModuleInfo {
return caddy.ModuleInfo{
ID: "http.reverse_proxy.upstreams.a",
New: func() caddy.Module { return new(AUpstreams) },
}
}

func (au AUpstreams) String() string { return au.Name }

func (au *AUpstreams) Provision(_ caddy.Context) error {
if au.Refresh == 0 {
au.Refresh = time.Minute
}
if au.Port == "" {
au.Port = "80"
}
return nil
}

func (au AUpstreams) GetUpstreams(r *http.Request) ([]*Upstream, error) {
auStr := au.String()

// first, use a cheap read-lock to return a cached result quickly
aAaaaMu.RLock()
cached := aAaaa[auStr]
aAaaaMu.RUnlock()
if cached.fresh() {
return cached.upstreams, nil
}

// otherwise, obtain a write-lock to update the cached value
aAaaaMu.Lock()
defer aAaaaMu.Unlock()

// check to see if it's still stale, since we're now in a different
// lock from when we first checked freshness; another goroutine might
// have refreshed it in the meantime before we re-obtained our lock
cached = aAaaa[auStr]
if cached.fresh() {
return cached.upstreams, nil
}

repl := r.Context().Value(caddy.ReplacerCtxKey).(*caddy.Replacer)
name := repl.ReplaceAll(au.Name, "")
port := repl.ReplaceAll(au.Port, "")

ips, err := net.DefaultResolver.LookupIPAddr(r.Context(), name)
if err != nil {
return nil, err
}

upstreams := make([]*Upstream, len(ips))
for i, ip := range ips {
upstreams[i] = &Upstream{
Dial: net.JoinHostPort(ip.String(), port),
}
upstreams[i].setHost()
}

// TODO: expire these somehow
aAaaa[auStr] = aLookup{
aUpstreams: au,
freshness: time.Now(),
upstreams: upstreams,
}

return upstreams, nil
}

type aLookup struct {
aUpstreams AUpstreams
freshness time.Time
upstreams []*Upstream
}

func (al aLookup) fresh() bool {
return time.Since(al.freshness) < al.aUpstreams.Refresh
}

var (
aAaaa = make(map[string]aLookup)
aAaaaMu sync.RWMutex
)

// Interface guards
var (
_ caddy.Provisioner = (*SRVUpstreams)(nil)
_ UpstreamSource = (*SRVUpstreams)(nil)
_ caddy.Provisioner = (*AUpstreams)(nil)
_ UpstreamSource = (*AUpstreams)(nil)
)

0 comments on commit 5e872e7

Please sign in to comment.