-
Notifications
You must be signed in to change notification settings - Fork 65
/
failrotate.go
99 lines (87 loc) · 2.95 KB
/
failrotate.go
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
package rdns
import (
"sync"
"github.com/miekg/dns"
"github.com/sirupsen/logrus"
)
// FailRotate is a resolver group that queries the same resolver unless that
// returns a failure in which case the request is retried on the next one for
// up to N times (with N the number of resolvers in the group). If the last
// resolver fails, the first one in the list becomes the active one. This
// group does not fail back automatically.
type FailRotate struct {
id string
resolvers []Resolver
mu sync.RWMutex
active int
metrics *FailRouterMetrics
opt FailRotateOptions
}
// FailRotateOptions contain group-specific options.
type FailRotateOptions struct {
// Determines if a SERVFAIL returned by a resolver should be considered an
// error response and trigger a failover.
ServfailError bool
}
var _ Resolver = &FailRotate{}
// NewFailRotate returns a new instance of a failover resolver group.
func NewFailRotate(id string, opt FailRotateOptions, resolvers ...Resolver) *FailRotate {
return &FailRotate{
id: id,
resolvers: resolvers,
opt: opt,
metrics: NewFailRouterMetrics(id, len(resolvers)),
}
}
// Resolve a DNS query using a failover resolver group that switches to the next
// resolver on error.
func (r *FailRotate) Resolve(q *dns.Msg, ci ClientInfo) (*dns.Msg, error) {
log := logger(r.id, q, ci)
var (
err error
a *dns.Msg
)
for i := 0; i < len(r.resolvers); i++ {
resolver, active := r.current()
log.WithField("resolver", resolver.String()).Trace("forwarding query to resolver")
r.metrics.route.Add(resolver.String(), 1)
a, err = resolver.Resolve(q, ci)
if err == nil && r.isSuccessResponse(a) { // Return immediately if successful
return a, err
}
log.WithField("resolver", resolver.String()).WithError(err).Debug("resolver returned failure")
r.metrics.failure.Add(resolver.String(), 1)
r.errorFrom(active)
}
return a, err
}
func (r *FailRotate) String() string {
return r.id
}
// Thread-safe method to return the currently active resolver.
func (r *FailRotate) current() (Resolver, int) {
r.mu.RLock()
defer r.mu.RUnlock()
return r.resolvers[r.active], r.active
}
// Fail over to the next available resolver after receiving an error from i (the active). We
// need i to know which store returned the error as there could be failures from concurrent
// requests. Another request could have initiated the failover already. So ignore if i is not
// (no longer) the active store.
func (r *FailRotate) errorFrom(i int) {
r.mu.Lock()
defer r.mu.Unlock()
if i != r.active {
return
}
r.metrics.failover.Add(1)
r.active = (r.active + 1) % len(r.resolvers)
Log.WithFields(logrus.Fields{
"id": r.id,
"resolver": r.resolvers[r.active].String(),
}).Debug("failing over to resolver")
}
// Returns true is the response is considered successful given the options.
func (r *FailRotate) isSuccessResponse(a *dns.Msg) bool {
return a == nil || !(r.opt.ServfailError && a.Rcode == dns.RcodeServerFailure)
}