mirror of
https://github.com/etcd-io/etcd.git
synced 2024-09-27 06:25:44 +00:00
clientv3/balancer: mark partitioned member as unhealthy
Previous behavior is when server returns errors, retry wrapper does not do anything, while passively expecting balancer to gray-list the isolated endpoint. This is problematic when multiple endpoints are passed, and network partition happens. This patch adds 'endpointError' method to 'balancer' interface to actively(possibly even before health-check API gets called) handle RPC errors and gray-list endpoints for the time being, thus speeding up the endpoint switch. This is safe in a single-endpoint case, because balancer will retry no matter what in such case. Signed-off-by: Gyu-Ho Lee <gyuhox@gmail.com>
This commit is contained in:
parent
1704443c6d
commit
fbed568b6a
@ -44,6 +44,8 @@ type balancer interface {
|
||||
endpoints() []string
|
||||
// pinned returns the current pinned endpoint.
|
||||
pinned() string
|
||||
// endpointError handles error from server-side.
|
||||
endpointError(addr string, err error)
|
||||
|
||||
// up is Up but includes whether the balancer will use the connection.
|
||||
up(addr grpc.Address) (func(error), bool)
|
||||
@ -150,6 +152,8 @@ func (b *simpleBalancer) pinned() string {
|
||||
return b.pinAddr
|
||||
}
|
||||
|
||||
func (b *simpleBalancer) endpointError(addr string, err error) { return }
|
||||
|
||||
func getHost2ep(eps []string) map[string]string {
|
||||
hm := make(map[string]string, len(eps))
|
||||
for i := range eps {
|
||||
|
@ -177,6 +177,15 @@ func (hb *healthBalancer) liveAddrs() []grpc.Address {
|
||||
return addrs
|
||||
}
|
||||
|
||||
func (hb *healthBalancer) endpointError(addr string, err error) {
|
||||
hb.mu.Lock()
|
||||
hb.unhealthy[addr] = time.Now()
|
||||
hb.mu.Unlock()
|
||||
if logger.V(4) {
|
||||
logger.Infof("clientv3/health-balancer: marking %s as unhealthy (%v)", addr, err)
|
||||
}
|
||||
}
|
||||
|
||||
func (hb *healthBalancer) mayPin(addr grpc.Address) bool {
|
||||
hb.mu.RLock()
|
||||
skip := len(hb.addrs) == 1 || len(hb.unhealthy) == 0
|
||||
|
@ -66,6 +66,8 @@ func (c *Client) newRetryWrapper(isStop retryStopErrFunc) retryRpcFunc {
|
||||
if logger.V(4) {
|
||||
logger.Infof("clientv3/retry: error %v on pinned endpoint %s", err, pinned)
|
||||
}
|
||||
// mark this before endpoint switch is triggered
|
||||
c.balancer.endpointError(pinned, err)
|
||||
notify := c.balancer.ConnectNotify()
|
||||
if s, ok := status.FromError(err); ok && s.Code() == codes.Unavailable {
|
||||
c.balancer.next()
|
||||
|
Loading…
x
Reference in New Issue
Block a user