mirror of
https://github.com/etcd-io/etcd.git
synced 2024-09-27 06:25:44 +00:00

It specifies request timeout error possibly caused by connection lost, and print out better log for user to understand. It handles two cases: 1. the leader cannot connect to majority of cluster. 2. the connection between follower and leader is down for a while, and it losts proposals. log format: ``` 20:04:19 etcd3 | 2015-08-25 20:04:19.368126 E | etcdhttp: etcdserver: request timed out, possibly due to connection lost 20:04:19 etcd3 | 2015-08-25 20:04:19.368227 E | etcdhttp: etcdserver: request timed out, possibly due to connection lost ```
78 lines
1.8 KiB
Go
78 lines
1.8 KiB
Go
// Copyright 2015 CoreOS, Inc.
|
|
//
|
|
// Licensed under the Apache License, Version 2.0 (the "License");
|
|
// you may not use this file except in compliance with the License.
|
|
// You may obtain a copy of the License at
|
|
//
|
|
// http://www.apache.org/licenses/LICENSE-2.0
|
|
//
|
|
// Unless required by applicable law or agreed to in writing, software
|
|
// distributed under the License is distributed on an "AS IS" BASIS,
|
|
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
// See the License for the specific language governing permissions and
|
|
// limitations under the License.
|
|
|
|
package rafthttp
|
|
|
|
import (
|
|
"fmt"
|
|
"sync"
|
|
"time"
|
|
|
|
"github.com/coreos/etcd/pkg/types"
|
|
)
|
|
|
|
type failureType struct {
|
|
source string
|
|
action string
|
|
}
|
|
|
|
type peerStatus struct {
|
|
id types.ID
|
|
mu sync.Mutex // protect variables below
|
|
active bool
|
|
failureMap map[failureType]string
|
|
activeSince time.Time
|
|
}
|
|
|
|
func newPeerStatus(id types.ID) *peerStatus {
|
|
return &peerStatus{
|
|
id: id,
|
|
failureMap: make(map[failureType]string),
|
|
}
|
|
}
|
|
|
|
func (s *peerStatus) activate() {
|
|
s.mu.Lock()
|
|
defer s.mu.Unlock()
|
|
if !s.active {
|
|
plog.Infof("the connection with %s became active", s.id)
|
|
s.active = true
|
|
s.activeSince = time.Now()
|
|
s.failureMap = make(map[failureType]string)
|
|
}
|
|
}
|
|
|
|
func (s *peerStatus) deactivate(failure failureType, reason string) {
|
|
s.mu.Lock()
|
|
defer s.mu.Unlock()
|
|
if s.active {
|
|
plog.Infof("the connection with %s became inactive", s.id)
|
|
s.active = false
|
|
s.activeSince = time.Time{}
|
|
}
|
|
logline := fmt.Sprintf("failed to %s %s on %s (%s)", failure.action, s.id, failure.source, reason)
|
|
if r, ok := s.failureMap[failure]; ok && r == reason {
|
|
plog.Debugf(logline)
|
|
return
|
|
}
|
|
s.failureMap[failure] = reason
|
|
plog.Errorf(logline)
|
|
}
|
|
|
|
func (s *peerStatus) isActive() bool {
|
|
s.mu.Lock()
|
|
defer s.mu.Unlock()
|
|
return s.active
|
|
}
|