mirror of
https://github.com/etcd-io/etcd.git
synced 2024-09-27 06:25:44 +00:00
Merge pull request #16691 from serathius/inject-sleep
Inject sleep during etcd bootstrap to reproduce etcd-io#16666
This commit is contained in:
commit
f198b417c6
@ -17,6 +17,7 @@ package e2e
|
|||||||
import (
|
import (
|
||||||
"bytes"
|
"bytes"
|
||||||
"context"
|
"context"
|
||||||
|
"errors"
|
||||||
"fmt"
|
"fmt"
|
||||||
"io"
|
"io"
|
||||||
"net/http"
|
"net/http"
|
||||||
@ -338,7 +339,15 @@ type BinaryFailpoints struct {
|
|||||||
availableCache map[string]struct{}
|
availableCache map[string]struct{}
|
||||||
}
|
}
|
||||||
|
|
||||||
func (f *BinaryFailpoints) Setup(ctx context.Context, failpoint, payload string) error {
|
func (f *BinaryFailpoints) SetupEnv(failpoint, payload string) error {
|
||||||
|
if f.member.IsRunning() {
|
||||||
|
return errors.New("cannot setup environment variable while process is running")
|
||||||
|
}
|
||||||
|
f.member.Config().EnvVars["GOFAIL_FAILPOINTS"] = fmt.Sprintf("%s=%s", failpoint, payload)
|
||||||
|
return nil
|
||||||
|
}
|
||||||
|
|
||||||
|
func (f *BinaryFailpoints) SetupHTTP(ctx context.Context, failpoint, payload string) error {
|
||||||
host := fmt.Sprintf("127.0.0.1:%d", f.member.Config().GoFailPort)
|
host := fmt.Sprintf("127.0.0.1:%d", f.member.Config().GoFailPort)
|
||||||
failpointUrl := url.URL{
|
failpointUrl := url.URL{
|
||||||
Scheme: "http",
|
Scheme: "http",
|
||||||
|
@ -66,6 +66,7 @@ var (
|
|||||||
RaftAfterWALReleasePanic Failpoint = goPanicFailpoint{"raftAfterWALRelease", triggerBlackhole{waitTillSnapshot: true}, Follower}
|
RaftAfterWALReleasePanic Failpoint = goPanicFailpoint{"raftAfterWALRelease", triggerBlackhole{waitTillSnapshot: true}, Follower}
|
||||||
RaftBeforeSaveSnapPanic Failpoint = goPanicFailpoint{"raftBeforeSaveSnap", triggerBlackhole{waitTillSnapshot: true}, Follower}
|
RaftBeforeSaveSnapPanic Failpoint = goPanicFailpoint{"raftBeforeSaveSnap", triggerBlackhole{waitTillSnapshot: true}, Follower}
|
||||||
RaftAfterSaveSnapPanic Failpoint = goPanicFailpoint{"raftAfterSaveSnap", triggerBlackhole{waitTillSnapshot: true}, Follower}
|
RaftAfterSaveSnapPanic Failpoint = goPanicFailpoint{"raftAfterSaveSnap", triggerBlackhole{waitTillSnapshot: true}, Follower}
|
||||||
|
beforeApplyOneConfChangeSleep Failpoint = killAndGofailSleep{"beforeApplyOneConfChange", time.Second}
|
||||||
allFailpoints = []Failpoint{
|
allFailpoints = []Failpoint{
|
||||||
KillFailpoint, BeforeCommitPanic, AfterCommitPanic, RaftBeforeSavePanic, RaftAfterSavePanic,
|
KillFailpoint, BeforeCommitPanic, AfterCommitPanic, RaftBeforeSavePanic, RaftAfterSavePanic,
|
||||||
DefragBeforeCopyPanic, DefragBeforeRenamePanic, BackendBeforePreCommitHookPanic, BackendAfterPreCommitHookPanic,
|
DefragBeforeCopyPanic, DefragBeforeRenamePanic, BackendBeforePreCommitHookPanic, BackendAfterPreCommitHookPanic,
|
||||||
@ -75,6 +76,7 @@ var (
|
|||||||
CompactAfterCommitBatchPanic, RaftBeforeLeaderSendPanic, BlackholePeerNetwork, DelayPeerNetwork,
|
CompactAfterCommitBatchPanic, RaftBeforeLeaderSendPanic, BlackholePeerNetwork, DelayPeerNetwork,
|
||||||
RaftBeforeFollowerSendPanic, RaftBeforeApplySnapPanic, RaftAfterApplySnapPanic, RaftAfterWALReleasePanic,
|
RaftBeforeFollowerSendPanic, RaftBeforeApplySnapPanic, RaftAfterApplySnapPanic, RaftAfterWALReleasePanic,
|
||||||
RaftBeforeSaveSnapPanic, RaftAfterSaveSnapPanic, BlackholeUntilSnapshot,
|
RaftBeforeSaveSnapPanic, RaftAfterSaveSnapPanic, BlackholeUntilSnapshot,
|
||||||
|
beforeApplyOneConfChangeSleep,
|
||||||
}
|
}
|
||||||
)
|
)
|
||||||
|
|
||||||
@ -252,7 +254,7 @@ func (f goPanicFailpoint) Inject(ctx context.Context, t *testing.T, lg *zap.Logg
|
|||||||
default:
|
default:
|
||||||
}
|
}
|
||||||
lg.Info("Setting up gofailpoint", zap.String("failpoint", f.Name()))
|
lg.Info("Setting up gofailpoint", zap.String("failpoint", f.Name()))
|
||||||
err := member.Failpoints().Setup(ctx, f.failpoint, "panic")
|
err := member.Failpoints().SetupHTTP(ctx, f.failpoint, "panic")
|
||||||
if err != nil {
|
if err != nil {
|
||||||
lg.Info("goFailpoint setup failed", zap.String("failpoint", f.Name()), zap.Error(err))
|
lg.Info("goFailpoint setup failed", zap.String("failpoint", f.Name()), zap.Error(err))
|
||||||
continue
|
continue
|
||||||
@ -318,7 +320,7 @@ func (f goPanicFailpoint) Available(config e2e.EtcdProcessClusterConfig, member
|
|||||||
}
|
}
|
||||||
|
|
||||||
func (f goPanicFailpoint) Name() string {
|
func (f goPanicFailpoint) Name() string {
|
||||||
return f.failpoint
|
return fmt.Sprintf("%s=panic()", f.failpoint)
|
||||||
}
|
}
|
||||||
|
|
||||||
type triggerDefrag struct{}
|
type triggerDefrag struct{}
|
||||||
@ -527,3 +529,48 @@ func (f delayPeerNetworkFailpoint) Name() string {
|
|||||||
func (f delayPeerNetworkFailpoint) Available(config e2e.EtcdProcessClusterConfig, clus e2e.EtcdProcess) bool {
|
func (f delayPeerNetworkFailpoint) Available(config e2e.EtcdProcessClusterConfig, clus e2e.EtcdProcess) bool {
|
||||||
return config.ClusterSize > 1 && clus.PeerProxy() != nil
|
return config.ClusterSize > 1 && clus.PeerProxy() != nil
|
||||||
}
|
}
|
||||||
|
|
||||||
|
type killAndGofailSleep struct {
|
||||||
|
failpoint string
|
||||||
|
time time.Duration
|
||||||
|
}
|
||||||
|
|
||||||
|
func (f killAndGofailSleep) Inject(ctx context.Context, t *testing.T, lg *zap.Logger, clus *e2e.EtcdProcessCluster) error {
|
||||||
|
member := clus.Procs[rand.Int()%len(clus.Procs)]
|
||||||
|
for member.IsRunning() {
|
||||||
|
err := member.Kill()
|
||||||
|
if err != nil {
|
||||||
|
lg.Info("Sending kill signal failed", zap.Error(err))
|
||||||
|
}
|
||||||
|
err = member.Wait(ctx)
|
||||||
|
if err != nil && !strings.Contains(err.Error(), "unexpected exit code") {
|
||||||
|
lg.Info("Failed to kill the process", zap.Error(err))
|
||||||
|
return fmt.Errorf("failed to kill the process within %s, err: %w", triggerTimeout, err)
|
||||||
|
}
|
||||||
|
}
|
||||||
|
lg.Info("Setting up goFailpoint", zap.String("failpoint", f.Name()))
|
||||||
|
err := member.Failpoints().SetupEnv(f.failpoint, fmt.Sprintf(`sleep(%q)`, f.time))
|
||||||
|
if err != nil {
|
||||||
|
return err
|
||||||
|
}
|
||||||
|
err = member.Start(ctx)
|
||||||
|
if err != nil {
|
||||||
|
return err
|
||||||
|
}
|
||||||
|
// TODO: Check gofail status (https://github.com/etcd-io/gofail/pull/47) and wait for sleep to beis executed at least once.
|
||||||
|
return nil
|
||||||
|
}
|
||||||
|
|
||||||
|
func (f killAndGofailSleep) Name() string {
|
||||||
|
return fmt.Sprintf("%s=sleep(%s)", f.failpoint, f.time)
|
||||||
|
}
|
||||||
|
|
||||||
|
func (f killAndGofailSleep) Available(config e2e.EtcdProcessClusterConfig, member e2e.EtcdProcess) bool {
|
||||||
|
memberFailpoints := member.Failpoints()
|
||||||
|
if memberFailpoints == nil {
|
||||||
|
return false
|
||||||
|
}
|
||||||
|
available := memberFailpoints.Available()
|
||||||
|
_, found := available[f.failpoint]
|
||||||
|
return found
|
||||||
|
}
|
||||||
|
Loading…
x
Reference in New Issue
Block a user