Merge pull request #17277 from ivanvc/fixes-etcdutl-memory-allocation-issue

etcdutl: Fix snapshot restore memory alloc issue
This commit is contained in:
Benjamin Wang 2024-02-14 11:41:14 +00:00 committed by GitHub
commit ccc4318478
No known key found for this signature in database
GPG Key ID: B5690EEEBB952194
3 changed files with 33 additions and 9 deletions

View File

@ -22,6 +22,7 @@ import (
"go.etcd.io/etcd/etcdutl/v3/snapshot" "go.etcd.io/etcd/etcdutl/v3/snapshot"
"go.etcd.io/etcd/pkg/v3/cobrautl" "go.etcd.io/etcd/pkg/v3/cobrautl"
"go.etcd.io/etcd/server/v3/storage/backend"
"go.etcd.io/etcd/server/v3/storage/datadir" "go.etcd.io/etcd/server/v3/storage/datadir"
) )
@ -38,6 +39,7 @@ var (
restorePeerURLs string restorePeerURLs string
restoreName string restoreName string
skipHashCheck bool skipHashCheck bool
initialMmapSize = backend.InitialMmapSize
markCompacted bool markCompacted bool
revisionBump uint64 revisionBump uint64
) )
@ -77,6 +79,7 @@ func NewSnapshotRestoreCommand() *cobra.Command {
cmd.Flags().StringVar(&restorePeerURLs, "initial-advertise-peer-urls", defaultInitialAdvertisePeerURLs, "List of this member's peer URLs to advertise to the rest of the cluster") cmd.Flags().StringVar(&restorePeerURLs, "initial-advertise-peer-urls", defaultInitialAdvertisePeerURLs, "List of this member's peer URLs to advertise to the rest of the cluster")
cmd.Flags().StringVar(&restoreName, "name", defaultName, "Human-readable name for this member") cmd.Flags().StringVar(&restoreName, "name", defaultName, "Human-readable name for this member")
cmd.Flags().BoolVar(&skipHashCheck, "skip-hash-check", false, "Ignore snapshot integrity hash value (required if copied from data directory)") cmd.Flags().BoolVar(&skipHashCheck, "skip-hash-check", false, "Ignore snapshot integrity hash value (required if copied from data directory)")
cmd.Flags().Uint64Var(&initialMmapSize, "initial-memory-map-size", initialMmapSize, "Initial memory map size of the database in bytes. It uses the default value if not defined or defined to 0")
cmd.Flags().Uint64Var(&revisionBump, "bump-revision", 0, "How much to increase the latest revision after restore") cmd.Flags().Uint64Var(&revisionBump, "bump-revision", 0, "How much to increase the latest revision after restore")
cmd.Flags().BoolVar(&markCompacted, "mark-compacted", false, "Mark the latest revision after restore as the point of scheduled compaction (required if --bump-revision > 0, disallowed otherwise)") cmd.Flags().BoolVar(&markCompacted, "mark-compacted", false, "Mark the latest revision after restore as the point of scheduled compaction (required if --bump-revision > 0, disallowed otherwise)")
@ -104,7 +107,7 @@ func SnapshotStatusCommandFunc(cmd *cobra.Command, args []string) {
func snapshotRestoreCommandFunc(_ *cobra.Command, args []string) { func snapshotRestoreCommandFunc(_ *cobra.Command, args []string) {
SnapshotRestoreCommandFunc(restoreCluster, restoreClusterToken, restoreDataDir, restoreWalDir, SnapshotRestoreCommandFunc(restoreCluster, restoreClusterToken, restoreDataDir, restoreWalDir,
restorePeerURLs, restoreName, skipHashCheck, revisionBump, markCompacted, args) restorePeerURLs, restoreName, skipHashCheck, initialMmapSize, revisionBump, markCompacted, args)
} }
func SnapshotRestoreCommandFunc(restoreCluster string, func SnapshotRestoreCommandFunc(restoreCluster string,
@ -114,6 +117,7 @@ func SnapshotRestoreCommandFunc(restoreCluster string,
restorePeerURLs string, restorePeerURLs string,
restoreName string, restoreName string,
skipHashCheck bool, skipHashCheck bool,
initialMmapSize uint64,
revisionBump uint64, revisionBump uint64,
markCompacted bool, markCompacted bool,
args []string) { args []string) {
@ -149,6 +153,7 @@ func SnapshotRestoreCommandFunc(restoreCluster string,
InitialCluster: restoreCluster, InitialCluster: restoreCluster,
InitialClusterToken: restoreClusterToken, InitialClusterToken: restoreClusterToken,
SkipHashCheck: skipHashCheck, SkipHashCheck: skipHashCheck,
InitialMmapSize: initialMmapSize,
RevisionBump: revisionBump, RevisionBump: revisionBump,
MarkCompacted: markCompacted, MarkCompacted: markCompacted,
}); err != nil { }); err != nil {

View File

@ -84,6 +84,7 @@ type v3Manager struct {
cl *membership.RaftCluster cl *membership.RaftCluster
skipHashCheck bool skipHashCheck bool
initialMmapSize uint64
} }
// hasChecksum returns "true" if the file size "n" // hasChecksum returns "true" if the file size "n"
@ -204,6 +205,9 @@ type RestoreConfig struct {
// (required if copied from data directory). // (required if copied from data directory).
SkipHashCheck bool SkipHashCheck bool
// InitialMmapSize is the database initial memory map size.
InitialMmapSize uint64
// RevisionBump is the amount to increase the latest revision after restore, // RevisionBump is the amount to increase the latest revision after restore,
// to allow administrators to trick clients into thinking that revision never decreased. // to allow administrators to trick clients into thinking that revision never decreased.
// If 0, revision bumping is skipped. // If 0, revision bumping is skipped.
@ -263,6 +267,7 @@ func (s *v3Manager) Restore(cfg RestoreConfig) error {
s.walDir = walDir s.walDir = walDir
s.snapDir = filepath.Join(dataDir, "member", "snap") s.snapDir = filepath.Join(dataDir, "member", "snap")
s.skipHashCheck = cfg.SkipHashCheck s.skipHashCheck = cfg.SkipHashCheck
s.initialMmapSize = cfg.InitialMmapSize
s.lg.Info( s.lg.Info(
"restoring snapshot", "restoring snapshot",
@ -270,6 +275,7 @@ func (s *v3Manager) Restore(cfg RestoreConfig) error {
zap.String("wal-dir", s.walDir), zap.String("wal-dir", s.walDir),
zap.String("data-dir", dataDir), zap.String("data-dir", dataDir),
zap.String("snap-dir", s.snapDir), zap.String("snap-dir", s.snapDir),
zap.Uint64("initial-memory-map-size", s.initialMmapSize),
) )
if err = s.saveDB(); err != nil { if err = s.saveDB(); err != nil {
@ -297,6 +303,7 @@ func (s *v3Manager) Restore(cfg RestoreConfig) error {
zap.String("wal-dir", s.walDir), zap.String("wal-dir", s.walDir),
zap.String("data-dir", dataDir), zap.String("data-dir", dataDir),
zap.String("snap-dir", s.snapDir), zap.String("snap-dir", s.snapDir),
zap.Uint64("initial-memory-map-size", s.initialMmapSize),
) )
return verify.VerifyIfEnabled(verify.Config{ return verify.VerifyIfEnabled(verify.Config{
@ -317,7 +324,7 @@ func (s *v3Manager) saveDB() error {
return err return err
} }
be := backend.NewDefaultBackend(s.lg, s.outDbPath()) be := backend.NewDefaultBackend(s.lg, s.outDbPath(), backend.WithMmapSize(s.initialMmapSize))
defer be.Close() defer be.Close()
err = schema.NewMembershipBackend(s.lg, be).TrimMembershipFromBackend() err = schema.NewMembershipBackend(s.lg, be).TrimMembershipFromBackend()
@ -472,7 +479,7 @@ func (s *v3Manager) saveWALAndSnap() (*raftpb.HardState, error) {
} }
// add members again to persist them to the backend we create. // add members again to persist them to the backend we create.
be := backend.NewDefaultBackend(s.lg, s.outDbPath()) be := backend.NewDefaultBackend(s.lg, s.outDbPath(), backend.WithMmapSize(s.initialMmapSize))
defer be.Close() defer be.Close()
s.cl.SetBackend(schema.NewMembershipBackend(s.lg, be)) s.cl.SetBackend(schema.NewMembershipBackend(s.lg, be))
for _, m := range s.cl.Members() { for _, m := range s.cl.Members() {
@ -551,7 +558,7 @@ func (s *v3Manager) saveWALAndSnap() (*raftpb.HardState, error) {
} }
func (s *v3Manager) updateCIndex(commit uint64, term uint64) error { func (s *v3Manager) updateCIndex(commit uint64, term uint64) error {
be := backend.NewDefaultBackend(s.lg, s.outDbPath()) be := backend.NewDefaultBackend(s.lg, s.outDbPath(), backend.WithMmapSize(s.initialMmapSize))
defer be.Close() defer be.Close()
cindex.UpdateConsistentIndexForce(be.BatchTx(), commit, term) cindex.UpdateConsistentIndexForce(be.BatchTx(), commit, term)

View File

@ -36,10 +36,10 @@ var (
defragLimit = 10000 defragLimit = 10000
// initialMmapSize is the initial size of the mmapped region. Setting this larger than // InitialMmapSize is the initial size of the mmapped region. Setting this larger than
// the potential max db size can prevent writer from blocking reader. // the potential max db size can prevent writer from blocking reader.
// This only works for linux. // This only works for linux.
initialMmapSize = uint64(10 * 1024 * 1024 * 1024) InitialMmapSize = uint64(10 * 1024 * 1024 * 1024)
// minSnapshotWarningTimeout is the minimum threshold to trigger a long running snapshot warning. // minSnapshotWarningTimeout is the minimum threshold to trigger a long running snapshot warning.
minSnapshotWarningTimeout = 30 * time.Second minSnapshotWarningTimeout = 30 * time.Second
@ -151,11 +151,13 @@ type BackendConfig struct {
Hooks Hooks Hooks Hooks
} }
type BackendConfigOption func(*BackendConfig)
func DefaultBackendConfig(lg *zap.Logger) BackendConfig { func DefaultBackendConfig(lg *zap.Logger) BackendConfig {
return BackendConfig{ return BackendConfig{
BatchInterval: defaultBatchInterval, BatchInterval: defaultBatchInterval,
BatchLimit: defaultBatchLimit, BatchLimit: defaultBatchLimit,
MmapSize: initialMmapSize, MmapSize: InitialMmapSize,
Logger: lg, Logger: lg,
} }
} }
@ -164,9 +166,19 @@ func New(bcfg BackendConfig) Backend {
return newBackend(bcfg) return newBackend(bcfg)
} }
func NewDefaultBackend(lg *zap.Logger, path string) Backend { func WithMmapSize(size uint64) BackendConfigOption {
return func(bcfg *BackendConfig) {
bcfg.MmapSize = size
}
}
func NewDefaultBackend(lg *zap.Logger, path string, opts ...BackendConfigOption) Backend {
bcfg := DefaultBackendConfig(lg) bcfg := DefaultBackendConfig(lg)
bcfg.Path = path bcfg.Path = path
for _, opt := range opts {
opt(&bcfg)
}
return newBackend(bcfg) return newBackend(bcfg)
} }