123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475 |
- // Copyright 2016 The etcd Authors
- //
- // Licensed under the Apache License, Version 2.0 (the "License");
- // you may not use this file except in compliance with the License.
- // You may obtain a copy of the License at
- //
- // http://www.apache.org/licenses/LICENSE-2.0
- //
- // Unless required by applicable law or agreed to in writing, software
- // distributed under the License is distributed on an "AS IS" BASIS,
- // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- // See the License for the specific language governing permissions and
- // limitations under the License.
- package command
- import (
- "context"
- "crypto/sha256"
- "encoding/binary"
- "encoding/json"
- "fmt"
- "hash/crc32"
- "io"
- "math"
- "os"
- "path/filepath"
- "reflect"
- "strings"
- "github.com/coreos/etcd/etcdserver"
- "github.com/coreos/etcd/etcdserver/etcdserverpb"
- "github.com/coreos/etcd/etcdserver/membership"
- "github.com/coreos/etcd/lease"
- "github.com/coreos/etcd/mvcc"
- "github.com/coreos/etcd/mvcc/backend"
- "github.com/coreos/etcd/pkg/fileutil"
- "github.com/coreos/etcd/pkg/types"
- "github.com/coreos/etcd/raft"
- "github.com/coreos/etcd/raft/raftpb"
- "github.com/coreos/etcd/snap"
- "github.com/coreos/etcd/store"
- "github.com/coreos/etcd/wal"
- "github.com/coreos/etcd/wal/walpb"
- bolt "github.com/coreos/bbolt"
- "github.com/spf13/cobra"
- )
- const (
- defaultName = "default"
- defaultInitialAdvertisePeerURLs = "http://localhost:2380"
- )
- var (
- restoreCluster string
- restoreClusterToken string
- restoreDataDir string
- restoreWalDir string
- restorePeerURLs string
- restoreName string
- skipHashCheck bool
- )
- // NewSnapshotCommand returns the cobra command for "snapshot".
- func NewSnapshotCommand() *cobra.Command {
- cmd := &cobra.Command{
- Use: "snapshot <subcommand>",
- Short: "Manages etcd node snapshots",
- }
- cmd.AddCommand(NewSnapshotSaveCommand())
- cmd.AddCommand(NewSnapshotRestoreCommand())
- cmd.AddCommand(newSnapshotStatusCommand())
- return cmd
- }
- func NewSnapshotSaveCommand() *cobra.Command {
- return &cobra.Command{
- Use: "save <filename>",
- Short: "Stores an etcd node backend snapshot to a given file",
- Run: snapshotSaveCommandFunc,
- }
- }
- func newSnapshotStatusCommand() *cobra.Command {
- return &cobra.Command{
- Use: "status <filename>",
- Short: "Gets backend snapshot status of a given file",
- Long: `When --write-out is set to simple, this command prints out comma-separated status lists for each endpoint.
- The items in the lists are hash, revision, total keys, total size.
- `,
- Run: snapshotStatusCommandFunc,
- }
- }
- func NewSnapshotRestoreCommand() *cobra.Command {
- cmd := &cobra.Command{
- Use: "restore <filename> [options]",
- Short: "Restores an etcd member snapshot to an etcd directory",
- Run: snapshotRestoreCommandFunc,
- }
- cmd.Flags().StringVar(&restoreDataDir, "data-dir", "", "Path to the data directory")
- cmd.Flags().StringVar(&restoreWalDir, "wal-dir", "", "Path to the WAL directory (use --data-dir if none given)")
- cmd.Flags().StringVar(&restoreCluster, "initial-cluster", initialClusterFromName(defaultName), "Initial cluster configuration for restore bootstrap")
- cmd.Flags().StringVar(&restoreClusterToken, "initial-cluster-token", "etcd-cluster", "Initial cluster token for the etcd cluster during restore bootstrap")
- cmd.Flags().StringVar(&restorePeerURLs, "initial-advertise-peer-urls", defaultInitialAdvertisePeerURLs, "List of this member's peer URLs to advertise to the rest of the cluster")
- cmd.Flags().StringVar(&restoreName, "name", defaultName, "Human-readable name for this member")
- cmd.Flags().BoolVar(&skipHashCheck, "skip-hash-check", false, "Ignore snapshot integrity hash value (required if copied from data directory)")
- return cmd
- }
- func snapshotSaveCommandFunc(cmd *cobra.Command, args []string) {
- if len(args) != 1 {
- err := fmt.Errorf("snapshot save expects one argument")
- ExitWithError(ExitBadArgs, err)
- }
- path := args[0]
- partpath := path + ".part"
- f, err := os.Create(partpath)
- if err != nil {
- exiterr := fmt.Errorf("could not open %s (%v)", partpath, err)
- ExitWithError(ExitBadArgs, exiterr)
- }
- c := mustClientFromCmd(cmd)
- r, serr := c.Snapshot(context.TODO())
- if serr != nil {
- os.RemoveAll(partpath)
- ExitWithError(ExitInterrupted, serr)
- }
- if _, rerr := io.Copy(f, r); rerr != nil {
- os.RemoveAll(partpath)
- ExitWithError(ExitInterrupted, rerr)
- }
- fileutil.Fsync(f)
- f.Close()
- if rerr := os.Rename(partpath, path); rerr != nil {
- exiterr := fmt.Errorf("could not rename %s to %s (%v)", partpath, path, rerr)
- ExitWithError(ExitIO, exiterr)
- }
- fmt.Printf("Snapshot saved at %s\n", path)
- }
- func snapshotStatusCommandFunc(cmd *cobra.Command, args []string) {
- if len(args) != 1 {
- err := fmt.Errorf("snapshot status requires exactly one argument")
- ExitWithError(ExitBadArgs, err)
- }
- initDisplayFromCmd(cmd)
- ds := dbStatus(args[0])
- display.DBStatus(ds)
- }
- func snapshotRestoreCommandFunc(cmd *cobra.Command, args []string) {
- if len(args) != 1 {
- err := fmt.Errorf("snapshot restore requires exactly one argument")
- ExitWithError(ExitBadArgs, err)
- }
- urlmap, uerr := types.NewURLsMap(restoreCluster)
- if uerr != nil {
- ExitWithError(ExitBadArgs, uerr)
- }
- cfg := etcdserver.ServerConfig{
- InitialClusterToken: restoreClusterToken,
- InitialPeerURLsMap: urlmap,
- PeerURLs: types.MustNewURLs(strings.Split(restorePeerURLs, ",")),
- Name: restoreName,
- }
- if err := cfg.VerifyBootstrap(); err != nil {
- ExitWithError(ExitBadArgs, err)
- }
- cl, cerr := membership.NewClusterFromURLsMap(restoreClusterToken, urlmap)
- if cerr != nil {
- ExitWithError(ExitBadArgs, cerr)
- }
- basedir := restoreDataDir
- if basedir == "" {
- basedir = restoreName + ".etcd"
- }
- waldir := restoreWalDir
- if waldir == "" {
- waldir = filepath.Join(basedir, "member", "wal")
- }
- snapdir := filepath.Join(basedir, "member", "snap")
- if _, err := os.Stat(basedir); err == nil {
- ExitWithError(ExitInvalidInput, fmt.Errorf("data-dir %q exists", basedir))
- }
- makeDB(snapdir, args[0], len(cl.Members()))
- makeWALAndSnap(waldir, snapdir, cl)
- }
- func initialClusterFromName(name string) string {
- n := name
- if name == "" {
- n = defaultName
- }
- return fmt.Sprintf("%s=http://localhost:2380", n)
- }
- // makeWAL creates a WAL for the initial cluster
- func makeWALAndSnap(waldir, snapdir string, cl *membership.RaftCluster) {
- if err := fileutil.CreateDirAll(waldir); err != nil {
- ExitWithError(ExitIO, err)
- }
- // add members again to persist them to the store we create.
- st := store.New(etcdserver.StoreClusterPrefix, etcdserver.StoreKeysPrefix)
- cl.SetStore(st)
- for _, m := range cl.Members() {
- cl.AddMember(m)
- }
- m := cl.MemberByName(restoreName)
- md := &etcdserverpb.Metadata{NodeID: uint64(m.ID), ClusterID: uint64(cl.ID())}
- metadata, merr := md.Marshal()
- if merr != nil {
- ExitWithError(ExitInvalidInput, merr)
- }
- w, walerr := wal.Create(waldir, metadata)
- if walerr != nil {
- ExitWithError(ExitIO, walerr)
- }
- defer w.Close()
- peers := make([]raft.Peer, len(cl.MemberIDs()))
- for i, id := range cl.MemberIDs() {
- ctx, err := json.Marshal((*cl).Member(id))
- if err != nil {
- ExitWithError(ExitInvalidInput, err)
- }
- peers[i] = raft.Peer{ID: uint64(id), Context: ctx}
- }
- ents := make([]raftpb.Entry, len(peers))
- nodeIDs := make([]uint64, len(peers))
- for i, p := range peers {
- nodeIDs[i] = p.ID
- cc := raftpb.ConfChange{
- Type: raftpb.ConfChangeAddNode,
- NodeID: p.ID,
- Context: p.Context}
- d, err := cc.Marshal()
- if err != nil {
- ExitWithError(ExitInvalidInput, err)
- }
- e := raftpb.Entry{
- Type: raftpb.EntryConfChange,
- Term: 1,
- Index: uint64(i + 1),
- Data: d,
- }
- ents[i] = e
- }
- commit, term := uint64(len(ents)), uint64(1)
- if err := w.Save(raftpb.HardState{
- Term: term,
- Vote: peers[0].ID,
- Commit: commit}, ents); err != nil {
- ExitWithError(ExitIO, err)
- }
- b, berr := st.Save()
- if berr != nil {
- ExitWithError(ExitError, berr)
- }
- raftSnap := raftpb.Snapshot{
- Data: b,
- Metadata: raftpb.SnapshotMetadata{
- Index: commit,
- Term: term,
- ConfState: raftpb.ConfState{
- Nodes: nodeIDs,
- },
- },
- }
- snapshotter := snap.New(snapdir)
- if err := snapshotter.SaveSnap(raftSnap); err != nil {
- panic(err)
- }
- if err := w.SaveSnapshot(walpb.Snapshot{Index: commit, Term: term}); err != nil {
- ExitWithError(ExitIO, err)
- }
- }
- // initIndex implements ConsistentIndexGetter so the snapshot won't block
- // the new raft instance by waiting for a future raft index.
- type initIndex int
- func (i *initIndex) ConsistentIndex() uint64 { return uint64(*i) }
- // makeDB copies the database snapshot to the snapshot directory
- func makeDB(snapdir, dbfile string, commit int) {
- f, ferr := os.OpenFile(dbfile, os.O_RDONLY, 0600)
- if ferr != nil {
- ExitWithError(ExitInvalidInput, ferr)
- }
- defer f.Close()
- // get snapshot integrity hash
- if _, err := f.Seek(-sha256.Size, io.SeekEnd); err != nil {
- ExitWithError(ExitIO, err)
- }
- sha := make([]byte, sha256.Size)
- if _, err := f.Read(sha); err != nil {
- ExitWithError(ExitIO, err)
- }
- if _, err := f.Seek(0, io.SeekStart); err != nil {
- ExitWithError(ExitIO, err)
- }
- if err := fileutil.CreateDirAll(snapdir); err != nil {
- ExitWithError(ExitIO, err)
- }
- dbpath := filepath.Join(snapdir, "db")
- db, dberr := os.OpenFile(dbpath, os.O_RDWR|os.O_CREATE, 0600)
- if dberr != nil {
- ExitWithError(ExitIO, dberr)
- }
- if _, err := io.Copy(db, f); err != nil {
- ExitWithError(ExitIO, err)
- }
- // truncate away integrity hash, if any.
- off, serr := db.Seek(0, io.SeekEnd)
- if serr != nil {
- ExitWithError(ExitIO, serr)
- }
- hasHash := (off % 512) == sha256.Size
- if hasHash {
- if err := db.Truncate(off - sha256.Size); err != nil {
- ExitWithError(ExitIO, err)
- }
- }
- if !hasHash && !skipHashCheck {
- err := fmt.Errorf("snapshot missing hash but --skip-hash-check=false")
- ExitWithError(ExitBadArgs, err)
- }
- if hasHash && !skipHashCheck {
- // check for match
- if _, err := db.Seek(0, io.SeekStart); err != nil {
- ExitWithError(ExitIO, err)
- }
- h := sha256.New()
- if _, err := io.Copy(h, db); err != nil {
- ExitWithError(ExitIO, err)
- }
- dbsha := h.Sum(nil)
- if !reflect.DeepEqual(sha, dbsha) {
- err := fmt.Errorf("expected sha256 %v, got %v", sha, dbsha)
- ExitWithError(ExitInvalidInput, err)
- }
- }
- // db hash is OK, can now modify DB so it can be part of a new cluster
- db.Close()
- // update consistentIndex so applies go through on etcdserver despite
- // having a new raft instance
- be := backend.NewDefaultBackend(dbpath)
- // a lessor never timeouts leases
- lessor := lease.NewLessor(be, math.MaxInt64)
- s := mvcc.NewStore(be, lessor, (*initIndex)(&commit))
- txn := s.Write()
- btx := be.BatchTx()
- del := func(k, v []byte) error {
- txn.DeleteRange(k, nil)
- return nil
- }
- // delete stored members from old cluster since using new members
- btx.UnsafeForEach([]byte("members"), del)
- // todo: add back new members when we start to deprecate old snap file.
- btx.UnsafeForEach([]byte("members_removed"), del)
- // trigger write-out of new consistent index
- txn.End()
- s.Commit()
- s.Close()
- be.Close()
- }
- type dbstatus struct {
- Hash uint32 `json:"hash"`
- Revision int64 `json:"revision"`
- TotalKey int `json:"totalKey"`
- TotalSize int64 `json:"totalSize"`
- }
- func dbStatus(p string) dbstatus {
- if _, err := os.Stat(p); err != nil {
- ExitWithError(ExitError, err)
- }
- ds := dbstatus{}
- db, err := bolt.Open(p, 0400, &bolt.Options{ReadOnly: true})
- if err != nil {
- ExitWithError(ExitError, err)
- }
- defer db.Close()
- h := crc32.New(crc32.MakeTable(crc32.Castagnoli))
- err = db.View(func(tx *bolt.Tx) error {
- // check snapshot file integrity first
- var dbErrStrings []string
- for dbErr := range tx.Check() {
- dbErrStrings = append(dbErrStrings, dbErr.Error())
- }
- if len(dbErrStrings) > 0 {
- return fmt.Errorf("snapshot file integrity check failed. %d errors found.\n"+strings.Join(dbErrStrings, "\n"), len(dbErrStrings))
- }
- ds.TotalSize = tx.Size()
- c := tx.Cursor()
- for next, _ := c.First(); next != nil; next, _ = c.Next() {
- b := tx.Bucket(next)
- if b == nil {
- return fmt.Errorf("cannot get hash of bucket %s", string(next))
- }
- h.Write(next)
- iskeyb := (string(next) == "key")
- b.ForEach(func(k, v []byte) error {
- h.Write(k)
- h.Write(v)
- if iskeyb {
- rev := bytesToRev(k)
- ds.Revision = rev.main
- }
- ds.TotalKey++
- return nil
- })
- }
- return nil
- })
- if err != nil {
- ExitWithError(ExitError, err)
- }
- ds.Hash = h.Sum32()
- return ds
- }
- type revision struct {
- main int64
- sub int64
- }
- func bytesToRev(bytes []byte) revision {
- return revision{
- main: int64(binary.BigEndian.Uint64(bytes[0:8])),
- sub: int64(binary.BigEndian.Uint64(bytes[9:])),
- }
- }
|