2018-05-10 22:56:10 -04:00
|
|
|
package restorer
|
2014-09-23 22:39:12 +02:00
|
|
|
|
|
|
|
import (
|
2017-06-04 11:16:55 +02:00
|
|
|
"context"
|
2018-04-13 10:02:09 -04:00
|
|
|
"os"
|
2014-09-23 22:39:12 +02:00
|
|
|
"path/filepath"
|
|
|
|
|
2018-04-13 10:02:09 -04:00
|
|
|
"github.com/restic/restic/internal/crypto"
|
2017-07-23 14:21:03 +02:00
|
|
|
"github.com/restic/restic/internal/errors"
|
2016-08-21 17:48:36 +02:00
|
|
|
|
2017-07-23 14:21:03 +02:00
|
|
|
"github.com/restic/restic/internal/debug"
|
|
|
|
"github.com/restic/restic/internal/fs"
|
2018-05-10 22:56:10 -04:00
|
|
|
"github.com/restic/restic/internal/restic"
|
2014-09-23 22:39:12 +02:00
|
|
|
)
|
|
|
|
|
2015-05-02 15:23:28 +02:00
|
|
|
// Restorer is used to restore a snapshot to a directory.
|
2014-09-23 22:39:12 +02:00
|
|
|
type Restorer struct {
|
2018-05-10 22:56:10 -04:00
|
|
|
repo restic.Repository
|
|
|
|
sn *restic.Snapshot
|
2014-09-23 22:39:12 +02:00
|
|
|
|
2018-05-10 22:56:10 -04:00
|
|
|
Error func(dir string, node *restic.Node, err error) error
|
|
|
|
SelectFilter func(item string, dstpath string, node *restic.Node) (selectedForRestore bool, childMayBeSelected bool)
|
2014-09-23 22:39:12 +02:00
|
|
|
}
|
|
|
|
|
2018-05-10 22:56:10 -04:00
|
|
|
var restorerAbortOnAllErrors = func(str string, node *restic.Node, err error) error { return err }
|
2015-04-29 20:59:06 -04:00
|
|
|
|
|
|
|
// NewRestorer creates a restorer preloaded with the content from the snapshot id.
|
2018-05-10 22:56:10 -04:00
|
|
|
func NewRestorer(repo restic.Repository, id restic.ID) (*Restorer, error) {
|
2015-07-08 22:35:41 +02:00
|
|
|
r := &Restorer{
|
|
|
|
repo: repo, Error: restorerAbortOnAllErrors,
|
2018-05-10 22:56:10 -04:00
|
|
|
SelectFilter: func(string, string, *restic.Node) (bool, bool) { return true, true },
|
2015-07-08 22:35:41 +02:00
|
|
|
}
|
2014-09-23 22:39:12 +02:00
|
|
|
|
|
|
|
var err error
|
|
|
|
|
2018-05-10 22:56:10 -04:00
|
|
|
r.sn, err = restic.LoadSnapshot(context.TODO(), repo, id)
|
2014-09-23 22:39:12 +02:00
|
|
|
if err != nil {
|
2016-08-21 17:24:13 +02:00
|
|
|
return nil, err
|
2014-09-23 22:39:12 +02:00
|
|
|
}
|
|
|
|
|
|
|
|
return r, nil
|
|
|
|
}
|
|
|
|
|
2018-04-07 22:43:14 -04:00
|
|
|
type treeVisitor struct {
|
|
|
|
enterDir func(node *restic.Node, target, location string) error
|
|
|
|
visitNode func(node *restic.Node, target, location string) error
|
|
|
|
leaveDir func(node *restic.Node, target, location string) error
|
|
|
|
}
|
|
|
|
|
|
|
|
// traverseTree traverses a tree from the repo and calls treeVisitor.
|
|
|
|
// target is the path in the file system, location within the snapshot.
|
|
|
|
func (res *Restorer) traverseTree(ctx context.Context, target, location string, treeID restic.ID, visitor treeVisitor) error {
|
2018-01-25 20:49:41 +01:00
|
|
|
debug.Log("%v %v %v", target, location, treeID)
|
2017-06-04 11:16:55 +02:00
|
|
|
tree, err := res.repo.LoadTree(ctx, treeID)
|
2014-09-23 22:39:12 +02:00
|
|
|
if err != nil {
|
2018-01-25 20:49:41 +01:00
|
|
|
debug.Log("error loading tree %v: %v", treeID, err)
|
2017-11-26 15:17:12 +01:00
|
|
|
return res.Error(location, nil, err)
|
2014-09-23 22:39:12 +02:00
|
|
|
}
|
|
|
|
|
2015-01-10 23:40:10 +01:00
|
|
|
for _, node := range tree.Nodes {
|
2017-11-26 15:17:12 +01:00
|
|
|
|
|
|
|
// ensure that the node name does not contain anything that refers to a
|
|
|
|
// top-level directory.
|
|
|
|
nodeName := filepath.Base(filepath.Join(string(filepath.Separator), node.Name))
|
|
|
|
if nodeName != node.Name {
|
|
|
|
debug.Log("node %q has invalid name %q", node.Name, nodeName)
|
|
|
|
err := res.Error(location, node, errors.New("node has invalid name"))
|
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
continue
|
|
|
|
}
|
|
|
|
|
|
|
|
nodeTarget := filepath.Join(target, nodeName)
|
|
|
|
nodeLocation := filepath.Join(location, nodeName)
|
|
|
|
|
|
|
|
if target == nodeTarget || !fs.HasPathPrefix(target, nodeTarget) {
|
2017-11-26 18:36:48 +01:00
|
|
|
debug.Log("target: %v %v", target, nodeTarget)
|
2017-11-26 15:17:12 +01:00
|
|
|
debug.Log("node %q has invalid target path %q", node.Name, nodeTarget)
|
|
|
|
err := res.Error(nodeLocation, node, errors.New("node has invalid path"))
|
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
continue
|
|
|
|
}
|
|
|
|
|
2018-04-20 13:53:11 +02:00
|
|
|
// sockets cannot be restored
|
|
|
|
if node.Type == "socket" {
|
|
|
|
continue
|
|
|
|
}
|
|
|
|
|
2017-11-26 15:17:12 +01:00
|
|
|
selectedForRestore, childMayBeSelected := res.SelectFilter(nodeLocation, nodeTarget, node)
|
2017-07-07 11:54:10 +02:00
|
|
|
debug.Log("SelectFilter returned %v %v", selectedForRestore, childMayBeSelected)
|
2015-07-08 20:29:27 +02:00
|
|
|
|
2018-04-07 22:43:14 -04:00
|
|
|
sanitizeError := func(err error) error {
|
|
|
|
if err != nil {
|
|
|
|
err = res.Error(nodeTarget, node, err)
|
|
|
|
}
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
|
|
|
|
if node.Type == "dir" {
|
2014-09-23 22:39:12 +02:00
|
|
|
if node.Subtree == nil {
|
2016-08-21 17:48:36 +02:00
|
|
|
return errors.Errorf("Dir without subtree in tree %v", treeID.Str())
|
2014-09-23 22:39:12 +02:00
|
|
|
}
|
|
|
|
|
2018-04-07 22:43:14 -04:00
|
|
|
if selectedForRestore {
|
|
|
|
err = sanitizeError(visitor.enterDir(node, nodeTarget, nodeLocation))
|
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
if childMayBeSelected {
|
|
|
|
err = sanitizeError(res.traverseTree(ctx, nodeTarget, nodeLocation, *node.Subtree, visitor))
|
2014-09-23 22:39:12 +02:00
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
restorer: Fix traverseTree
traverseTree() was meant to call enterDir() whenever a directory is
selected for restore, either explicitly or implicitly (=contains a file
which is to be restored). After restoring a file, leaveDir() is called
in reverse order for all intermediate directories so that the metadata
can be restored.
When a directory is selected implicitly, the metadata for it is
restored. This is different from the previous restorer behavior, which
created implicitly selected intermediate directories with permissions
0700 (only user can read/write it).
This commit changes the behavior back to the old one. Only a directory
is explicitly selected for restore, enterDir()/leaveDir() are called for
it. Otherwise, only visitNode() is called, so visitNode() needs to make
sure the parent directory exists. If the directory is explicitly
included, leaveDir() will then restore the metadata correctly.
When we decide to change the behavior (restore metadata for all
intermediate directories, even if selected implicitly), we should do
that in the selection functions, not here.
This finally resolves #1870
2018-07-21 22:39:12 +02:00
|
|
|
if selectedForRestore {
|
|
|
|
err = sanitizeError(visitor.leaveDir(node, nodeTarget, nodeLocation))
|
2018-04-20 13:53:11 +02:00
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
2018-01-07 15:13:24 +01:00
|
|
|
}
|
restorer: Fix traverseTree
traverseTree() was meant to call enterDir() whenever a directory is
selected for restore, either explicitly or implicitly (=contains a file
which is to be restored). After restoring a file, leaveDir() is called
in reverse order for all intermediate directories so that the metadata
can be restored.
When a directory is selected implicitly, the metadata for it is
restored. This is different from the previous restorer behavior, which
created implicitly selected intermediate directories with permissions
0700 (only user can read/write it).
This commit changes the behavior back to the old one. Only a directory
is explicitly selected for restore, enterDir()/leaveDir() are called for
it. Otherwise, only visitNode() is called, so visitNode() needs to make
sure the parent directory exists. If the directory is explicitly
included, leaveDir() will then restore the metadata correctly.
When we decide to change the behavior (restore metadata for all
intermediate directories, even if selected implicitly), we should do
that in the selection functions, not here.
This finally resolves #1870
2018-07-21 22:39:12 +02:00
|
|
|
|
|
|
|
continue
|
2018-04-07 22:43:14 -04:00
|
|
|
}
|
2018-01-07 15:13:24 +01:00
|
|
|
|
restorer: Fix traverseTree
traverseTree() was meant to call enterDir() whenever a directory is
selected for restore, either explicitly or implicitly (=contains a file
which is to be restored). After restoring a file, leaveDir() is called
in reverse order for all intermediate directories so that the metadata
can be restored.
When a directory is selected implicitly, the metadata for it is
restored. This is different from the previous restorer behavior, which
created implicitly selected intermediate directories with permissions
0700 (only user can read/write it).
This commit changes the behavior back to the old one. Only a directory
is explicitly selected for restore, enterDir()/leaveDir() are called for
it. Otherwise, only visitNode() is called, so visitNode() needs to make
sure the parent directory exists. If the directory is explicitly
included, leaveDir() will then restore the metadata correctly.
When we decide to change the behavior (restore metadata for all
intermediate directories, even if selected implicitly), we should do
that in the selection functions, not here.
This finally resolves #1870
2018-07-21 22:39:12 +02:00
|
|
|
if selectedForRestore {
|
|
|
|
err = sanitizeError(visitor.visitNode(node, nodeTarget, nodeLocation))
|
2018-01-07 15:13:24 +01:00
|
|
|
if err != nil {
|
restorer: Fix traverseTree
traverseTree() was meant to call enterDir() whenever a directory is
selected for restore, either explicitly or implicitly (=contains a file
which is to be restored). After restoring a file, leaveDir() is called
in reverse order for all intermediate directories so that the metadata
can be restored.
When a directory is selected implicitly, the metadata for it is
restored. This is different from the previous restorer behavior, which
created implicitly selected intermediate directories with permissions
0700 (only user can read/write it).
This commit changes the behavior back to the old one. Only a directory
is explicitly selected for restore, enterDir()/leaveDir() are called for
it. Otherwise, only visitNode() is called, so visitNode() needs to make
sure the parent directory exists. If the directory is explicitly
included, leaveDir() will then restore the metadata correctly.
When we decide to change the behavior (restore metadata for all
intermediate directories, even if selected implicitly), we should do
that in the selection functions, not here.
This finally resolves #1870
2018-07-21 22:39:12 +02:00
|
|
|
return err
|
2015-05-14 15:58:26 +02:00
|
|
|
}
|
2015-05-13 23:11:31 -04:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2014-09-23 22:39:12 +02:00
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
2018-05-10 22:56:10 -04:00
|
|
|
func (res *Restorer) restoreNodeTo(ctx context.Context, node *restic.Node, target, location string, idx *restic.HardlinkIndex) error {
|
2018-04-07 22:43:14 -04:00
|
|
|
debug.Log("restoreNode %v %v %v", node.Name, target, location)
|
2015-04-29 20:59:06 -04:00
|
|
|
|
2017-11-26 15:17:12 +01:00
|
|
|
err := node.CreateAt(ctx, target, res.repo, idx)
|
2015-07-06 23:59:28 +02:00
|
|
|
if err != nil {
|
2017-11-26 15:17:12 +01:00
|
|
|
debug.Log("node.CreateAt(%s) error %v", target, err)
|
2015-07-06 23:59:28 +02:00
|
|
|
}
|
2018-04-07 22:43:14 -04:00
|
|
|
if err == nil {
|
|
|
|
err = res.restoreNodeMetadataTo(node, target, location)
|
2015-04-29 20:59:06 -04:00
|
|
|
}
|
|
|
|
|
2018-04-07 22:43:14 -04:00
|
|
|
return err
|
|
|
|
}
|
|
|
|
|
|
|
|
func (res *Restorer) restoreNodeMetadataTo(node *restic.Node, target, location string) error {
|
|
|
|
debug.Log("restoreNodeMetadata %v %v %v", node.Name, target, location)
|
|
|
|
err := node.RestoreMetadata(target)
|
2015-04-29 20:59:06 -04:00
|
|
|
if err != nil {
|
2018-04-07 22:43:14 -04:00
|
|
|
debug.Log("node.RestoreMetadata(%s) error %v", target, err)
|
2015-04-29 20:59:06 -04:00
|
|
|
}
|
2018-04-07 22:43:14 -04:00
|
|
|
return err
|
2015-04-29 20:59:06 -04:00
|
|
|
}
|
|
|
|
|
2017-03-02 14:52:18 +01:00
|
|
|
// RestoreTo creates the directories and files in the snapshot below dst.
|
2014-09-23 22:39:12 +02:00
|
|
|
// Before an item is created, res.Filter is called.
|
2017-06-04 11:16:55 +02:00
|
|
|
func (res *Restorer) RestoreTo(ctx context.Context, dst string) error {
|
2017-11-26 18:36:48 +01:00
|
|
|
var err error
|
|
|
|
if !filepath.IsAbs(dst) {
|
|
|
|
dst, err = filepath.Abs(dst)
|
|
|
|
if err != nil {
|
|
|
|
return errors.Wrap(err, "Abs")
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2018-07-15 16:02:04 +02:00
|
|
|
// make sure the target directory exists
|
|
|
|
err = fs.MkdirAll(dst, 0777) // umask takes care of dir permissions
|
|
|
|
if err != nil {
|
|
|
|
return errors.Wrap(err, "MkdirAll")
|
|
|
|
}
|
|
|
|
|
2018-05-10 22:56:10 -04:00
|
|
|
idx := restic.NewHardlinkIndex()
|
2018-04-07 22:43:14 -04:00
|
|
|
return res.traverseTree(ctx, dst, string(filepath.Separator), *res.sn.Tree, treeVisitor{
|
|
|
|
enterDir: func(node *restic.Node, target, location string) error {
|
|
|
|
// create dir with default permissions
|
|
|
|
// #leaveDir restores dir metadata after visiting all children
|
|
|
|
return fs.MkdirAll(target, 0700)
|
|
|
|
},
|
|
|
|
visitNode: func(node *restic.Node, target, location string) error {
|
restorer: Fix traverseTree
traverseTree() was meant to call enterDir() whenever a directory is
selected for restore, either explicitly or implicitly (=contains a file
which is to be restored). After restoring a file, leaveDir() is called
in reverse order for all intermediate directories so that the metadata
can be restored.
When a directory is selected implicitly, the metadata for it is
restored. This is different from the previous restorer behavior, which
created implicitly selected intermediate directories with permissions
0700 (only user can read/write it).
This commit changes the behavior back to the old one. Only a directory
is explicitly selected for restore, enterDir()/leaveDir() are called for
it. Otherwise, only visitNode() is called, so visitNode() needs to make
sure the parent directory exists. If the directory is explicitly
included, leaveDir() will then restore the metadata correctly.
When we decide to change the behavior (restore metadata for all
intermediate directories, even if selected implicitly), we should do
that in the selection functions, not here.
This finally resolves #1870
2018-07-21 22:39:12 +02:00
|
|
|
// create parent dir with default permissions
|
|
|
|
// #leaveDir restores dir metadata after visiting all children
|
|
|
|
err := fs.MkdirAll(filepath.Dir(target), 0700)
|
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
|
2018-04-07 22:43:14 -04:00
|
|
|
return res.restoreNodeTo(ctx, node, target, location, idx)
|
|
|
|
},
|
|
|
|
leaveDir: func(node *restic.Node, target, location string) error {
|
|
|
|
// Restore directory permissions and timestamp at the end. If we did it earlier
|
|
|
|
// - children restore could fail because of restictive directory permission
|
|
|
|
// - children restore could overwrite the timestamp of the directory they are in
|
|
|
|
return res.restoreNodeMetadataTo(node, target, location)
|
|
|
|
},
|
|
|
|
})
|
2014-09-23 22:39:12 +02:00
|
|
|
}
|
|
|
|
|
2015-05-02 15:23:28 +02:00
|
|
|
// Snapshot returns the snapshot this restorer is configured to use.
|
2018-05-10 22:56:10 -04:00
|
|
|
func (res *Restorer) Snapshot() *restic.Snapshot {
|
2014-09-23 22:39:12 +02:00
|
|
|
return res.sn
|
|
|
|
}
|
2018-04-13 10:02:09 -04:00
|
|
|
|
|
|
|
// VerifyFiles reads all snapshot files and verifies their contents
|
|
|
|
func (res *Restorer) VerifyFiles(ctx context.Context, dst string) (int, error) {
|
|
|
|
// TODO multithreaded?
|
|
|
|
|
|
|
|
count := 0
|
|
|
|
err := res.traverseTree(ctx, dst, string(filepath.Separator), *res.sn.Tree, treeVisitor{
|
|
|
|
enterDir: func(node *restic.Node, target, location string) error { return nil },
|
|
|
|
visitNode: func(node *restic.Node, target, location string) error {
|
|
|
|
if node.Type != "file" {
|
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
|
|
|
count++
|
|
|
|
stat, err := os.Stat(target)
|
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
if int64(node.Size) != stat.Size() {
|
|
|
|
return errors.Errorf("Invalid file size: expected %d got %d", node.Size, stat.Size())
|
|
|
|
}
|
|
|
|
|
|
|
|
offset := int64(0)
|
|
|
|
for _, blobID := range node.Content {
|
|
|
|
rd, err := os.Open(target)
|
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
blobs, _ := res.repo.Index().Lookup(blobID, restic.DataBlob)
|
|
|
|
length := blobs[0].Length - uint(crypto.Extension)
|
|
|
|
buf := make([]byte, length) // TODO do I want to reuse the buffer somehow?
|
|
|
|
_, err = rd.ReadAt(buf, offset)
|
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
if !blobID.Equal(restic.Hash(buf)) {
|
|
|
|
return errors.Errorf("Unexpected contents starting at offset %d", offset)
|
|
|
|
}
|
|
|
|
offset += int64(length)
|
|
|
|
}
|
|
|
|
|
|
|
|
return nil
|
|
|
|
},
|
|
|
|
leaveDir: func(node *restic.Node, target, location string) error { return nil },
|
|
|
|
})
|
|
|
|
|
|
|
|
return count, err
|
|
|
|
}
|