2014-07-12 22:45:33 +00:00
|
|
|
// Copyright (C) 2014 Jakob Borg and Contributors (see the CONTRIBUTORS file).
|
|
|
|
// All rights reserved. Use of this source code is governed by an MIT-style
|
|
|
|
// license that can be found in the LICENSE file.
|
2014-06-01 20:50:14 +00:00
|
|
|
|
2014-03-08 22:02:01 +00:00
|
|
|
package scanner
|
|
|
|
|
|
|
|
import (
|
|
|
|
"bytes"
|
2014-05-04 16:20:25 +00:00
|
|
|
"errors"
|
2014-06-16 14:18:19 +00:00
|
|
|
"fmt"
|
2014-03-08 22:02:01 +00:00
|
|
|
"io/ioutil"
|
|
|
|
"os"
|
|
|
|
"path/filepath"
|
2014-05-19 21:42:08 +00:00
|
|
|
"runtime"
|
2014-03-08 22:02:01 +00:00
|
|
|
"strings"
|
2014-07-15 12:27:46 +00:00
|
|
|
"code.google.com/p/go.text/unicode/norm"
|
2014-03-21 08:09:01 +00:00
|
|
|
|
2014-08-01 14:35:37 +00:00
|
|
|
"github.com/syncthing/syncthing/lamport"
|
|
|
|
"github.com/syncthing/syncthing/protocol"
|
2014-03-08 22:02:01 +00:00
|
|
|
)
|
|
|
|
|
|
|
|
type Walker struct {
|
|
|
|
// Dir is the base directory for the walk
|
|
|
|
Dir string
|
2014-08-11 18:20:01 +00:00
|
|
|
// Limit walking to this path within Dir, or no limit if Sub is blank
|
|
|
|
Sub string
|
2014-03-08 22:02:01 +00:00
|
|
|
// BlockSize controls the size of the block used when hashing.
|
|
|
|
BlockSize int
|
|
|
|
// If IgnoreFile is not empty, it is the name used for the file that holds ignore patterns.
|
|
|
|
IgnoreFile string
|
|
|
|
// If TempNamer is not nil, it is used to ignore tempory files when walking.
|
|
|
|
TempNamer TempNamer
|
2014-03-16 07:14:55 +00:00
|
|
|
// If CurrentFiler is not nil, it is queried for the current file before rescanning.
|
|
|
|
CurrentFiler CurrentFiler
|
2014-05-23 12:31:16 +00:00
|
|
|
// If IgnorePerms is true, changes to permission bits will not be
|
2014-05-23 11:10:26 +00:00
|
|
|
// detected. Scanned files will get zero permission bits and the
|
|
|
|
// NoPermissionBits flag set.
|
2014-05-23 12:31:16 +00:00
|
|
|
IgnorePerms bool
|
2014-03-08 22:02:01 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
type TempNamer interface {
|
2014-03-28 13:36:57 +00:00
|
|
|
// Temporary returns a temporary name for the filed referred to by filepath.
|
2014-03-08 22:02:01 +00:00
|
|
|
TempName(path string) string
|
|
|
|
// IsTemporary returns true if path refers to the name of temporary file.
|
|
|
|
IsTemporary(path string) bool
|
|
|
|
}
|
|
|
|
|
2014-03-16 07:14:55 +00:00
|
|
|
type CurrentFiler interface {
|
|
|
|
// CurrentFile returns the file as seen at last scan.
|
2014-07-12 21:06:48 +00:00
|
|
|
CurrentFile(name string) protocol.FileInfo
|
2014-03-16 07:14:55 +00:00
|
|
|
}
|
|
|
|
|
2014-03-08 22:02:01 +00:00
|
|
|
// Walk returns the list of files found in the local repository by scanning the
|
|
|
|
// file system. Files are blockwise hashed.
|
2014-07-30 18:10:46 +00:00
|
|
|
func (w *Walker) Walk() (chan protocol.FileInfo, map[string][]string, error) {
|
2014-03-08 22:02:01 +00:00
|
|
|
if debug {
|
2014-08-11 18:20:01 +00:00
|
|
|
l.Debugln("Walk", w.Dir, w.Sub, w.BlockSize, w.IgnoreFile)
|
2014-03-08 22:02:01 +00:00
|
|
|
}
|
2014-05-04 16:20:25 +00:00
|
|
|
|
2014-07-30 18:10:46 +00:00
|
|
|
err := checkDir(w.Dir)
|
2014-05-04 16:20:25 +00:00
|
|
|
if err != nil {
|
2014-07-30 18:10:46 +00:00
|
|
|
return nil, nil, err
|
2014-05-04 16:20:25 +00:00
|
|
|
}
|
|
|
|
|
2014-07-30 18:10:46 +00:00
|
|
|
ignore := make(map[string][]string)
|
|
|
|
files := make(chan protocol.FileInfo)
|
|
|
|
hashedFiles := make(chan protocol.FileInfo)
|
|
|
|
newParallelHasher(w.Dir, w.BlockSize, runtime.NumCPU(), hashedFiles, files)
|
2014-07-15 12:27:46 +00:00
|
|
|
hashFiles := w.walkAndHashFiles(files, ignore)
|
2014-03-08 22:02:01 +00:00
|
|
|
|
2014-07-15 12:27:46 +00:00
|
|
|
go func() {
|
|
|
|
filepath.Walk(w.Dir, w.loadIgnoreFiles(w.Dir, ignore))
|
2014-08-11 18:20:01 +00:00
|
|
|
filepath.Walk(filepath.Join(w.Dir, w.Sub), hashFiles)
|
2014-07-15 12:27:46 +00:00
|
|
|
close(files)
|
|
|
|
}()
|
2014-03-08 22:02:01 +00:00
|
|
|
|
2014-07-30 18:10:46 +00:00
|
|
|
return hashedFiles, ignore, nil
|
2014-03-08 22:02:01 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
// CleanTempFiles removes all files that match the temporary filename pattern.
|
|
|
|
func (w *Walker) CleanTempFiles() {
|
|
|
|
filepath.Walk(w.Dir, w.cleanTempFile)
|
|
|
|
}
|
|
|
|
|
|
|
|
func (w *Walker) loadIgnoreFiles(dir string, ign map[string][]string) filepath.WalkFunc {
|
|
|
|
return func(p string, info os.FileInfo, err error) error {
|
|
|
|
if err != nil {
|
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
2014-03-08 22:18:50 +00:00
|
|
|
rn, err := filepath.Rel(dir, p)
|
2014-03-08 22:02:01 +00:00
|
|
|
if err != nil {
|
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
2014-03-28 13:36:57 +00:00
|
|
|
if pn, sn := filepath.Split(rn); sn == w.IgnoreFile {
|
2014-06-16 14:18:19 +00:00
|
|
|
pn := filepath.Clean(pn)
|
2014-03-08 22:02:01 +00:00
|
|
|
bs, _ := ioutil.ReadFile(p)
|
|
|
|
lines := bytes.Split(bs, []byte("\n"))
|
|
|
|
var patterns []string
|
|
|
|
for _, line := range lines {
|
2014-06-16 14:18:19 +00:00
|
|
|
lineStr := strings.TrimSpace(string(line))
|
|
|
|
if len(lineStr) > 0 {
|
|
|
|
patterns = append(patterns, lineStr)
|
2014-03-08 22:02:01 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
ign[pn] = patterns
|
|
|
|
}
|
|
|
|
|
|
|
|
return nil
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2014-07-15 12:27:46 +00:00
|
|
|
func (w *Walker) walkAndHashFiles(fchan chan protocol.FileInfo, ign map[string][]string) filepath.WalkFunc {
|
2014-03-08 22:02:01 +00:00
|
|
|
return func(p string, info os.FileInfo, err error) error {
|
|
|
|
if err != nil {
|
|
|
|
if debug {
|
2014-05-15 00:08:56 +00:00
|
|
|
l.Debugln("error:", p, info, err)
|
2014-03-08 22:02:01 +00:00
|
|
|
}
|
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
2014-03-08 22:18:50 +00:00
|
|
|
rn, err := filepath.Rel(w.Dir, p)
|
2014-03-08 22:02:01 +00:00
|
|
|
if err != nil {
|
2014-03-08 22:18:50 +00:00
|
|
|
if debug {
|
2014-05-15 00:08:56 +00:00
|
|
|
l.Debugln("rel error:", p, err)
|
2014-03-08 22:18:50 +00:00
|
|
|
}
|
2014-03-08 22:02:01 +00:00
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
2014-04-01 21:18:32 +00:00
|
|
|
if rn == "." {
|
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
2014-03-08 22:18:50 +00:00
|
|
|
if w.TempNamer != nil && w.TempNamer.IsTemporary(rn) {
|
2014-04-01 21:18:32 +00:00
|
|
|
// A temporary file
|
2014-03-08 22:02:01 +00:00
|
|
|
if debug {
|
2014-05-15 00:08:56 +00:00
|
|
|
l.Debugln("temporary:", rn)
|
2014-03-08 22:02:01 +00:00
|
|
|
}
|
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
2014-05-25 18:49:08 +00:00
|
|
|
if sn := filepath.Base(rn); sn == w.IgnoreFile || sn == ".stversions" || w.ignoreFile(ign, rn) {
|
2014-04-01 21:18:32 +00:00
|
|
|
// An ignored file
|
2014-03-08 22:02:01 +00:00
|
|
|
if debug {
|
2014-05-15 00:08:56 +00:00
|
|
|
l.Debugln("ignored:", rn)
|
2014-03-08 22:02:01 +00:00
|
|
|
}
|
2014-03-09 11:21:07 +00:00
|
|
|
if info.IsDir() {
|
|
|
|
return filepath.SkipDir
|
|
|
|
}
|
2014-03-08 22:02:01 +00:00
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
2014-06-11 15:51:31 +00:00
|
|
|
if (runtime.GOOS == "linux" || runtime.GOOS == "windows") && !norm.NFC.IsNormalString(rn) {
|
|
|
|
l.Warnf("File %q contains non-NFC UTF-8 sequences and cannot be synced. Consider renaming.", rn)
|
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
2014-04-01 21:18:32 +00:00
|
|
|
if info.Mode().IsDir() {
|
|
|
|
if w.CurrentFiler != nil {
|
|
|
|
cf := w.CurrentFiler.CurrentFile(rn)
|
2014-05-23 12:31:16 +00:00
|
|
|
permUnchanged := w.IgnorePerms || !protocol.HasPermissionBits(cf.Flags) || PermsEqual(cf.Flags, uint32(info.Mode()))
|
2014-07-21 08:48:49 +00:00
|
|
|
if !protocol.IsDeleted(cf.Flags) && protocol.IsDirectory(cf.Flags) && permUnchanged {
|
2014-07-14 21:58:37 +00:00
|
|
|
return nil
|
2014-04-01 21:18:32 +00:00
|
|
|
}
|
|
|
|
}
|
2014-07-14 21:58:37 +00:00
|
|
|
|
|
|
|
var flags uint32 = protocol.FlagDirectory
|
|
|
|
if w.IgnorePerms {
|
|
|
|
flags |= protocol.FlagNoPermBits | 0777
|
|
|
|
} else {
|
|
|
|
flags |= uint32(info.Mode() & os.ModePerm)
|
|
|
|
}
|
|
|
|
f := protocol.FileInfo{
|
|
|
|
Name: rn,
|
|
|
|
Version: lamport.Default.Tick(0),
|
|
|
|
Flags: flags,
|
|
|
|
Modified: info.ModTime().Unix(),
|
|
|
|
}
|
|
|
|
if debug {
|
|
|
|
l.Debugln("dir:", f)
|
|
|
|
}
|
2014-07-15 12:27:46 +00:00
|
|
|
fchan <- f
|
2014-07-14 21:58:37 +00:00
|
|
|
return nil
|
2014-04-01 21:18:32 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
if info.Mode().IsRegular() {
|
2014-03-16 07:14:55 +00:00
|
|
|
if w.CurrentFiler != nil {
|
|
|
|
cf := w.CurrentFiler.CurrentFile(rn)
|
2014-05-23 12:31:16 +00:00
|
|
|
permUnchanged := w.IgnorePerms || !protocol.HasPermissionBits(cf.Flags) || PermsEqual(cf.Flags, uint32(info.Mode()))
|
2014-05-23 11:10:26 +00:00
|
|
|
if !protocol.IsDeleted(cf.Flags) && cf.Modified == info.ModTime().Unix() && permUnchanged {
|
2014-03-16 07:14:55 +00:00
|
|
|
return nil
|
2014-03-08 22:02:01 +00:00
|
|
|
}
|
|
|
|
|
2014-05-19 21:42:08 +00:00
|
|
|
if debug {
|
|
|
|
l.Debugln("rescan:", cf, info.ModTime().Unix(), info.Mode()&os.ModePerm)
|
|
|
|
}
|
2014-03-08 22:02:01 +00:00
|
|
|
}
|
|
|
|
|
2014-05-23 11:10:26 +00:00
|
|
|
var flags = uint32(info.Mode() & os.ModePerm)
|
2014-05-23 12:31:16 +00:00
|
|
|
if w.IgnorePerms {
|
2014-05-24 06:53:54 +00:00
|
|
|
flags = protocol.FlagNoPermBits | 0666
|
2014-05-23 11:10:26 +00:00
|
|
|
}
|
2014-07-30 18:10:46 +00:00
|
|
|
|
|
|
|
fchan <- protocol.FileInfo{
|
2014-03-08 22:18:50 +00:00
|
|
|
Name: rn,
|
2014-03-28 13:36:57 +00:00
|
|
|
Version: lamport.Default.Tick(0),
|
2014-05-23 11:10:26 +00:00
|
|
|
Flags: flags,
|
2014-03-16 07:14:55 +00:00
|
|
|
Modified: info.ModTime().Unix(),
|
2014-03-08 22:02:01 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
return nil
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
func (w *Walker) cleanTempFile(path string, info os.FileInfo, err error) error {
|
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
if info.Mode()&os.ModeType == 0 && w.TempNamer.IsTemporary(path) {
|
|
|
|
os.Remove(path)
|
|
|
|
}
|
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
|
|
|
func (w *Walker) ignoreFile(patterns map[string][]string, file string) bool {
|
2014-03-28 13:36:57 +00:00
|
|
|
first, last := filepath.Split(file)
|
2014-03-08 22:02:01 +00:00
|
|
|
for prefix, pats := range patterns {
|
2014-06-16 14:18:19 +00:00
|
|
|
if prefix == "." || prefix == first || strings.HasPrefix(first, fmt.Sprintf("%s%c", prefix, os.PathSeparator)) {
|
2014-03-08 22:02:01 +00:00
|
|
|
for _, pattern := range pats {
|
2014-03-28 13:36:57 +00:00
|
|
|
if match, _ := filepath.Match(pattern, last); match {
|
2014-03-08 22:02:01 +00:00
|
|
|
return true
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
return false
|
|
|
|
}
|
2014-05-04 16:20:25 +00:00
|
|
|
|
|
|
|
func checkDir(dir string) error {
|
2014-05-28 04:55:30 +00:00
|
|
|
if info, err := os.Lstat(dir); err != nil {
|
2014-05-04 16:20:25 +00:00
|
|
|
return err
|
|
|
|
} else if !info.IsDir() {
|
|
|
|
return errors.New(dir + ": not a directory")
|
2014-05-28 04:55:30 +00:00
|
|
|
} else if debug {
|
|
|
|
l.Debugln("checkDir", dir, info)
|
2014-05-04 16:20:25 +00:00
|
|
|
}
|
|
|
|
return nil
|
|
|
|
}
|
2014-05-19 21:42:08 +00:00
|
|
|
|
2014-05-23 10:55:24 +00:00
|
|
|
func PermsEqual(a, b uint32) bool {
|
2014-05-19 21:42:08 +00:00
|
|
|
switch runtime.GOOS {
|
|
|
|
case "windows":
|
|
|
|
// There is only writeable and read only, represented for user, group
|
|
|
|
// and other equally. We only compare against user.
|
|
|
|
return a&0600 == b&0600
|
|
|
|
default:
|
|
|
|
// All bits count
|
|
|
|
return a&0777 == b&0777
|
|
|
|
}
|
|
|
|
}
|