2014-07-12 22:45:33 +00:00
|
|
|
// Copyright (C) 2014 Jakob Borg and Contributors (see the CONTRIBUTORS file).
|
|
|
|
// All rights reserved. Use of this source code is governed by an MIT-style
|
|
|
|
// license that can be found in the LICENSE file.
|
2014-06-01 20:50:14 +00:00
|
|
|
|
2014-03-08 22:02:01 +00:00
|
|
|
package scanner
|
|
|
|
|
|
|
|
import (
|
2014-08-26 08:11:25 +00:00
|
|
|
"bufio"
|
2014-05-04 16:20:25 +00:00
|
|
|
"errors"
|
2014-08-26 08:11:25 +00:00
|
|
|
"io"
|
2014-03-08 22:02:01 +00:00
|
|
|
"os"
|
2014-08-26 08:11:25 +00:00
|
|
|
"path"
|
2014-03-08 22:02:01 +00:00
|
|
|
"path/filepath"
|
2014-08-26 08:11:25 +00:00
|
|
|
"regexp"
|
2014-05-19 21:42:08 +00:00
|
|
|
"runtime"
|
2014-03-08 22:02:01 +00:00
|
|
|
"strings"
|
2014-08-16 16:33:01 +00:00
|
|
|
|
2014-07-15 12:27:46 +00:00
|
|
|
"code.google.com/p/go.text/unicode/norm"
|
2014-03-21 08:09:01 +00:00
|
|
|
|
2014-08-26 08:11:25 +00:00
|
|
|
"github.com/syncthing/syncthing/fnmatch"
|
2014-08-01 14:35:37 +00:00
|
|
|
"github.com/syncthing/syncthing/lamport"
|
|
|
|
"github.com/syncthing/syncthing/protocol"
|
2014-03-08 22:02:01 +00:00
|
|
|
)
|
|
|
|
|
|
|
|
type Walker struct {
|
|
|
|
// Dir is the base directory for the walk
|
|
|
|
Dir string
|
2014-08-11 18:20:01 +00:00
|
|
|
// Limit walking to this path within Dir, or no limit if Sub is blank
|
|
|
|
Sub string
|
2014-03-08 22:02:01 +00:00
|
|
|
// BlockSize controls the size of the block used when hashing.
|
|
|
|
BlockSize int
|
|
|
|
// If IgnoreFile is not empty, it is the name used for the file that holds ignore patterns.
|
|
|
|
IgnoreFile string
|
|
|
|
// If TempNamer is not nil, it is used to ignore tempory files when walking.
|
|
|
|
TempNamer TempNamer
|
2014-03-16 07:14:55 +00:00
|
|
|
// If CurrentFiler is not nil, it is queried for the current file before rescanning.
|
|
|
|
CurrentFiler CurrentFiler
|
2014-05-23 12:31:16 +00:00
|
|
|
// If IgnorePerms is true, changes to permission bits will not be
|
2014-05-23 11:10:26 +00:00
|
|
|
// detected. Scanned files will get zero permission bits and the
|
|
|
|
// NoPermissionBits flag set.
|
2014-05-23 12:31:16 +00:00
|
|
|
IgnorePerms bool
|
2014-03-08 22:02:01 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
type TempNamer interface {
|
2014-03-28 13:36:57 +00:00
|
|
|
// Temporary returns a temporary name for the filed referred to by filepath.
|
2014-03-08 22:02:01 +00:00
|
|
|
TempName(path string) string
|
|
|
|
// IsTemporary returns true if path refers to the name of temporary file.
|
|
|
|
IsTemporary(path string) bool
|
|
|
|
}
|
|
|
|
|
2014-03-16 07:14:55 +00:00
|
|
|
type CurrentFiler interface {
|
|
|
|
// CurrentFile returns the file as seen at last scan.
|
2014-07-12 21:06:48 +00:00
|
|
|
CurrentFile(name string) protocol.FileInfo
|
2014-03-16 07:14:55 +00:00
|
|
|
}
|
|
|
|
|
2014-03-08 22:02:01 +00:00
|
|
|
// Walk returns the list of files found in the local repository by scanning the
|
|
|
|
// file system. Files are blockwise hashed.
|
2014-08-26 08:11:25 +00:00
|
|
|
func (w *Walker) Walk() (chan protocol.FileInfo, error) {
|
2014-03-08 22:02:01 +00:00
|
|
|
if debug {
|
2014-08-11 18:20:01 +00:00
|
|
|
l.Debugln("Walk", w.Dir, w.Sub, w.BlockSize, w.IgnoreFile)
|
2014-03-08 22:02:01 +00:00
|
|
|
}
|
2014-05-04 16:20:25 +00:00
|
|
|
|
2014-07-30 18:10:46 +00:00
|
|
|
err := checkDir(w.Dir)
|
2014-05-04 16:20:25 +00:00
|
|
|
if err != nil {
|
2014-08-26 08:11:25 +00:00
|
|
|
return nil, err
|
2014-05-04 16:20:25 +00:00
|
|
|
}
|
|
|
|
|
2014-07-30 18:10:46 +00:00
|
|
|
files := make(chan protocol.FileInfo)
|
|
|
|
hashedFiles := make(chan protocol.FileInfo)
|
|
|
|
newParallelHasher(w.Dir, w.BlockSize, runtime.NumCPU(), hashedFiles, files)
|
2014-03-08 22:02:01 +00:00
|
|
|
|
2014-08-26 08:11:25 +00:00
|
|
|
var ignores []*regexp.Regexp
|
2014-07-15 12:27:46 +00:00
|
|
|
go func() {
|
2014-08-26 08:11:25 +00:00
|
|
|
filepath.Walk(w.Dir, w.loadIgnoreFiles(w.Dir, &ignores))
|
|
|
|
|
|
|
|
hashFiles := w.walkAndHashFiles(files, ignores)
|
2014-08-11 18:20:01 +00:00
|
|
|
filepath.Walk(filepath.Join(w.Dir, w.Sub), hashFiles)
|
2014-07-15 12:27:46 +00:00
|
|
|
close(files)
|
|
|
|
}()
|
2014-03-08 22:02:01 +00:00
|
|
|
|
2014-08-26 08:11:25 +00:00
|
|
|
return hashedFiles, nil
|
2014-03-08 22:02:01 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
// CleanTempFiles removes all files that match the temporary filename pattern.
|
|
|
|
func (w *Walker) CleanTempFiles() {
|
|
|
|
filepath.Walk(w.Dir, w.cleanTempFile)
|
|
|
|
}
|
|
|
|
|
2014-08-26 08:11:25 +00:00
|
|
|
func (w *Walker) loadIgnoreFiles(dir string, ignores *[]*regexp.Regexp) filepath.WalkFunc {
|
2014-03-08 22:02:01 +00:00
|
|
|
return func(p string, info os.FileInfo, err error) error {
|
|
|
|
if err != nil {
|
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
2014-03-08 22:18:50 +00:00
|
|
|
rn, err := filepath.Rel(dir, p)
|
2014-03-08 22:02:01 +00:00
|
|
|
if err != nil {
|
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
2014-03-28 13:36:57 +00:00
|
|
|
if pn, sn := filepath.Split(rn); sn == w.IgnoreFile {
|
2014-06-16 14:18:19 +00:00
|
|
|
pn := filepath.Clean(pn)
|
2014-08-30 21:32:17 +00:00
|
|
|
filesSeen := make(map[string]map[string]bool)
|
|
|
|
dirIgnores := loadIgnoreFile(p, pn, filesSeen)
|
2014-08-26 08:11:25 +00:00
|
|
|
*ignores = append(*ignores, dirIgnores...)
|
2014-03-08 22:02:01 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
return nil
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2014-08-30 21:32:17 +00:00
|
|
|
func loadIgnoreFile(ignFile, base string, filesSeen map[string]map[string]bool) []*regexp.Regexp {
|
2014-08-26 08:11:25 +00:00
|
|
|
fd, err := os.Open(ignFile)
|
|
|
|
if err != nil {
|
|
|
|
return nil
|
|
|
|
}
|
|
|
|
defer fd.Close()
|
2014-08-30 21:32:17 +00:00
|
|
|
return parseIgnoreFile(fd, base, ignFile, filesSeen)
|
2014-08-26 08:11:25 +00:00
|
|
|
}
|
|
|
|
|
2014-08-30 21:32:17 +00:00
|
|
|
func parseIgnoreFile(fd io.Reader, base, currentFile string, filesSeen map[string]map[string]bool) []*regexp.Regexp {
|
2014-08-26 08:11:25 +00:00
|
|
|
var exps []*regexp.Regexp
|
|
|
|
scanner := bufio.NewScanner(fd)
|
|
|
|
for scanner.Scan() {
|
|
|
|
line := strings.TrimSpace(scanner.Text())
|
|
|
|
if line == "" {
|
|
|
|
continue
|
|
|
|
}
|
|
|
|
|
|
|
|
if strings.HasPrefix(line, "/") {
|
|
|
|
// Pattern is rooted in the current dir only
|
|
|
|
exp, err := fnmatch.Convert(path.Join(base, line[1:]), fnmatch.FNM_PATHNAME)
|
|
|
|
if err != nil {
|
|
|
|
l.Warnf("Invalid pattern %q in ignore file", line)
|
|
|
|
continue
|
|
|
|
}
|
|
|
|
exps = append(exps, exp)
|
|
|
|
} else if strings.HasPrefix(line, "**/") {
|
|
|
|
// Add the pattern as is, and without **/ so it matches in current dir
|
|
|
|
exp, err := fnmatch.Convert(line, fnmatch.FNM_PATHNAME)
|
|
|
|
if err != nil {
|
|
|
|
l.Warnf("Invalid pattern %q in ignore file", line)
|
|
|
|
continue
|
|
|
|
}
|
|
|
|
exps = append(exps, exp)
|
|
|
|
|
|
|
|
exp, err = fnmatch.Convert(path.Join(base, line[3:]), fnmatch.FNM_PATHNAME)
|
|
|
|
if err != nil {
|
|
|
|
l.Warnf("Invalid pattern %q in ignore file", line)
|
|
|
|
continue
|
|
|
|
}
|
|
|
|
exps = append(exps, exp)
|
2014-08-28 22:45:26 +00:00
|
|
|
} else if strings.HasPrefix(line, "#include ") {
|
2014-08-30 21:32:17 +00:00
|
|
|
includeFile := filepath.Join(filepath.Dir(currentFile), strings.Replace(line, "#include ", "", 1))
|
2014-08-28 22:45:26 +00:00
|
|
|
if _, err := os.Stat(includeFile); os.IsNotExist(err) {
|
|
|
|
l.Infoln("Could not open ignore include file", includeFile)
|
|
|
|
} else {
|
2014-08-30 21:32:17 +00:00
|
|
|
seen := false
|
|
|
|
if seenByCurrent, ok := filesSeen[currentFile]; ok {
|
|
|
|
_, seen = seenByCurrent[includeFile]
|
|
|
|
}
|
|
|
|
|
|
|
|
if seen {
|
|
|
|
l.Warnf("Recursion detected while including %s from %s", includeFile, currentFile)
|
|
|
|
} else {
|
|
|
|
if filesSeen[currentFile] == nil {
|
|
|
|
filesSeen[currentFile] = make(map[string]bool)
|
|
|
|
}
|
|
|
|
filesSeen[currentFile][includeFile] = true
|
|
|
|
includes := loadIgnoreFile(includeFile, base, filesSeen)
|
|
|
|
exps = append(exps, includes...)
|
|
|
|
}
|
2014-08-28 22:45:26 +00:00
|
|
|
}
|
2014-08-26 08:11:25 +00:00
|
|
|
} else {
|
|
|
|
// Path name or pattern, add it so it matches files both in
|
|
|
|
// current directory and subdirs.
|
|
|
|
exp, err := fnmatch.Convert(path.Join(base, line), fnmatch.FNM_PATHNAME)
|
|
|
|
if err != nil {
|
|
|
|
l.Warnf("Invalid pattern %q in ignore file", line)
|
|
|
|
continue
|
|
|
|
}
|
|
|
|
exps = append(exps, exp)
|
|
|
|
|
|
|
|
exp, err = fnmatch.Convert(path.Join(base, "**", line), fnmatch.FNM_PATHNAME)
|
|
|
|
if err != nil {
|
|
|
|
l.Warnf("Invalid pattern %q in ignore file", line)
|
|
|
|
continue
|
|
|
|
}
|
|
|
|
exps = append(exps, exp)
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
return exps
|
|
|
|
}
|
|
|
|
|
|
|
|
func (w *Walker) walkAndHashFiles(fchan chan protocol.FileInfo, ignores []*regexp.Regexp) filepath.WalkFunc {
|
2014-03-08 22:02:01 +00:00
|
|
|
return func(p string, info os.FileInfo, err error) error {
|
|
|
|
if err != nil {
|
|
|
|
if debug {
|
2014-05-15 00:08:56 +00:00
|
|
|
l.Debugln("error:", p, info, err)
|
2014-03-08 22:02:01 +00:00
|
|
|
}
|
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
2014-03-08 22:18:50 +00:00
|
|
|
rn, err := filepath.Rel(w.Dir, p)
|
2014-03-08 22:02:01 +00:00
|
|
|
if err != nil {
|
2014-03-08 22:18:50 +00:00
|
|
|
if debug {
|
2014-05-15 00:08:56 +00:00
|
|
|
l.Debugln("rel error:", p, err)
|
2014-03-08 22:18:50 +00:00
|
|
|
}
|
2014-03-08 22:02:01 +00:00
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
2014-04-01 21:18:32 +00:00
|
|
|
if rn == "." {
|
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
2014-03-08 22:18:50 +00:00
|
|
|
if w.TempNamer != nil && w.TempNamer.IsTemporary(rn) {
|
2014-04-01 21:18:32 +00:00
|
|
|
// A temporary file
|
2014-03-08 22:02:01 +00:00
|
|
|
if debug {
|
2014-05-15 00:08:56 +00:00
|
|
|
l.Debugln("temporary:", rn)
|
2014-03-08 22:02:01 +00:00
|
|
|
}
|
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
2014-08-26 08:11:25 +00:00
|
|
|
if sn := filepath.Base(rn); sn == w.IgnoreFile || sn == ".stversions" || w.ignoreFile(ignores, rn) {
|
2014-04-01 21:18:32 +00:00
|
|
|
// An ignored file
|
2014-03-08 22:02:01 +00:00
|
|
|
if debug {
|
2014-05-15 00:08:56 +00:00
|
|
|
l.Debugln("ignored:", rn)
|
2014-03-08 22:02:01 +00:00
|
|
|
}
|
2014-03-09 11:21:07 +00:00
|
|
|
if info.IsDir() {
|
|
|
|
return filepath.SkipDir
|
|
|
|
}
|
2014-03-08 22:02:01 +00:00
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
2014-06-11 15:51:31 +00:00
|
|
|
if (runtime.GOOS == "linux" || runtime.GOOS == "windows") && !norm.NFC.IsNormalString(rn) {
|
|
|
|
l.Warnf("File %q contains non-NFC UTF-8 sequences and cannot be synced. Consider renaming.", rn)
|
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
2014-04-01 21:18:32 +00:00
|
|
|
if info.Mode().IsDir() {
|
|
|
|
if w.CurrentFiler != nil {
|
|
|
|
cf := w.CurrentFiler.CurrentFile(rn)
|
2014-05-23 12:31:16 +00:00
|
|
|
permUnchanged := w.IgnorePerms || !protocol.HasPermissionBits(cf.Flags) || PermsEqual(cf.Flags, uint32(info.Mode()))
|
2014-07-21 08:48:49 +00:00
|
|
|
if !protocol.IsDeleted(cf.Flags) && protocol.IsDirectory(cf.Flags) && permUnchanged {
|
2014-07-14 21:58:37 +00:00
|
|
|
return nil
|
2014-04-01 21:18:32 +00:00
|
|
|
}
|
|
|
|
}
|
2014-07-14 21:58:37 +00:00
|
|
|
|
|
|
|
var flags uint32 = protocol.FlagDirectory
|
|
|
|
if w.IgnorePerms {
|
|
|
|
flags |= protocol.FlagNoPermBits | 0777
|
|
|
|
} else {
|
|
|
|
flags |= uint32(info.Mode() & os.ModePerm)
|
|
|
|
}
|
|
|
|
f := protocol.FileInfo{
|
|
|
|
Name: rn,
|
|
|
|
Version: lamport.Default.Tick(0),
|
|
|
|
Flags: flags,
|
|
|
|
Modified: info.ModTime().Unix(),
|
|
|
|
}
|
|
|
|
if debug {
|
|
|
|
l.Debugln("dir:", f)
|
|
|
|
}
|
2014-07-15 12:27:46 +00:00
|
|
|
fchan <- f
|
2014-07-14 21:58:37 +00:00
|
|
|
return nil
|
2014-04-01 21:18:32 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
if info.Mode().IsRegular() {
|
2014-03-16 07:14:55 +00:00
|
|
|
if w.CurrentFiler != nil {
|
|
|
|
cf := w.CurrentFiler.CurrentFile(rn)
|
2014-05-23 12:31:16 +00:00
|
|
|
permUnchanged := w.IgnorePerms || !protocol.HasPermissionBits(cf.Flags) || PermsEqual(cf.Flags, uint32(info.Mode()))
|
2014-05-23 11:10:26 +00:00
|
|
|
if !protocol.IsDeleted(cf.Flags) && cf.Modified == info.ModTime().Unix() && permUnchanged {
|
2014-03-16 07:14:55 +00:00
|
|
|
return nil
|
2014-03-08 22:02:01 +00:00
|
|
|
}
|
|
|
|
|
2014-05-19 21:42:08 +00:00
|
|
|
if debug {
|
|
|
|
l.Debugln("rescan:", cf, info.ModTime().Unix(), info.Mode()&os.ModePerm)
|
|
|
|
}
|
2014-03-08 22:02:01 +00:00
|
|
|
}
|
|
|
|
|
2014-05-23 11:10:26 +00:00
|
|
|
var flags = uint32(info.Mode() & os.ModePerm)
|
2014-05-23 12:31:16 +00:00
|
|
|
if w.IgnorePerms {
|
2014-05-24 06:53:54 +00:00
|
|
|
flags = protocol.FlagNoPermBits | 0666
|
2014-05-23 11:10:26 +00:00
|
|
|
}
|
2014-07-30 18:10:46 +00:00
|
|
|
|
|
|
|
fchan <- protocol.FileInfo{
|
2014-03-08 22:18:50 +00:00
|
|
|
Name: rn,
|
2014-03-28 13:36:57 +00:00
|
|
|
Version: lamport.Default.Tick(0),
|
2014-05-23 11:10:26 +00:00
|
|
|
Flags: flags,
|
2014-03-16 07:14:55 +00:00
|
|
|
Modified: info.ModTime().Unix(),
|
2014-03-08 22:02:01 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
return nil
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
func (w *Walker) cleanTempFile(path string, info os.FileInfo, err error) error {
|
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
if info.Mode()&os.ModeType == 0 && w.TempNamer.IsTemporary(path) {
|
|
|
|
os.Remove(path)
|
|
|
|
}
|
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
2014-08-26 08:11:25 +00:00
|
|
|
func (w *Walker) ignoreFile(patterns []*regexp.Regexp, file string) bool {
|
|
|
|
for _, pattern := range patterns {
|
|
|
|
if pattern.MatchString(file) {
|
|
|
|
if debug {
|
|
|
|
l.Debugf("%q matches %v", file, pattern)
|
2014-03-08 22:02:01 +00:00
|
|
|
}
|
2014-08-26 08:11:25 +00:00
|
|
|
return true
|
2014-03-08 22:02:01 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
return false
|
|
|
|
}
|
2014-05-04 16:20:25 +00:00
|
|
|
|
|
|
|
func checkDir(dir string) error {
|
2014-05-28 04:55:30 +00:00
|
|
|
if info, err := os.Lstat(dir); err != nil {
|
2014-05-04 16:20:25 +00:00
|
|
|
return err
|
|
|
|
} else if !info.IsDir() {
|
|
|
|
return errors.New(dir + ": not a directory")
|
2014-05-28 04:55:30 +00:00
|
|
|
} else if debug {
|
|
|
|
l.Debugln("checkDir", dir, info)
|
2014-05-04 16:20:25 +00:00
|
|
|
}
|
|
|
|
return nil
|
|
|
|
}
|
2014-05-19 21:42:08 +00:00
|
|
|
|
2014-05-23 10:55:24 +00:00
|
|
|
func PermsEqual(a, b uint32) bool {
|
2014-05-19 21:42:08 +00:00
|
|
|
switch runtime.GOOS {
|
|
|
|
case "windows":
|
|
|
|
// There is only writeable and read only, represented for user, group
|
|
|
|
// and other equally. We only compare against user.
|
|
|
|
return a&0600 == b&0600
|
|
|
|
default:
|
|
|
|
// All bits count
|
|
|
|
return a&0777 == b&0777
|
|
|
|
}
|
|
|
|
}
|