2014-03-08 23:02:01 +01:00
|
|
|
package scanner
|
|
|
|
|
|
|
|
import (
|
|
|
|
"bytes"
|
|
|
|
"io/ioutil"
|
|
|
|
"log"
|
|
|
|
"os"
|
|
|
|
"path/filepath"
|
|
|
|
"strings"
|
|
|
|
"time"
|
2014-03-21 09:09:01 +01:00
|
|
|
|
2014-03-28 14:36:57 +01:00
|
|
|
"github.com/calmh/syncthing/lamport"
|
2014-04-01 23:18:32 +02:00
|
|
|
"github.com/calmh/syncthing/protocol"
|
2014-03-08 23:02:01 +01:00
|
|
|
)
|
|
|
|
|
|
|
|
type Walker struct {
|
|
|
|
// Dir is the base directory for the walk
|
|
|
|
Dir string
|
|
|
|
// BlockSize controls the size of the block used when hashing.
|
|
|
|
BlockSize int
|
|
|
|
// If IgnoreFile is not empty, it is the name used for the file that holds ignore patterns.
|
|
|
|
IgnoreFile string
|
|
|
|
// If TempNamer is not nil, it is used to ignore tempory files when walking.
|
|
|
|
TempNamer TempNamer
|
2014-03-16 08:14:55 +01:00
|
|
|
// If CurrentFiler is not nil, it is queried for the current file before rescanning.
|
|
|
|
CurrentFiler CurrentFiler
|
2014-03-08 23:02:01 +01:00
|
|
|
// If Suppressor is not nil, it is queried for supression of modified files.
|
2014-03-16 08:14:55 +01:00
|
|
|
// Suppressed files will be returned with empty metadata and the Suppressed flag set.
|
|
|
|
// Requires CurrentFiler to be set.
|
2014-03-08 23:02:01 +01:00
|
|
|
Suppressor Suppressor
|
|
|
|
|
|
|
|
suppressed map[string]bool // file name -> suppression status
|
|
|
|
}
|
|
|
|
|
|
|
|
type TempNamer interface {
|
2014-03-28 14:36:57 +01:00
|
|
|
// Temporary returns a temporary name for the filed referred to by filepath.
|
2014-03-08 23:02:01 +01:00
|
|
|
TempName(path string) string
|
|
|
|
// IsTemporary returns true if path refers to the name of temporary file.
|
|
|
|
IsTemporary(path string) bool
|
|
|
|
}
|
|
|
|
|
|
|
|
type Suppressor interface {
|
|
|
|
// Supress returns true if the update to the named file should be ignored.
|
|
|
|
Suppress(name string, fi os.FileInfo) bool
|
|
|
|
}
|
|
|
|
|
2014-03-16 08:14:55 +01:00
|
|
|
type CurrentFiler interface {
|
|
|
|
// CurrentFile returns the file as seen at last scan.
|
|
|
|
CurrentFile(name string) File
|
|
|
|
}
|
|
|
|
|
2014-03-08 23:02:01 +01:00
|
|
|
// Walk returns the list of files found in the local repository by scanning the
|
|
|
|
// file system. Files are blockwise hashed.
|
|
|
|
func (w *Walker) Walk() (files []File, ignore map[string][]string) {
|
|
|
|
w.lazyInit()
|
|
|
|
|
|
|
|
if debug {
|
2014-04-06 21:44:17 +02:00
|
|
|
dlog.Println("Walk", w.Dir, w.BlockSize, w.IgnoreFile)
|
2014-03-08 23:02:01 +01:00
|
|
|
}
|
|
|
|
t0 := time.Now()
|
|
|
|
|
|
|
|
ignore = make(map[string][]string)
|
|
|
|
hashFiles := w.walkAndHashFiles(&files, ignore)
|
|
|
|
|
|
|
|
filepath.Walk(w.Dir, w.loadIgnoreFiles(w.Dir, ignore))
|
|
|
|
filepath.Walk(w.Dir, hashFiles)
|
|
|
|
|
|
|
|
if debug {
|
|
|
|
t1 := time.Now()
|
|
|
|
d := t1.Sub(t0).Seconds()
|
|
|
|
dlog.Printf("Walk in %.02f ms, %.0f files/s", d*1000, float64(len(files))/d)
|
|
|
|
}
|
|
|
|
return
|
|
|
|
}
|
|
|
|
|
|
|
|
// CleanTempFiles removes all files that match the temporary filename pattern.
|
|
|
|
func (w *Walker) CleanTempFiles() {
|
|
|
|
filepath.Walk(w.Dir, w.cleanTempFile)
|
|
|
|
}
|
|
|
|
|
|
|
|
func (w *Walker) lazyInit() {
|
2014-03-16 08:14:55 +01:00
|
|
|
if w.suppressed == nil {
|
2014-03-08 23:02:01 +01:00
|
|
|
w.suppressed = make(map[string]bool)
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
func (w *Walker) loadIgnoreFiles(dir string, ign map[string][]string) filepath.WalkFunc {
|
|
|
|
return func(p string, info os.FileInfo, err error) error {
|
|
|
|
if err != nil {
|
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
2014-03-08 23:18:50 +01:00
|
|
|
rn, err := filepath.Rel(dir, p)
|
2014-03-08 23:02:01 +01:00
|
|
|
if err != nil {
|
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
2014-03-28 14:36:57 +01:00
|
|
|
if pn, sn := filepath.Split(rn); sn == w.IgnoreFile {
|
2014-03-08 23:02:01 +01:00
|
|
|
pn := strings.Trim(pn, "/")
|
|
|
|
bs, _ := ioutil.ReadFile(p)
|
|
|
|
lines := bytes.Split(bs, []byte("\n"))
|
|
|
|
var patterns []string
|
|
|
|
for _, line := range lines {
|
|
|
|
if len(line) > 0 {
|
|
|
|
patterns = append(patterns, string(line))
|
|
|
|
}
|
|
|
|
}
|
|
|
|
ign[pn] = patterns
|
|
|
|
}
|
|
|
|
|
|
|
|
return nil
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
func (w *Walker) walkAndHashFiles(res *[]File, ign map[string][]string) filepath.WalkFunc {
|
|
|
|
return func(p string, info os.FileInfo, err error) error {
|
|
|
|
if err != nil {
|
|
|
|
if debug {
|
|
|
|
dlog.Println("error:", p, info, err)
|
|
|
|
}
|
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
2014-03-08 23:18:50 +01:00
|
|
|
rn, err := filepath.Rel(w.Dir, p)
|
2014-03-08 23:02:01 +01:00
|
|
|
if err != nil {
|
2014-03-08 23:18:50 +01:00
|
|
|
if debug {
|
|
|
|
dlog.Println("rel error:", p, err)
|
|
|
|
}
|
2014-03-08 23:02:01 +01:00
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
2014-04-01 23:18:32 +02:00
|
|
|
if rn == "." {
|
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
2014-03-08 23:18:50 +01:00
|
|
|
if w.TempNamer != nil && w.TempNamer.IsTemporary(rn) {
|
2014-04-01 23:18:32 +02:00
|
|
|
// A temporary file
|
2014-03-08 23:02:01 +01:00
|
|
|
if debug {
|
2014-03-08 23:18:50 +01:00
|
|
|
dlog.Println("temporary:", rn)
|
2014-03-08 23:02:01 +01:00
|
|
|
}
|
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
2014-03-28 14:36:57 +01:00
|
|
|
if _, sn := filepath.Split(rn); sn == w.IgnoreFile {
|
2014-04-01 23:18:32 +02:00
|
|
|
// An ignore-file; these are ignored themselves
|
2014-03-08 23:02:01 +01:00
|
|
|
if debug {
|
2014-03-08 23:18:50 +01:00
|
|
|
dlog.Println("ignorefile:", rn)
|
2014-03-08 23:02:01 +01:00
|
|
|
}
|
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
2014-04-01 23:18:32 +02:00
|
|
|
if w.ignoreFile(ign, rn) {
|
|
|
|
// An ignored file
|
2014-03-08 23:02:01 +01:00
|
|
|
if debug {
|
2014-03-08 23:18:50 +01:00
|
|
|
dlog.Println("ignored:", rn)
|
2014-03-08 23:02:01 +01:00
|
|
|
}
|
2014-03-09 12:21:07 +01:00
|
|
|
if info.IsDir() {
|
|
|
|
return filepath.SkipDir
|
|
|
|
}
|
2014-03-08 23:02:01 +01:00
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
2014-04-01 23:18:32 +02:00
|
|
|
if info.Mode().IsDir() {
|
|
|
|
if w.CurrentFiler != nil {
|
|
|
|
cf := w.CurrentFiler.CurrentFile(rn)
|
|
|
|
if cf.Modified == info.ModTime().Unix() && cf.Flags == uint32(info.Mode()&os.ModePerm|protocol.FlagDirectory) {
|
|
|
|
if debug {
|
|
|
|
dlog.Println("unchanged:", cf)
|
|
|
|
}
|
|
|
|
*res = append(*res, cf)
|
|
|
|
} else {
|
|
|
|
f := File{
|
|
|
|
Name: rn,
|
|
|
|
Version: lamport.Default.Tick(0),
|
|
|
|
Flags: uint32(info.Mode()&os.ModePerm) | protocol.FlagDirectory,
|
|
|
|
Modified: info.ModTime().Unix(),
|
|
|
|
}
|
|
|
|
if debug {
|
|
|
|
dlog.Println("dir:", cf, f)
|
|
|
|
}
|
|
|
|
*res = append(*res, f)
|
|
|
|
}
|
|
|
|
return nil
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
if info.Mode().IsRegular() {
|
2014-03-16 08:14:55 +01:00
|
|
|
if w.CurrentFiler != nil {
|
|
|
|
cf := w.CurrentFiler.CurrentFile(rn)
|
2014-04-01 23:18:32 +02:00
|
|
|
if cf.Flags&protocol.FlagDeleted == 0 && cf.Modified == info.ModTime().Unix() {
|
2014-03-08 23:02:01 +01:00
|
|
|
if debug {
|
2014-03-28 14:36:57 +01:00
|
|
|
dlog.Println("unchanged:", cf)
|
2014-03-08 23:02:01 +01:00
|
|
|
}
|
2014-03-16 08:14:55 +01:00
|
|
|
*res = append(*res, cf)
|
|
|
|
return nil
|
2014-03-08 23:02:01 +01:00
|
|
|
}
|
|
|
|
|
2014-03-16 08:14:55 +01:00
|
|
|
if w.Suppressor != nil && w.Suppressor.Suppress(rn, info) {
|
|
|
|
if !w.suppressed[rn] {
|
|
|
|
w.suppressed[rn] = true
|
|
|
|
log.Printf("INFO: Changes to %q are being temporarily suppressed because it changes too frequently.", p)
|
2014-03-28 14:36:57 +01:00
|
|
|
cf.Suppressed = true
|
|
|
|
cf.Version++
|
|
|
|
}
|
|
|
|
if debug {
|
|
|
|
dlog.Println("suppressed:", cf)
|
2014-03-16 08:14:55 +01:00
|
|
|
}
|
|
|
|
*res = append(*res, cf)
|
2014-03-28 14:36:57 +01:00
|
|
|
return nil
|
2014-03-16 08:14:55 +01:00
|
|
|
} else if w.suppressed[rn] {
|
|
|
|
log.Printf("INFO: Changes to %q are no longer suppressed.", p)
|
|
|
|
delete(w.suppressed, rn)
|
2014-03-08 23:02:01 +01:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
fd, err := os.Open(p)
|
|
|
|
if err != nil {
|
2014-03-08 23:18:50 +01:00
|
|
|
if debug {
|
|
|
|
dlog.Println("open:", p, err)
|
|
|
|
}
|
2014-03-08 23:02:01 +01:00
|
|
|
return nil
|
|
|
|
}
|
|
|
|
defer fd.Close()
|
|
|
|
|
|
|
|
t0 := time.Now()
|
|
|
|
blocks, err := Blocks(fd, w.BlockSize)
|
|
|
|
if err != nil {
|
|
|
|
if debug {
|
2014-03-08 23:18:50 +01:00
|
|
|
dlog.Println("hash error:", rn, err)
|
2014-03-08 23:02:01 +01:00
|
|
|
}
|
|
|
|
return nil
|
|
|
|
}
|
|
|
|
if debug {
|
|
|
|
t1 := time.Now()
|
2014-03-08 23:18:50 +01:00
|
|
|
dlog.Println("hashed:", rn, ";", len(blocks), "blocks;", info.Size(), "bytes;", int(float64(info.Size())/1024/t1.Sub(t0).Seconds()), "KB/s")
|
2014-03-08 23:02:01 +01:00
|
|
|
}
|
|
|
|
f := File{
|
2014-03-08 23:18:50 +01:00
|
|
|
Name: rn,
|
2014-03-28 14:36:57 +01:00
|
|
|
Version: lamport.Default.Tick(0),
|
2014-03-08 23:02:01 +01:00
|
|
|
Size: info.Size(),
|
|
|
|
Flags: uint32(info.Mode()),
|
2014-03-16 08:14:55 +01:00
|
|
|
Modified: info.ModTime().Unix(),
|
2014-03-08 23:02:01 +01:00
|
|
|
Blocks: blocks,
|
|
|
|
}
|
|
|
|
*res = append(*res, f)
|
|
|
|
}
|
|
|
|
|
|
|
|
return nil
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
func (w *Walker) cleanTempFile(path string, info os.FileInfo, err error) error {
|
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
if info.Mode()&os.ModeType == 0 && w.TempNamer.IsTemporary(path) {
|
|
|
|
os.Remove(path)
|
|
|
|
}
|
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
|
|
|
func (w *Walker) ignoreFile(patterns map[string][]string, file string) bool {
|
2014-03-28 14:36:57 +01:00
|
|
|
first, last := filepath.Split(file)
|
2014-03-08 23:02:01 +01:00
|
|
|
for prefix, pats := range patterns {
|
|
|
|
if len(prefix) == 0 || prefix == first || strings.HasPrefix(first, prefix+"/") {
|
|
|
|
for _, pattern := range pats {
|
2014-03-28 14:36:57 +01:00
|
|
|
if match, _ := filepath.Match(pattern, last); match {
|
2014-03-08 23:02:01 +01:00
|
|
|
return true
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
return false
|
|
|
|
}
|