Configurable file pull order (alphabetic, random, by size or age)

This commit is contained in:
Jakob Borg 2015-04-25 14:13:53 +09:00
parent bb31b1785b
commit be7b3a9952
10 changed files with 364 additions and 33 deletions

View File

@ -10,6 +10,7 @@
"Addresses": "Addresses", "Addresses": "Addresses",
"All Data": "All Data", "All Data": "All Data",
"Allow Anonymous Usage Reporting?": "Allow Anonymous Usage Reporting?", "Allow Anonymous Usage Reporting?": "Allow Anonymous Usage Reporting?",
"Alphabetic": "Alphabetic",
"An external command handles the versioning. It has to remove the file from the synced folder.": "An external command handles the versioning. It has to remove the file from the synced folder.", "An external command handles the versioning. It has to remove the file from the synced folder.": "An external command handles the versioning. It has to remove the file from the synced folder.",
"Anonymous Usage Reporting": "Anonymous Usage Reporting", "Anonymous Usage Reporting": "Anonymous Usage Reporting",
"Any devices configured on an introducer device will be added to this device as well.": "Any devices configured on an introducer device will be added to this device as well.", "Any devices configured on an introducer device will be added to this device as well.": "Any devices configured on an introducer device will be added to this device as well.",
@ -45,6 +46,7 @@
"Enter ignore patterns, one per line.": "Enter ignore patterns, one per line.", "Enter ignore patterns, one per line.": "Enter ignore patterns, one per line.",
"Error": "Error", "Error": "Error",
"External File Versioning": "External File Versioning", "External File Versioning": "External File Versioning",
"File Pull Order": "File Pull Order",
"File Versioning": "File Versioning", "File Versioning": "File Versioning",
"File permission bits are ignored when looking for changes. Use on FAT file systems.": "File permission bits are ignored when looking for changes. Use on FAT file systems.", "File permission bits are ignored when looking for changes. Use on FAT file systems.": "File permission bits are ignored when looking for changes. Use on FAT file systems.",
"Files are moved to date stamped versions in a .stversions folder when replaced or deleted by Syncthing.": "Files are moved to date stamped versions in a .stversions folder when replaced or deleted by Syncthing.", "Files are moved to date stamped versions in a .stversions folder when replaced or deleted by Syncthing.": "Files are moved to date stamped versions in a .stversions folder when replaced or deleted by Syncthing.",
@ -67,6 +69,7 @@
"Introducer": "Introducer", "Introducer": "Introducer",
"Inversion of the given condition (i.e. do not exclude)": "Inversion of the given condition (i.e. do not exclude)", "Inversion of the given condition (i.e. do not exclude)": "Inversion of the given condition (i.e. do not exclude)",
"Keep Versions": "Keep Versions", "Keep Versions": "Keep Versions",
"Largest First": "Largest First",
"Last File Received": "Last File Received", "Last File Received": "Last File Received",
"Last seen": "Last seen", "Last seen": "Last seen",
"Later": "Later", "Later": "Later",
@ -80,11 +83,13 @@
"Never": "Never", "Never": "Never",
"New Device": "New Device", "New Device": "New Device",
"New Folder": "New Folder", "New Folder": "New Folder",
"Newest First": "Newest First",
"No": "No", "No": "No",
"No File Versioning": "No File Versioning", "No File Versioning": "No File Versioning",
"Notice": "Notice", "Notice": "Notice",
"OK": "OK", "OK": "OK",
"Off": "Off", "Off": "Off",
"Oldest First": "Oldest First",
"Out Of Sync": "Out Of Sync", "Out Of Sync": "Out Of Sync",
"Out of Sync Items": "Out of Sync Items", "Out of Sync Items": "Out of Sync Items",
"Outgoing Rate Limit (KiB/s)": "Outgoing Rate Limit (KiB/s)", "Outgoing Rate Limit (KiB/s)": "Outgoing Rate Limit (KiB/s)",
@ -97,6 +102,7 @@
"Preview Usage Report": "Preview Usage Report", "Preview Usage Report": "Preview Usage Report",
"Quick guide to supported patterns": "Quick guide to supported patterns", "Quick guide to supported patterns": "Quick guide to supported patterns",
"RAM Utilization": "RAM Utilization", "RAM Utilization": "RAM Utilization",
"Random": "Random",
"Release Notes": "Release Notes", "Release Notes": "Release Notes",
"Rescan": "Rescan", "Rescan": "Rescan",
"Rescan All": "Rescan All", "Rescan All": "Rescan All",
@ -124,6 +130,7 @@
"Shutdown Complete": "Shutdown Complete", "Shutdown Complete": "Shutdown Complete",
"Simple File Versioning": "Simple File Versioning", "Simple File Versioning": "Simple File Versioning",
"Single level wildcard (matches within a directory only)": "Single level wildcard (matches within a directory only)", "Single level wildcard (matches within a directory only)": "Single level wildcard (matches within a directory only)",
"Smallest First": "Smallest First",
"Source Code": "Source Code", "Source Code": "Source Code",
"Staggered File Versioning": "Staggered File Versioning", "Staggered File Versioning": "Staggered File Versioning",
"Start Browser": "Start Browser", "Start Browser": "Start Browser",

View File

@ -239,6 +239,17 @@
<th><span class="glyphicon glyphicon-refresh"></span>&emsp;<span translate>Rescan Interval</span></th> <th><span class="glyphicon glyphicon-refresh"></span>&emsp;<span translate>Rescan Interval</span></th>
<td class="text-right">{{folder.rescanIntervalS}} s</td> <td class="text-right">{{folder.rescanIntervalS}} s</td>
</tr> </tr>
<tr ng-if="folder.order != 'random'">
<th><span class="glyphicon glyphicon-sort"></span>&emsp;<span translate>File Pull Order</span></th>
<td class="text-right" ng-switch="folder.order">
<span ng-switch-when="random" translate>Random</span>
<span ng-switch-when="alphabetic" translate>Alphabetic</span>
<span ng-switch-when="smallestFirst" translate>Smallest First</span>
<span ng-switch-when="largestFirst" translate>Largest First</span>
<span ng-switch-when="oldestFirst" translate>Oldest First</span>
<span ng-switch-when="newestFirst" translate>Newest First</span>
</td>
</tr>
<tr ng-if="folder.versioning.type"> <tr ng-if="folder.versioning.type">
<th><span class="glyphicon glyphicon-tags"></span>&emsp;<span translate>File Versioning</span></th> <th><span class="glyphicon glyphicon-tags"></span>&emsp;<span translate>File Versioning</span></th>
<td class="text-right" ng-switch="folder.versioning.type"> <td class="text-right" ng-switch="folder.versioning.type">
@ -625,6 +636,7 @@
</div> </div>
</div> </div>
<div class="row"> <div class="row">
<!-- Left column -->
<div class="col-md-6"> <div class="col-md-6">
<div class="form-group"> <div class="form-group">
<div class="checkbox"> <div class="checkbox">
@ -643,7 +655,20 @@
<p translate class="help-block">File permission bits are ignored when looking for changes. Use on FAT file systems.</p> <p translate class="help-block">File permission bits are ignored when looking for changes. Use on FAT file systems.</p>
</div> </div>
</div> </div>
<!-- Right column-->
<div class="col-md-6"> <div class="col-md-6">
<div class="form-group">
<label translate>File Pull Order</label>
<select class="form-control" ng-model="currentFolder.order">
<option value="random" translate>Random</option>
<option value="alphabetic" translate>Alphabetic</option>
<option value="smallestFirst" translate>Smallest First</option>
<option value="largestFirst" translate>Largest First</option>
<option value="oldestFirst" translate>Oldest First</option>
<option value="newestFirst" translate>Newest First</option>
</select>
</div>
<div class="form-group"> <div class="form-group">
<label translate>File Versioning</label> <label translate>File Versioning</label>
<div class="radio"> <div class="radio">

File diff suppressed because one or more lines are too long

View File

@ -82,6 +82,7 @@ type FolderConfiguration struct {
Copiers int `xml:"copiers" json:"copiers"` // This defines how many files are handled concurrently. Copiers int `xml:"copiers" json:"copiers"` // This defines how many files are handled concurrently.
Pullers int `xml:"pullers" json:"pullers"` // Defines how many blocks are fetched at the same time, possibly between separate copier routines. Pullers int `xml:"pullers" json:"pullers"` // Defines how many blocks are fetched at the same time, possibly between separate copier routines.
Hashers int `xml:"hashers" json:"hashers"` // Less than one sets the value to the number of cores. These are CPU bound due to hashing. Hashers int `xml:"hashers" json:"hashers"` // Less than one sets the value to the number of cores. These are CPU bound due to hashing.
Order PullOrder `xml:"order" json:"order"`
Invalid string `xml:"-" json:"invalid"` // Set at runtime when there is an error, not saved Invalid string `xml:"-" json:"invalid"` // Set at runtime when there is an error, not saved
@ -678,3 +679,57 @@ func randomString(l int) string {
} }
return string(bs) return string(bs)
} }
type PullOrder int
const (
OrderRandom PullOrder = iota // default is random
OrderAlphabetic
OrderSmallestFirst
OrderLargestFirst
OrderOldestFirst
OrderNewestFirst
)
func (o PullOrder) String() string {
switch o {
case OrderRandom:
return "random"
case OrderAlphabetic:
return "alphabetic"
case OrderSmallestFirst:
return "smallestFirst"
case OrderLargestFirst:
return "largestFirst"
case OrderOldestFirst:
return "oldestFirst"
case OrderNewestFirst:
return "newestFirst"
default:
return "unknown"
}
}
func (o PullOrder) MarshalText() ([]byte, error) {
return []byte(o.String()), nil
}
func (o *PullOrder) UnmarshalText(bs []byte) error {
switch string(bs) {
case "random":
*o = OrderRandom
case "alphabetic":
*o = OrderAlphabetic
case "smallestFirst":
*o = OrderSmallestFirst
case "largestFirst":
*o = OrderLargestFirst
case "oldestFirst":
*o = OrderOldestFirst
case "newestFirst":
*o = OrderNewestFirst
default:
*o = OrderRandom
}
return nil
}

View File

@ -528,3 +528,51 @@ func TestCopy(t *testing.T) {
t.Error("Copy should be unchanged") t.Error("Copy should be unchanged")
} }
} }
func TestPullOrder(t *testing.T) {
wrapper, err := Load("testdata/pullorder.xml", device1)
if err != nil {
t.Fatal(err)
}
folders := wrapper.Folders()
expected := []struct {
name string
order PullOrder
}{
{"f1", OrderRandom}, // empty value, default
{"f2", OrderRandom}, // explicit
{"f3", OrderAlphabetic}, // explicit
{"f4", OrderRandom}, // unknown value, default
{"f5", OrderSmallestFirst}, // explicit
{"f6", OrderLargestFirst}, // explicit
{"f7", OrderOldestFirst}, // explicit
{"f8", OrderNewestFirst}, // explicit
}
// Verify values are deserialized correctly
for _, tc := range expected {
if actual := folders[tc.name].Order; actual != tc.order {
t.Errorf("Incorrect pull order for %q: %v != %v", tc.name, actual, tc.order)
}
}
// Serialize and deserialize again to verify it survives the transformation
buf := new(bytes.Buffer)
cfg := wrapper.Raw()
cfg.WriteXML(buf)
t.Logf("%s", buf.Bytes())
cfg, err = ReadXML(buf, device1)
wrapper = Wrap("testdata/pullorder.xml", cfg)
folders = wrapper.Folders()
for _, tc := range expected {
if actual := folders[tc.name].Order; actual != tc.order {
t.Errorf("Incorrect pull order for %q: %v != %v", tc.name, actual, tc.order)
}
}
}

25
internal/config/testdata/pullorder.xml vendored Normal file
View File

@ -0,0 +1,25 @@
<configuration version="10">
<folder id="f1" directory="testdata/">
</folder>
<folder id="f2" directory="testdata/">
<order>random</order>
</folder>
<folder id="f3" directory="testdata/">
<order>alphabetic</order>
</folder>
<folder id="f4" directory="testdata/">
<order>whatever</order>
</folder>
<folder id="f5" directory="testdata/">
<order>smallestFirst</order>
</folder>
<folder id="f6" directory="testdata/">
<order>largestFirst</order>
</folder>
<folder id="f7" directory="testdata/">
<order>oldestFirst</order>
</folder>
<folder id="f8" directory="testdata/">
<order>newestFirst</order>
</folder>
</configuration>

View File

@ -6,23 +6,34 @@
package model package model
import "github.com/syncthing/syncthing/internal/sync" import (
"math/rand"
"sort"
"github.com/syncthing/syncthing/internal/sync"
)
type jobQueue struct { type jobQueue struct {
progress []string progress []string
queued []string queued []jobQueueEntry
mut sync.Mutex mut sync.Mutex
} }
type jobQueueEntry struct {
name string
size int64
modified int64
}
func newJobQueue() *jobQueue { func newJobQueue() *jobQueue {
return &jobQueue{ return &jobQueue{
mut: sync.NewMutex(), mut: sync.NewMutex(),
} }
} }
func (q *jobQueue) Push(file string) { func (q *jobQueue) Push(file string, size, modified int64) {
q.mut.Lock() q.mut.Lock()
q.queued = append(q.queued, file) q.queued = append(q.queued, jobQueueEntry{file, size, modified})
q.mut.Unlock() q.mut.Unlock()
} }
@ -34,8 +45,7 @@ func (q *jobQueue) Pop() (string, bool) {
return "", false return "", false
} }
var f string f := q.queued[0].name
f = q.queued[0]
q.queued = q.queued[1:] q.queued = q.queued[1:]
q.progress = append(q.progress, f) q.progress = append(q.progress, f)
@ -47,7 +57,7 @@ func (q *jobQueue) BringToFront(filename string) {
defer q.mut.Unlock() defer q.mut.Unlock()
for i, cur := range q.queued { for i, cur := range q.queued {
if cur == filename { if cur.name == filename {
if i > 0 { if i > 0 {
// Shift the elements before the selected element one step to // Shift the elements before the selected element one step to
// the right, overwriting the selected element // the right, overwriting the selected element
@ -81,7 +91,62 @@ func (q *jobQueue) Jobs() ([]string, []string) {
copy(progress, q.progress) copy(progress, q.progress)
queued := make([]string, len(q.queued)) queued := make([]string, len(q.queued))
copy(queued, q.queued) for i := range q.queued {
queued[i] = q.queued[i].name
}
return progress, queued return progress, queued
} }
func (q *jobQueue) Shuffle() {
q.mut.Lock()
defer q.mut.Unlock()
l := len(q.queued)
for i := range q.queued {
r := rand.Intn(l)
q.queued[i], q.queued[r] = q.queued[r], q.queued[i]
}
}
func (q *jobQueue) SortSmallestFirst() {
q.mut.Lock()
defer q.mut.Unlock()
sort.Sort(smallestFirst(q.queued))
}
func (q *jobQueue) SortLargestFirst() {
q.mut.Lock()
defer q.mut.Unlock()
sort.Sort(sort.Reverse(smallestFirst(q.queued)))
}
func (q *jobQueue) SortOldestFirst() {
q.mut.Lock()
defer q.mut.Unlock()
sort.Sort(oldestFirst(q.queued))
}
func (q *jobQueue) SortNewestFirst() {
q.mut.Lock()
defer q.mut.Unlock()
sort.Sort(sort.Reverse(oldestFirst(q.queued)))
}
// The usual sort.Interface boilerplate
type smallestFirst []jobQueueEntry
func (q smallestFirst) Len() int { return len(q) }
func (q smallestFirst) Less(a, b int) bool { return q[a].size < q[b].size }
func (q smallestFirst) Swap(a, b int) { q[a], q[b] = q[b], q[a] }
type oldestFirst []jobQueueEntry
func (q oldestFirst) Len() int { return len(q) }
func (q oldestFirst) Less(a, b int) bool { return q[a].modified < q[b].modified }
func (q oldestFirst) Swap(a, b int) { q[a], q[b] = q[b], q[a] }

View File

@ -15,10 +15,10 @@ import (
func TestJobQueue(t *testing.T) { func TestJobQueue(t *testing.T) {
// Some random actions // Some random actions
q := newJobQueue() q := newJobQueue()
q.Push("f1") q.Push("f1", 0, 0)
q.Push("f2") q.Push("f2", 0, 0)
q.Push("f3") q.Push("f3", 0, 0)
q.Push("f4") q.Push("f4", 0, 0)
progress, queued := q.Jobs() progress, queued := q.Jobs()
if len(progress) != 0 || len(queued) != 4 { if len(progress) != 0 || len(queued) != 4 {
@ -43,7 +43,7 @@ func TestJobQueue(t *testing.T) {
t.Fatal("Wrong length", len(progress), len(queued)) t.Fatal("Wrong length", len(progress), len(queued))
} }
q.Push(n) q.Push(n, 0, 0)
progress, queued = q.Jobs() progress, queued = q.Jobs()
if len(progress) != 0 || len(queued) != 4 { if len(progress) != 0 || len(queued) != 4 {
t.Fatal("Wrong length") t.Fatal("Wrong length")
@ -120,10 +120,10 @@ func TestJobQueue(t *testing.T) {
func TestBringToFront(t *testing.T) { func TestBringToFront(t *testing.T) {
q := newJobQueue() q := newJobQueue()
q.Push("f1") q.Push("f1", 0, 0)
q.Push("f2") q.Push("f2", 0, 0)
q.Push("f3") q.Push("f3", 0, 0)
q.Push("f4") q.Push("f4", 0, 0)
_, queued := q.Jobs() _, queued := q.Jobs()
if !reflect.DeepEqual(queued, []string{"f1", "f2", "f3", "f4"}) { if !reflect.DeepEqual(queued, []string{"f1", "f2", "f3", "f4"}) {
@ -159,12 +159,101 @@ func TestBringToFront(t *testing.T) {
} }
} }
func TestShuffle(t *testing.T) {
q := newJobQueue()
q.Push("f1", 0, 0)
q.Push("f2", 0, 0)
q.Push("f3", 0, 0)
q.Push("f4", 0, 0)
// This test will fail once in eight million times (1 / (4!)^5) :)
for i := 0; i < 5; i++ {
q.Shuffle()
_, queued := q.Jobs()
if l := len(queued); l != 4 {
t.Fatalf("Weird length %d returned from Jobs()", l)
}
t.Logf("%v", queued)
if !reflect.DeepEqual(queued, []string{"f1", "f2", "f3", "f4"}) {
// The queue was shuffled
return
}
}
t.Error("Queue was not shuffled after five attempts.")
}
func TestSortBySize(t *testing.T) {
q := newJobQueue()
q.Push("f1", 20, 0)
q.Push("f2", 40, 0)
q.Push("f3", 30, 0)
q.Push("f4", 10, 0)
q.SortSmallestFirst()
_, actual := q.Jobs()
if l := len(actual); l != 4 {
t.Fatalf("Weird length %d returned from Jobs()", l)
}
expected := []string{"f4", "f1", "f3", "f2"}
if !reflect.DeepEqual(actual, expected) {
t.Errorf("SortSmallestFirst(): %#v != %#v", actual, expected)
}
q.SortLargestFirst()
_, actual = q.Jobs()
if l := len(actual); l != 4 {
t.Fatalf("Weird length %d returned from Jobs()", l)
}
expected = []string{"f2", "f3", "f1", "f4"}
if !reflect.DeepEqual(actual, expected) {
t.Errorf("SortLargestFirst(): %#v != %#v", actual, expected)
}
}
func TestSortByAge(t *testing.T) {
q := newJobQueue()
q.Push("f1", 0, 20)
q.Push("f2", 0, 40)
q.Push("f3", 0, 30)
q.Push("f4", 0, 10)
q.SortOldestFirst()
_, actual := q.Jobs()
if l := len(actual); l != 4 {
t.Fatalf("Weird length %d returned from Jobs()", l)
}
expected := []string{"f4", "f1", "f3", "f2"}
if !reflect.DeepEqual(actual, expected) {
t.Errorf("SortOldestFirst(): %#v != %#v", actual, expected)
}
q.SortNewestFirst()
_, actual = q.Jobs()
if l := len(actual); l != 4 {
t.Fatalf("Weird length %d returned from Jobs()", l)
}
expected = []string{"f2", "f3", "f1", "f4"}
if !reflect.DeepEqual(actual, expected) {
t.Errorf("SortNewestFirst(): %#v != %#v", actual, expected)
}
}
func BenchmarkJobQueueBump(b *testing.B) { func BenchmarkJobQueueBump(b *testing.B) {
files := genFiles(b.N) files := genFiles(b.N)
q := newJobQueue() q := newJobQueue()
for _, f := range files { for _, f := range files {
q.Push(f.Name) q.Push(f.Name, 0, 0)
} }
b.ResetTimer() b.ResetTimer()
@ -180,7 +269,7 @@ func BenchmarkJobQueuePushPopDone10k(b *testing.B) {
for i := 0; i < b.N; i++ { for i := 0; i < b.N; i++ {
q := newJobQueue() q := newJobQueue()
for _, f := range files { for _, f := range files {
q.Push(f.Name) q.Push(f.Name, 0, 0)
} }
for _ = range files { for _ = range files {
n, _ := q.Pop() n, _ := q.Pop()

View File

@ -69,6 +69,7 @@ type rwFolder struct {
copiers int copiers int
pullers int pullers int
shortID uint64 shortID uint64
order config.PullOrder
stop chan struct{} stop chan struct{}
queue *jobQueue queue *jobQueue
@ -93,6 +94,7 @@ func newRWFolder(m *Model, shortID uint64, cfg config.FolderConfiguration) *rwFo
copiers: cfg.Copiers, copiers: cfg.Copiers,
pullers: cfg.Pullers, pullers: cfg.Pullers,
shortID: shortID, shortID: shortID,
order: cfg.Order,
stop: make(chan struct{}), stop: make(chan struct{}),
queue: newJobQueue(), queue: newJobQueue(),
@ -346,13 +348,9 @@ func (p *rwFolder) pullerIteration(ignores *ignore.Matcher) int {
buckets := map[string][]protocol.FileInfo{} buckets := map[string][]protocol.FileInfo{}
folderFiles.WithNeed(protocol.LocalDeviceID, func(intf db.FileIntf) bool { folderFiles.WithNeed(protocol.LocalDeviceID, func(intf db.FileIntf) bool {
// Needed items are delivered sorted lexicographically. We'll handle
// Needed items are delivered sorted lexicographically. This isn't // directories as they come along, so parents before children. Files
// really optimal from a performance point of view - it would be // are queued and the order may be changed later.
// better if files were handled in random order, to spread the load
// over the cluster. But it means that we can be sure that we fully
// handle directories before the files that go inside them, which is
// nice.
file := intf.(protocol.FileInfo) file := intf.(protocol.FileInfo)
@ -392,13 +390,32 @@ func (p *rwFolder) pullerIteration(ignores *ignore.Matcher) int {
default: default:
// A new or changed file or symlink. This is the only case where we // A new or changed file or symlink. This is the only case where we
// do stuff concurrently in the background // do stuff concurrently in the background
p.queue.Push(file.Name) p.queue.Push(file.Name, file.Size(), file.Modified)
} }
changed++ changed++
return true return true
}) })
// Reorder the file queue according to configuration
switch p.order {
case config.OrderRandom:
p.queue.Shuffle()
case config.OrderAlphabetic:
// The queue is already in alphabetic order.
case config.OrderSmallestFirst:
p.queue.SortSmallestFirst()
case config.OrderLargestFirst:
p.queue.SortLargestFirst()
case config.OrderOldestFirst:
p.queue.SortOldestFirst()
case config.OrderNewestFirst:
p.queue.SortOldestFirst()
}
// Process the file queue
nextFile: nextFile:
for { for {
fileName, ok := p.queue.Pop() fileName, ok := p.queue.Pop()

View File

@ -393,7 +393,7 @@ func TestDeregisterOnFailInCopy(t *testing.T) {
} }
// queue.Done should be called by the finisher routine // queue.Done should be called by the finisher routine
p.queue.Push("filex") p.queue.Push("filex", 0, 0)
p.queue.Pop() p.queue.Pop()
if len(p.queue.progress) != 1 { if len(p.queue.progress) != 1 {
@ -480,7 +480,7 @@ func TestDeregisterOnFailInPull(t *testing.T) {
} }
// queue.Done should be called by the finisher routine // queue.Done should be called by the finisher routine
p.queue.Push("filex") p.queue.Push("filex", 0, 0)
p.queue.Pop() p.queue.Pop()
if len(p.queue.progress) != 1 { if len(p.queue.progress) != 1 {