syncthing/lib/scanner/blocks.go

228 lines
5.2 KiB
Go
Raw Normal View History

2014-11-16 21:13:20 +01:00
// Copyright (C) 2014 The Syncthing Authors.
2014-09-29 21:43:32 +02:00
//
2015-03-07 21:36:35 +01:00
// This Source Code Form is subject to the terms of the Mozilla Public
// License, v. 2.0. If a copy of the MPL was not distributed with this file,
// You can obtain one at http://mozilla.org/MPL/2.0/.
2014-06-01 22:50:14 +02:00
package scanner
2014-03-02 23:58:14 +01:00
import (
"bytes"
"crypto/sha256"
"fmt"
2014-03-02 23:58:14 +01:00
"io"
2014-07-12 23:06:48 +02:00
2015-09-22 19:38:46 +02:00
"github.com/syncthing/syncthing/lib/protocol"
2014-03-02 23:58:14 +01:00
)
2014-10-24 23:20:08 +01:00
var SHA256OfNothing = []uint8{0xe3, 0xb0, 0xc4, 0x42, 0x98, 0xfc, 0x1c, 0x14, 0x9a, 0xfb, 0xf4, 0xc8, 0x99, 0x6f, 0xb9, 0x24, 0x27, 0xae, 0x41, 0xe4, 0x64, 0x9b, 0x93, 0x4c, 0xa4, 0x95, 0x99, 0x1b, 0x78, 0x52, 0xb8, 0x55}
2014-07-26 21:28:32 +02:00
2015-11-17 21:08:36 +01:00
type Counter interface {
Update(bytes int64)
}
2014-03-02 23:58:14 +01:00
// Blocks returns the blockwise hash of the reader.
2015-11-17 21:08:36 +01:00
func Blocks(r io.Reader, blocksize int, sizehint int64, counter Counter) ([]protocol.BlockInfo, error) {
hf := sha256.New()
hashLength := hf.Size()
2014-07-12 23:06:48 +02:00
var blocks []protocol.BlockInfo
var hashes, thisHash []byte
if sizehint >= 0 {
// Allocate contiguous blocks for the BlockInfo structures and their
// hashes once and for all, and stick to the specified size.
r = io.LimitReader(r, sizehint)
numBlocks := int(sizehint / int64(blocksize))
blocks = make([]protocol.BlockInfo, 0, numBlocks)
hashes = make([]byte, 0, hashLength*numBlocks)
2014-08-12 13:52:36 +02:00
}
// A 32k buffer is used for copying into the hash function.
buf := make([]byte, 32<<10)
2014-03-02 23:58:14 +01:00
var offset int64
for {
lr := io.LimitReader(r, int64(blocksize))
n, err := copyBuffer(hf, lr, buf)
2014-03-02 23:58:14 +01:00
if err != nil {
return nil, err
}
if n == 0 {
break
}
2015-08-26 23:49:06 +01:00
if counter != nil {
2015-11-17 21:08:36 +01:00
counter.Update(int64(n))
2015-08-26 23:49:06 +01:00
}
// Carve out a hash-sized chunk of "hashes" to store the hash for this
// block.
hashes = hf.Sum(hashes)
thisHash, hashes = hashes[:hashLength], hashes[hashLength:]
2014-07-12 23:06:48 +02:00
b := protocol.BlockInfo{
Size: int32(n),
2014-07-12 23:06:48 +02:00
Offset: offset,
Hash: thisHash,
2014-03-02 23:58:14 +01:00
}
2014-03-02 23:58:14 +01:00
blocks = append(blocks, b)
offset += int64(n)
2014-08-12 13:52:36 +02:00
hf.Reset()
2014-03-02 23:58:14 +01:00
}
if len(blocks) == 0 {
// Empty file
2014-07-12 23:06:48 +02:00
blocks = append(blocks, protocol.BlockInfo{
2014-03-02 23:58:14 +01:00
Offset: 0,
Size: 0,
2014-10-24 23:20:08 +01:00
Hash: SHA256OfNothing,
2014-03-02 23:58:14 +01:00
})
}
return blocks, nil
}
2015-04-28 22:32:10 +02:00
// PopulateOffsets sets the Offset field on each block
func PopulateOffsets(blocks []protocol.BlockInfo) {
var offset int64
for i := range blocks {
blocks[i].Offset = offset
offset += int64(blocks[i].Size)
}
}
2014-03-02 23:58:14 +01:00
// BlockDiff returns lists of common and missing (to transform src into tgt)
// blocks. Both block lists must have been created with the same block size.
2014-07-12 23:06:48 +02:00
func BlockDiff(src, tgt []protocol.BlockInfo) (have, need []protocol.BlockInfo) {
2014-03-02 23:58:14 +01:00
if len(tgt) == 0 && len(src) != 0 {
return nil, nil
}
if len(tgt) != 0 && len(src) == 0 {
// Copy the entire file
return nil, tgt
}
for i := range tgt {
if i >= len(src) || !bytes.Equal(tgt[i].Hash, src[i].Hash) {
2014-03-02 23:58:14 +01:00
// Copy differing block
need = append(need, tgt[i])
} else {
have = append(have, tgt[i])
}
}
return have, need
}
// Verify returns nil or an error describing the mismatch between the block
// list and actual reader contents
func Verify(r io.Reader, blocksize int, blocks []protocol.BlockInfo) error {
hf := sha256.New()
for i, block := range blocks {
lr := &io.LimitedReader{R: r, N: int64(blocksize)}
_, err := io.Copy(hf, lr)
if err != nil {
return err
}
hash := hf.Sum(nil)
hf.Reset()
if !bytes.Equal(hash, block.Hash) {
return fmt.Errorf("hash mismatch %x != %x for block %d", hash, block.Hash, i)
}
}
// We should have reached the end now
bs := make([]byte, 1)
n, err := r.Read(bs)
if n != 0 || err != io.EOF {
return fmt.Errorf("file continues past end of blocks")
}
return nil
}
2014-11-09 04:26:52 +00:00
func VerifyBuffer(buf []byte, block protocol.BlockInfo) ([]byte, error) {
if len(buf) != int(block.Size) {
return nil, fmt.Errorf("length mismatch %d != %d", len(buf), block.Size)
}
hf := sha256.New()
_, err := hf.Write(buf)
if err != nil {
return nil, err
}
hash := hf.Sum(nil)
if !bytes.Equal(hash, block.Hash) {
return hash, fmt.Errorf("hash mismatch %x != %x", hash, block.Hash)
}
return hash, nil
}
2015-04-28 22:32:10 +02:00
// BlocksEqual returns whether two slices of blocks are exactly the same hash
2014-11-09 04:26:52 +00:00
// and index pair wise.
func BlocksEqual(src, tgt []protocol.BlockInfo) bool {
if len(tgt) != len(src) {
return false
}
for i, sblk := range src {
if !bytes.Equal(sblk.Hash, tgt[i].Hash) {
return false
}
}
return true
}
// This is a copy & paste of io.copyBuffer from the Go 1.5 standard library,
// as we want this but also want to build with Go 1.3+.
// copyBuffer is the actual implementation of Copy and CopyBuffer.
// if buf is nil, one is allocated.
func copyBuffer(dst io.Writer, src io.Reader, buf []byte) (written int64, err error) {
// If the reader has a WriteTo method, use it to do the copy.
// Avoids an allocation and a copy.
if wt, ok := src.(io.WriterTo); ok {
return wt.WriteTo(dst)
}
// Similarly, if the writer has a ReadFrom method, use it to do the copy.
if rt, ok := dst.(io.ReaderFrom); ok {
return rt.ReadFrom(src)
}
if buf == nil {
buf = make([]byte, 32*1024)
}
for {
nr, er := src.Read(buf)
if nr > 0 {
nw, ew := dst.Write(buf[0:nr])
if nw > 0 {
written += int64(nw)
}
if ew != nil {
err = ew
break
}
if nr != nw {
err = io.ErrShortWrite
break
}
}
if er == io.EOF {
break
}
if er != nil {
err = er
break
}
}
return written, err
}