2
2
mirror of https://github.com/octoleo/restic.git synced 2025-01-05 16:12:29 +00:00

chunker: Add test, only pass hash.Hash to New()

This commit is contained in:
Alexander Neumann 2015-02-11 13:10:36 +01:00
parent 869ba83c6d
commit 3bf66d24fa
3 changed files with 57 additions and 20 deletions

View File

@ -67,16 +67,16 @@ type Chunker struct {
digest uint64 digest uint64
h hash.Hash h hash.Hash
hfn func() hash.Hash
} }
// New returns a new Chunker that reads from data from rd. // New returns a new Chunker that reads from data from rd with bufsize and pass
func New(rd io.Reader, bufsize int, hashfn func() hash.Hash) *Chunker { // all data to hash along the way.
func New(rd io.Reader, bufsize int, hash hash.Hash) *Chunker {
once.Do(fill_tables) once.Do(fill_tables)
c := &Chunker{ c := &Chunker{
buf: make([]byte, bufsize), buf: make([]byte, bufsize),
hfn: hashfn, h: hash,
} }
c.Reset(rd) c.Reset(rd)
@ -99,7 +99,9 @@ func (c *Chunker) Reset(rd io.Reader) {
c.count = 0 c.count = 0
c.slide(1) c.slide(1)
c.resetHash() if c.h != nil {
c.h.Reset()
}
// do not start a new chunk unless at least MinSize bytes have been read // do not start a new chunk unless at least MinSize bytes have been read
c.pre = MinSize - WindowSize c.pre = MinSize - WindowSize
@ -232,7 +234,9 @@ func (c *Chunker) Next() (*Chunk, error) {
Digest: c.hashDigest(), Digest: c.hashDigest(),
} }
c.resetHash() if c.h != nil {
c.h.Reset()
}
// reset chunker, but keep position // reset chunker, but keep position
pos := c.pos pos := c.pos
@ -255,12 +259,6 @@ func (c *Chunker) Next() (*Chunk, error) {
} }
} }
func (c *Chunker) resetHash() {
if c.hfn != nil {
c.h = c.hfn()
}
}
func (c *Chunker) updateHash(data []byte) { func (c *Chunker) updateHash(data []byte) {
if c.h != nil { if c.h != nil {
// the hashes from crypto/sha* do not return an error // the hashes from crypto/sha* do not return an error

View File

@ -8,6 +8,7 @@ import (
"flag" "flag"
"hash" "hash"
"io" "io"
"io/ioutil"
"math/rand" "math/rand"
"os" "os"
"testing" "testing"
@ -104,7 +105,7 @@ func test_with_data(t *testing.T, chnker *chunker.Chunker, testChunks []chunk) [
i, len(chunks)-1, chunk.CutFP, c.Cut) i, len(chunks)-1, chunk.CutFP, c.Cut)
} }
if !bytes.Equal(c.Digest, chunk.Digest) { if c.Digest != nil && !bytes.Equal(c.Digest, chunk.Digest) {
t.Fatalf("Digest fingerprint for chunk %d/%d does not match: expected %02x, got %02x", t.Fatalf("Digest fingerprint for chunk %d/%d does not match: expected %02x, got %02x",
i, len(chunks)-1, chunk.Digest, c.Digest) i, len(chunks)-1, chunk.Digest, c.Digest)
} }
@ -145,7 +146,7 @@ func get_random(seed, count int) []byte {
func TestChunker(t *testing.T) { func TestChunker(t *testing.T) {
// setup data source // setup data source
buf := get_random(23, 32*1024*1024) buf := get_random(23, 32*1024*1024)
ch := chunker.New(bytes.NewReader(buf), *testBufSize, sha256.New) ch := chunker.New(bytes.NewReader(buf), *testBufSize, sha256.New())
chunks := test_with_data(t, ch, chunks1) chunks := test_with_data(t, ch, chunks1)
// test reader // test reader
@ -172,14 +173,52 @@ func TestChunker(t *testing.T) {
// setup nullbyte data source // setup nullbyte data source
buf = bytes.Repeat([]byte{0}, len(chunks2)*chunker.MinSize) buf = bytes.Repeat([]byte{0}, len(chunks2)*chunker.MinSize)
ch = chunker.New(bytes.NewReader(buf), *testBufSize, sha256.New) ch = chunker.New(bytes.NewReader(buf), *testBufSize, sha256.New())
test_with_data(t, ch, chunks2)
}
func TestChunkerWithoutHash(t *testing.T) {
// setup data source
buf := get_random(23, 32*1024*1024)
ch := chunker.New(bytes.NewReader(buf), *testBufSize, nil)
chunks := test_with_data(t, ch, chunks1)
// test reader
for i, c := range chunks {
rd := c.Reader(bytes.NewReader(buf))
buf2, err := ioutil.ReadAll(rd)
if err != nil {
t.Fatalf("io.Copy(): %v", err)
}
if uint(len(buf2)) != chunks1[i].Length {
t.Fatalf("reader returned wrong number of bytes: expected %d, got %d",
chunks1[i].Length, uint(len(buf2)))
}
if uint(len(buf2)) != chunks1[i].Length {
t.Fatalf("wrong number of bytes returned: expected %02x, got %02x",
chunks[i].Length, len(buf2))
}
if !bytes.Equal(buf[c.Start:c.Start+c.Length], buf2) {
t.Fatalf("invalid data for chunk returned: expected %02x, got %02x",
buf[c.Start:c.Start+c.Length], buf2)
}
}
// setup nullbyte data source
buf = bytes.Repeat([]byte{0}, len(chunks2)*chunker.MinSize)
ch = chunker.New(bytes.NewReader(buf), *testBufSize, sha256.New())
test_with_data(t, ch, chunks2) test_with_data(t, ch, chunks2)
} }
func TestChunkerReuse(t *testing.T) { func TestChunkerReuse(t *testing.T) {
// test multiple uses of the same chunker // test multiple uses of the same chunker
ch := chunker.New(nil, *testBufSize, sha256.New) ch := chunker.New(nil, *testBufSize, sha256.New())
buf := get_random(23, 32*1024*1024) buf := get_random(23, 32*1024*1024)
for i := 0; i < 4; i++ { for i := 0; i < 4; i++ {
@ -188,7 +227,7 @@ func TestChunkerReuse(t *testing.T) {
} }
} }
func benchmarkChunker(b *testing.B, hash func() hash.Hash) { func benchmarkChunker(b *testing.B, hash hash.Hash) {
var ( var (
rd io.ReadSeeker rd io.ReadSeeker
size int size int
@ -244,11 +283,11 @@ func benchmarkChunker(b *testing.B, hash func() hash.Hash) {
} }
func BenchmarkChunkerWithSHA256(b *testing.B) { func BenchmarkChunkerWithSHA256(b *testing.B) {
benchmarkChunker(b, sha256.New) benchmarkChunker(b, sha256.New())
} }
func BenchmarkChunkerWithMD5(b *testing.B) { func BenchmarkChunkerWithMD5(b *testing.B) {
benchmarkChunker(b, md5.New) benchmarkChunker(b, md5.New())
} }
func BenchmarkChunker(b *testing.B) { func BenchmarkChunker(b *testing.B) {

View File

@ -99,7 +99,7 @@ func newChunker() interface{} {
chunkStats.new++ chunkStats.new++
// create a new chunker with a nil reader // create a new chunker with a nil reader
return chunker.New(nil, chunkerBufSize, sha256.New) return chunker.New(nil, chunkerBufSize, sha256.New())
} }
func GetChunkBuf(s string) []byte { func GetChunkBuf(s string) []byte {