Improve benchmarks

License: MIT
Signed-off-by: default avatarJakub Sztandera <kubuxu@protocol.ai>
parent b1c398a9
package chunk
import (
"bytes"
"io"
"math/rand"
"testing"
)
type newSplitter func(io.Reader) Splitter
type bencSpec struct {
size int
name string
}
var bSizes = []bencSpec{
{1 << 10, "1K"},
{1 << 20, "1M"},
{16 << 20, "16M"},
{100 << 20, "100M"},
}
func benchmarkChunker(b *testing.B, ns newSplitter) {
for _, s := range bSizes {
s := s
b.Run(s.name, func(b *testing.B) {
benchmarkChunkerSize(b, ns, s.size)
})
}
}
func benchmarkChunkerSize(b *testing.B, ns newSplitter, size int) {
rng := rand.New(rand.NewSource(1))
data := make([]byte, size)
rng.Read(data)
b.SetBytes(int64(size))
b.ReportAllocs()
b.ResetTimer()
var res uint64
for i := 0; i < b.N; i++ {
r := ns(bytes.NewReader(data))
for {
chunk, err := r.NextBytes()
if err != nil {
if err == io.EOF {
break
}
b.Fatal(err)
}
res = res + uint64(len(chunk))
}
}
Res = Res + res
}
...@@ -28,6 +28,10 @@ func NewBuzhash(r io.Reader) *Buzhash { ...@@ -28,6 +28,10 @@ func NewBuzhash(r io.Reader) *Buzhash {
} }
} }
func (b *Buzhash) Reader() io.Reader {
return b.r
}
func (b *Buzhash) NextBytes() ([]byte, error) { func (b *Buzhash) NextBytes() ([]byte, error) {
if b.err != nil { if b.err != nil {
return nil, b.err return nil, b.err
......
...@@ -41,37 +41,16 @@ func TestBuzhashChunking(t *testing.T) { ...@@ -41,37 +41,16 @@ func TestBuzhashChunking(t *testing.T) {
} }
func TestBuzhashChunkReuse(t *testing.T) { func TestBuzhashChunkReuse(t *testing.T) {
newBuzhash := func(r io.Reader) cher { newBuzhash := func(r io.Reader) Splitter {
return NewBuzhash(r) return NewBuzhash(r)
} }
testReuse(t, newBuzhash) testReuse(t, newBuzhash)
} }
func BenchmarkBuzhash(b *testing.B) { func BenchmarkBuzhash2(b *testing.B) {
data := make([]byte, 1<<10) benchmarkChunker(b, func(r io.Reader) Splitter {
util.NewTimeSeededRand().Read(data) return NewBuzhash(r)
})
b.SetBytes(int64(len(data)))
b.ReportAllocs()
b.ResetTimer()
var res uint64
for i := 0; i < b.N; i++ {
r := NewBuzhash(bytes.NewReader(data))
for {
chunk, err := r.NextBytes()
if err != nil {
if err == io.EOF {
break
}
b.Fatal(err)
}
res = res + uint64(len(chunk))
}
}
Res = Res + res
} }
func TestBuzhashBitsHash(t *testing.T) { func TestBuzhashBitsHash(t *testing.T) {
......
...@@ -39,13 +39,7 @@ func TestRabinChunking(t *testing.T) { ...@@ -39,13 +39,7 @@ func TestRabinChunking(t *testing.T) {
} }
} }
type cher interface { func chunkData(t *testing.T, newC newSplitter, data []byte) map[string]blocks.Block {
NextBytes() ([]byte, error)
}
type newChunker func(io.Reader) cher
func chunkData(t *testing.T, newC newChunker, data []byte) map[string]blocks.Block {
r := newC(bytes.NewReader(data)) r := newC(bytes.NewReader(data))
blkmap := make(map[string]blocks.Block) blkmap := make(map[string]blocks.Block)
...@@ -66,7 +60,7 @@ func chunkData(t *testing.T, newC newChunker, data []byte) map[string]blocks.Blo ...@@ -66,7 +60,7 @@ func chunkData(t *testing.T, newC newChunker, data []byte) map[string]blocks.Blo
return blkmap return blkmap
} }
func testReuse(t *testing.T, cr newChunker) { func testReuse(t *testing.T, cr newSplitter) {
data := make([]byte, 1024*1024*16) data := make([]byte, 1024*1024*16)
util.NewTimeSeededRand().Read(data) util.NewTimeSeededRand().Read(data)
...@@ -87,7 +81,7 @@ func testReuse(t *testing.T, cr newChunker) { ...@@ -87,7 +81,7 @@ func testReuse(t *testing.T, cr newChunker) {
} }
func TestRabinChunkReuse(t *testing.T) { func TestRabinChunkReuse(t *testing.T) {
newRabin := func(r io.Reader) cher { newRabin := func(r io.Reader) Splitter {
return NewRabin(r, 256*1024) return NewRabin(r, 256*1024)
} }
testReuse(t, newRabin) testReuse(t, newRabin)
...@@ -96,29 +90,7 @@ func TestRabinChunkReuse(t *testing.T) { ...@@ -96,29 +90,7 @@ func TestRabinChunkReuse(t *testing.T) {
var Res uint64 var Res uint64
func BenchmarkRabin(b *testing.B) { func BenchmarkRabin(b *testing.B) {
const size = 1 << 10 benchmarkChunker(b, func(r io.Reader) Splitter {
data := make([]byte, size) return NewRabin(r, 256<<10)
util.NewTimeSeededRand().Read(data) })
b.SetBytes(size)
b.ReportAllocs()
b.ResetTimer()
var res uint64
for i := 0; i < b.N; i++ {
r := NewRabin(bytes.NewReader(data), 1024*256)
for {
chunk, err := r.NextBytes()
if err != nil {
if err == io.EOF {
break
}
b.Fatal(err)
}
res = res + uint64(len(chunk))
}
}
Res = Res + res
} }
...@@ -6,7 +6,6 @@ import ( ...@@ -6,7 +6,6 @@ import (
"testing" "testing"
u "github.com/ipfs/go-ipfs-util" u "github.com/ipfs/go-ipfs-util"
util "github.com/ipfs/go-ipfs-util"
) )
func randBuf(t *testing.T, size int) []byte { func randBuf(t *testing.T, size int) []byte {
...@@ -121,29 +120,7 @@ func (s *clipReader) Read(buf []byte) (int, error) { ...@@ -121,29 +120,7 @@ func (s *clipReader) Read(buf []byte) (int, error) {
} }
func BenchmarkDefault(b *testing.B) { func BenchmarkDefault(b *testing.B) {
const size = 1 << 10 benchmarkChunker(b, func(r io.Reader) Splitter {
data := make([]byte, size) return DefaultSplitter(r)
util.NewTimeSeededRand().Read(data) })
b.SetBytes(size)
b.ReportAllocs()
b.ResetTimer()
var res uint64
for i := 0; i < b.N; i++ {
r := DefaultSplitter(bytes.NewReader(data))
for {
chunk, err := r.NextBytes()
if err != nil {
if err == io.EOF {
break
}
b.Fatal(err)
}
res = res + uint64(len(chunk))
}
}
Res = Res + res
} }
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment