205 lines
4.6 KiB
Go
205 lines
4.6 KiB
Go
package blockstore
|
|
|
|
import (
|
|
"context"
|
|
"fmt"
|
|
"sync/atomic"
|
|
"time"
|
|
|
|
bloom "github.com/ipfs/bbloom"
|
|
blocks "github.com/ipfs/go-block-format"
|
|
cid "github.com/ipfs/go-cid"
|
|
metrics "github.com/ipfs/go-metrics-interface"
|
|
)
|
|
|
|
// bloomCached returns a Blockstore that caches Has requests using a Bloom
|
|
// filter. bloomSize is size of bloom filter in bytes. hashCount specifies the
|
|
// number of hashing functions in the bloom filter (usually known as k).
|
|
func bloomCached(ctx context.Context, bs Blockstore, bloomSize, hashCount int) (*bloomcache, error) {
|
|
bl, err := bloom.New(float64(bloomSize), float64(hashCount))
|
|
if err != nil {
|
|
return nil, err
|
|
}
|
|
bc := &bloomcache{
|
|
blockstore: bs,
|
|
bloom: bl,
|
|
hits: metrics.NewCtx(ctx, "bloom.hits_total",
|
|
"Number of cache hits in bloom cache").Counter(),
|
|
total: metrics.NewCtx(ctx, "bloom_total",
|
|
"Total number of requests to bloom cache").Counter(),
|
|
buildChan: make(chan struct{}),
|
|
}
|
|
go func() {
|
|
err := bc.build(ctx)
|
|
if err != nil {
|
|
select {
|
|
case <-ctx.Done():
|
|
log.Warning("Cache rebuild closed by context finishing: ", err)
|
|
default:
|
|
log.Error(err)
|
|
}
|
|
return
|
|
}
|
|
if metrics.Active() {
|
|
fill := metrics.NewCtx(ctx, "bloom_fill_ratio",
|
|
"Ratio of bloom filter fullnes, (updated once a minute)").Gauge()
|
|
|
|
t := time.NewTicker(1 * time.Minute)
|
|
defer t.Stop()
|
|
for {
|
|
select {
|
|
case <-ctx.Done():
|
|
return
|
|
case <-t.C:
|
|
fill.Set(bc.bloom.FillRatio())
|
|
}
|
|
}
|
|
}
|
|
}()
|
|
return bc, nil
|
|
}
|
|
|
|
type bloomcache struct {
|
|
active int32
|
|
|
|
bloom *bloom.Bloom
|
|
buildErr error
|
|
|
|
buildChan chan struct{}
|
|
blockstore Blockstore
|
|
|
|
// Statistics
|
|
hits metrics.Counter
|
|
total metrics.Counter
|
|
}
|
|
|
|
func (b *bloomcache) BloomActive() bool {
|
|
return atomic.LoadInt32(&b.active) != 0
|
|
}
|
|
|
|
func (b *bloomcache) Wait(ctx context.Context) error {
|
|
select {
|
|
case <-ctx.Done():
|
|
return ctx.Err()
|
|
case <-b.buildChan:
|
|
return b.buildErr
|
|
}
|
|
}
|
|
|
|
func (b *bloomcache) build(ctx context.Context) error {
|
|
evt := log.EventBegin(ctx, "bloomcache.build")
|
|
defer evt.Done()
|
|
defer close(b.buildChan)
|
|
|
|
ch, err := b.blockstore.AllKeysChan(ctx)
|
|
if err != nil {
|
|
b.buildErr = fmt.Errorf("AllKeysChan failed in bloomcache rebuild with: %v", err)
|
|
return b.buildErr
|
|
}
|
|
for {
|
|
select {
|
|
case key, ok := <-ch:
|
|
if !ok {
|
|
atomic.StoreInt32(&b.active, 1)
|
|
return nil
|
|
}
|
|
b.bloom.AddTS(key.Bytes()) // Use binary key, the more compact the better
|
|
case <-ctx.Done():
|
|
b.buildErr = ctx.Err()
|
|
return b.buildErr
|
|
}
|
|
}
|
|
}
|
|
|
|
func (b *bloomcache) DeleteBlock(k cid.Cid) error {
|
|
if has, ok := b.hasCached(k); ok && !has {
|
|
return ErrNotFound
|
|
}
|
|
|
|
return b.blockstore.DeleteBlock(k)
|
|
}
|
|
|
|
// if ok == false has is inconclusive
|
|
// if ok == true then has respons to question: is it contained
|
|
func (b *bloomcache) hasCached(k cid.Cid) (has bool, ok bool) {
|
|
b.total.Inc()
|
|
if !k.Defined() {
|
|
log.Error("undefined in bloom cache")
|
|
// Return cache invalid so call to blockstore
|
|
// in case of invalid key is forwarded deeper
|
|
return false, false
|
|
}
|
|
if b.BloomActive() {
|
|
blr := b.bloom.HasTS(k.Bytes())
|
|
if !blr { // not contained in bloom is only conclusive answer bloom gives
|
|
b.hits.Inc()
|
|
return false, true
|
|
}
|
|
}
|
|
return false, false
|
|
}
|
|
|
|
func (b *bloomcache) Has(k cid.Cid) (bool, error) {
|
|
if has, ok := b.hasCached(k); ok {
|
|
return has, nil
|
|
}
|
|
|
|
return b.blockstore.Has(k)
|
|
}
|
|
|
|
func (b *bloomcache) GetSize(k cid.Cid) (int, error) {
|
|
return b.blockstore.GetSize(k)
|
|
}
|
|
|
|
func (b *bloomcache) Get(k cid.Cid) (blocks.Block, error) {
|
|
if has, ok := b.hasCached(k); ok && !has {
|
|
return nil, ErrNotFound
|
|
}
|
|
|
|
return b.blockstore.Get(k)
|
|
}
|
|
|
|
func (b *bloomcache) Put(bl blocks.Block) error {
|
|
// See comment in PutMany
|
|
err := b.blockstore.Put(bl)
|
|
if err == nil {
|
|
b.bloom.AddTS(bl.Cid().Bytes())
|
|
}
|
|
return err
|
|
}
|
|
|
|
func (b *bloomcache) PutMany(bs []blocks.Block) error {
|
|
// bloom cache gives only conclusive resulty if key is not contained
|
|
// to reduce number of puts we need conclusive information if block is contained
|
|
// this means that PutMany can't be improved with bloom cache so we just
|
|
// just do a passthrough.
|
|
err := b.blockstore.PutMany(bs)
|
|
if err != nil {
|
|
return err
|
|
}
|
|
for _, bl := range bs {
|
|
b.bloom.AddTS(bl.Cid().Bytes())
|
|
}
|
|
return nil
|
|
}
|
|
|
|
func (b *bloomcache) HashOnRead(enabled bool) {
|
|
b.blockstore.HashOnRead(enabled)
|
|
}
|
|
|
|
func (b *bloomcache) AllKeysChan(ctx context.Context) (<-chan cid.Cid, error) {
|
|
return b.blockstore.AllKeysChan(ctx)
|
|
}
|
|
|
|
func (b *bloomcache) GCLock() Unlocker {
|
|
return b.blockstore.(GCBlockstore).GCLock()
|
|
}
|
|
|
|
func (b *bloomcache) PinLock() Unlocker {
|
|
return b.blockstore.(GCBlockstore).PinLock()
|
|
}
|
|
|
|
func (b *bloomcache) GCRequested() bool {
|
|
return b.blockstore.(GCBlockstore).GCRequested()
|
|
}
|