9a58a9b91a
* swarm/storage/localstore: most basic database * swarm/storage/localstore: fix typos and comments * swarm/shed: add uint64 field Dec and DecInBatch methods * swarm/storage/localstore: decrement size counter on ModeRemoval update * swarm/storage/localstore: unexport modeAccess and modeRemoval * swarm/storage/localstore: add WithRetrievalCompositeIndex * swarm/storage/localstore: add TestModeSyncing * swarm/storage/localstore: fix test name * swarm/storage/localstore: add TestModeUpload * swarm/storage/localstore: add TestModeRequest * swarm/storage/localstore: add TestModeSynced * swarm/storage/localstore: add TestModeAccess * swarm/storage/localstore: add TestModeRemoval * swarm/storage/localstore: add mock store option for chunk data * swarm/storage/localstore: add TestDB_pullIndex * swarm/storage/localstore: add TestDB_gcIndex * swarm/storage/localstore: change how batches are written * swarm/storage/localstore: add updateOnAccess function * swarm/storage/localhost: add DB.gcSize * swarm/storage/localstore: update comments * swarm/storage/localstore: add BenchmarkNew * swarm/storage/localstore: add retrieval tests benchmarks * swarm/storage/localstore: accessors redesign * swarm/storage/localstore: add semaphore for updateGC goroutine * swarm/storage/localstore: implement basic garbage collection * swarm/storage/localstore: optimize collectGarbage * swarm/storage/localstore: add more garbage collection tests cases * swarm/shed, swarm/storage/localstore: rename IndexItem to Item * swarm/shed: add Index.CountFrom * swarm/storage/localstore: persist gcSize * swarm/storage/localstore: remove composite retrieval index * swarm/shed: IterateWithPrefix and IterateWithPrefixFrom Index functions * swarm/storage/localstore: writeGCSize function with leveldb batch * swarm/storage/localstore: unexport modeSetRemove * swarm/storage/localstore: update writeGCSizeWorker comment * swarm/storage/localstore: add triggerGarbageCollection function * swarm/storage/localstore: call writeGCSize on DB Close * swarm/storage/localstore: additional comment in writeGCSizeWorker * swarm/storage/localstore: add MetricsPrefix option * swarm/storage/localstore: fix a typo * swamr/shed: only one Index Iterate function * swarm/storage/localstore: use shed Iterate function * swarm/shed: pass a new byte slice copy to index decode functions * swarm/storage/localstore: implement feed subscriptions * swarm/storage/localstore: add more subscriptions tests * swarm/storage/localsore: add parallel upload test * swarm/storage/localstore: use storage.MaxPO in subscription tests * swarm/storage/localstore: subscription of addresses instead chunks * swarm/storage/localstore: lock item address in collectGarbage iterator * swarm/storage/localstore: fix TestSubscribePull to include MaxPO * swarm/storage/localstore: improve subscriptions * swarm/storage/localstore: add TestDB_SubscribePull_sinceAndUntil test * swarm/storage/localstore: adjust pull sync tests * swarm/storage/localstore: remove writeGCSizeDelay and use literal * swarm/storage/localstore: adjust subscriptions tests delays and comments * swarm/storage/localstore: add godoc package overview * swarm/storage/localstore: fix a typo * swarm/storage/localstore: update package overview * swarm/storage/localstore: remove repeated index change * swarm/storage/localstore: rename ChunkInfo to ChunkDescriptor * swarm/storage/localstore: add comment in collectGarbageWorker * swarm/storage/localstore: replace atomics with mutexes for gcSize and tests * swarm/storage/localstore: protect addrs map in pull subs tests * swarm/storage/localstore: protect slices in push subs test * swarm/storage/localstore: protect chunks in TestModePutUpload_parallel * swarm/storage/localstore: fix a race in TestDB_updateGCSem defers * swarm/storage/localstore: remove parallel flag from tests * swarm/storage/localstore: fix a race in testDB_collectGarbageWorker * swarm/storage/localstore: remove unused code * swarm/storage/localstore: add more context to pull sub log messages * swarm/storage/localstore: BenchmarkPutUpload and global lock option * swarm/storage/localstore: pre-generate chunks in BenchmarkPutUpload * swarm/storage/localstore: correct useGlobalLock in collectGarbage * swarm/storage/localstore: fix typos and update comments * swarm/storage/localstore: update writeGCSize comment * swarm/storage/localstore: global batch write lock * swarm/storage/localstore: remove global lock option * swarm/storage/localstore: simplify DB.Close
176 lines
5.1 KiB
Go
176 lines
5.1 KiB
Go
// Copyright 2018 The go-ethereum Authors
|
|
// This file is part of the go-ethereum library.
|
|
//
|
|
// The go-ethereum library is free software: you can redistribute it and/or modify
|
|
// it under the terms of the GNU Lesser General Public License as published by
|
|
// the Free Software Foundation, either version 3 of the License, or
|
|
// (at your option) any later version.
|
|
//
|
|
// The go-ethereum library is distributed in the hope that it will be useful,
|
|
// but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
// GNU Lesser General Public License for more details.
|
|
//
|
|
// You should have received a copy of the GNU Lesser General Public License
|
|
// along with the go-ethereum library. If not, see <http://www.gnu.org/licenses/>.
|
|
|
|
package localstore
|
|
|
|
import (
|
|
"github.com/ethereum/go-ethereum/log"
|
|
"github.com/ethereum/go-ethereum/swarm/shed"
|
|
"github.com/syndtr/goleveldb/leveldb"
|
|
)
|
|
|
|
var (
|
|
// gcTargetRatio defines the target number of items
|
|
// in garbage collection index that will not be removed
|
|
// on garbage collection. The target number of items
|
|
// is calculated by gcTarget function. This value must be
|
|
// in range (0,1]. For example, with 0.9 value,
|
|
// garbage collection will leave 90% of defined capacity
|
|
// in database after its run. This prevents frequent
|
|
// garbage collection runs.
|
|
gcTargetRatio = 0.9
|
|
// gcBatchSize limits the number of chunks in a single
|
|
// leveldb batch on garbage collection.
|
|
gcBatchSize uint64 = 1000
|
|
)
|
|
|
|
// collectGarbageWorker is a long running function that waits for
|
|
// collectGarbageTrigger channel to signal a garbage collection
|
|
// run. GC run iterates on gcIndex and removes older items
|
|
// form retrieval and other indexes.
|
|
func (db *DB) collectGarbageWorker() {
|
|
defer close(db.collectGarbageWorkerDone)
|
|
|
|
for {
|
|
select {
|
|
case <-db.collectGarbageTrigger:
|
|
// run a single collect garbage run and
|
|
// if done is false, gcBatchSize is reached and
|
|
// another collect garbage run is needed
|
|
collectedCount, done, err := db.collectGarbage()
|
|
if err != nil {
|
|
log.Error("localstore collect garbage", "err", err)
|
|
}
|
|
// check if another gc run is needed
|
|
if !done {
|
|
db.triggerGarbageCollection()
|
|
}
|
|
|
|
if collectedCount > 0 && testHookCollectGarbage != nil {
|
|
testHookCollectGarbage(collectedCount)
|
|
}
|
|
case <-db.close:
|
|
return
|
|
}
|
|
}
|
|
}
|
|
|
|
// collectGarbage removes chunks from retrieval and other
|
|
// indexes if maximal number of chunks in database is reached.
|
|
// This function returns the number of removed chunks. If done
|
|
// is false, another call to this function is needed to collect
|
|
// the rest of the garbage as the batch size limit is reached.
|
|
// This function is called in collectGarbageWorker.
|
|
func (db *DB) collectGarbage() (collectedCount uint64, done bool, err error) {
|
|
batch := new(leveldb.Batch)
|
|
target := db.gcTarget()
|
|
|
|
// protect database from changing idexes and gcSize
|
|
db.batchMu.Lock()
|
|
defer db.batchMu.Unlock()
|
|
|
|
gcSize, err := db.gcSize.Get()
|
|
if err != nil {
|
|
return 0, true, err
|
|
}
|
|
|
|
done = true
|
|
err = db.gcIndex.Iterate(func(item shed.Item) (stop bool, err error) {
|
|
if gcSize-collectedCount <= target {
|
|
return true, nil
|
|
}
|
|
// delete from retrieve, pull, gc
|
|
db.retrievalDataIndex.DeleteInBatch(batch, item)
|
|
db.retrievalAccessIndex.DeleteInBatch(batch, item)
|
|
db.pullIndex.DeleteInBatch(batch, item)
|
|
db.gcIndex.DeleteInBatch(batch, item)
|
|
collectedCount++
|
|
if collectedCount >= gcBatchSize {
|
|
// bach size limit reached,
|
|
// another gc run is needed
|
|
done = false
|
|
return true, nil
|
|
}
|
|
return false, nil
|
|
}, nil)
|
|
if err != nil {
|
|
return 0, false, err
|
|
}
|
|
|
|
db.gcSize.PutInBatch(batch, gcSize-collectedCount)
|
|
|
|
err = db.shed.WriteBatch(batch)
|
|
if err != nil {
|
|
return 0, false, err
|
|
}
|
|
return collectedCount, done, nil
|
|
}
|
|
|
|
// gcTrigger retruns the absolute value for garbage collection
|
|
// target value, calculated from db.capacity and gcTargetRatio.
|
|
func (db *DB) gcTarget() (target uint64) {
|
|
return uint64(float64(db.capacity) * gcTargetRatio)
|
|
}
|
|
|
|
// triggerGarbageCollection signals collectGarbageWorker
|
|
// to call collectGarbage.
|
|
func (db *DB) triggerGarbageCollection() {
|
|
select {
|
|
case db.collectGarbageTrigger <- struct{}{}:
|
|
case <-db.close:
|
|
default:
|
|
}
|
|
}
|
|
|
|
// incGCSizeInBatch changes gcSize field value
|
|
// by change which can be negative. This function
|
|
// must be called under batchMu lock.
|
|
func (db *DB) incGCSizeInBatch(batch *leveldb.Batch, change int64) (err error) {
|
|
if change == 0 {
|
|
return nil
|
|
}
|
|
gcSize, err := db.gcSize.Get()
|
|
if err != nil {
|
|
return err
|
|
}
|
|
|
|
var new uint64
|
|
if change > 0 {
|
|
new = gcSize + uint64(change)
|
|
} else {
|
|
// 'change' is an int64 and is negative
|
|
// a conversion is needed with correct sign
|
|
c := uint64(-change)
|
|
if c > gcSize {
|
|
// protect uint64 undeflow
|
|
return nil
|
|
}
|
|
new = gcSize - c
|
|
}
|
|
db.gcSize.PutInBatch(batch, new)
|
|
|
|
// trigger garbage collection if we reached the capacity
|
|
if new >= db.capacity {
|
|
db.triggerGarbageCollection()
|
|
}
|
|
return nil
|
|
}
|
|
|
|
// testHookCollectGarbage is a hook that can provide
|
|
// information when a garbage collection run is done
|
|
// and how many items it removed.
|
|
var testHookCollectGarbage func(collectedCount uint64)
|