2020-09-16 03:20:48 +00:00
|
|
|
package main
|
|
|
|
|
|
|
|
import (
|
|
|
|
"context"
|
|
|
|
"fmt"
|
2020-11-01 13:03:21 +00:00
|
|
|
"io"
|
2020-09-16 03:20:48 +00:00
|
|
|
|
|
|
|
"github.com/filecoin-project/go-state-types/abi"
|
|
|
|
"github.com/ipfs/bbloom"
|
|
|
|
"github.com/ipfs/go-cid"
|
|
|
|
"github.com/urfave/cli/v2"
|
|
|
|
"golang.org/x/xerrors"
|
2020-11-01 13:03:21 +00:00
|
|
|
|
2021-01-29 20:01:00 +00:00
|
|
|
badgerbs "github.com/filecoin-project/lotus/blockstore/badger"
|
2020-11-01 13:03:21 +00:00
|
|
|
"github.com/filecoin-project/lotus/chain/store"
|
|
|
|
"github.com/filecoin-project/lotus/chain/vm"
|
|
|
|
"github.com/filecoin-project/lotus/extern/sector-storage/ffiwrapper"
|
|
|
|
"github.com/filecoin-project/lotus/node/repo"
|
2020-09-16 03:20:48 +00:00
|
|
|
)
|
|
|
|
|
|
|
|
type cidSet interface {
|
|
|
|
Add(cid.Cid)
|
|
|
|
Has(cid.Cid) bool
|
|
|
|
HasRaw([]byte) bool
|
|
|
|
Len() int
|
|
|
|
}
|
|
|
|
|
|
|
|
type bloomSet struct {
|
|
|
|
bloom *bbloom.Bloom
|
|
|
|
}
|
|
|
|
|
|
|
|
func newBloomSet(size int64) (*bloomSet, error) {
|
|
|
|
b, err := bbloom.New(float64(size), 3)
|
|
|
|
if err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
|
|
|
|
return &bloomSet{bloom: b}, nil
|
|
|
|
}
|
|
|
|
|
|
|
|
func (bs *bloomSet) Add(c cid.Cid) {
|
|
|
|
bs.bloom.Add(c.Hash())
|
|
|
|
|
|
|
|
}
|
|
|
|
|
|
|
|
func (bs *bloomSet) Has(c cid.Cid) bool {
|
|
|
|
return bs.bloom.Has(c.Hash())
|
|
|
|
}
|
|
|
|
|
|
|
|
func (bs *bloomSet) HasRaw(b []byte) bool {
|
|
|
|
return bs.bloom.Has(b)
|
|
|
|
}
|
|
|
|
|
|
|
|
func (bs *bloomSet) Len() int {
|
|
|
|
return int(bs.bloom.ElementsAdded())
|
|
|
|
}
|
|
|
|
|
|
|
|
type mapSet struct {
|
|
|
|
m map[string]struct{}
|
|
|
|
}
|
|
|
|
|
|
|
|
func newMapSet() *mapSet {
|
|
|
|
return &mapSet{m: make(map[string]struct{})}
|
|
|
|
}
|
|
|
|
|
|
|
|
func (bs *mapSet) Add(c cid.Cid) {
|
|
|
|
bs.m[string(c.Hash())] = struct{}{}
|
|
|
|
}
|
|
|
|
|
|
|
|
func (bs *mapSet) Has(c cid.Cid) bool {
|
|
|
|
_, ok := bs.m[string(c.Hash())]
|
|
|
|
return ok
|
|
|
|
}
|
|
|
|
|
|
|
|
func (bs *mapSet) HasRaw(b []byte) bool {
|
|
|
|
_, ok := bs.m[string(b)]
|
|
|
|
return ok
|
|
|
|
}
|
|
|
|
|
|
|
|
func (bs *mapSet) Len() int {
|
|
|
|
return len(bs.m)
|
|
|
|
}
|
|
|
|
|
|
|
|
var stateTreePruneCmd = &cli.Command{
|
|
|
|
Name: "state-prune",
|
|
|
|
Description: "Deletes old state root data from local chainstore",
|
|
|
|
Flags: []cli.Flag{
|
|
|
|
&cli.StringFlag{
|
|
|
|
Name: "repo",
|
|
|
|
Value: "~/.lotus",
|
|
|
|
},
|
|
|
|
&cli.Int64Flag{
|
|
|
|
Name: "keep-from-lookback",
|
|
|
|
Usage: "keep stateroots at or newer than the current height minus this lookback",
|
|
|
|
Value: 1800, // 2 x finality
|
|
|
|
},
|
|
|
|
&cli.IntFlag{
|
|
|
|
Name: "delete-up-to",
|
|
|
|
Usage: "delete up to the given number of objects (used to run a faster 'partial' sync)",
|
|
|
|
},
|
|
|
|
&cli.BoolFlag{
|
|
|
|
Name: "use-bloom-set",
|
|
|
|
Usage: "use a bloom filter for the 'good' set instead of a map, reduces memory usage but may not clean up as much",
|
|
|
|
},
|
|
|
|
&cli.BoolFlag{
|
|
|
|
Name: "dry-run",
|
|
|
|
Usage: "only enumerate the good set, don't do any deletions",
|
|
|
|
},
|
|
|
|
&cli.BoolFlag{
|
|
|
|
Name: "only-ds-gc",
|
|
|
|
Usage: "Only run datastore GC",
|
|
|
|
},
|
|
|
|
&cli.IntFlag{
|
|
|
|
Name: "gc-count",
|
|
|
|
Usage: "number of times to run gc",
|
|
|
|
Value: 20,
|
|
|
|
},
|
|
|
|
},
|
|
|
|
Action: func(cctx *cli.Context) error {
|
|
|
|
ctx := context.TODO()
|
|
|
|
|
|
|
|
fsrepo, err := repo.NewFS(cctx.String("repo"))
|
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
|
|
|
|
lkrepo, err := fsrepo.Lock(repo.FullNode)
|
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
|
|
|
|
defer lkrepo.Close() //nolint:errcheck
|
|
|
|
|
2020-12-30 10:04:00 +00:00
|
|
|
bs, err := lkrepo.Blockstore(ctx, repo.BlockstoreChain)
|
2020-09-16 03:20:48 +00:00
|
|
|
if err != nil {
|
2020-11-01 13:03:21 +00:00
|
|
|
return fmt.Errorf("failed to open blockstore: %w", err)
|
2020-09-16 03:20:48 +00:00
|
|
|
}
|
|
|
|
|
2020-11-01 13:03:21 +00:00
|
|
|
defer func() {
|
|
|
|
if c, ok := bs.(io.Closer); ok {
|
|
|
|
if err := c.Close(); err != nil {
|
|
|
|
log.Warnf("failed to close blockstore: %s", err)
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}()
|
|
|
|
|
|
|
|
// After migrating to native blockstores, this has been made
|
|
|
|
// database-specific.
|
|
|
|
badgbs, ok := bs.(*badgerbs.Blockstore)
|
|
|
|
if !ok {
|
|
|
|
return fmt.Errorf("only badger blockstores are supported")
|
|
|
|
}
|
2020-09-16 03:20:48 +00:00
|
|
|
|
2021-01-26 10:25:34 +00:00
|
|
|
mds, err := lkrepo.Datastore(context.Background(), "/metadata")
|
2020-09-16 03:20:48 +00:00
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
2020-10-02 21:38:54 +00:00
|
|
|
defer mds.Close() //nolint:errcheck
|
2020-09-16 03:20:48 +00:00
|
|
|
|
2020-11-01 13:03:21 +00:00
|
|
|
const DiscardRatio = 0.2
|
2020-09-16 03:20:48 +00:00
|
|
|
if cctx.Bool("only-ds-gc") {
|
2020-11-01 13:03:21 +00:00
|
|
|
fmt.Println("running datastore gc....")
|
|
|
|
for i := 0; i < cctx.Int("gc-count"); i++ {
|
|
|
|
if err := badgbs.DB.RunValueLogGC(DiscardRatio); err != nil {
|
|
|
|
return xerrors.Errorf("datastore GC failed: %w", err)
|
2020-09-16 03:20:48 +00:00
|
|
|
}
|
|
|
|
}
|
2020-11-01 13:03:21 +00:00
|
|
|
fmt.Println("gc complete!")
|
|
|
|
return nil
|
2020-09-16 03:20:48 +00:00
|
|
|
}
|
|
|
|
|
2020-11-16 22:22:08 +00:00
|
|
|
cs := store.NewChainStore(bs, bs, mds, vm.Syscalls(ffiwrapper.ProofVerifier), nil)
|
|
|
|
defer cs.Close() //nolint:errcheck
|
|
|
|
|
2020-09-16 03:20:48 +00:00
|
|
|
if err := cs.Load(); err != nil {
|
|
|
|
return fmt.Errorf("loading chainstore: %w", err)
|
|
|
|
}
|
|
|
|
|
|
|
|
var goodSet cidSet
|
|
|
|
if cctx.Bool("use-bloom-set") {
|
|
|
|
bset, err := newBloomSet(10000000)
|
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
goodSet = bset
|
|
|
|
} else {
|
|
|
|
goodSet = newMapSet()
|
|
|
|
}
|
|
|
|
|
|
|
|
ts := cs.GetHeaviestTipSet()
|
|
|
|
|
|
|
|
rrLb := abi.ChainEpoch(cctx.Int64("keep-from-lookback"))
|
|
|
|
|
|
|
|
if err := cs.WalkSnapshot(ctx, ts, rrLb, true, func(c cid.Cid) error {
|
|
|
|
if goodSet.Len()%20 == 0 {
|
|
|
|
fmt.Printf("\renumerating keep set: %d ", goodSet.Len())
|
|
|
|
}
|
|
|
|
goodSet.Add(c)
|
|
|
|
return nil
|
|
|
|
}); err != nil {
|
|
|
|
return fmt.Errorf("snapshot walk failed: %w", err)
|
|
|
|
}
|
|
|
|
|
|
|
|
fmt.Println()
|
2020-10-02 21:38:54 +00:00
|
|
|
fmt.Printf("Successfully marked keep set! (%d objects)\n", goodSet.Len())
|
2020-09-16 03:20:48 +00:00
|
|
|
|
|
|
|
if cctx.Bool("dry-run") {
|
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
2020-11-01 13:03:21 +00:00
|
|
|
b := badgbs.DB.NewWriteBatch()
|
|
|
|
defer b.Cancel()
|
2020-09-16 03:20:48 +00:00
|
|
|
|
2020-11-01 13:03:21 +00:00
|
|
|
markForRemoval := func(c cid.Cid) error {
|
2020-11-02 13:32:07 +00:00
|
|
|
return b.Delete(badgbs.StorageKey(nil, c))
|
2020-09-16 03:20:48 +00:00
|
|
|
}
|
|
|
|
|
2020-11-01 13:03:21 +00:00
|
|
|
keys, err := bs.AllKeysChan(context.Background())
|
2020-09-16 03:20:48 +00:00
|
|
|
if err != nil {
|
2020-11-01 13:03:21 +00:00
|
|
|
return xerrors.Errorf("failed to query blockstore: %w", err)
|
2020-09-16 03:20:48 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
dupTo := cctx.Int("delete-up-to")
|
|
|
|
|
|
|
|
var deleteCount int
|
|
|
|
var goodHits int
|
2020-11-01 13:03:21 +00:00
|
|
|
for k := range keys {
|
|
|
|
if goodSet.HasRaw(k.Bytes()) {
|
2020-09-16 03:20:48 +00:00
|
|
|
goodHits++
|
|
|
|
continue
|
|
|
|
}
|
|
|
|
|
2020-11-01 13:03:21 +00:00
|
|
|
if err := markForRemoval(k); err != nil {
|
|
|
|
return fmt.Errorf("failed to remove cid %s: %w", k, err)
|
2020-09-16 03:20:48 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
if deleteCount%20 == 0 {
|
|
|
|
fmt.Printf("\rdeleting %d objects (good hits: %d)... ", deleteCount, goodHits)
|
|
|
|
}
|
|
|
|
|
|
|
|
if dupTo != 0 && deleteCount > dupTo {
|
|
|
|
break
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2020-11-01 13:03:21 +00:00
|
|
|
if err := b.Flush(); err != nil {
|
|
|
|
return xerrors.Errorf("failed to flush final batch delete: %w", err)
|
2020-09-16 03:20:48 +00:00
|
|
|
}
|
|
|
|
|
2020-11-01 13:03:21 +00:00
|
|
|
fmt.Println("running datastore gc....")
|
|
|
|
for i := 0; i < cctx.Int("gc-count"); i++ {
|
|
|
|
if err := badgbs.DB.RunValueLogGC(DiscardRatio); err != nil {
|
|
|
|
return xerrors.Errorf("datastore GC failed: %w", err)
|
2020-09-16 03:20:48 +00:00
|
|
|
}
|
|
|
|
}
|
2020-11-01 13:03:21 +00:00
|
|
|
fmt.Println("gc complete!")
|
2020-09-16 03:20:48 +00:00
|
|
|
|
|
|
|
return nil
|
|
|
|
},
|
|
|
|
}
|