2023-01-06 23:02:36 +00:00
|
|
|
package main
|
|
|
|
|
|
|
|
import (
|
2023-09-21 15:37:02 +00:00
|
|
|
"bytes"
|
2023-01-06 23:02:36 +00:00
|
|
|
"context"
|
|
|
|
"encoding/json"
|
|
|
|
"fmt"
|
|
|
|
"io"
|
2023-09-21 15:37:02 +00:00
|
|
|
"path"
|
2023-01-06 23:02:36 +00:00
|
|
|
"reflect"
|
2023-09-21 15:37:02 +00:00
|
|
|
"sort"
|
2023-01-06 23:02:36 +00:00
|
|
|
"sync"
|
|
|
|
|
|
|
|
"github.com/docker/go-units"
|
2023-03-13 22:29:09 +00:00
|
|
|
lru "github.com/hashicorp/golang-lru/v2"
|
2023-05-25 14:31:53 +00:00
|
|
|
"github.com/ipfs/boxo/blockservice"
|
|
|
|
offline "github.com/ipfs/boxo/exchange/offline"
|
|
|
|
"github.com/ipfs/boxo/ipld/merkledag"
|
2023-01-06 23:02:36 +00:00
|
|
|
"github.com/ipfs/go-cid"
|
|
|
|
format "github.com/ipfs/go-ipld-format"
|
|
|
|
"github.com/urfave/cli/v2"
|
|
|
|
"golang.org/x/sync/errgroup"
|
|
|
|
"golang.org/x/xerrors"
|
|
|
|
|
|
|
|
"github.com/filecoin-project/go-address"
|
|
|
|
"github.com/filecoin-project/go-state-types/abi"
|
2023-09-21 15:37:02 +00:00
|
|
|
gstactors "github.com/filecoin-project/go-state-types/actors"
|
|
|
|
"github.com/filecoin-project/go-state-types/network"
|
2023-01-06 23:02:36 +00:00
|
|
|
"github.com/filecoin-project/lotus/api"
|
2023-09-21 15:37:02 +00:00
|
|
|
"github.com/filecoin-project/lotus/blockstore"
|
|
|
|
"github.com/filecoin-project/lotus/chain/actors"
|
2023-01-06 23:02:36 +00:00
|
|
|
"github.com/filecoin-project/lotus/chain/actors/builtin"
|
|
|
|
"github.com/filecoin-project/lotus/chain/consensus"
|
|
|
|
"github.com/filecoin-project/lotus/chain/consensus/filcns"
|
2023-03-12 13:33:36 +00:00
|
|
|
"github.com/filecoin-project/lotus/chain/index"
|
2023-01-06 23:02:36 +00:00
|
|
|
"github.com/filecoin-project/lotus/chain/stmgr"
|
|
|
|
"github.com/filecoin-project/lotus/chain/store"
|
|
|
|
"github.com/filecoin-project/lotus/chain/types"
|
|
|
|
"github.com/filecoin-project/lotus/chain/vm"
|
|
|
|
lcli "github.com/filecoin-project/lotus/cli"
|
|
|
|
"github.com/filecoin-project/lotus/node/repo"
|
|
|
|
"github.com/filecoin-project/lotus/storage/sealer/ffiwrapper"
|
|
|
|
)
|
|
|
|
|
|
|
|
type actorStats struct {
|
|
|
|
Address address.Address
|
|
|
|
Actor *types.Actor
|
|
|
|
Fields []fieldItem
|
|
|
|
Stats api.ObjStat
|
|
|
|
}
|
|
|
|
|
|
|
|
type fieldItem struct {
|
|
|
|
Name string
|
|
|
|
Cid cid.Cid
|
|
|
|
Stats api.ObjStat
|
|
|
|
}
|
|
|
|
|
2023-09-21 15:37:02 +00:00
|
|
|
type job struct {
|
|
|
|
c cid.Cid
|
|
|
|
key string // prefix path for the region being recorded i.e. "/state/mineractor"
|
|
|
|
}
|
|
|
|
type cidCall struct {
|
|
|
|
c cid.Cid
|
|
|
|
resp chan bool
|
|
|
|
}
|
|
|
|
type result struct {
|
|
|
|
key string
|
|
|
|
stats api.ObjStat
|
|
|
|
}
|
|
|
|
|
2023-01-06 23:02:36 +00:00
|
|
|
type cacheNodeGetter struct {
|
|
|
|
ds format.NodeGetter
|
2023-03-13 22:29:09 +00:00
|
|
|
cache *lru.TwoQueueCache[cid.Cid, format.Node]
|
2023-01-06 23:02:36 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
func newCacheNodeGetter(d format.NodeGetter, size int) (*cacheNodeGetter, error) {
|
|
|
|
cng := &cacheNodeGetter{ds: d}
|
|
|
|
|
2023-03-13 22:29:09 +00:00
|
|
|
cache, err := lru.New2Q[cid.Cid, format.Node](size)
|
2023-01-06 23:02:36 +00:00
|
|
|
if err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
|
|
|
|
cng.cache = cache
|
|
|
|
|
|
|
|
return cng, nil
|
|
|
|
}
|
|
|
|
|
|
|
|
func (cng *cacheNodeGetter) Get(ctx context.Context, c cid.Cid) (format.Node, error) {
|
|
|
|
if n, ok := cng.cache.Get(c); ok {
|
2023-03-13 22:29:09 +00:00
|
|
|
return n, nil
|
2023-01-06 23:02:36 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
n, err := cng.ds.Get(ctx, c)
|
|
|
|
if err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
|
|
|
|
cng.cache.Add(c, n)
|
|
|
|
|
|
|
|
return n, nil
|
|
|
|
}
|
|
|
|
|
|
|
|
func (cng *cacheNodeGetter) GetMany(ctx context.Context, list []cid.Cid) <-chan *format.NodeOption {
|
|
|
|
out := make(chan *format.NodeOption, len(list))
|
|
|
|
go func() {
|
|
|
|
for _, c := range list {
|
|
|
|
n, err := cng.Get(ctx, c)
|
|
|
|
if err != nil {
|
|
|
|
out <- &format.NodeOption{Err: err}
|
|
|
|
continue
|
|
|
|
}
|
|
|
|
|
|
|
|
out <- &format.NodeOption{Node: n}
|
|
|
|
}
|
|
|
|
}()
|
|
|
|
|
|
|
|
return out
|
|
|
|
}
|
|
|
|
|
|
|
|
type dagStatCollector struct {
|
|
|
|
ds format.NodeGetter
|
|
|
|
walk func(format.Node) ([]*format.Link, error)
|
|
|
|
|
|
|
|
statsLk sync.Mutex
|
|
|
|
stats api.ObjStat
|
|
|
|
}
|
|
|
|
|
|
|
|
func (dsc *dagStatCollector) record(ctx context.Context, nd format.Node) error {
|
|
|
|
size, err := nd.Size()
|
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
|
|
|
|
dsc.statsLk.Lock()
|
|
|
|
defer dsc.statsLk.Unlock()
|
|
|
|
|
|
|
|
dsc.stats.Size = dsc.stats.Size + size
|
|
|
|
dsc.stats.Links = dsc.stats.Links + 1
|
|
|
|
|
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
|
|
|
func (dsc *dagStatCollector) walkLinks(ctx context.Context, c cid.Cid) ([]*format.Link, error) {
|
|
|
|
nd, err := dsc.ds.Get(ctx, c)
|
|
|
|
if err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
|
|
|
|
if err := dsc.record(ctx, nd); err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
|
|
|
|
return dsc.walk(nd)
|
|
|
|
}
|
|
|
|
|
|
|
|
type ChainStoreTipSetResolver struct {
|
|
|
|
Chain *store.ChainStore
|
|
|
|
}
|
|
|
|
|
|
|
|
func (tsr *ChainStoreTipSetResolver) ChainHead(ctx context.Context) (*types.TipSet, error) {
|
|
|
|
return tsr.Chain.GetHeaviestTipSet(), nil
|
|
|
|
}
|
|
|
|
|
|
|
|
func (tsr *ChainStoreTipSetResolver) ChainGetTipSetByHeight(ctx context.Context, h abi.ChainEpoch, tsk types.TipSetKey) (*types.TipSet, error) {
|
|
|
|
ts, err := tsr.Chain.GetTipSetFromKey(ctx, tsk)
|
|
|
|
if err != nil {
|
|
|
|
return nil, xerrors.Errorf("loading tipset %s: %w", tsk, err)
|
|
|
|
}
|
|
|
|
return tsr.Chain.GetTipsetByHeight(ctx, h, ts, true)
|
|
|
|
}
|
|
|
|
func (tsr *ChainStoreTipSetResolver) ChainGetTipSet(ctx context.Context, tsk types.TipSetKey) (*types.TipSet, error) {
|
|
|
|
return tsr.Chain.LoadTipSet(ctx, tsk)
|
|
|
|
}
|
|
|
|
|
|
|
|
var statObjCmd = &cli.Command{
|
|
|
|
Name: "stat-obj",
|
|
|
|
Usage: "calculates the size of any DAG in the blockstore",
|
|
|
|
Flags: []cli.Flag{},
|
|
|
|
Action: func(cctx *cli.Context) error {
|
|
|
|
ctx := lcli.ReqContext(cctx)
|
|
|
|
|
|
|
|
c, err := cid.Parse(cctx.Args().First())
|
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
|
2023-09-21 15:37:02 +00:00
|
|
|
h, err := loadChainStore(ctx, cctx.String("repo"))
|
2023-01-06 23:02:36 +00:00
|
|
|
if err != nil {
|
2023-09-21 15:37:02 +00:00
|
|
|
return err
|
2023-01-06 23:02:36 +00:00
|
|
|
}
|
2023-09-21 15:37:02 +00:00
|
|
|
defer h.closer()
|
2023-01-06 23:02:36 +00:00
|
|
|
|
2023-09-21 15:37:02 +00:00
|
|
|
dag := merkledag.NewDAGService(blockservice.New(h.bs, offline.Exchange(h.bs)))
|
|
|
|
dsc := &dagStatCollector{
|
|
|
|
ds: dag,
|
|
|
|
walk: carWalkFunc,
|
|
|
|
}
|
|
|
|
|
|
|
|
if err := merkledag.Walk(ctx, dsc.walkLinks, c, cid.NewSet().Visit, merkledag.Concurrent()); err != nil {
|
2023-01-06 23:02:36 +00:00
|
|
|
return err
|
|
|
|
}
|
2023-09-21 15:37:02 +00:00
|
|
|
|
|
|
|
return DumpJSON(dsc.stats)
|
|
|
|
},
|
|
|
|
}
|
|
|
|
|
|
|
|
type StoreHandle struct {
|
|
|
|
bs blockstore.Blockstore
|
|
|
|
cs *store.ChainStore
|
|
|
|
sm *stmgr.StateManager
|
|
|
|
closer func()
|
|
|
|
}
|
|
|
|
|
|
|
|
func loadChainStore(ctx context.Context, repoPath string) (*StoreHandle, error) {
|
|
|
|
r, err := repo.NewFS(repoPath)
|
|
|
|
if err != nil {
|
|
|
|
return nil, xerrors.Errorf("opening fs repo: %w", err)
|
|
|
|
}
|
|
|
|
|
|
|
|
exists, err := r.Exists()
|
|
|
|
if err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
if !exists {
|
|
|
|
return nil, xerrors.Errorf("lotus repo doesn't exist")
|
|
|
|
}
|
|
|
|
|
|
|
|
lr, err := r.Lock(repo.FullNode)
|
|
|
|
if err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
|
|
|
|
bs, err := lr.Blockstore(ctx, repo.UniversalBlockstore)
|
|
|
|
if err != nil {
|
|
|
|
return nil, fmt.Errorf("failed to open blockstore: %w", err)
|
|
|
|
}
|
|
|
|
|
|
|
|
closer := func() {
|
|
|
|
if err := lr.Close(); err != nil {
|
|
|
|
log.Warnf("failed to close locked repo: %s", err)
|
|
|
|
}
|
|
|
|
if c, ok := bs.(io.Closer); ok {
|
|
|
|
if err := c.Close(); err != nil {
|
|
|
|
log.Warnf("failed to close blockstore: %s", err)
|
|
|
|
}
|
2023-01-06 23:02:36 +00:00
|
|
|
}
|
2023-09-21 15:37:02 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
mds, err := lr.Datastore(context.Background(), "/metadata")
|
|
|
|
if err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
|
|
|
|
cs := store.NewChainStore(bs, bs, mds, nil, nil)
|
|
|
|
if err := cs.Load(ctx); err != nil {
|
|
|
|
return nil, fmt.Errorf("failed to load chain store: %w", err)
|
|
|
|
}
|
|
|
|
|
|
|
|
tsExec := consensus.NewTipSetExecutor(filcns.RewardFunc)
|
|
|
|
sm, err := stmgr.NewStateManager(cs, tsExec, vm.Syscalls(ffiwrapper.ProofVerifier), filcns.DefaultUpgradeSchedule(), nil, mds, index.DummyMsgIndex)
|
|
|
|
if err != nil {
|
|
|
|
return nil, fmt.Errorf("failed to open state manager: %w", err)
|
|
|
|
}
|
|
|
|
handle := StoreHandle{
|
|
|
|
bs: bs,
|
|
|
|
sm: sm,
|
|
|
|
cs: cs,
|
|
|
|
closer: closer,
|
|
|
|
}
|
|
|
|
|
|
|
|
return &handle, nil
|
|
|
|
}
|
|
|
|
|
|
|
|
func pipeline(ctx context.Context, name string, numWorkers int, createJobs func(ctx context.Context, jobCh chan job, resultCh chan result) error,
|
|
|
|
worker func(ctx context.Context, id int, jobCh chan job, resultCh chan result) error,
|
|
|
|
processResults func(ctx context.Context, resultCh chan result) error) error {
|
|
|
|
|
|
|
|
eg, egctx := errgroup.WithContext(ctx)
|
|
|
|
jobCh := make(chan job, numWorkers)
|
|
|
|
resultCh := make(chan result)
|
|
|
|
var resultWriterWg sync.WaitGroup
|
2023-01-06 23:02:36 +00:00
|
|
|
|
2023-09-21 15:37:02 +00:00
|
|
|
resultWriterWg.Add(1)
|
|
|
|
eg.Go(func() error {
|
|
|
|
defer resultWriterWg.Done()
|
|
|
|
defer func() {
|
|
|
|
close(jobCh)
|
|
|
|
}()
|
|
|
|
return createJobs(ctx, jobCh, resultCh)
|
|
|
|
})
|
|
|
|
|
|
|
|
var id int
|
|
|
|
for w := 0; w < numWorkers; w++ {
|
|
|
|
id = w
|
|
|
|
|
|
|
|
resultWriterWg.Add(1)
|
|
|
|
eg.Go(func() error {
|
|
|
|
defer resultWriterWg.Done()
|
|
|
|
return worker(egctx, id, jobCh, resultCh)
|
|
|
|
})
|
|
|
|
}
|
|
|
|
|
|
|
|
eg.Go(func() error {
|
|
|
|
return processResults(ctx, resultCh)
|
|
|
|
})
|
|
|
|
|
|
|
|
// close result channel when workers are done sending to it.
|
|
|
|
eg.Go(func() error {
|
|
|
|
resultWriterWg.Wait()
|
|
|
|
close(resultCh)
|
|
|
|
return nil
|
|
|
|
})
|
|
|
|
|
|
|
|
if err := eg.Wait(); err != nil {
|
|
|
|
return fmt.Errorf("failed pipeline %s: %w", name, err)
|
|
|
|
}
|
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
|
|
|
var statSnapshotCmd = &cli.Command{
|
|
|
|
Name: "stat-snapshot",
|
|
|
|
Usage: "calculates the space usage of a snapshot taken from the given tipset",
|
|
|
|
Description: `Walk the chain back to lightweight snapshot size and break down space usage into high level
|
|
|
|
categories: headers, messages, receipts, latest state root, and churn from earlier state roots.
|
|
|
|
State root and churn space is further broken down by actor type and immediate top level fields
|
|
|
|
`,
|
|
|
|
Flags: []cli.Flag{
|
|
|
|
&cli.StringFlag{
|
|
|
|
Name: "tipset",
|
|
|
|
Usage: "specify tipset to call method on (pass comma separated array of cids)",
|
|
|
|
},
|
|
|
|
&cli.IntFlag{
|
|
|
|
Name: "workers",
|
|
|
|
Usage: "number of workers to use when processing",
|
|
|
|
Value: 10,
|
|
|
|
},
|
|
|
|
&cli.IntFlag{
|
|
|
|
Name: "dag-cache-size",
|
|
|
|
Usage: "cache size per worker (setting to 0 disables)",
|
|
|
|
Value: 8092,
|
|
|
|
},
|
|
|
|
&cli.BoolFlag{
|
|
|
|
Name: "pretty",
|
|
|
|
Usage: "print formated output instead of ldjson",
|
|
|
|
Value: false,
|
|
|
|
},
|
|
|
|
},
|
|
|
|
Action: func(cctx *cli.Context) error {
|
|
|
|
ctx := lcli.ReqContext(cctx)
|
|
|
|
h, err := loadChainStore(ctx, cctx.String("repo"))
|
2023-01-06 23:02:36 +00:00
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
2023-09-21 15:37:02 +00:00
|
|
|
defer h.closer()
|
|
|
|
tsr := &ChainStoreTipSetResolver{
|
|
|
|
Chain: h.cs,
|
|
|
|
}
|
2023-01-06 23:02:36 +00:00
|
|
|
|
2023-09-21 15:37:02 +00:00
|
|
|
ts, err := lcli.LoadTipSet(ctx, cctx, tsr)
|
2023-01-06 23:02:36 +00:00
|
|
|
if err != nil {
|
2023-09-21 15:37:02 +00:00
|
|
|
return err
|
2023-01-06 23:02:36 +00:00
|
|
|
}
|
|
|
|
|
2023-09-21 15:37:02 +00:00
|
|
|
numWorkers := cctx.Int("workers")
|
|
|
|
dagCacheSize := cctx.Int("dag-cache-size")
|
|
|
|
|
|
|
|
cidCh := make(chan cidCall, numWorkers)
|
|
|
|
summary := make(map[string]api.ObjStat)
|
|
|
|
// snapshot root objects with no additional bytes or links
|
|
|
|
summary["/"] = api.ObjStat{Size: 0, Links: 0}
|
|
|
|
summary["/statetree"] = api.ObjStat{Size: 0, Links: 0}
|
|
|
|
|
|
|
|
combine := func(statsA, statsB api.ObjStat) api.ObjStat {
|
|
|
|
return api.ObjStat{
|
|
|
|
Size: statsA.Size + statsB.Size,
|
|
|
|
Links: statsA.Links + statsB.Links,
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
// Threadsafe cid set lives across different pipelines so not part of error group
|
|
|
|
go func() {
|
|
|
|
seen := cid.NewSet()
|
|
|
|
for {
|
|
|
|
select {
|
|
|
|
case call := <-cidCh:
|
|
|
|
call.resp <- seen.Visit(call.c)
|
|
|
|
case <-ctx.Done():
|
|
|
|
log.Infof("shutting down cid set goroutine: %s", ctx.Err())
|
|
|
|
return
|
2023-01-06 23:02:36 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
}()
|
2023-09-21 15:37:02 +00:00
|
|
|
visit := func(c cid.Cid) bool {
|
|
|
|
ch := make(chan bool)
|
|
|
|
cidCh <- cidCall{c: c, resp: ch}
|
|
|
|
out := <-ch
|
|
|
|
return out
|
|
|
|
}
|
|
|
|
// Stage 1 walk all actors in latest state root
|
|
|
|
createJobsStage1 := func(ctx context.Context, jobCh chan job, _ chan result) error {
|
|
|
|
st, err := h.sm.StateTree(ts.ParentState())
|
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
2023-01-06 23:02:36 +00:00
|
|
|
|
2023-09-21 15:37:02 +00:00
|
|
|
return st.ForEach(func(_ address.Address, act *types.Actor) error {
|
|
|
|
actType := builtin.ActorNameByCode(act.Code)
|
|
|
|
actType = path.Base(actType) // strip away fil/<nv>
|
|
|
|
if actType == "<unknown>" {
|
|
|
|
actType = act.Code.String()
|
|
|
|
}
|
|
|
|
jobCh <- job{c: act.Head, key: fmt.Sprintf("/statetree/latest/%s", actType)}
|
|
|
|
|
|
|
|
return nil
|
|
|
|
})
|
2023-01-06 23:02:36 +00:00
|
|
|
}
|
|
|
|
|
2023-09-21 15:37:02 +00:00
|
|
|
worker := func(ctx context.Context, id int, jobCh chan job, resultCh chan result) error {
|
|
|
|
var dag format.NodeGetter = merkledag.NewDAGService(blockservice.New(h.bs, offline.Exchange(h.bs)))
|
|
|
|
if dagCacheSize != 0 {
|
|
|
|
var err error
|
|
|
|
dag, err = newCacheNodeGetter(merkledag.NewDAGService(blockservice.New(h.bs, offline.Exchange(h.bs))), dagCacheSize)
|
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
for job := range jobCh {
|
|
|
|
stats, err := collectSnapshotJobStats(ctx, job, dag, visit)
|
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
for _, stat := range stats {
|
|
|
|
select {
|
|
|
|
case resultCh <- stat:
|
|
|
|
case <-ctx.Done():
|
|
|
|
return ctx.Err()
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
|
|
|
processResults := func(ctx context.Context, resultCh chan result) error {
|
|
|
|
for result := range resultCh {
|
|
|
|
if stat, ok := summary[result.key]; ok {
|
|
|
|
summary[result.key] = combine(stat, result.stats)
|
|
|
|
|
|
|
|
} else {
|
|
|
|
summary[result.key] = result.stats
|
|
|
|
}
|
|
|
|
}
|
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
|
|
|
if err := pipeline(ctx, "Latest State Actors", numWorkers, createJobsStage1, worker, processResults); err != nil {
|
2023-01-06 23:02:36 +00:00
|
|
|
return err
|
|
|
|
}
|
|
|
|
|
2023-09-21 15:37:02 +00:00
|
|
|
// Stage 2: walk the top of the latest state root
|
|
|
|
createJobsStage2 := func(ctx context.Context, jobCh chan job, _ chan result) error {
|
|
|
|
jobCh <- job{c: ts.ParentState(), key: "/statetree/latest"}
|
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
|
|
|
if err := pipeline(ctx, "Latest State HAMT", numWorkers, createJobsStage2, worker, processResults); err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
|
|
|
|
// Stage 3 walk the rest of the chain: headers, messages, churn
|
|
|
|
// ordering:
|
|
|
|
// for each header send jobs for messages, receipts, state tree churn
|
|
|
|
// don't walk header directly as it would just walk everything including parent tipsets
|
|
|
|
|
|
|
|
churnStateRoots := cid.NewSet()
|
|
|
|
createJobsStage3 := func(ctx context.Context, jobCh chan job, resultCh chan result) error {
|
|
|
|
// walk chain
|
|
|
|
var dag format.NodeGetter = merkledag.NewDAGService(blockservice.New(h.bs, offline.Exchange(h.bs)))
|
|
|
|
if dagCacheSize != 0 {
|
|
|
|
var err error
|
|
|
|
dag, err = newCacheNodeGetter(merkledag.NewDAGService(blockservice.New(h.bs, offline.Exchange(h.bs))), dagCacheSize)
|
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
blocksToWalk := ts.Cids()
|
|
|
|
startHeight := ts.Height()
|
|
|
|
snapshotStateLimit := abi.ChainEpoch(2000)
|
|
|
|
|
|
|
|
churnActorCache := cid.NewSet()
|
|
|
|
blocksTracked := cid.NewSet()
|
|
|
|
for len(blocksToWalk) > 0 {
|
|
|
|
blkCid := blocksToWalk[0]
|
|
|
|
blocksToWalk = blocksToWalk[1:]
|
|
|
|
nd, err := dag.Get(ctx, blkCid)
|
|
|
|
if err != nil {
|
|
|
|
return xerrors.Errorf("getting block: %w", err)
|
|
|
|
}
|
|
|
|
|
|
|
|
var b types.BlockHeader
|
|
|
|
if err := b.UnmarshalCBOR(bytes.NewBuffer(nd.RawData())); err != nil {
|
|
|
|
return xerrors.Errorf("unmarshaling block header (cid=%s): %w", blkCid, err)
|
|
|
|
}
|
|
|
|
|
|
|
|
// header directly to result channel
|
|
|
|
resultCh <- result{key: "/headers", stats: api.ObjStat{Size: uint64(len(nd.RawData())), Links: uint64(len(nd.Links()))}}
|
|
|
|
// message job
|
|
|
|
if b.Height > startHeight-snapshotStateLimit {
|
|
|
|
jobCh <- job{key: "/messages", c: b.Messages}
|
|
|
|
}
|
|
|
|
|
|
|
|
// state churn job
|
|
|
|
if b.Height > startHeight-snapshotStateLimit {
|
|
|
|
if churnStateRoots.Visit(b.ParentStateRoot) {
|
|
|
|
st, err := h.sm.StateTree(b.ParentStateRoot)
|
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
|
|
|
|
err = st.ForEach(func(_ address.Address, act *types.Actor) error {
|
|
|
|
if churnActorCache.Visit(act.Head) {
|
|
|
|
actType := builtin.ActorNameByCode(act.Code)
|
|
|
|
actType = path.Base(actType) // strip away fil/<nv>
|
|
|
|
if actType == "<unknown>" {
|
|
|
|
actType = act.Code.String()
|
|
|
|
}
|
|
|
|
jobCh <- job{c: act.Head, key: fmt.Sprintf("/statetree/churn/%s", actType)}
|
|
|
|
}
|
|
|
|
|
|
|
|
return nil
|
|
|
|
})
|
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
for _, blkCid := range b.Parents {
|
|
|
|
if blocksTracked.Visit(blkCid) && b.Height != 0 {
|
|
|
|
blocksToWalk = append(blocksToWalk, blkCid)
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
|
|
|
if err := pipeline(ctx, "Churn, Headers, Messages", numWorkers, createJobsStage3, worker, processResults); err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
|
|
|
|
// step 1 clean things up and get a nice abstraction to reuse
|
|
|
|
// Stage 4 walk all actor HAMTs for churn
|
|
|
|
|
|
|
|
createJobsStage4 := func(ctx context.Context, jobCh chan job, _ chan result) error {
|
|
|
|
return churnStateRoots.ForEach(func(c cid.Cid) error {
|
|
|
|
jobCh <- job{c: c, key: "/statetree/churn"}
|
|
|
|
return nil
|
|
|
|
})
|
|
|
|
}
|
|
|
|
|
|
|
|
if err := pipeline(ctx, "Churn HAMT", numWorkers, createJobsStage4, worker, processResults); err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
|
|
|
|
if cctx.Bool("pretty") {
|
|
|
|
DumpSnapshotStats(summary)
|
|
|
|
} else {
|
|
|
|
if err := DumpJSON(summary); err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
return nil
|
2023-01-06 23:02:36 +00:00
|
|
|
},
|
|
|
|
}
|
|
|
|
|
|
|
|
var statActorCmd = &cli.Command{
|
|
|
|
Name: "stat-actor",
|
|
|
|
Usage: "calculates the size of actors and their immeidate structures",
|
|
|
|
Description: `Any DAG linked by the actor object (field) will have its size calculated independently of all
|
|
|
|
other linked DAG. If an actor has two fields containing links to the same DAG the structure size will be counted
|
|
|
|
twice, included in each fields size individually.
|
|
|
|
|
|
|
|
The top level stats reported for an actor is computed independently of all fields and is a more accurate
|
|
|
|
accounting of the true size of the actor in the state datastore.
|
|
|
|
|
|
|
|
The calculation of these stats results in the actor state being traversed twice. The dag-cache-size flag can be used
|
|
|
|
to reduce the number of decode operations performed by caching the decoded object after first access.`,
|
|
|
|
Flags: []cli.Flag{
|
|
|
|
&cli.StringFlag{
|
|
|
|
Name: "tipset",
|
|
|
|
Usage: "specify tipset to call method on (pass comma separated array of cids)",
|
|
|
|
},
|
|
|
|
&cli.IntFlag{
|
|
|
|
Name: "workers",
|
|
|
|
Usage: "number of workers to use when processing",
|
|
|
|
Value: 10,
|
|
|
|
},
|
|
|
|
&cli.IntFlag{
|
|
|
|
Name: "dag-cache-size",
|
|
|
|
Usage: "cache size per worker (setting to 0 disables)",
|
|
|
|
Value: 8092,
|
|
|
|
},
|
|
|
|
&cli.BoolFlag{
|
|
|
|
Name: "all",
|
|
|
|
Usage: "process all actors in stateroot of tipset",
|
|
|
|
Value: false,
|
|
|
|
},
|
|
|
|
&cli.BoolFlag{
|
|
|
|
Name: "pretty",
|
|
|
|
Usage: "print formated output instead of ldjson",
|
|
|
|
Value: false,
|
|
|
|
},
|
|
|
|
},
|
|
|
|
Action: func(cctx *cli.Context) error {
|
|
|
|
ctx := lcli.ReqContext(cctx)
|
|
|
|
|
|
|
|
var addrs []address.Address
|
|
|
|
|
|
|
|
if !cctx.Bool("all") {
|
|
|
|
for _, a := range cctx.Args().Slice() {
|
|
|
|
addr, err := address.NewFromString(a)
|
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
|
|
|
|
addrs = append(addrs, addr)
|
|
|
|
}
|
|
|
|
}
|
2023-09-21 15:37:02 +00:00
|
|
|
h, err := loadChainStore(ctx, cctx.String("repo"))
|
2023-01-06 23:02:36 +00:00
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
2023-09-21 15:37:02 +00:00
|
|
|
defer h.closer()
|
2023-01-06 23:02:36 +00:00
|
|
|
|
|
|
|
tsr := &ChainStoreTipSetResolver{
|
2023-09-21 15:37:02 +00:00
|
|
|
Chain: h.cs,
|
2023-01-06 23:02:36 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
ts, err := lcli.LoadTipSet(ctx, cctx, tsr)
|
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
|
|
|
|
log.Infow("tipset", "parentstate", ts.ParentState())
|
|
|
|
|
|
|
|
if len(addrs) == 0 && cctx.Bool("all") {
|
|
|
|
var err error
|
2023-09-21 15:37:02 +00:00
|
|
|
addrs, err = h.sm.ListAllActors(ctx, ts)
|
2023-01-06 23:02:36 +00:00
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
numWorkers := cctx.Int("workers")
|
|
|
|
dagCacheSize := cctx.Int("dag-cache-size")
|
|
|
|
|
|
|
|
eg, egctx := errgroup.WithContext(ctx)
|
|
|
|
|
|
|
|
jobs := make(chan address.Address, numWorkers)
|
|
|
|
results := make(chan actorStats, numWorkers)
|
|
|
|
|
|
|
|
worker := func(ctx context.Context, id int) error {
|
|
|
|
completed := 0
|
|
|
|
defer func() {
|
|
|
|
log.Infow("worker done", "id", id, "completed", completed)
|
|
|
|
}()
|
|
|
|
|
|
|
|
for {
|
|
|
|
select {
|
|
|
|
case addr, ok := <-jobs:
|
|
|
|
if !ok {
|
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
2023-09-21 15:37:02 +00:00
|
|
|
actor, err := h.sm.LoadActor(ctx, addr, ts)
|
2023-01-06 23:02:36 +00:00
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
|
2023-09-21 15:37:02 +00:00
|
|
|
var dag format.NodeGetter = merkledag.NewDAGService(blockservice.New(h.bs, offline.Exchange(h.bs)))
|
2023-01-06 23:02:36 +00:00
|
|
|
if dagCacheSize != 0 {
|
|
|
|
var err error
|
2023-09-21 15:37:02 +00:00
|
|
|
dag, err = newCacheNodeGetter(merkledag.NewDAGService(blockservice.New(h.bs, offline.Exchange(h.bs))), dagCacheSize)
|
2023-01-06 23:02:36 +00:00
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
actStats, err := collectStats(ctx, addr, actor, dag)
|
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
|
|
|
|
select {
|
|
|
|
case results <- actStats:
|
|
|
|
case <-ctx.Done():
|
|
|
|
return ctx.Err()
|
|
|
|
}
|
|
|
|
case <-ctx.Done():
|
|
|
|
return ctx.Err()
|
|
|
|
}
|
|
|
|
|
|
|
|
completed = completed + 1
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
for w := 0; w < numWorkers; w++ {
|
|
|
|
id := w
|
|
|
|
eg.Go(func() error {
|
|
|
|
return worker(egctx, id)
|
|
|
|
})
|
|
|
|
}
|
|
|
|
|
|
|
|
go func() {
|
|
|
|
defer close(jobs)
|
|
|
|
for _, addr := range addrs {
|
|
|
|
jobs <- addr
|
|
|
|
}
|
|
|
|
}()
|
|
|
|
|
|
|
|
go func() {
|
|
|
|
// error is check later
|
|
|
|
eg.Wait() //nolint:errcheck
|
|
|
|
close(results)
|
|
|
|
}()
|
|
|
|
|
|
|
|
for {
|
|
|
|
select {
|
|
|
|
case result, ok := <-results:
|
|
|
|
if !ok {
|
|
|
|
return eg.Wait()
|
|
|
|
}
|
|
|
|
|
|
|
|
if cctx.Bool("pretty") {
|
|
|
|
DumpStats(result)
|
|
|
|
} else {
|
|
|
|
if err := DumpJSON(result); err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
}
|
|
|
|
case <-ctx.Done():
|
|
|
|
return ctx.Err()
|
|
|
|
}
|
|
|
|
}
|
|
|
|
},
|
|
|
|
}
|
|
|
|
|
2023-09-21 15:37:02 +00:00
|
|
|
func collectSnapshotJobStats(ctx context.Context, in job, dag format.NodeGetter, visit func(c cid.Cid) bool) ([]result, error) {
|
|
|
|
// "state" and "churn" attempt further breakdown by actor type
|
|
|
|
if !(path.Dir(in.key) == "/statetree/latest") && !(path.Dir(in.key) == "/statetree/churn") {
|
|
|
|
dsc := &dagStatCollector{
|
|
|
|
ds: dag,
|
|
|
|
walk: carWalkFunc,
|
|
|
|
}
|
|
|
|
|
|
|
|
if err := merkledag.Walk(ctx, dsc.walkLinks, in.c, visit, merkledag.Concurrent()); err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
return []result{{key: in.key, stats: dsc.stats}}, nil
|
|
|
|
}
|
|
|
|
|
|
|
|
// in.c is an actor head cid, try to unmarshal and create sub keys for different regions of state
|
|
|
|
nd, err := dag.Get(ctx, in.c)
|
|
|
|
if err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
subjobs := make([]job, 0)
|
|
|
|
results := make([]result, 0)
|
|
|
|
|
|
|
|
// reconstruct actor for state parsing from key
|
|
|
|
av, err := gstactors.VersionForNetwork(network.Version20)
|
|
|
|
if err != nil {
|
|
|
|
return nil, fmt.Errorf("failed to get actors version for network: %w", err)
|
|
|
|
}
|
|
|
|
code, ok := actors.GetActorCodeID(av, path.Base(in.key))
|
|
|
|
if !ok { // try parsing key directly
|
|
|
|
code, err = cid.Parse(path.Base(in.key))
|
|
|
|
if err != nil {
|
|
|
|
log.Debugf("failing to parse actor string: %s", path.Base(in.key))
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
actor := types.ActorV5{Head: in.c, Code: code}
|
|
|
|
oif, err := vm.DumpActorState(consensus.NewTipSetExecutor(filcns.RewardFunc).NewActorRegistry(), &actor, nd.RawData())
|
|
|
|
if err != nil {
|
|
|
|
oif = nil
|
|
|
|
}
|
|
|
|
// Account actors return nil from DumpActorState as they have no state
|
|
|
|
if oif != nil {
|
|
|
|
v := reflect.Indirect(reflect.ValueOf(oif))
|
|
|
|
for i := 0; i < v.NumField(); i++ {
|
|
|
|
varName := v.Type().Field(i).Name
|
|
|
|
varType := v.Type().Field(i).Type
|
|
|
|
varValue := v.Field(i).Interface()
|
|
|
|
|
|
|
|
if varType == reflect.TypeOf(cid.Cid{}) {
|
|
|
|
subjobs = append(subjobs, job{
|
|
|
|
key: fmt.Sprintf("%s/%s", in.key, varName),
|
|
|
|
c: varValue.(cid.Cid),
|
|
|
|
})
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
// Walk subfields
|
|
|
|
for _, job := range subjobs {
|
|
|
|
dsc := &dagStatCollector{
|
|
|
|
ds: dag,
|
|
|
|
walk: carWalkFunc,
|
|
|
|
}
|
|
|
|
|
|
|
|
if err := merkledag.Walk(ctx, dsc.walkLinks, job.c, visit, merkledag.Concurrent()); err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
var res result
|
|
|
|
res.key = job.key
|
|
|
|
res.stats = dsc.stats
|
|
|
|
|
|
|
|
results = append(results, res)
|
|
|
|
}
|
|
|
|
|
|
|
|
// now walk the top level object of actor state
|
|
|
|
dsc := &dagStatCollector{
|
|
|
|
ds: dag,
|
|
|
|
walk: carWalkFunc,
|
|
|
|
}
|
|
|
|
|
|
|
|
if err := merkledag.Walk(ctx, dsc.walkLinks, in.c, visit, merkledag.Concurrent()); err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
results = append(results, result{key: in.key, stats: dsc.stats})
|
|
|
|
return results, nil
|
|
|
|
}
|
|
|
|
|
2023-01-06 23:02:36 +00:00
|
|
|
func collectStats(ctx context.Context, addr address.Address, actor *types.Actor, dag format.NodeGetter) (actorStats, error) {
|
|
|
|
log.Infow("actor", "addr", addr, "code", actor.Code, "name", builtin.ActorNameByCode(actor.Code))
|
|
|
|
|
|
|
|
nd, err := dag.Get(ctx, actor.Head)
|
|
|
|
if err != nil {
|
|
|
|
return actorStats{}, err
|
|
|
|
}
|
|
|
|
|
|
|
|
// When it comes to fvm / evm actors this method of inspecting fields will probably not work
|
|
|
|
// and we may only be able to collect stats for the top level object. We might be able to iterate
|
|
|
|
// over the top level fields for the actors and identify field that are CIDs, but unsure if we would
|
|
|
|
// be able to identify a field name.
|
|
|
|
|
|
|
|
oif, err := vm.DumpActorState(consensus.NewTipSetExecutor(filcns.RewardFunc).NewActorRegistry(), actor, nd.RawData())
|
|
|
|
if err != nil {
|
|
|
|
oif = nil
|
|
|
|
}
|
|
|
|
|
|
|
|
fields := []fieldItem{}
|
|
|
|
|
|
|
|
// Account actors return nil from DumpActorState as they have no state
|
|
|
|
if oif != nil {
|
|
|
|
v := reflect.Indirect(reflect.ValueOf(oif))
|
|
|
|
for i := 0; i < v.NumField(); i++ {
|
|
|
|
varName := v.Type().Field(i).Name
|
|
|
|
varType := v.Type().Field(i).Type
|
|
|
|
varValue := v.Field(i).Interface()
|
|
|
|
|
|
|
|
if varType == reflect.TypeOf(cid.Cid{}) {
|
|
|
|
fields = append(fields, fieldItem{
|
|
|
|
Name: varName,
|
|
|
|
Cid: varValue.(cid.Cid),
|
|
|
|
})
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
actStats := actorStats{
|
|
|
|
Address: addr,
|
|
|
|
Actor: actor,
|
|
|
|
}
|
|
|
|
|
|
|
|
dsc := &dagStatCollector{
|
|
|
|
ds: dag,
|
|
|
|
walk: carWalkFunc,
|
|
|
|
}
|
|
|
|
|
|
|
|
if err := merkledag.Walk(ctx, dsc.walkLinks, actor.Head, cid.NewSet().Visit, merkledag.Concurrent()); err != nil {
|
|
|
|
return actorStats{}, err
|
|
|
|
}
|
|
|
|
|
|
|
|
actStats.Stats = dsc.stats
|
|
|
|
|
|
|
|
for _, field := range fields {
|
|
|
|
dsc := &dagStatCollector{
|
|
|
|
ds: dag,
|
|
|
|
walk: carWalkFunc,
|
|
|
|
}
|
|
|
|
|
|
|
|
if err := merkledag.Walk(ctx, dsc.walkLinks, field.Cid, cid.NewSet().Visit, merkledag.Concurrent()); err != nil {
|
|
|
|
return actorStats{}, err
|
|
|
|
}
|
|
|
|
|
|
|
|
field.Stats = dsc.stats
|
|
|
|
|
|
|
|
actStats.Fields = append(actStats.Fields, field)
|
|
|
|
}
|
|
|
|
|
|
|
|
return actStats, nil
|
|
|
|
}
|
|
|
|
|
|
|
|
func DumpJSON(i interface{}) error {
|
|
|
|
bs, err := json.Marshal(i)
|
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
|
|
|
|
fmt.Println(string(bs))
|
|
|
|
|
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
|
|
|
func DumpStats(actStats actorStats) {
|
|
|
|
strtype := builtin.ActorNameByCode(actStats.Actor.Code)
|
|
|
|
fmt.Printf("Address:\t%s\n", actStats.Address)
|
|
|
|
fmt.Printf("Balance:\t%s\n", types.FIL(actStats.Actor.Balance))
|
|
|
|
fmt.Printf("Nonce:\t\t%d\n", actStats.Actor.Nonce)
|
|
|
|
fmt.Printf("Code:\t\t%s (%s)\n", actStats.Actor.Code, strtype)
|
|
|
|
fmt.Printf("Head:\t\t%s\n", actStats.Actor.Head)
|
|
|
|
fmt.Println()
|
|
|
|
|
|
|
|
fmt.Printf("%-*s%-*s%-*s\n", 32, "Field", 24, "Size", 24, "\"Blocks\"")
|
|
|
|
|
|
|
|
stats := actStats.Stats
|
|
|
|
sizeStr := units.BytesSize(float64(stats.Size))
|
|
|
|
fmt.Printf("%-*s%-*s%-*s%-*d\n", 32, "<self>", 10, sizeStr, 14, fmt.Sprintf("(%d)", stats.Size), 24, stats.Links)
|
|
|
|
|
|
|
|
for _, s := range actStats.Fields {
|
|
|
|
stats := s.Stats
|
|
|
|
sizeStr := units.BytesSize(float64(stats.Size))
|
|
|
|
fmt.Printf("%-*s%-*s%-*s%-*d\n", 32, s.Name, 10, sizeStr, 14, fmt.Sprintf("(%d)", stats.Size), 24, stats.Links)
|
|
|
|
}
|
|
|
|
|
|
|
|
fmt.Println("--------------------------------------------------------------------------")
|
|
|
|
}
|
2023-09-21 15:37:02 +00:00
|
|
|
|
|
|
|
func DumpSnapshotStats(stats map[string]api.ObjStat) {
|
|
|
|
// sort keys so we get subkey locality
|
|
|
|
keys := make([]string, 0, len(stats))
|
|
|
|
for k := range stats {
|
|
|
|
keys = append(keys, k)
|
|
|
|
}
|
|
|
|
sort.Strings(keys)
|
|
|
|
|
|
|
|
fmt.Printf("%-*s%-*s%-*s\n", 32, "Path", 24, "Size", 24, "\"Blocks\"")
|
|
|
|
for _, k := range keys {
|
|
|
|
stat := stats[k]
|
|
|
|
sizeStr := units.BytesSize(float64(stat.Size))
|
|
|
|
fmt.Printf("%-*s%-*s%-*s%-*d\n", 32, k, 10, sizeStr, 14, fmt.Sprintf("(%d)", stat.Size), 24, stat.Links)
|
|
|
|
}
|
|
|
|
}
|