Merge pull request #3437 from filecoin-project/feat/mpool-stats-cmd
add a simple command to watch messages sitting in the mempool
This commit is contained in:
commit
767341b279
@ -33,6 +33,7 @@ func main() {
|
|||||||
mpoolCmd,
|
mpoolCmd,
|
||||||
genesisVerifyCmd,
|
genesisVerifyCmd,
|
||||||
mathCmd,
|
mathCmd,
|
||||||
|
mpoolStatsCmd,
|
||||||
}
|
}
|
||||||
|
|
||||||
app := &cli.App{
|
app := &cli.App{
|
||||||
|
273
cmd/lotus-shed/mempool-stats.go
Normal file
273
cmd/lotus-shed/mempool-stats.go
Normal file
@ -0,0 +1,273 @@
|
|||||||
|
package main
|
||||||
|
|
||||||
|
import (
|
||||||
|
"fmt"
|
||||||
|
"net/http"
|
||||||
|
"sort"
|
||||||
|
"time"
|
||||||
|
|
||||||
|
"contrib.go.opencensus.io/exporter/prometheus"
|
||||||
|
"github.com/ipfs/go-cid"
|
||||||
|
logging "github.com/ipfs/go-log"
|
||||||
|
"github.com/urfave/cli/v2"
|
||||||
|
"go.opencensus.io/stats"
|
||||||
|
"go.opencensus.io/stats/view"
|
||||||
|
"go.opencensus.io/tag"
|
||||||
|
|
||||||
|
"github.com/filecoin-project/go-address"
|
||||||
|
lapi "github.com/filecoin-project/lotus/api"
|
||||||
|
"github.com/filecoin-project/lotus/chain/types"
|
||||||
|
lcli "github.com/filecoin-project/lotus/cli"
|
||||||
|
"github.com/filecoin-project/specs-actors/actors/builtin"
|
||||||
|
)
|
||||||
|
|
||||||
|
var (
|
||||||
|
MpoolAge = stats.Float64("mpoolage", "Age of messages in the mempool", stats.UnitSeconds)
|
||||||
|
MpoolSize = stats.Int64("mpoolsize", "Number of messages in mempool", stats.UnitDimensionless)
|
||||||
|
MpoolInboundRate = stats.Int64("inbound", "Counter for inbound messages", stats.UnitDimensionless)
|
||||||
|
BlockInclusionRate = stats.Int64("inclusion", "Counter for message included in blocks", stats.UnitDimensionless)
|
||||||
|
MsgWaitTime = stats.Float64("msg-wait-time", "Wait time of messages to make it into a block", stats.UnitSeconds)
|
||||||
|
)
|
||||||
|
|
||||||
|
var (
|
||||||
|
LeTag, _ = tag.NewKey("quantile")
|
||||||
|
MTTag, _ = tag.NewKey("msg_type")
|
||||||
|
)
|
||||||
|
|
||||||
|
var (
|
||||||
|
AgeView = &view.View{
|
||||||
|
Name: "mpool-age",
|
||||||
|
Measure: MpoolAge,
|
||||||
|
TagKeys: []tag.Key{LeTag, MTTag},
|
||||||
|
Aggregation: view.LastValue(),
|
||||||
|
}
|
||||||
|
SizeView = &view.View{
|
||||||
|
Name: "mpool-size",
|
||||||
|
Measure: MpoolSize,
|
||||||
|
TagKeys: []tag.Key{MTTag},
|
||||||
|
Aggregation: view.LastValue(),
|
||||||
|
}
|
||||||
|
InboundRate = &view.View{
|
||||||
|
Name: "msg-inbound",
|
||||||
|
Measure: MpoolInboundRate,
|
||||||
|
TagKeys: []tag.Key{MTTag},
|
||||||
|
Aggregation: view.Count(),
|
||||||
|
}
|
||||||
|
InclusionRate = &view.View{
|
||||||
|
Name: "msg-inclusion",
|
||||||
|
Measure: BlockInclusionRate,
|
||||||
|
TagKeys: []tag.Key{MTTag},
|
||||||
|
Aggregation: view.Count(),
|
||||||
|
}
|
||||||
|
MsgWait = &view.View{
|
||||||
|
Name: "msg-wait",
|
||||||
|
Measure: MsgWaitTime,
|
||||||
|
TagKeys: []tag.Key{MTTag},
|
||||||
|
Aggregation: view.Distribution(10, 30, 60, 120, 240, 600, 1800, 3600),
|
||||||
|
}
|
||||||
|
)
|
||||||
|
|
||||||
|
type msgInfo struct {
|
||||||
|
msg *types.SignedMessage
|
||||||
|
seen time.Time
|
||||||
|
}
|
||||||
|
|
||||||
|
var mpoolStatsCmd = &cli.Command{
|
||||||
|
Name: "mpool-stats",
|
||||||
|
Action: func(cctx *cli.Context) error {
|
||||||
|
logging.SetLogLevel("rpc", "ERROR")
|
||||||
|
|
||||||
|
if err := view.Register(AgeView, SizeView, InboundRate, InclusionRate, MsgWait); err != nil {
|
||||||
|
return err
|
||||||
|
}
|
||||||
|
|
||||||
|
expo, err := prometheus.NewExporter(prometheus.Options{
|
||||||
|
Namespace: "lotusmpool",
|
||||||
|
})
|
||||||
|
if err != nil {
|
||||||
|
return err
|
||||||
|
}
|
||||||
|
|
||||||
|
http.Handle("/debug/metrics", expo)
|
||||||
|
|
||||||
|
go func() {
|
||||||
|
if err := http.ListenAndServe(":10555", nil); err != nil {
|
||||||
|
panic(err)
|
||||||
|
}
|
||||||
|
}()
|
||||||
|
|
||||||
|
api, closer, err := lcli.GetFullNodeAPI(cctx)
|
||||||
|
if err != nil {
|
||||||
|
return err
|
||||||
|
}
|
||||||
|
|
||||||
|
defer closer()
|
||||||
|
ctx := lcli.ReqContext(cctx)
|
||||||
|
|
||||||
|
updates, err := api.MpoolSub(ctx)
|
||||||
|
if err != nil {
|
||||||
|
return err
|
||||||
|
}
|
||||||
|
|
||||||
|
mcache := make(map[address.Address]bool)
|
||||||
|
isMiner := func(addr address.Address) (bool, error) {
|
||||||
|
cache, ok := mcache[addr]
|
||||||
|
if ok {
|
||||||
|
return cache, nil
|
||||||
|
}
|
||||||
|
|
||||||
|
act, err := api.StateGetActor(ctx, addr, types.EmptyTSK)
|
||||||
|
if err != nil {
|
||||||
|
return false, err
|
||||||
|
}
|
||||||
|
|
||||||
|
ism := act.Code == builtin.StorageMinerActorCodeID
|
||||||
|
mcache[addr] = ism
|
||||||
|
return ism, nil
|
||||||
|
}
|
||||||
|
|
||||||
|
wpostTracker := make(map[cid.Cid]*msgInfo)
|
||||||
|
tracker := make(map[cid.Cid]*msgInfo)
|
||||||
|
tick := time.Tick(time.Second)
|
||||||
|
for {
|
||||||
|
select {
|
||||||
|
case u, ok := <-updates:
|
||||||
|
if !ok {
|
||||||
|
return fmt.Errorf("connection with lotus node broke")
|
||||||
|
}
|
||||||
|
switch u.Type {
|
||||||
|
case lapi.MpoolAdd:
|
||||||
|
stats.Record(ctx, MpoolInboundRate.M(1))
|
||||||
|
tracker[u.Message.Cid()] = &msgInfo{
|
||||||
|
msg: u.Message,
|
||||||
|
seen: time.Now(),
|
||||||
|
}
|
||||||
|
|
||||||
|
if u.Message.Message.Method == builtin.MethodsMiner.SubmitWindowedPoSt {
|
||||||
|
|
||||||
|
miner, err := isMiner(u.Message.Message.To)
|
||||||
|
if err != nil {
|
||||||
|
log.Warnf("failed to determine if message target was to a miner: %s", err)
|
||||||
|
continue
|
||||||
|
}
|
||||||
|
|
||||||
|
if miner {
|
||||||
|
wpostTracker[u.Message.Cid()] = &msgInfo{
|
||||||
|
msg: u.Message,
|
||||||
|
seen: time.Now(),
|
||||||
|
}
|
||||||
|
_ = stats.RecordWithTags(ctx, []tag.Mutator{tag.Upsert(MTTag, "wpost")}, MpoolInboundRate.M(1))
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
case lapi.MpoolRemove:
|
||||||
|
mi, ok := tracker[u.Message.Cid()]
|
||||||
|
if ok {
|
||||||
|
fmt.Printf("%s was in the mempool for %s (feecap=%s, prem=%s)\n", u.Message.Cid(), time.Since(mi.seen), u.Message.Message.GasFeeCap, u.Message.Message.GasPremium)
|
||||||
|
stats.Record(ctx, BlockInclusionRate.M(1))
|
||||||
|
stats.Record(ctx, MsgWaitTime.M(time.Since(mi.seen).Seconds()))
|
||||||
|
delete(tracker, u.Message.Cid())
|
||||||
|
}
|
||||||
|
|
||||||
|
wm, ok := wpostTracker[u.Message.Cid()]
|
||||||
|
if ok {
|
||||||
|
_ = stats.RecordWithTags(ctx, []tag.Mutator{tag.Upsert(MTTag, "wpost")}, BlockInclusionRate.M(1))
|
||||||
|
_ = stats.RecordWithTags(ctx, []tag.Mutator{tag.Upsert(MTTag, "wpost")}, MsgWaitTime.M(time.Since(wm.seen).Seconds()))
|
||||||
|
delete(wpostTracker, u.Message.Cid())
|
||||||
|
}
|
||||||
|
default:
|
||||||
|
return fmt.Errorf("unrecognized mpool update state: %d", u.Type)
|
||||||
|
}
|
||||||
|
case <-tick:
|
||||||
|
var ages []time.Duration
|
||||||
|
if len(tracker) > 0 {
|
||||||
|
for _, v := range tracker {
|
||||||
|
age := time.Since(v.seen)
|
||||||
|
ages = append(ages, age)
|
||||||
|
}
|
||||||
|
|
||||||
|
st := ageStats(ages)
|
||||||
|
_ = stats.RecordWithTags(ctx, []tag.Mutator{tag.Upsert(LeTag, "40")}, MpoolAge.M(st.Perc40.Seconds()))
|
||||||
|
_ = stats.RecordWithTags(ctx, []tag.Mutator{tag.Upsert(LeTag, "50")}, MpoolAge.M(st.Perc50.Seconds()))
|
||||||
|
_ = stats.RecordWithTags(ctx, []tag.Mutator{tag.Upsert(LeTag, "60")}, MpoolAge.M(st.Perc60.Seconds()))
|
||||||
|
_ = stats.RecordWithTags(ctx, []tag.Mutator{tag.Upsert(LeTag, "70")}, MpoolAge.M(st.Perc70.Seconds()))
|
||||||
|
_ = stats.RecordWithTags(ctx, []tag.Mutator{tag.Upsert(LeTag, "80")}, MpoolAge.M(st.Perc80.Seconds()))
|
||||||
|
_ = stats.RecordWithTags(ctx, []tag.Mutator{tag.Upsert(LeTag, "90")}, MpoolAge.M(st.Perc90.Seconds()))
|
||||||
|
_ = stats.RecordWithTags(ctx, []tag.Mutator{tag.Upsert(LeTag, "95")}, MpoolAge.M(st.Perc95.Seconds()))
|
||||||
|
|
||||||
|
stats.Record(ctx, MpoolSize.M(int64(len(tracker))))
|
||||||
|
fmt.Printf("%d messages in mempool for average of %s, (%s / %s / %s)\n", st.Count, st.Average, st.Perc50, st.Perc80, st.Perc95)
|
||||||
|
}
|
||||||
|
|
||||||
|
var wpages []time.Duration
|
||||||
|
if len(wpostTracker) > 0 {
|
||||||
|
for _, v := range wpostTracker {
|
||||||
|
age := time.Since(v.seen)
|
||||||
|
wpages = append(wpages, age)
|
||||||
|
}
|
||||||
|
|
||||||
|
st := ageStats(wpages)
|
||||||
|
_ = stats.RecordWithTags(ctx, []tag.Mutator{tag.Upsert(LeTag, "40"), tag.Upsert(MTTag, "wpost")}, MpoolAge.M(st.Perc40.Seconds()))
|
||||||
|
_ = stats.RecordWithTags(ctx, []tag.Mutator{tag.Upsert(LeTag, "50"), tag.Upsert(MTTag, "wpost")}, MpoolAge.M(st.Perc50.Seconds()))
|
||||||
|
_ = stats.RecordWithTags(ctx, []tag.Mutator{tag.Upsert(LeTag, "60"), tag.Upsert(MTTag, "wpost")}, MpoolAge.M(st.Perc60.Seconds()))
|
||||||
|
_ = stats.RecordWithTags(ctx, []tag.Mutator{tag.Upsert(LeTag, "70"), tag.Upsert(MTTag, "wpost")}, MpoolAge.M(st.Perc70.Seconds()))
|
||||||
|
_ = stats.RecordWithTags(ctx, []tag.Mutator{tag.Upsert(LeTag, "80"), tag.Upsert(MTTag, "wpost")}, MpoolAge.M(st.Perc80.Seconds()))
|
||||||
|
_ = stats.RecordWithTags(ctx, []tag.Mutator{tag.Upsert(LeTag, "90"), tag.Upsert(MTTag, "wpost")}, MpoolAge.M(st.Perc90.Seconds()))
|
||||||
|
_ = stats.RecordWithTags(ctx, []tag.Mutator{tag.Upsert(LeTag, "95"), tag.Upsert(MTTag, "wpost")}, MpoolAge.M(st.Perc95.Seconds()))
|
||||||
|
|
||||||
|
_ = stats.RecordWithTags(ctx, []tag.Mutator{tag.Upsert(MTTag, "wpost")}, MpoolSize.M(int64(len(wpostTracker))))
|
||||||
|
fmt.Printf("%d wpost messages in mempool for average of %s, (%s / %s / %s)\n", st.Count, st.Average, st.Perc50, st.Perc80, st.Perc95)
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
||||||
|
},
|
||||||
|
}
|
||||||
|
|
||||||
|
type ageStat struct {
|
||||||
|
Average time.Duration
|
||||||
|
Max time.Duration
|
||||||
|
Perc40 time.Duration
|
||||||
|
Perc50 time.Duration
|
||||||
|
Perc60 time.Duration
|
||||||
|
Perc70 time.Duration
|
||||||
|
Perc80 time.Duration
|
||||||
|
Perc90 time.Duration
|
||||||
|
Perc95 time.Duration
|
||||||
|
Count int
|
||||||
|
}
|
||||||
|
|
||||||
|
func ageStats(ages []time.Duration) *ageStat {
|
||||||
|
sort.Slice(ages, func(i, j int) bool {
|
||||||
|
return ages[i] < ages[j]
|
||||||
|
})
|
||||||
|
|
||||||
|
st := ageStat{
|
||||||
|
Count: len(ages),
|
||||||
|
}
|
||||||
|
var sum time.Duration
|
||||||
|
for _, a := range ages {
|
||||||
|
sum += a
|
||||||
|
if a > st.Max {
|
||||||
|
st.Max = a
|
||||||
|
}
|
||||||
|
}
|
||||||
|
st.Average = sum / time.Duration(len(ages))
|
||||||
|
|
||||||
|
p40 := (4 * len(ages)) / 10
|
||||||
|
p50 := len(ages) / 2
|
||||||
|
p60 := (6 * len(ages)) / 10
|
||||||
|
p70 := (7 * len(ages)) / 10
|
||||||
|
p80 := (4 * len(ages)) / 5
|
||||||
|
p90 := (9 * len(ages)) / 10
|
||||||
|
p95 := (19 * len(ages)) / 20
|
||||||
|
|
||||||
|
st.Perc40 = ages[p40]
|
||||||
|
st.Perc50 = ages[p50]
|
||||||
|
st.Perc60 = ages[p60]
|
||||||
|
st.Perc70 = ages[p70]
|
||||||
|
st.Perc80 = ages[p80]
|
||||||
|
st.Perc90 = ages[p90]
|
||||||
|
st.Perc95 = ages[p95]
|
||||||
|
|
||||||
|
return &st
|
||||||
|
}
|
Loading…
Reference in New Issue
Block a user