2022-01-18 12:56:24 +00:00
|
|
|
package lp2p
|
|
|
|
|
|
|
|
import (
|
2022-01-20 09:47:39 +00:00
|
|
|
"context"
|
2022-01-18 12:56:24 +00:00
|
|
|
"errors"
|
|
|
|
"fmt"
|
2022-03-15 07:43:18 +00:00
|
|
|
"math/bits"
|
2022-01-18 12:56:24 +00:00
|
|
|
"os"
|
|
|
|
"path/filepath"
|
|
|
|
|
2022-07-05 22:07:56 +00:00
|
|
|
ocprom "contrib.go.opencensus.io/exporter/prometheus"
|
2022-06-14 15:00:51 +00:00
|
|
|
logging "github.com/ipfs/go-log/v2"
|
2022-01-18 12:56:24 +00:00
|
|
|
"github.com/libp2p/go-libp2p"
|
|
|
|
"github.com/libp2p/go-libp2p-core/network"
|
2022-02-14 17:46:05 +00:00
|
|
|
"github.com/libp2p/go-libp2p-core/peer"
|
|
|
|
"github.com/libp2p/go-libp2p-core/protocol"
|
2022-01-18 12:56:24 +00:00
|
|
|
rcmgr "github.com/libp2p/go-libp2p-resource-manager"
|
2022-07-05 22:07:56 +00:00
|
|
|
rcmgrObs "github.com/libp2p/go-libp2p-resource-manager/obs"
|
|
|
|
"github.com/prometheus/client_golang/prometheus"
|
2022-06-14 15:00:51 +00:00
|
|
|
"go.opencensus.io/stats"
|
2022-07-05 22:07:56 +00:00
|
|
|
"go.opencensus.io/stats/view"
|
2022-06-14 15:00:51 +00:00
|
|
|
"go.opencensus.io/tag"
|
|
|
|
"go.uber.org/fx"
|
2022-03-15 07:43:18 +00:00
|
|
|
|
2022-02-14 17:46:05 +00:00
|
|
|
"github.com/filecoin-project/lotus/metrics"
|
2022-01-18 12:56:24 +00:00
|
|
|
"github.com/filecoin-project/lotus/node/repo"
|
|
|
|
)
|
|
|
|
|
2022-03-15 07:43:18 +00:00
|
|
|
func ResourceManager(connMgrHi uint) func(lc fx.Lifecycle, repo repo.LockedRepo) (network.ResourceManager, error) {
|
|
|
|
return func(lc fx.Lifecycle, repo repo.LockedRepo) (network.ResourceManager, error) {
|
2022-05-31 09:03:03 +00:00
|
|
|
isFullNode := repo.RepoType().Type() == "FullNode"
|
2022-03-15 07:43:18 +00:00
|
|
|
envvar := os.Getenv("LOTUS_RCMGR")
|
2022-05-31 09:32:56 +00:00
|
|
|
if (isFullNode && envvar == "0") || // only set NullResourceManager if envvar is explicitly "0"
|
2022-05-31 09:33:08 +00:00
|
|
|
(!isFullNode && envvar != "1") { // set NullResourceManager *unless* envvar is explicitly "1"
|
2022-03-15 07:43:18 +00:00
|
|
|
log.Info("libp2p resource manager is disabled")
|
|
|
|
return network.NullResourceManager, nil
|
|
|
|
}
|
2022-01-18 12:56:24 +00:00
|
|
|
|
2022-03-15 07:43:18 +00:00
|
|
|
log.Info("libp2p resource manager is enabled")
|
|
|
|
// enable debug logs for rcmgr
|
|
|
|
logging.SetLogLevel("rcmgr", "debug")
|
|
|
|
|
2022-07-05 22:07:56 +00:00
|
|
|
// Adjust default defaultLimits
|
2022-03-15 07:43:18 +00:00
|
|
|
// - give it more memory, up to 4G, min of 1G
|
2022-07-05 22:07:56 +00:00
|
|
|
// - if maxconns are too high, adjust Conn/FD/Stream defaultLimits
|
|
|
|
defaultLimits := rcmgr.DefaultLimits
|
|
|
|
|
|
|
|
// TODO: also set appropriate default limits for lotus protocols
|
|
|
|
libp2p.SetDefaultServiceLimits(&defaultLimits)
|
|
|
|
|
|
|
|
// Minimum 1GB of memory
|
|
|
|
defaultLimits.SystemBaseLimit.Memory = 1 << 30
|
|
|
|
// For every extra 1GB of memory we have available, increase our limit by 1GiB
|
|
|
|
defaultLimits.SystemLimitIncrease.Memory = 1 << 30
|
2022-07-06 17:12:09 +00:00
|
|
|
defaultLimitConfig := defaultLimits.AutoScale()
|
2022-07-05 22:07:56 +00:00
|
|
|
if defaultLimitConfig.System.Memory > 4<<30 {
|
|
|
|
// Cap our memory limit
|
|
|
|
defaultLimitConfig.System.Memory = 4 << 30
|
|
|
|
}
|
|
|
|
|
2022-03-15 07:43:18 +00:00
|
|
|
maxconns := int(connMgrHi)
|
2022-07-05 22:07:56 +00:00
|
|
|
if 2*maxconns > defaultLimitConfig.System.ConnsInbound {
|
2022-03-15 07:59:34 +00:00
|
|
|
// adjust conns to 2x to allow for two conns per peer (TCP+QUIC)
|
2022-07-05 22:07:56 +00:00
|
|
|
defaultLimitConfig.System.ConnsInbound = logScale(2 * maxconns)
|
|
|
|
defaultLimitConfig.System.ConnsOutbound = logScale(2 * maxconns)
|
|
|
|
defaultLimitConfig.System.Conns = logScale(4 * maxconns)
|
2022-03-15 07:43:18 +00:00
|
|
|
|
2022-07-05 22:07:56 +00:00
|
|
|
defaultLimitConfig.System.StreamsInbound = logScale(16 * maxconns)
|
|
|
|
defaultLimitConfig.System.StreamsOutbound = logScale(64 * maxconns)
|
|
|
|
defaultLimitConfig.System.Streams = logScale(64 * maxconns)
|
2022-03-15 07:43:18 +00:00
|
|
|
|
2022-07-05 22:07:56 +00:00
|
|
|
if 2*maxconns > defaultLimitConfig.System.FD {
|
|
|
|
defaultLimitConfig.System.FD = logScale(2 * maxconns)
|
2022-03-15 07:43:18 +00:00
|
|
|
}
|
|
|
|
|
2022-07-05 22:07:56 +00:00
|
|
|
defaultLimitConfig.ServiceDefault.StreamsInbound = logScale(8 * maxconns)
|
|
|
|
defaultLimitConfig.ServiceDefault.StreamsOutbound = logScale(32 * maxconns)
|
|
|
|
defaultLimitConfig.ServiceDefault.Streams = logScale(32 * maxconns)
|
2022-03-15 07:43:18 +00:00
|
|
|
|
2022-07-05 22:07:56 +00:00
|
|
|
defaultLimitConfig.ProtocolDefault.StreamsInbound = logScale(8 * maxconns)
|
|
|
|
defaultLimitConfig.ProtocolDefault.StreamsOutbound = logScale(32 * maxconns)
|
|
|
|
defaultLimitConfig.ProtocolDefault.Streams = logScale(32 * maxconns)
|
2022-03-15 07:43:18 +00:00
|
|
|
|
|
|
|
log.Info("adjusted default resource manager limits")
|
2022-01-18 12:56:24 +00:00
|
|
|
}
|
|
|
|
|
2022-03-15 07:43:18 +00:00
|
|
|
// initialize
|
2022-07-05 22:07:56 +00:00
|
|
|
var limiter rcmgr.Limiter
|
2022-03-15 07:43:18 +00:00
|
|
|
var opts []rcmgr.Option
|
2022-01-18 12:56:24 +00:00
|
|
|
|
2022-03-15 07:43:18 +00:00
|
|
|
repoPath := repo.Path()
|
2022-01-18 12:56:24 +00:00
|
|
|
|
2022-03-15 07:43:18 +00:00
|
|
|
// create limiter -- parse $repo/limits.json if exists
|
|
|
|
limitsFile := filepath.Join(repoPath, "limits.json")
|
|
|
|
limitsIn, err := os.Open(limitsFile)
|
|
|
|
switch {
|
|
|
|
case err == nil:
|
|
|
|
defer limitsIn.Close() //nolint:errcheck
|
2022-07-05 22:07:56 +00:00
|
|
|
limiter, err = rcmgr.NewLimiterFromJSON(limitsIn, defaultLimitConfig)
|
2022-03-15 07:43:18 +00:00
|
|
|
if err != nil {
|
|
|
|
return nil, fmt.Errorf("error parsing limit file: %w", err)
|
|
|
|
}
|
2022-01-18 12:56:24 +00:00
|
|
|
|
2022-03-15 07:43:18 +00:00
|
|
|
case errors.Is(err, os.ErrNotExist):
|
2022-07-05 22:07:56 +00:00
|
|
|
limiter = rcmgr.NewFixedLimiter(defaultLimitConfig)
|
2022-02-14 17:46:05 +00:00
|
|
|
|
2022-03-15 07:43:18 +00:00
|
|
|
default:
|
|
|
|
return nil, err
|
2022-01-18 12:56:24 +00:00
|
|
|
}
|
|
|
|
|
2022-07-05 22:07:56 +00:00
|
|
|
str, err := rcmgrObs.NewStatsTraceReporter()
|
|
|
|
if err != nil {
|
|
|
|
return nil, fmt.Errorf("error creating resource manager stats reporter: %w", err)
|
|
|
|
}
|
2022-03-15 07:43:18 +00:00
|
|
|
|
2022-07-05 22:07:56 +00:00
|
|
|
// Metrics
|
|
|
|
opts = append(opts, rcmgr.WithMetrics(rcmgrMetrics{}), rcmgr.WithTraceReporter(str))
|
2022-01-18 12:56:24 +00:00
|
|
|
|
2022-03-15 07:43:18 +00:00
|
|
|
if os.Getenv("LOTUS_DEBUG_RCMGR") != "" {
|
|
|
|
debugPath := filepath.Join(repoPath, "debug")
|
|
|
|
if err := os.MkdirAll(debugPath, 0755); err != nil {
|
|
|
|
return nil, fmt.Errorf("error creating debug directory: %w", err)
|
|
|
|
}
|
|
|
|
traceFile := filepath.Join(debugPath, "rcmgr.json.gz")
|
|
|
|
opts = append(opts, rcmgr.WithTrace(traceFile))
|
|
|
|
}
|
|
|
|
|
|
|
|
mgr, err := rcmgr.NewResourceManager(limiter, opts...)
|
|
|
|
if err != nil {
|
|
|
|
return nil, fmt.Errorf("error creating resource manager: %w", err)
|
|
|
|
}
|
|
|
|
|
2022-07-05 22:07:56 +00:00
|
|
|
// Hook up resource manager metrics
|
2022-07-05 23:07:01 +00:00
|
|
|
err = view.Register(rcmgrObs.DefaultViews...)
|
|
|
|
if err != nil {
|
|
|
|
return nil, fmt.Errorf("error registering metrics: %w", err)
|
|
|
|
}
|
|
|
|
_, err = ocprom.NewExporter(ocprom.Options{
|
2022-07-05 22:07:56 +00:00
|
|
|
Registry: prometheus.DefaultRegisterer.(*prometheus.Registry),
|
|
|
|
Namespace: "rcmgr_trace_metrics",
|
|
|
|
})
|
2022-07-05 23:07:01 +00:00
|
|
|
if err != nil {
|
|
|
|
return nil, fmt.Errorf("error registering metrics: %w", err)
|
|
|
|
}
|
2022-07-05 22:07:56 +00:00
|
|
|
|
2022-03-15 07:43:18 +00:00
|
|
|
lc.Append(fx.Hook{
|
|
|
|
OnStop: func(_ context.Context) error {
|
|
|
|
return mgr.Close()
|
|
|
|
}})
|
|
|
|
|
|
|
|
return mgr, nil
|
|
|
|
}
|
|
|
|
}
|
2022-01-20 09:47:39 +00:00
|
|
|
|
2022-03-15 07:43:18 +00:00
|
|
|
func logScale(val int) int {
|
|
|
|
bitlen := bits.Len(uint(val))
|
|
|
|
return 1 << bitlen
|
2022-01-18 12:56:24 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
func ResourceManagerOption(mgr network.ResourceManager) Libp2pOpts {
|
|
|
|
return Libp2pOpts{
|
|
|
|
Opts: []libp2p.Option{libp2p.ResourceManager(mgr)},
|
|
|
|
}
|
|
|
|
}
|
2022-02-14 17:46:05 +00:00
|
|
|
|
|
|
|
type rcmgrMetrics struct{}
|
|
|
|
|
|
|
|
func (r rcmgrMetrics) AllowConn(dir network.Direction, usefd bool) {
|
|
|
|
ctx := context.Background()
|
|
|
|
if dir == network.DirInbound {
|
|
|
|
ctx, _ = tag.New(ctx, tag.Upsert(metrics.Direction, "inbound"))
|
|
|
|
} else {
|
|
|
|
ctx, _ = tag.New(ctx, tag.Upsert(metrics.Direction, "outbound"))
|
|
|
|
}
|
|
|
|
if usefd {
|
|
|
|
ctx, _ = tag.New(ctx, tag.Upsert(metrics.UseFD, "true"))
|
|
|
|
} else {
|
|
|
|
ctx, _ = tag.New(ctx, tag.Upsert(metrics.UseFD, "false"))
|
|
|
|
}
|
|
|
|
stats.Record(ctx, metrics.RcmgrAllowConn.M(1))
|
|
|
|
}
|
|
|
|
|
|
|
|
func (r rcmgrMetrics) BlockConn(dir network.Direction, usefd bool) {
|
|
|
|
ctx := context.Background()
|
|
|
|
if dir == network.DirInbound {
|
|
|
|
ctx, _ = tag.New(ctx, tag.Upsert(metrics.Direction, "inbound"))
|
|
|
|
} else {
|
|
|
|
ctx, _ = tag.New(ctx, tag.Upsert(metrics.Direction, "outbound"))
|
|
|
|
}
|
|
|
|
if usefd {
|
|
|
|
ctx, _ = tag.New(ctx, tag.Upsert(metrics.UseFD, "true"))
|
|
|
|
} else {
|
|
|
|
ctx, _ = tag.New(ctx, tag.Upsert(metrics.UseFD, "false"))
|
|
|
|
}
|
|
|
|
stats.Record(ctx, metrics.RcmgrBlockConn.M(1))
|
|
|
|
}
|
|
|
|
|
|
|
|
func (r rcmgrMetrics) AllowStream(p peer.ID, dir network.Direction) {
|
|
|
|
ctx := context.Background()
|
|
|
|
if dir == network.DirInbound {
|
|
|
|
ctx, _ = tag.New(ctx, tag.Upsert(metrics.Direction, "inbound"))
|
|
|
|
} else {
|
|
|
|
ctx, _ = tag.New(ctx, tag.Upsert(metrics.Direction, "outbound"))
|
|
|
|
}
|
|
|
|
stats.Record(ctx, metrics.RcmgrAllowStream.M(1))
|
|
|
|
}
|
|
|
|
|
|
|
|
func (r rcmgrMetrics) BlockStream(p peer.ID, dir network.Direction) {
|
|
|
|
ctx := context.Background()
|
|
|
|
if dir == network.DirInbound {
|
|
|
|
ctx, _ = tag.New(ctx, tag.Upsert(metrics.Direction, "inbound"))
|
|
|
|
} else {
|
|
|
|
ctx, _ = tag.New(ctx, tag.Upsert(metrics.Direction, "outbound"))
|
|
|
|
}
|
|
|
|
stats.Record(ctx, metrics.RcmgrBlockStream.M(1))
|
|
|
|
}
|
|
|
|
|
|
|
|
func (r rcmgrMetrics) AllowPeer(p peer.ID) {
|
|
|
|
ctx := context.Background()
|
|
|
|
stats.Record(ctx, metrics.RcmgrAllowPeer.M(1))
|
|
|
|
}
|
|
|
|
|
|
|
|
func (r rcmgrMetrics) BlockPeer(p peer.ID) {
|
|
|
|
ctx := context.Background()
|
|
|
|
stats.Record(ctx, metrics.RcmgrBlockPeer.M(1))
|
|
|
|
}
|
|
|
|
|
|
|
|
func (r rcmgrMetrics) AllowProtocol(proto protocol.ID) {
|
|
|
|
ctx := context.Background()
|
|
|
|
ctx, _ = tag.New(ctx, tag.Upsert(metrics.ProtocolID, string(proto)))
|
|
|
|
stats.Record(ctx, metrics.RcmgrAllowProto.M(1))
|
|
|
|
}
|
|
|
|
|
|
|
|
func (r rcmgrMetrics) BlockProtocol(proto protocol.ID) {
|
|
|
|
ctx := context.Background()
|
|
|
|
ctx, _ = tag.New(ctx, tag.Upsert(metrics.ProtocolID, string(proto)))
|
|
|
|
stats.Record(ctx, metrics.RcmgrBlockProto.M(1))
|
|
|
|
}
|
|
|
|
|
|
|
|
func (r rcmgrMetrics) BlockProtocolPeer(proto protocol.ID, p peer.ID) {
|
|
|
|
ctx := context.Background()
|
|
|
|
ctx, _ = tag.New(ctx, tag.Upsert(metrics.ProtocolID, string(proto)))
|
|
|
|
stats.Record(ctx, metrics.RcmgrBlockProtoPeer.M(1))
|
|
|
|
}
|
|
|
|
|
|
|
|
func (r rcmgrMetrics) AllowService(svc string) {
|
|
|
|
ctx := context.Background()
|
|
|
|
ctx, _ = tag.New(ctx, tag.Upsert(metrics.ServiceID, svc))
|
|
|
|
stats.Record(ctx, metrics.RcmgrAllowSvc.M(1))
|
|
|
|
}
|
|
|
|
|
|
|
|
func (r rcmgrMetrics) BlockService(svc string) {
|
|
|
|
ctx := context.Background()
|
|
|
|
ctx, _ = tag.New(ctx, tag.Upsert(metrics.ServiceID, svc))
|
|
|
|
stats.Record(ctx, metrics.RcmgrBlockSvc.M(1))
|
|
|
|
}
|
|
|
|
|
|
|
|
func (r rcmgrMetrics) BlockServicePeer(svc string, p peer.ID) {
|
|
|
|
ctx := context.Background()
|
|
|
|
ctx, _ = tag.New(ctx, tag.Upsert(metrics.ServiceID, svc))
|
|
|
|
stats.Record(ctx, metrics.RcmgrBlockSvcPeer.M(1))
|
|
|
|
}
|
|
|
|
|
|
|
|
func (r rcmgrMetrics) AllowMemory(size int) {
|
|
|
|
stats.Record(context.Background(), metrics.RcmgrAllowMem.M(1))
|
|
|
|
}
|
|
|
|
|
|
|
|
func (r rcmgrMetrics) BlockMemory(size int) {
|
|
|
|
stats.Record(context.Background(), metrics.RcmgrBlockMem.M(1))
|
|
|
|
}
|