2019-04-18 12:39:37 +00:00
|
|
|
package swarm
|
|
|
|
|
|
|
|
import (
|
|
|
|
"context"
|
|
|
|
"os"
|
|
|
|
"strconv"
|
|
|
|
"sync"
|
|
|
|
"time"
|
|
|
|
|
2019-06-12 17:36:56 +00:00
|
|
|
"github.com/libp2p/go-libp2p-core/peer"
|
|
|
|
"github.com/libp2p/go-libp2p-core/transport"
|
|
|
|
|
2019-04-18 12:39:37 +00:00
|
|
|
addrutil "github.com/libp2p/go-addr-util"
|
|
|
|
ma "github.com/multiformats/go-multiaddr"
|
|
|
|
)
|
|
|
|
|
|
|
|
type dialResult struct {
|
2019-06-12 17:36:56 +00:00
|
|
|
Conn transport.CapableConn
|
2019-04-18 12:39:37 +00:00
|
|
|
Addr ma.Multiaddr
|
|
|
|
Err error
|
|
|
|
}
|
|
|
|
|
|
|
|
type dialJob struct {
|
|
|
|
addr ma.Multiaddr
|
|
|
|
peer peer.ID
|
|
|
|
ctx context.Context
|
|
|
|
resp chan dialResult
|
|
|
|
}
|
|
|
|
|
|
|
|
func (dj *dialJob) cancelled() bool {
|
|
|
|
return dj.ctx.Err() != nil
|
|
|
|
}
|
|
|
|
|
|
|
|
func (dj *dialJob) dialTimeout() time.Duration {
|
|
|
|
timeout := transport.DialTimeout
|
|
|
|
if lowTimeoutFilters.AddrBlocked(dj.addr) {
|
|
|
|
timeout = DialTimeoutLocal
|
|
|
|
}
|
|
|
|
|
|
|
|
return timeout
|
|
|
|
}
|
|
|
|
|
|
|
|
type dialLimiter struct {
|
|
|
|
lk sync.Mutex
|
|
|
|
|
|
|
|
fdConsuming int
|
|
|
|
fdLimit int
|
|
|
|
waitingOnFd []*dialJob
|
|
|
|
|
|
|
|
dialFunc dialfunc
|
|
|
|
|
|
|
|
activePerPeer map[peer.ID]int
|
|
|
|
perPeerLimit int
|
|
|
|
waitingOnPeerLimit map[peer.ID][]*dialJob
|
|
|
|
}
|
|
|
|
|
2019-06-12 17:36:56 +00:00
|
|
|
type dialfunc func(context.Context, peer.ID, ma.Multiaddr) (transport.CapableConn, error)
|
2019-04-18 12:39:37 +00:00
|
|
|
|
|
|
|
func newDialLimiter(df dialfunc) *dialLimiter {
|
|
|
|
fd := ConcurrentFdDials
|
|
|
|
if env := os.Getenv("LIBP2P_SWARM_FD_LIMIT"); env != "" {
|
|
|
|
if n, err := strconv.ParseInt(env, 10, 32); err == nil {
|
|
|
|
fd = int(n)
|
|
|
|
}
|
|
|
|
}
|
|
|
|
return newDialLimiterWithParams(df, fd, DefaultPerPeerRateLimit)
|
|
|
|
}
|
|
|
|
|
|
|
|
func newDialLimiterWithParams(df dialfunc, fdLimit, perPeerLimit int) *dialLimiter {
|
|
|
|
return &dialLimiter{
|
|
|
|
fdLimit: fdLimit,
|
|
|
|
perPeerLimit: perPeerLimit,
|
|
|
|
waitingOnPeerLimit: make(map[peer.ID][]*dialJob),
|
|
|
|
activePerPeer: make(map[peer.ID]int),
|
|
|
|
dialFunc: df,
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
// freeFDToken frees FD token and if there are any schedules another waiting dialJob
|
|
|
|
// in it's place
|
|
|
|
func (dl *dialLimiter) freeFDToken() {
|
|
|
|
log.Debugf("[limiter] freeing FD token; waiting: %d; consuming: %d", len(dl.waitingOnFd), dl.fdConsuming)
|
|
|
|
dl.fdConsuming--
|
|
|
|
|
|
|
|
for len(dl.waitingOnFd) > 0 {
|
|
|
|
next := dl.waitingOnFd[0]
|
|
|
|
dl.waitingOnFd[0] = nil // clear out memory
|
|
|
|
dl.waitingOnFd = dl.waitingOnFd[1:]
|
|
|
|
|
|
|
|
if len(dl.waitingOnFd) == 0 {
|
|
|
|
// clear out memory.
|
|
|
|
dl.waitingOnFd = nil
|
|
|
|
}
|
|
|
|
|
|
|
|
// Skip over canceled dials instead of queuing up a goroutine.
|
|
|
|
if next.cancelled() {
|
|
|
|
dl.freePeerToken(next)
|
|
|
|
continue
|
|
|
|
}
|
|
|
|
dl.fdConsuming++
|
|
|
|
|
|
|
|
// we already have activePerPeer token at this point so we can just dial
|
|
|
|
go dl.executeDial(next)
|
|
|
|
return
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
func (dl *dialLimiter) freePeerToken(dj *dialJob) {
|
|
|
|
log.Debugf("[limiter] freeing peer token; peer %s; addr: %s; active for peer: %d; waiting on peer limit: %d",
|
|
|
|
dj.peer, dj.addr, dl.activePerPeer[dj.peer], len(dl.waitingOnPeerLimit[dj.peer]))
|
|
|
|
// release tokens in reverse order than we take them
|
|
|
|
dl.activePerPeer[dj.peer]--
|
|
|
|
if dl.activePerPeer[dj.peer] == 0 {
|
|
|
|
delete(dl.activePerPeer, dj.peer)
|
|
|
|
}
|
|
|
|
|
|
|
|
waitlist := dl.waitingOnPeerLimit[dj.peer]
|
|
|
|
for len(waitlist) > 0 {
|
|
|
|
next := waitlist[0]
|
|
|
|
waitlist[0] = nil // clear out memory
|
|
|
|
waitlist = waitlist[1:]
|
|
|
|
|
|
|
|
if len(waitlist) == 0 {
|
|
|
|
delete(dl.waitingOnPeerLimit, next.peer)
|
|
|
|
} else {
|
|
|
|
dl.waitingOnPeerLimit[next.peer] = waitlist
|
|
|
|
}
|
|
|
|
|
|
|
|
if next.cancelled() {
|
|
|
|
continue
|
|
|
|
}
|
|
|
|
|
|
|
|
dl.activePerPeer[next.peer]++ // just kidding, we still want this token
|
|
|
|
|
|
|
|
dl.addCheckFdLimit(next)
|
|
|
|
return
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
func (dl *dialLimiter) finishedDial(dj *dialJob) {
|
|
|
|
dl.lk.Lock()
|
|
|
|
defer dl.lk.Unlock()
|
|
|
|
|
|
|
|
if addrutil.IsFDCostlyTransport(dj.addr) {
|
|
|
|
dl.freeFDToken()
|
|
|
|
}
|
|
|
|
|
|
|
|
dl.freePeerToken(dj)
|
|
|
|
}
|
|
|
|
|
|
|
|
func (dl *dialLimiter) addCheckFdLimit(dj *dialJob) {
|
|
|
|
if addrutil.IsFDCostlyTransport(dj.addr) {
|
|
|
|
if dl.fdConsuming >= dl.fdLimit {
|
|
|
|
log.Debugf("[limiter] blocked dial waiting on FD token; peer: %s; addr: %s; consuming: %d; "+
|
|
|
|
"limit: %d; waiting: %d", dj.peer, dj.addr, dl.fdConsuming, dl.fdLimit, len(dl.waitingOnFd))
|
|
|
|
dl.waitingOnFd = append(dl.waitingOnFd, dj)
|
|
|
|
return
|
|
|
|
}
|
|
|
|
|
|
|
|
log.Debugf("[limiter] taking FD token: peer: %s; addr: %s; prev consuming: %d",
|
|
|
|
dj.peer, dj.addr, dl.fdConsuming)
|
|
|
|
// take token
|
|
|
|
dl.fdConsuming++
|
|
|
|
}
|
|
|
|
|
|
|
|
log.Debugf("[limiter] executing dial; peer: %s; addr: %s; FD consuming: %d; waiting: %d",
|
|
|
|
dj.peer, dj.addr, dl.fdConsuming, len(dl.waitingOnFd))
|
|
|
|
go dl.executeDial(dj)
|
|
|
|
}
|
|
|
|
|
|
|
|
func (dl *dialLimiter) addCheckPeerLimit(dj *dialJob) {
|
|
|
|
if dl.activePerPeer[dj.peer] >= dl.perPeerLimit {
|
|
|
|
log.Debugf("[limiter] blocked dial waiting on peer limit; peer: %s; addr: %s; active: %d; "+
|
|
|
|
"peer limit: %d; waiting: %d", dj.peer, dj.addr, dl.activePerPeer[dj.peer], dl.perPeerLimit,
|
|
|
|
len(dl.waitingOnPeerLimit[dj.peer]))
|
|
|
|
wlist := dl.waitingOnPeerLimit[dj.peer]
|
|
|
|
dl.waitingOnPeerLimit[dj.peer] = append(wlist, dj)
|
|
|
|
return
|
|
|
|
}
|
|
|
|
dl.activePerPeer[dj.peer]++
|
|
|
|
|
|
|
|
dl.addCheckFdLimit(dj)
|
|
|
|
}
|
|
|
|
|
|
|
|
// AddDialJob tries to take the needed tokens for starting the given dial job.
|
|
|
|
// If it acquires all needed tokens, it immediately starts the dial, otherwise
|
|
|
|
// it will put it on the waitlist for the requested token.
|
|
|
|
func (dl *dialLimiter) AddDialJob(dj *dialJob) {
|
|
|
|
dl.lk.Lock()
|
|
|
|
defer dl.lk.Unlock()
|
|
|
|
|
|
|
|
log.Debugf("[limiter] adding a dial job through limiter: %v", dj.addr)
|
|
|
|
dl.addCheckPeerLimit(dj)
|
|
|
|
}
|
|
|
|
|
|
|
|
func (dl *dialLimiter) clearAllPeerDials(p peer.ID) {
|
|
|
|
dl.lk.Lock()
|
|
|
|
defer dl.lk.Unlock()
|
|
|
|
delete(dl.waitingOnPeerLimit, p)
|
|
|
|
log.Debugf("[limiter] clearing all peer dials: %v", p)
|
|
|
|
// NB: the waitingOnFd list doesn't need to be cleaned out here, we will
|
|
|
|
// remove them as we encounter them because they are 'cancelled' at this
|
|
|
|
// point
|
|
|
|
}
|
|
|
|
|
|
|
|
// executeDial calls the dialFunc, and reports the result through the response
|
|
|
|
// channel when finished. Once the response is sent it also releases all tokens
|
|
|
|
// it held during the dial.
|
|
|
|
func (dl *dialLimiter) executeDial(j *dialJob) {
|
|
|
|
defer dl.finishedDial(j)
|
|
|
|
if j.cancelled() {
|
|
|
|
return
|
|
|
|
}
|
|
|
|
|
|
|
|
dctx, cancel := context.WithTimeout(j.ctx, j.dialTimeout())
|
|
|
|
defer cancel()
|
|
|
|
|
|
|
|
con, err := dl.dialFunc(dctx, j.peer, j.addr)
|
|
|
|
select {
|
|
|
|
case j.resp <- dialResult{Conn: con, Addr: j.addr, Err: err}:
|
|
|
|
case <-j.ctx.Done():
|
|
|
|
if err == nil {
|
|
|
|
con.Close()
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|