limiter.go 5.81 KB
Newer Older
Jeromy's avatar
Jeromy committed
1 2 3
package swarm

import (
4
	"context"
5 6
	"os"
	"strconv"
Jeromy's avatar
Jeromy committed
7
	"sync"
8
	"time"
Jeromy's avatar
Jeromy committed
9

Jeromy's avatar
Jeromy committed
10 11
	addrutil "github.com/libp2p/go-addr-util"
	peer "github.com/libp2p/go-libp2p-peer"
Steven Allen's avatar
Steven Allen committed
12
	transport "github.com/libp2p/go-libp2p-transport"
Jeromy's avatar
Jeromy committed
13
	ma "github.com/multiformats/go-multiaddr"
Jeromy's avatar
Jeromy committed
14 15 16
)

type dialResult struct {
Steven Allen's avatar
Steven Allen committed
17
	Conn transport.Conn
Jeromy's avatar
Jeromy committed
18
	Addr ma.Multiaddr
Jeromy's avatar
Jeromy committed
19 20 21 22
	Err  error
}

type dialJob struct {
Steven Allen's avatar
Steven Allen committed
23 24 25 26
	addr ma.Multiaddr
	peer peer.ID
	ctx  context.Context
	resp chan dialResult
Jeromy's avatar
Jeromy committed
27 28
}

Jeromy's avatar
Jeromy committed
29 30 31 32 33 34 35 36 37
func (dj *dialJob) cancelled() bool {
	select {
	case <-dj.ctx.Done():
		return true
	default:
		return false
	}
}

38
func (dj *dialJob) dialTimeout() time.Duration {
39
	timeout := transport.DialTimeout
40 41 42 43 44 45 46
	if lowTimeoutFilters.AddrBlocked(dj.addr) {
		timeout = DialTimeoutLocal
	}

	return timeout
}

Jeromy's avatar
Jeromy committed
47
type dialLimiter struct {
Łukasz Magiera's avatar
Łukasz Magiera committed
48 49
	lk sync.Mutex

Jeromy's avatar
Jeromy committed
50 51 52 53
	fdConsuming int
	fdLimit     int
	waitingOnFd []*dialJob

Łukasz Magiera's avatar
Łukasz Magiera committed
54
	dialFunc dialfunc
Jeromy's avatar
Jeromy committed
55 56 57 58 59 60

	activePerPeer      map[peer.ID]int
	perPeerLimit       int
	waitingOnPeerLimit map[peer.ID][]*dialJob
}

Steven Allen's avatar
Steven Allen committed
61
type dialfunc func(context.Context, peer.ID, ma.Multiaddr) (transport.Conn, error)
Jeromy's avatar
Jeromy committed
62 63

func newDialLimiter(df dialfunc) *dialLimiter {
64 65 66 67 68 69 70
	fd := ConcurrentFdDials
	if env := os.Getenv("LIBP2P_SWARM_FD_LIMIT"); env != "" {
		if n, err := strconv.ParseInt(env, 10, 32); err == nil {
			fd = int(n)
		}
	}
	return newDialLimiterWithParams(df, fd, DefaultPerPeerRateLimit)
Jeromy's avatar
Jeromy committed
71 72
}

73
func newDialLimiterWithParams(df dialfunc, fdLimit, perPeerLimit int) *dialLimiter {
Jeromy's avatar
Jeromy committed
74
	return &dialLimiter{
75 76
		fdLimit:            fdLimit,
		perPeerLimit:       perPeerLimit,
Jeromy's avatar
Jeromy committed
77 78 79 80 81 82
		waitingOnPeerLimit: make(map[peer.ID][]*dialJob),
		activePerPeer:      make(map[peer.ID]int),
		dialFunc:           df,
	}
}

Łukasz Magiera's avatar
Łukasz Magiera committed
83 84 85
// freeFDToken frees FD token and if there are any schedules another waiting dialJob
// in it's place
func (dl *dialLimiter) freeFDToken() {
86
	log.Debugf("[limiter] freeing FD token; waiting: %d; consuming: %d", len(dl.waitingOnFd), dl.fdConsuming)
Łukasz Magiera's avatar
Łukasz Magiera committed
87 88
	dl.fdConsuming--

89
	for len(dl.waitingOnFd) > 0 {
Łukasz Magiera's avatar
Łukasz Magiera committed
90 91 92
		next := dl.waitingOnFd[0]
		dl.waitingOnFd[0] = nil // clear out memory
		dl.waitingOnFd = dl.waitingOnFd[1:]
93

Łukasz Magiera's avatar
Łukasz Magiera committed
94
		if len(dl.waitingOnFd) == 0 {
95 96 97 98 99 100 101 102
			// clear out memory.
			dl.waitingOnFd = nil
		}

		// Skip over canceled dials instead of queuing up a goroutine.
		if next.cancelled() {
			dl.freePeerToken(next)
			continue
Jeromy's avatar
Jeromy committed
103
		}
Łukasz Magiera's avatar
Łukasz Magiera committed
104 105 106 107
		dl.fdConsuming++

		// we already have activePerPeer token at this point so we can just dial
		go dl.executeDial(next)
108
		return
Jeromy's avatar
Jeromy committed
109
	}
Łukasz Magiera's avatar
Łukasz Magiera committed
110
}
Jeromy's avatar
Jeromy committed
111

Łukasz Magiera's avatar
Łukasz Magiera committed
112
func (dl *dialLimiter) freePeerToken(dj *dialJob) {
113 114
	log.Debugf("[limiter] freeing peer token; peer %s; addr: %s; active for peer: %d; waiting on peer limit: %d",
		dj.peer, dj.addr, dl.activePerPeer[dj.peer], len(dl.waitingOnPeerLimit[dj.peer]))
Jeromy's avatar
Jeromy committed
115 116 117 118 119 120 121
	// release tokens in reverse order than we take them
	dl.activePerPeer[dj.peer]--
	if dl.activePerPeer[dj.peer] == 0 {
		delete(dl.activePerPeer, dj.peer)
	}

	waitlist := dl.waitingOnPeerLimit[dj.peer]
122
	for len(waitlist) > 0 {
Jeromy's avatar
Jeromy committed
123
		next := waitlist[0]
124 125 126 127
		waitlist[0] = nil // clear out memory
		waitlist = waitlist[1:]

		if len(waitlist) == 0 {
Łukasz Magiera's avatar
Łukasz Magiera committed
128
			delete(dl.waitingOnPeerLimit, next.peer)
Jeromy's avatar
Jeromy committed
129
		} else {
130 131 132 133 134
			dl.waitingOnPeerLimit[next.peer] = waitlist
		}

		if next.cancelled() {
			continue
Jeromy's avatar
Jeromy committed
135 136
		}

Łukasz Magiera's avatar
Łukasz Magiera committed
137
		dl.activePerPeer[next.peer]++ // just kidding, we still want this token
138

Łukasz Magiera's avatar
Łukasz Magiera committed
139
		dl.addCheckFdLimit(next)
140
		return
Jeromy's avatar
Jeromy committed
141 142 143
	}
}

Łukasz Magiera's avatar
Łukasz Magiera committed
144 145 146
func (dl *dialLimiter) finishedDial(dj *dialJob) {
	dl.lk.Lock()
	defer dl.lk.Unlock()
Jeromy's avatar
Jeromy committed
147

Łukasz Magiera's avatar
Łukasz Magiera committed
148 149
	if addrutil.IsFDCostlyTransport(dj.addr) {
		dl.freeFDToken()
Jeromy's avatar
Jeromy committed
150 151
	}

Łukasz Magiera's avatar
Łukasz Magiera committed
152 153 154 155
	dl.freePeerToken(dj)
}

func (dl *dialLimiter) addCheckFdLimit(dj *dialJob) {
Jeromy's avatar
Jeromy committed
156 157
	if addrutil.IsFDCostlyTransport(dj.addr) {
		if dl.fdConsuming >= dl.fdLimit {
158 159
			log.Debugf("[limiter] blocked dial waiting on FD token; peer: %s; addr: %s; consuming: %d; "+
				"limit: %d; waiting: %d", dj.peer, dj.addr, dl.fdConsuming, dl.fdLimit, len(dl.waitingOnFd))
Jeromy's avatar
Jeromy committed
160 161 162 163
			dl.waitingOnFd = append(dl.waitingOnFd, dj)
			return
		}

164 165
		log.Debugf("[limiter] taking FD token: peer: %s; addr: %s; prev consuming: %d",
			dj.peer, dj.addr, dl.fdConsuming)
Jeromy's avatar
Jeromy committed
166 167 168 169
		// take token
		dl.fdConsuming++
	}

170 171
	log.Debugf("[limiter] executing dial; peer: %s; addr: %s; FD consuming: %d; waiting: %d",
		dj.peer, dj.addr, dl.fdConsuming, len(dl.waitingOnFd))
Jeromy's avatar
Jeromy committed
172 173 174
	go dl.executeDial(dj)
}

Łukasz Magiera's avatar
Łukasz Magiera committed
175 176
func (dl *dialLimiter) addCheckPeerLimit(dj *dialJob) {
	if dl.activePerPeer[dj.peer] >= dl.perPeerLimit {
177 178 179
		log.Debugf("[limiter] blocked dial waiting on peer limit; peer: %s; addr: %s; active: %d; "+
			"peer limit: %d; waiting: %d", dj.peer, dj.addr, dl.activePerPeer[dj.peer], dl.perPeerLimit,
			len(dl.waitingOnPeerLimit[dj.peer]))
Łukasz Magiera's avatar
Łukasz Magiera committed
180 181 182 183 184 185 186 187 188 189 190 191 192 193 194 195
		wlist := dl.waitingOnPeerLimit[dj.peer]
		dl.waitingOnPeerLimit[dj.peer] = append(wlist, dj)
		return
	}
	dl.activePerPeer[dj.peer]++

	dl.addCheckFdLimit(dj)
}

// AddDialJob tries to take the needed tokens for starting the given dial job.
// If it acquires all needed tokens, it immediately starts the dial, otherwise
// it will put it on the waitlist for the requested token.
func (dl *dialLimiter) AddDialJob(dj *dialJob) {
	dl.lk.Lock()
	defer dl.lk.Unlock()

196
	log.Debugf("[limiter] adding a dial job through limiter: %v", dj.addr)
Łukasz Magiera's avatar
Łukasz Magiera committed
197 198 199
	dl.addCheckPeerLimit(dj)
}

200
func (dl *dialLimiter) clearAllPeerDials(p peer.ID) {
Łukasz Magiera's avatar
Łukasz Magiera committed
201 202
	dl.lk.Lock()
	defer dl.lk.Unlock()
203
	delete(dl.waitingOnPeerLimit, p)
204
	log.Debugf("[limiter] clearing all peer dials: %v", p)
Łukasz Magiera's avatar
Łukasz Magiera committed
205
	// NB: the waitingOnFd list doesn't need to be cleaned out here, we will
206 207 208 209
	// remove them as we encounter them because they are 'cancelled' at this
	// point
}

Jeromy's avatar
Jeromy committed
210 211 212 213 214
// executeDial calls the dialFunc, and reports the result through the response
// channel when finished. Once the response is sent it also releases all tokens
// it held during the dial.
func (dl *dialLimiter) executeDial(j *dialJob) {
	defer dl.finishedDial(j)
Jeromy's avatar
Jeromy committed
215 216 217 218
	if j.cancelled() {
		return
	}

219 220 221 222
	dctx, cancel := context.WithTimeout(j.ctx, j.dialTimeout())
	defer cancel()

	con, err := dl.dialFunc(dctx, j.peer, j.addr)
Jeromy's avatar
Jeromy committed
223
	select {
Jeromy's avatar
Jeromy committed
224
	case j.resp <- dialResult{Conn: con, Addr: j.addr, Err: err}:
Jeromy's avatar
Jeromy committed
225
	case <-j.ctx.Done():
226 227 228
		if err == nil {
			con.Close()
		}
Jeromy's avatar
Jeromy committed
229 230
	}
}