swarm.go 12.9 KB
Newer Older
Juan Batiz-Benet's avatar
Juan Batiz-Benet committed
1 2 3
package swarm

import (
4
	"context"
Steven Allen's avatar
Steven Allen committed
5
	"errors"
Juan Batiz-Benet's avatar
Juan Batiz-Benet committed
6
	"fmt"
7
	"strings"
Juan Batiz-Benet's avatar
Juan Batiz-Benet committed
8
	"sync"
Steven Allen's avatar
Steven Allen committed
9
	"sync/atomic"
Juan Batiz-Benet's avatar
Juan Batiz-Benet committed
10 11
	"time"

12
	"github.com/libp2p/go-libp2p-core/connmgr"
13 14 15 16 17 18
	"github.com/libp2p/go-libp2p-core/metrics"
	"github.com/libp2p/go-libp2p-core/network"
	"github.com/libp2p/go-libp2p-core/peer"
	"github.com/libp2p/go-libp2p-core/peerstore"
	"github.com/libp2p/go-libp2p-core/transport"

Jeromy's avatar
Jeromy committed
19 20 21
	logging "github.com/ipfs/go-log"
	"github.com/jbenet/goprocess"
	goprocessctx "github.com/jbenet/goprocess/context"
22

23
	ma "github.com/multiformats/go-multiaddr"
Juan Batiz-Benet's avatar
Juan Batiz-Benet committed
24 25
)

26 27
// DialTimeoutLocal is the maximum duration a Dial to local network address
// is allowed to take.
Steven Allen's avatar
Steven Allen committed
28 29
// This includes the time between dialing the raw network connection,
// protocol selection as well the handshake, if applicable.
30
var DialTimeoutLocal = 5 * time.Second
31

Steven Allen's avatar
Steven Allen committed
32
var log = logging.Logger("swarm2")
33

Steven Allen's avatar
Steven Allen committed
34 35
// ErrSwarmClosed is returned when one attempts to operate on a closed swarm.
var ErrSwarmClosed = errors.New("swarm closed")
36

Steven Allen's avatar
Steven Allen committed
37 38 39 40
// ErrAddrFiltered is returned when trying to register a connection to a
// filtered address. You shouldn't see this error unless some underlying
// transport is misbehaving.
var ErrAddrFiltered = errors.New("address filtered")
Juan Batiz-Benet's avatar
Juan Batiz-Benet committed
41

42 43 44
// ErrDialTimeout is returned when one a dial times out due to the global timeout
var ErrDialTimeout = errors.New("dial timed out")

Juan Batiz-Benet's avatar
Juan Batiz-Benet committed
45 46 47 48 49
// Swarm is a connection muxer, allowing connections to other peers to
// be opened and closed, while still using the same Chan for all
// communication. The Chan sends/receives Messages, which note the
// destination or source Peer.
type Swarm struct {
Steven Allen's avatar
Steven Allen committed
50 51 52 53
	// Close refcount. This allows us to fully wait for the swarm to be torn
	// down before continuing.
	refs sync.WaitGroup

Juan Batiz-Benet's avatar
Juan Batiz-Benet committed
54
	local peer.ID
55
	peers peerstore.Peerstore
Juan Batiz-Benet's avatar
Juan Batiz-Benet committed
56

Steven Allen's avatar
Steven Allen committed
57 58 59 60
	conns struct {
		sync.RWMutex
		m map[peer.ID][]*Conn
	}
Juan Batiz-Benet's avatar
Juan Batiz-Benet committed
61

Steven Allen's avatar
Steven Allen committed
62 63
	listeners struct {
		sync.RWMutex
64

65 66
		ifaceListenAddres []ma.Multiaddr
		cacheEOL          time.Time
67

Steven Allen's avatar
Steven Allen committed
68 69
		m map[transport.Listener]struct{}
	}
Jeromy's avatar
Jeromy committed
70

Steven Allen's avatar
Steven Allen committed
71 72
	notifs struct {
		sync.RWMutex
73
		m map[network.Notifiee]struct{}
Steven Allen's avatar
Steven Allen committed
74
	}
Juan Batiz-Benet's avatar
Juan Batiz-Benet committed
75

Steven Allen's avatar
Steven Allen committed
76 77 78 79
	transports struct {
		sync.RWMutex
		m map[int]transport.Transport
	}
Jeromy's avatar
Jeromy committed
80

Steven Allen's avatar
Steven Allen committed
81 82 83
	// new connection and stream handlers
	connh   atomic.Value
	streamh atomic.Value
Juan Batiz-Benet's avatar
Juan Batiz-Benet committed
84

Steven Allen's avatar
Steven Allen committed
85 86 87 88
	// dialing helpers
	dsync   *DialSync
	backf   DialBackoff
	limiter *dialLimiter
89
	gater   connmgr.ConnectionGater
Jeromy's avatar
Jeromy committed
90

Juan Batiz-Benet's avatar
Juan Batiz-Benet committed
91 92 93
	proc goprocess.Process
	ctx  context.Context
	bwc  metrics.Reporter
94 95
}

96 97 98 99 100 101 102
// NewSwarm constructs a Swarm.
//
// NOTE: go-libp2p will be moving to dependency injection soon. The variadic
// `extra` interface{} parameter facilitates the future migration. Supported
// elements are:
//  - connmgr.ConnectionGater
func NewSwarm(ctx context.Context, local peer.ID, peers peerstore.Peerstore, bwc metrics.Reporter, extra ...interface{}) *Swarm {
Juan Batiz-Benet's avatar
Juan Batiz-Benet committed
103
	s := &Swarm{
104 105 106
		local: local,
		peers: peers,
		bwc:   bwc,
Juan Batiz-Benet's avatar
Juan Batiz-Benet committed
107
	}
Steven Allen's avatar
Steven Allen committed
108 109 110 111

	s.conns.m = make(map[peer.ID][]*Conn)
	s.listeners.m = make(map[transport.Listener]struct{})
	s.transports.m = make(map[int]transport.Transport)
112
	s.notifs.m = make(map[network.Notifiee]struct{})
Juan Batiz-Benet's avatar
Juan Batiz-Benet committed
113

114 115 116 117 118 119 120
	for _, i := range extra {
		switch v := i.(type) {
		case connmgr.ConnectionGater:
			s.gater = v
		}
	}

121
	s.dsync = NewDialSync(s.doDial)
Aarsh Shah's avatar
Aarsh Shah committed
122
	s.limiter = newDialLimiter(s.dialAddr, s.IsFdConsumingAddr)
123
	s.proc = goprocessctx.WithContext(ctx)
Steven Allen's avatar
Steven Allen committed
124
	s.ctx = goprocessctx.OnClosingContext(s.proc)
Will Scott's avatar
Will Scott committed
125
	s.backf.init(s.ctx)
Jeromy's avatar
Jeromy committed
126

127 128 129 130
	// Set teardown after setting the context/process so we don't start the
	// teardown process early.
	s.proc.SetTeardown(s.teardown)

Steven Allen's avatar
Steven Allen committed
131
	return s
Juan Batiz-Benet's avatar
Juan Batiz-Benet committed
132 133
}

Steven Allen's avatar
Steven Allen committed
134
func (s *Swarm) teardown() error {
135 136 137 138 139
	// Wait for the context to be canceled.
	// This allows other parts of the swarm to detect that we're shutting
	// down.
	<-s.ctx.Done()

Steven Allen's avatar
Steven Allen committed
140 141 142 143 144 145 146 147 148 149 150 151
	// Prevents new connections and/or listeners from being added to the swarm.

	s.listeners.Lock()
	listeners := s.listeners.m
	s.listeners.m = nil
	s.listeners.Unlock()

	s.conns.Lock()
	conns := s.conns.m
	s.conns.m = nil
	s.conns.Unlock()

Matt Joiner's avatar
Matt Joiner committed
152 153
	// Lots of goroutines but we might as well do this in parallel. We want to shut down as fast as
	// possible.
Steven Allen's avatar
Steven Allen committed
154 155 156 157 158 159 160

	for l := range listeners {
		go func(l transport.Listener) {
			if err := l.Close(); err != nil {
				log.Errorf("error when shutting down listener: %s", err)
			}
		}(l)
161 162
	}

Steven Allen's avatar
Steven Allen committed
163 164 165 166 167 168 169 170 171
	for _, cs := range conns {
		for _, c := range cs {
			go func(c *Conn) {
				if err := c.Close(); err != nil {
					log.Errorf("error when shutting down connection: %s", err)
				}
			}(c)
		}
	}
172

Steven Allen's avatar
Steven Allen committed
173 174
	// Wait for everything to finish.
	s.refs.Wait()
175

Steven Allen's avatar
Steven Allen committed
176
	return nil
Juan Batiz-Benet's avatar
Juan Batiz-Benet committed
177 178
}

Steven Allen's avatar
Steven Allen committed
179 180 181 182 183
// Process returns the Process of the swarm
func (s *Swarm) Process() goprocess.Process {
	return s.proc
}

184
func (s *Swarm) addConn(tc transport.CapableConn, dir network.Direction) (*Conn, error) {
185 186 187 188 189 190 191 192 193 194 195 196 197 198 199 200 201 202 203 204
	var (
		p    = tc.RemotePeer()
		addr = tc.RemoteMultiaddr()
	)

	if s.gater != nil {
		if allow := s.gater.InterceptAddrDial(p, addr); !allow {
			err := tc.Close()
			if err != nil {
				log.Warnf("failed to close connection with peer %s and addr %s; err: %s", p.Pretty(), addr, err)
			}
			return nil, ErrAddrFiltered
		}
	}

	stat := network.Stat{Direction: dir}
	c := &Conn{
		conn:  tc,
		swarm: s,
		stat:  stat,
Juan Batiz-Benet's avatar
Juan Batiz-Benet committed
205
	}
Jeromy's avatar
Jeromy committed
206

207 208 209 210 211 212 213 214 215 216 217 218
	// we ONLY check upgraded connections here so we can send them a Disconnect message.
	// If we do this in the Upgrader, we will not be able to do this.
	if s.gater != nil {
		if allow, _ := s.gater.InterceptUpgraded(c); !allow {
			// TODO Send disconnect with reason here
			err := tc.Close()
			if err != nil {
				log.Warnf("failed to close connection with peer %s and addr %s; err: %s", p.Pretty(), addr, err)
			}
			return nil, ErrGaterDisallowedConnection
		}
	}
Juan Batiz-Benet's avatar
Juan Batiz-Benet committed
219

Steven Allen's avatar
Steven Allen committed
220 221 222 223 224 225 226 227 228 229 230 231 232 233 234 235 236 237 238 239 240 241 242 243 244 245
	// Add the public key.
	if pk := tc.RemotePublicKey(); pk != nil {
		s.peers.AddPubKey(p, pk)
	}

	// Clear any backoffs
	s.backf.Clear(p)

	// Finally, add the peer.
	s.conns.Lock()
	// Check if we're still online
	if s.conns.m == nil {
		s.conns.Unlock()
		tc.Close()
		return nil, ErrSwarmClosed
	}

	// Wrap and register the connection.
	c.streams.m = make(map[*Stream]struct{})
	s.conns.m[p] = append(s.conns.m[p], c)

	// Add two swarm refs:
	// * One will be decremented after the close notifications fire in Conn.doClose
	// * The other will be decremented when Conn.start exits.
	s.refs.Add(2)

246 247 248
	// Take the notification lock before releasing the conns lock to block
	// Disconnect notifications until after the Connect notifications done.
	c.notifyLk.Lock()
Steven Allen's avatar
Steven Allen committed
249 250 251 252
	s.conns.Unlock()

	// We have a connection now. Cancel all other in-progress dials.
	// This should be fast, no reason to wait till later.
253 254 255
	if dir == network.DirOutbound {
		s.dsync.CancelDial(p)
	}
Steven Allen's avatar
Steven Allen committed
256

257
	s.notifyAll(func(f network.Notifiee) {
Steven Allen's avatar
Steven Allen committed
258 259
		f.Connected(s, c)
	})
260
	c.notifyLk.Unlock()
Juan Batiz-Benet's avatar
Juan Batiz-Benet committed
261

Steven Allen's avatar
Steven Allen committed
262 263 264 265 266 267 268 269 270 271
	c.start()

	// TODO: Get rid of this. We use it for identify but that happen much
	// earlier (really, inside the transport and, if not then, during the
	// notifications).
	if h := s.ConnHandler(); h != nil {
		go h(c)
	}

	return c, nil
Juan Batiz-Benet's avatar
Juan Batiz-Benet committed
272 273
}

Steven Allen's avatar
Steven Allen committed
274
// Peerstore returns this swarms internal Peerstore.
275
func (s *Swarm) Peerstore() peerstore.Peerstore {
Steven Allen's avatar
Steven Allen committed
276
	return s.peers
Juan Batiz-Benet's avatar
Juan Batiz-Benet committed
277 278 279 280 281 282 283 284 285 286 287 288
}

// Context returns the context of the swarm
func (s *Swarm) Context() context.Context {
	return s.ctx
}

// Close stops the Swarm.
func (s *Swarm) Close() error {
	return s.proc.Close()
}

Steven Allen's avatar
Steven Allen committed
289
// TODO: We probably don't need the conn handlers.
Juan Batiz-Benet's avatar
Juan Batiz-Benet committed
290 291

// SetConnHandler assigns the handler for new connections.
Steven Allen's avatar
Steven Allen committed
292
// You will rarely use this. See SetStreamHandler
293
func (s *Swarm) SetConnHandler(handler network.ConnHandler) {
Steven Allen's avatar
Steven Allen committed
294 295
	s.connh.Store(handler)
}
Juan Batiz-Benet's avatar
Juan Batiz-Benet committed
296

Steven Allen's avatar
Steven Allen committed
297
// ConnHandler gets the handler for new connections.
298 299
func (s *Swarm) ConnHandler() network.ConnHandler {
	handler, _ := s.connh.Load().(network.ConnHandler)
Steven Allen's avatar
Steven Allen committed
300
	return handler
Juan Batiz-Benet's avatar
Juan Batiz-Benet committed
301 302 303
}

// SetStreamHandler assigns the handler for new streams.
304
func (s *Swarm) SetStreamHandler(handler network.StreamHandler) {
Steven Allen's avatar
Steven Allen committed
305 306 307 308
	s.streamh.Store(handler)
}

// StreamHandler gets the handler for new streams.
309 310
func (s *Swarm) StreamHandler() network.StreamHandler {
	handler, _ := s.streamh.Load().(network.StreamHandler)
Steven Allen's avatar
Steven Allen committed
311 312 313 314 315
	return handler
}

// NewStream creates a new stream on any available connection to peer, dialing
// if necessary.
316
func (s *Swarm) NewStream(ctx context.Context, p peer.ID) (network.Stream, error) {
Steven Allen's avatar
Steven Allen committed
317 318 319 320 321 322 323 324 325 326 327 328 329 330 331 332 333 334
	log.Debugf("[%s] opening stream to peer [%s]", s.local, p)

	// Algorithm:
	// 1. Find the best connection, otherwise, dial.
	// 2. Try opening a stream.
	// 3. If the underlying connection is, in fact, closed, close the outer
	//    connection and try again. We do this in case we have a closed
	//    connection but don't notice it until we actually try to open a
	//    stream.
	//
	// Note: We only dial once.
	//
	// TODO: Try all connections even if we get an error opening a stream on
	// a non-closed connection.
	dials := 0
	for {
		c := s.bestConnToPeer(p)
		if c == nil {
335 336
			if nodial, _ := network.GetNoDial(ctx); nodial {
				return nil, network.ErrNoConn
337 338
			}

Steven Allen's avatar
Steven Allen committed
339 340 341 342 343 344 345 346 347 348 349 350 351 352 353 354
			if dials >= DialAttempts {
				return nil, errors.New("max dial attempts exceeded")
			}
			dials++

			var err error
			c, err = s.dialPeer(ctx, p)
			if err != nil {
				return nil, err
			}
		}
		s, err := c.NewStream()
		if err != nil {
			if c.conn.IsClosed() {
				continue
			}
Juan Batiz-Benet's avatar
Juan Batiz-Benet committed
355 356
			return nil, err
		}
Steven Allen's avatar
Steven Allen committed
357
		return s, nil
Juan Batiz-Benet's avatar
Juan Batiz-Benet committed
358 359 360
	}
}

Steven Allen's avatar
Steven Allen committed
361
// ConnsToPeer returns all the live connections to peer.
362
func (s *Swarm) ConnsToPeer(p peer.ID) []network.Conn {
Steven Allen's avatar
Steven Allen committed
363 364 365 366 367
	// TODO: Consider sorting the connection list best to worst. Currently,
	// it's sorted oldest to newest.
	s.conns.RLock()
	defer s.conns.RUnlock()
	conns := s.conns.m[p]
368
	output := make([]network.Conn, len(conns))
Steven Allen's avatar
Steven Allen committed
369 370 371 372 373 374 375 376 377 378 379 380 381 382 383 384 385 386 387 388 389 390 391 392
	for i, c := range conns {
		output[i] = c
	}
	return output
}

// bestConnToPeer returns the best connection to peer.
func (s *Swarm) bestConnToPeer(p peer.ID) *Conn {
	// Selects the best connection we have to the peer.
	// TODO: Prefer some transports over others. Currently, we just select
	// the newest non-closed connection with the most streams.
	s.conns.RLock()
	defer s.conns.RUnlock()

	var best *Conn
	bestLen := 0
	for _, c := range s.conns.m[p] {
		if c.conn.IsClosed() {
			// We *will* garbage collect this soon anyways.
			continue
		}
		c.streams.Lock()
		cLen := len(c.streams.m)
		c.streams.Unlock()
Juan Batiz-Benet's avatar
Juan Batiz-Benet committed
393

Steven Allen's avatar
Steven Allen committed
394 395 396 397
		if cLen >= bestLen {
			best = c
			bestLen = cLen
		}
398

Steven Allen's avatar
Steven Allen committed
399 400
	}
	return best
Juan Batiz-Benet's avatar
Juan Batiz-Benet committed
401 402
}

Steven Allen's avatar
Steven Allen committed
403 404 405
// Connectedness returns our "connectedness" state with the given peer.
//
// To check if we have an open connection, use `s.Connectedness(p) ==
406 407
// network.Connected`.
func (s *Swarm) Connectedness(p peer.ID) network.Connectedness {
Steven Allen's avatar
Steven Allen committed
408
	if s.bestConnToPeer(p) != nil {
409
		return network.Connected
Juan Batiz-Benet's avatar
Juan Batiz-Benet committed
410
	}
411
	return network.NotConnected
Juan Batiz-Benet's avatar
Juan Batiz-Benet committed
412 413
}

Steven Allen's avatar
Steven Allen committed
414
// Conns returns a slice of all connections.
415
func (s *Swarm) Conns() []network.Conn {
Steven Allen's avatar
Steven Allen committed
416 417
	s.conns.RLock()
	defer s.conns.RUnlock()
Juan Batiz-Benet's avatar
Juan Batiz-Benet committed
418

419
	conns := make([]network.Conn, 0, len(s.conns.m))
Steven Allen's avatar
Steven Allen committed
420 421 422 423 424 425 426 427 428 429 430 431 432 433 434 435 436 437 438
	for _, cs := range s.conns.m {
		for _, c := range cs {
			conns = append(conns, c)
		}
	}
	return conns
}

// ClosePeer closes all connections to the given peer.
func (s *Swarm) ClosePeer(p peer.ID) error {
	conns := s.ConnsToPeer(p)
	switch len(conns) {
	case 0:
		return nil
	case 1:
		return conns[0].Close()
	default:
		errCh := make(chan error)
		for _, c := range conns {
439
			go func(c network.Conn) {
Steven Allen's avatar
Steven Allen committed
440 441
				errCh <- c.Close()
			}(c)
Juan Batiz-Benet's avatar
Juan Batiz-Benet committed
442 443
		}

Steven Allen's avatar
Steven Allen committed
444 445 446 447 448 449 450 451 452 453 454 455 456 457 458 459 460 461 462 463
		var errs []string
		for _ = range conns {
			err := <-errCh
			if err != nil {
				errs = append(errs, err.Error())
			}
		}
		if len(errs) > 0 {
			return fmt.Errorf("when disconnecting from peer %s: %s", p, strings.Join(errs, ", "))
		}
		return nil
	}
}

// Peers returns a copy of the set of peers swarm is connected to.
func (s *Swarm) Peers() []peer.ID {
	s.conns.RLock()
	defer s.conns.RUnlock()
	peers := make([]peer.ID, 0, len(s.conns.m))
	for p := range s.conns.m {
Juan Batiz-Benet's avatar
Juan Batiz-Benet committed
464 465
		peers = append(peers, p)
	}
Steven Allen's avatar
Steven Allen committed
466

Juan Batiz-Benet's avatar
Juan Batiz-Benet committed
467 468 469 470 471 472 473 474
	return peers
}

// LocalPeer returns the local peer swarm is associated to.
func (s *Swarm) LocalPeer() peer.ID {
	return s.local
}

Steven Allen's avatar
Steven Allen committed
475 476
// Backoff returns the DialBackoff object for this swarm.
func (s *Swarm) Backoff() *DialBackoff {
Jeromy's avatar
Jeromy committed
477 478 479
	return &s.backf
}

Juan Batiz-Benet's avatar
Juan Batiz-Benet committed
480
// notifyAll sends a signal to all Notifiees
481
func (s *Swarm) notifyAll(notify func(network.Notifiee)) {
482 483
	var wg sync.WaitGroup

Steven Allen's avatar
Steven Allen committed
484
	s.notifs.RLock()
485
	wg.Add(len(s.notifs.m))
Steven Allen's avatar
Steven Allen committed
486
	for f := range s.notifs.m {
487
		go func(f network.Notifiee) {
488 489 490
			defer wg.Done()
			notify(f)
		}(f)
Juan Batiz-Benet's avatar
Juan Batiz-Benet committed
491
	}
492 493

	wg.Wait()
Steven Allen's avatar
Steven Allen committed
494
	s.notifs.RUnlock()
Juan Batiz-Benet's avatar
Juan Batiz-Benet committed
495 496 497
}

// Notify signs up Notifiee to receive signals when events happen
498
func (s *Swarm) Notify(f network.Notifiee) {
Steven Allen's avatar
Steven Allen committed
499 500 501
	s.notifs.Lock()
	s.notifs.m[f] = struct{}{}
	s.notifs.Unlock()
Juan Batiz-Benet's avatar
Juan Batiz-Benet committed
502 503 504
}

// StopNotify unregisters Notifiee fromr receiving signals
505
func (s *Swarm) StopNotify(f network.Notifiee) {
Steven Allen's avatar
Steven Allen committed
506 507 508 509 510 511 512 513 514 515 516 517 518 519 520 521 522 523 524 525 526 527 528 529 530
	s.notifs.Lock()
	delete(s.notifs.m, f)
	s.notifs.Unlock()
}

func (s *Swarm) removeConn(c *Conn) {
	p := c.RemotePeer()

	s.conns.Lock()
	defer s.conns.Unlock()
	cs := s.conns.m[p]
	for i, ci := range cs {
		if ci == c {
			if len(cs) == 1 {
				delete(s.conns.m, p)
			} else {
				// NOTE: We're intentionally preserving order.
				// This way, connections to a peer are always
				// sorted oldest to newest.
				copy(cs[i:], cs[i+1:])
				cs[len(cs)-1] = nil
				s.conns.m[p] = cs[:len(cs)-1]
			}
			return
		}
Juan Batiz-Benet's avatar
Juan Batiz-Benet committed
531 532 533
	}
}

Steven Allen's avatar
Steven Allen committed
534 535 536
// String returns a string representation of Network.
func (s *Swarm) String() string {
	return fmt.Sprintf("<Swarm %s>", s.LocalPeer())
Juan Batiz-Benet's avatar
Juan Batiz-Benet committed
537 538
}

Steven Allen's avatar
Steven Allen committed
539
// Swarm is a Network.
540 541
var _ network.Network = (*Swarm)(nil)
var _ transport.TransportNetwork = (*Swarm)(nil)