bitswap.go 17 KB
Newer Older
1
// Package bitswap implements the IPFS exchange interface with the BitSwap
Brian Tiger Chow's avatar
Brian Tiger Chow committed
2
// bilateral exchange protocol.
3 4 5
package bitswap

import (
6
	"context"
Juan Batiz-Benet's avatar
Juan Batiz-Benet committed
7
	"errors"
dirkmc's avatar
dirkmc committed
8

9
	"sync"
Jeromy's avatar
Jeromy committed
10 11
	"time"

12
	delay "github.com/ipfs/go-ipfs-delay"
13

14 15 16 17 18 19 20 21 22 23 24
	bsbpm "github.com/ipfs/go-bitswap/internal/blockpresencemanager"
	decision "github.com/ipfs/go-bitswap/internal/decision"
	bsgetter "github.com/ipfs/go-bitswap/internal/getter"
	bsmq "github.com/ipfs/go-bitswap/internal/messagequeue"
	notifications "github.com/ipfs/go-bitswap/internal/notifications"
	bspm "github.com/ipfs/go-bitswap/internal/peermanager"
	bspqm "github.com/ipfs/go-bitswap/internal/providerquerymanager"
	bssession "github.com/ipfs/go-bitswap/internal/session"
	bssim "github.com/ipfs/go-bitswap/internal/sessioninterestmanager"
	bssm "github.com/ipfs/go-bitswap/internal/sessionmanager"
	bsspm "github.com/ipfs/go-bitswap/internal/sessionpeermanager"
25 26
	bsmsg "github.com/ipfs/go-bitswap/message"
	bsnet "github.com/ipfs/go-bitswap/network"
Jeromy's avatar
Jeromy committed
27 28 29 30 31 32 33 34
	blocks "github.com/ipfs/go-block-format"
	cid "github.com/ipfs/go-cid"
	blockstore "github.com/ipfs/go-ipfs-blockstore"
	exchange "github.com/ipfs/go-ipfs-exchange-interface"
	logging "github.com/ipfs/go-log"
	metrics "github.com/ipfs/go-metrics-interface"
	process "github.com/jbenet/goprocess"
	procctx "github.com/jbenet/goprocess/context"
Raúl Kripalani's avatar
Raúl Kripalani committed
35
	peer "github.com/libp2p/go-libp2p-core/peer"
36 37
)

Jeromy's avatar
Jeromy committed
38
var log = logging.Logger("bitswap")
39
var sflog = log.Desugar()
Juan Batiz-Benet's avatar
Juan Batiz-Benet committed
40

41 42
var _ exchange.SessionExchange = (*Bitswap)(nil)

Brian Tiger Chow's avatar
Brian Tiger Chow committed
43
const (
44
	// these requests take at _least_ two minutes at the moment.
45 46
	provideTimeout         = time.Minute * 3
	defaultProvSearchDelay = time.Second
Jeromy's avatar
Jeromy committed
47
)
48

Jeromy's avatar
Jeromy committed
49
var (
50 51 52 53
	// HasBlockBufferSize is the buffer size of the channel for new blocks
	// that need to be provided. They should get pulled over by the
	// provideCollector even before they are actually provided.
	// TODO: Does this need to be this large givent that?
54 55
	HasBlockBufferSize    = 256
	provideKeysBufferSize = 2048
Steven Allen's avatar
Steven Allen committed
56
	provideWorkerMax      = 6
57 58 59

	// the 1<<18+15 is to observe old file chunks that are 1<<18 + 14 in size
	metricsBuckets = []float64{1 << 6, 1 << 10, 1 << 14, 1 << 18, 1<<18 + 15, 1 << 22}
Brian Tiger Chow's avatar
Brian Tiger Chow committed
60
)
Jeromy's avatar
Jeromy committed
61

62 63 64 65 66 67 68 69 70 71 72
// Option defines the functional option type that can be used to configure
// bitswap instances
type Option func(*Bitswap)

// ProvideEnabled is an option for enabling/disabling provide announcements
func ProvideEnabled(enabled bool) Option {
	return func(bs *Bitswap) {
		bs.provideEnabled = enabled
	}
}

73 74 75 76 77 78 79 80 81 82 83 84 85 86
// ProviderSearchDelay overwrites the global provider search delay
func ProviderSearchDelay(newProvSearchDelay time.Duration) Option {
	return func(bs *Bitswap) {
		bs.provSearchDelay = newProvSearchDelay
	}
}

// RebroadcastDelay overwrites the global provider rebroadcast delay
func RebroadcastDelay(newRebroadcastDelay delay.D) Option {
	return func(bs *Bitswap) {
		bs.rebroadcastDelay = newRebroadcastDelay
	}
}

87 88 89 90 91 92 93 94 95 96 97
// SetSendDontHaves indicates what to do when the engine receives a want-block
// for a block that is not in the blockstore. Either
// - Send a DONT_HAVE message
// - Simply don't respond
// This option is only used for testing.
func SetSendDontHaves(send bool) Option {
	return func(bs *Bitswap) {
		bs.engine.SetSendDontHaves(send)
	}
}

Brian Tiger Chow's avatar
Brian Tiger Chow committed
98 99
// New initializes a BitSwap instance that communicates over the provided
// BitSwapNetwork. This function registers the returned instance as the network
100
// delegate. Runs until context is cancelled or bitswap.Close is called.
Łukasz Magiera's avatar
Łukasz Magiera committed
101
func New(parent context.Context, network bsnet.BitSwapNetwork,
102
	bstore blockstore.Blockstore, options ...Option) exchange.Interface {
103

104 105
	// important to use provided parent context (since it may include important
	// loggable data). It's probably not a good idea to allow bitswap to be
106
	// coupled to the concerns of the ipfs daemon in this way.
107 108 109 110
	//
	// FIXME(btc) Now that bitswap manages itself using a process, it probably
	// shouldn't accept a context anymore. Clients should probably use Close()
	// exclusively. We should probably find another way to share logging data
111
	ctx, cancelFunc := context.WithCancel(parent)
112
	ctx = metrics.CtxSubScope(ctx, "bitswap")
113
	dupHist := metrics.NewCtx(ctx, "recv_dup_blocks_bytes", "Summary of duplicate"+
114
		" data blocks recived").Histogram(metricsBuckets)
115
	allHist := metrics.NewCtx(ctx, "recv_all_blocks_bytes", "Summary of all"+
116
		" data blocks recived").Histogram(metricsBuckets)
117

118 119 120
	sentHistogram := metrics.NewCtx(ctx, "sent_all_blocks_bytes", "Histogram of blocks sent by"+
		" this bitswap").Histogram(metricsBuckets)

121 122 123 124
	px := process.WithTeardown(func() error {
		return nil
	})

125 126
	// onDontHaveTimeout is called when a want-block is sent to a peer that
	// has an old version of Bitswap that doesn't support DONT_HAVE messages,
127
	// or when no response is received within a timeout.
Dirk McCormick's avatar
Dirk McCormick committed
128
	var sm *bssm.SessionManager
129
	onDontHaveTimeout := func(p peer.ID, dontHaves []cid.Cid) {
Dirk McCormick's avatar
Dirk McCormick committed
130 131
		// Simulate a message arriving with DONT_HAVEs
		sm.ReceiveFrom(ctx, p, nil, nil, dontHaves)
132
	}
133
	peerQueueFactory := func(ctx context.Context, p peer.ID) bspm.PeerQueue {
134
		return bsmq.New(ctx, p, network, onDontHaveTimeout)
135 136
	}

dirkmc's avatar
dirkmc committed
137 138 139
	sim := bssim.New()
	bpm := bsbpm.New()
	pm := bspm.New(ctx, peerQueueFactory, network.Self())
140 141
	pqm := bspqm.New(ctx, network)

142 143 144 145 146
	sessionFactory := func(
		sessctx context.Context,
		sessmgr bssession.SessionManager,
		id uint64,
		spm bssession.SessionPeerManager,
dirkmc's avatar
dirkmc committed
147 148 149
		sim *bssim.SessionInterestManager,
		pm bssession.PeerManager,
		bpm *bsbpm.BlockPresenceManager,
150
		notif notifications.PubSub,
151
		provSearchDelay time.Duration,
dirkmc's avatar
dirkmc committed
152 153
		rebroadcastDelay delay.D,
		self peer.ID) bssm.Session {
154
		return bssession.New(sessctx, sessmgr, id, spm, pqm, sim, pm, bpm, notif, provSearchDelay, rebroadcastDelay, self)
155
	}
dirkmc's avatar
dirkmc committed
156
	sessionPeerManagerFactory := func(ctx context.Context, id uint64) bssession.SessionPeerManager {
157
		return bsspm.New(id, network.ConnectionManager())
158
	}
159
	notif := notifications.New()
Dirk McCormick's avatar
Dirk McCormick committed
160
	sm = bssm.New(ctx, sessionFactory, sim, sessionPeerManagerFactory, bpm, pm, notif, network.Self())
dirkmc's avatar
dirkmc committed
161
	engine := decision.NewEngine(ctx, bstore, network.ConnectionManager(), network.Self())
162

163
	bs := &Bitswap{
164
		blockstore:       bstore,
165
		engine:           engine,
166 167 168 169
		network:          network,
		process:          px,
		newBlocks:        make(chan cid.Cid, HasBlockBufferSize),
		provideKeys:      make(chan cid.Cid, provideKeysBufferSize),
dirkmc's avatar
dirkmc committed
170
		pm:               pm,
171
		pqm:              pqm,
dirkmc's avatar
dirkmc committed
172 173
		sm:               sm,
		sim:              sim,
174
		notif:            notif,
175 176 177 178 179 180 181
		counters:         new(counters),
		dupMetric:        dupHist,
		allMetric:        allHist,
		sentHistogram:    sentHistogram,
		provideEnabled:   true,
		provSearchDelay:  defaultProvSearchDelay,
		rebroadcastDelay: delay.Fixed(time.Minute),
182 183 184 185 186
	}

	// apply functional options before starting and running bitswap
	for _, option := range options {
		option(bs)
187
	}
188

189
	bs.pqm.Startup()
Brian Tiger Chow's avatar
Brian Tiger Chow committed
190
	network.SetDelegate(bs)
191

192
	// Start up bitswaps async worker routines
193
	bs.startWorkers(ctx, px)
194
	engine.StartWorkers(ctx, px)
195 196 197 198 199

	// bind the context and process.
	// do it over here to avoid closing before all setup is done.
	go func() {
		<-px.Closing() // process closes first
200
		sm.Shutdown()
201
		cancelFunc()
202
		notif.Shutdown()
203 204 205
	}()
	procctx.CloseAfterContext(px, ctx) // parent cancelled first

206 207 208
	return bs
}

209 210
// Bitswap instances implement the bitswap protocol.
type Bitswap struct {
dirkmc's avatar
dirkmc committed
211 212
	pm *bspm.PeerManager

213 214 215
	// the provider query manager manages requests to find providers
	pqm *bspqm.ProviderQueryManager

216 217
	// the engine is the bit of logic that decides who to send which blocks to
	engine *decision.Engine
Juan Batiz-Benet's avatar
Juan Batiz-Benet committed
218

219 220
	// network delivers messages on behalf of the session
	network bsnet.BitSwapNetwork
221 222 223 224 225

	// blockstore is the local database
	// NB: ensure threadsafety
	blockstore blockstore.Blockstore

226 227 228
	// manages channels of outgoing blocks for sessions
	notif notifications.PubSub

229 230 231
	// newBlocks is a channel for newly added blocks to be provided to the
	// network.  blocks pushed down this channel get buffered and fed to the
	// provideKeys channel later on to avoid too much network activity
232
	newBlocks chan cid.Cid
233
	// provideKeys directly feeds provide workers
234
	provideKeys chan cid.Cid
235

236 237 238
	process process.Process

	// Counters for various statistics
239 240
	counterLk sync.Mutex
	counters  *counters
241 242

	// Metrics interface metrics
243 244 245
	dupMetric     metrics.Histogram
	allMetric     metrics.Histogram
	sentHistogram metrics.Histogram
Jeromy's avatar
Jeromy committed
246

dirkmc's avatar
dirkmc committed
247
	// the SessionManager routes requests to interested sessions
248
	sm *bssm.SessionManager
249

dirkmc's avatar
dirkmc committed
250 251 252 253
	// the SessionInterestManager keeps track of which sessions are interested
	// in which CIDs
	sim *bssim.SessionInterestManager

254 255
	// whether or not to make provide announcements
	provideEnabled bool
256 257 258 259 260 261

	// how long to wait before looking for providers in a session
	provSearchDelay time.Duration

	// how often to rebroadcast providing requests to find more optimized providers
	rebroadcastDelay delay.D
262 263
}

264 265 266 267 268 269 270 271 272 273
type counters struct {
	blocksRecvd    uint64
	dupBlocksRecvd uint64
	dupDataRecvd   uint64
	blocksSent     uint64
	dataSent       uint64
	dataRecvd      uint64
	messagesRecvd  uint64
}

274
// GetBlock attempts to retrieve a particular block from peers within the
275
// deadline enforced by the context.
276
func (bs *Bitswap) GetBlock(parent context.Context, k cid.Cid) (blocks.Block, error) {
277
	return bsgetter.SyncGetBlock(parent, k, bs.GetBlocks)
278 279
}

280 281
// WantlistForPeer returns the currently understood list of blocks requested by a
// given peer.
282 283
func (bs *Bitswap) WantlistForPeer(p peer.ID) []cid.Cid {
	var out []cid.Cid
284
	for _, e := range bs.engine.WantlistForPeer(p) {
285
		out = append(out, e.Cid)
286 287 288 289
	}
	return out
}

290 291
// LedgerForPeer returns aggregated data about blocks swapped and communication
// with a given peer.
292 293 294 295
func (bs *Bitswap) LedgerForPeer(p peer.ID) *decision.Receipt {
	return bs.engine.LedgerForPeer(p)
}

296 297 298 299 300 301 302
// GetBlocks returns a channel where the caller may receive blocks that
// correspond to the provided |keys|. Returns an error if BitSwap is unable to
// begin this request within the deadline enforced by the context.
//
// NB: Your request remains open until the context expires. To conserve
// resources, provide a context with a reasonably short deadline (ie. not one
// that lasts throughout the lifetime of the server)
303
func (bs *Bitswap) GetBlocks(ctx context.Context, keys []cid.Cid) (<-chan blocks.Block, error) {
304
	session := bs.sm.NewSession(ctx, bs.provSearchDelay, bs.rebroadcastDelay)
305
	return session.GetBlocks(ctx, keys)
Jeromy's avatar
Jeromy committed
306 307
}

Łukasz Magiera's avatar
Łukasz Magiera committed
308
// HasBlock announces the existence of a block to this bitswap service. The
309
// service will potentially notify its peers.
310
func (bs *Bitswap) HasBlock(blk blocks.Block) error {
dirkmc's avatar
dirkmc committed
311
	return bs.receiveBlocksFrom(context.Background(), "", []blocks.Block{blk}, nil, nil)
312 313 314 315 316 317
}

// TODO: Some of this stuff really only needs to be done when adding a block
// from the user, not when receiving it from the network.
// In case you run `git blame` on this comment, I'll save you some time: ask
// @whyrusleeping, I don't know the answers you seek.
dirkmc's avatar
dirkmc committed
318
func (bs *Bitswap) receiveBlocksFrom(ctx context.Context, from peer.ID, blks []blocks.Block, haves []cid.Cid, dontHaves []cid.Cid) error {
319 320 321 322 323
	select {
	case <-bs.process.Closing():
		return errors.New("bitswap is closed")
	default:
	}
324

325 326 327 328
	wanted := blks

	// If blocks came from the network
	if from != "" {
dirkmc's avatar
dirkmc committed
329 330 331 332
		var notWanted []blocks.Block
		wanted, notWanted = bs.sim.SplitWantedUnwanted(blks)
		for _, b := range notWanted {
			log.Debugf("[recv] block not in wantlist; cid=%s, peer=%s", b.Cid(), from)
333 334 335 336
		}
	}

	// Put wanted blocks into blockstore
dirkmc's avatar
dirkmc committed
337 338 339 340 341 342
	if len(wanted) > 0 {
		err := bs.blockstore.PutMany(wanted)
		if err != nil {
			log.Errorf("Error writing %d blocks to datastore: %s", len(wanted), err)
			return err
		}
343
	}
344

345 346 347 348 349
	// NOTE: There exists the possiblity for a race condition here.  If a user
	// creates a node, then adds it to the dagservice while another goroutine
	// is waiting on a GetBlock for that object, they will receive a reference
	// to the same node. We should address this soon, but i'm not going to do
	// it now as it requires more thought and isnt causing immediate problems.
Jeromy's avatar
Jeromy committed
350

351 352 353 354 355
	allKs := make([]cid.Cid, 0, len(blks))
	for _, b := range blks {
		allKs = append(allKs, b.Cid())
	}

356 357 358 359 360 361 362
	// If the message came from the network
	if from != "" {
		// Inform the PeerManager so that we can calculate per-peer latency
		combined := make([]cid.Cid, 0, len(allKs)+len(haves)+len(dontHaves))
		combined = append(combined, allKs...)
		combined = append(combined, haves...)
		combined = append(combined, dontHaves...)
Dirk McCormick's avatar
Dirk McCormick committed
363
		bs.pm.ResponseReceived(from, combined)
364 365
	}

366
	// Send all block keys (including duplicates) to any sessions that want them.
367
	// (The duplicates are needed by sessions for accounting purposes)
Dirk McCormick's avatar
Dirk McCormick committed
368
	bs.sm.ReceiveFrom(ctx, from, allKs, haves, dontHaves)
369

dirkmc's avatar
dirkmc committed
370 371
	// Send wanted blocks to decision engine
	bs.engine.ReceiveFrom(from, wanted, haves)
372

373
	// Publish the block to any Bitswap clients that had requested blocks.
dirkmc's avatar
dirkmc committed
374
	// (the sessions use this pubsub mechanism to inform clients of incoming
375 376 377 378 379
	// blocks)
	for _, b := range wanted {
		bs.notif.Publish(b)
	}

380
	// If the reprovider is enabled, send wanted blocks to reprovider
381
	if bs.provideEnabled {
dirkmc's avatar
dirkmc committed
382
		for _, blk := range wanted {
383
			select {
dirkmc's avatar
dirkmc committed
384
			case bs.newBlocks <- blk.Cid():
385 386 387 388
				// send block off to be reprovided
			case <-bs.process.Closing():
				return bs.process.Close()
			}
389
		}
390
	}
391

392 393
	if from != "" {
		for _, b := range wanted {
394
			log.Debugw("Bitswap.GetBlockRequest.End", "cid", b.Cid())
395 396 397
		}
	}

398
	return nil
399 400
}

401 402
// ReceiveMessage is called by the network interface when a new message is
// received.
403
func (bs *Bitswap) ReceiveMessage(ctx context.Context, p peer.ID, incoming bsmsg.BitSwapMessage) {
Steven Allen's avatar
Steven Allen committed
404 405 406
	bs.counterLk.Lock()
	bs.counters.messagesRecvd++
	bs.counterLk.Unlock()
Jeromy's avatar
Jeromy committed
407

Jeromy's avatar
Jeromy committed
408 409
	// This call records changes to wantlists, blocks received,
	// and number of bytes transfered.
410
	bs.engine.MessageReceived(ctx, p, incoming)
Jeromy's avatar
Jeromy committed
411 412
	// TODO: this is bad, and could be easily abused.
	// Should only track *useful* messages in ledger
413

414 415
	iblocks := incoming.Blocks()

dirkmc's avatar
dirkmc committed
416 417 418 419 420
	if len(iblocks) > 0 {
		bs.updateReceiveCounters(iblocks)
		for _, b := range iblocks {
			log.Debugf("[recv] block; cid=%s, peer=%s", b.Cid(), p)
		}
421
	}
422

dirkmc's avatar
dirkmc committed
423 424 425 426 427 428
	haves := incoming.Haves()
	dontHaves := incoming.DontHaves()
	if len(iblocks) > 0 || len(haves) > 0 || len(dontHaves) > 0 {
		// Process blocks
		err := bs.receiveBlocksFrom(ctx, p, iblocks, haves, dontHaves)
		if err != nil {
429
			log.Warnf("ReceiveMessage recvBlockFrom error: %s", err)
dirkmc's avatar
dirkmc committed
430 431
			return
		}
432
	}
433 434 435 436 437 438 439
}

func (bs *Bitswap) updateReceiveCounters(blocks []blocks.Block) {
	// Check which blocks are in the datastore
	// (Note: any errors from the blockstore are simply logged out in
	// blockstoreHas())
	blocksHas := bs.blockstoreHas(blocks)
440

441 442 443
	bs.counterLk.Lock()
	defer bs.counterLk.Unlock()

444 445 446 447 448 449 450 451 452 453 454 455 456 457 458 459 460 461
	// Do some accounting for each block
	for i, b := range blocks {
		has := blocksHas[i]

		blkLen := len(b.RawData())
		bs.allMetric.Observe(float64(blkLen))
		if has {
			bs.dupMetric.Observe(float64(blkLen))
		}

		c := bs.counters

		c.blocksRecvd++
		c.dataRecvd += uint64(blkLen)
		if has {
			c.dupBlocksRecvd++
			c.dupDataRecvd += uint64(blkLen)
		}
462 463 464
	}
}

465 466 467 468 469 470 471 472 473 474 475 476 477 478 479 480 481 482 483 484 485 486 487
func (bs *Bitswap) blockstoreHas(blks []blocks.Block) []bool {
	res := make([]bool, len(blks))

	wg := sync.WaitGroup{}
	for i, block := range blks {
		wg.Add(1)
		go func(i int, b blocks.Block) {
			defer wg.Done()

			has, err := bs.blockstore.Has(b.Cid())
			if err != nil {
				log.Infof("blockstore.Has error: %s", err)
				has = false
			}

			res[i] = has
		}(i, block)
	}
	wg.Wait()

	return res
}

488 489
// PeerConnected is called by the network interface
// when a peer initiates a new connection to bitswap.
490
func (bs *Bitswap) PeerConnected(p peer.ID) {
Dirk McCormick's avatar
Dirk McCormick committed
491
	bs.pm.Connected(p)
492
	bs.engine.PeerConnected(p)
493 494
}

495 496
// PeerDisconnected is called by the network interface when a peer
// closes a connection
497
func (bs *Bitswap) PeerDisconnected(p peer.ID) {
Dirk McCormick's avatar
Dirk McCormick committed
498
	bs.pm.Disconnected(p)
499
	bs.engine.PeerDisconnected(p)
500 501
}

502 503
// ReceiveError is called by the network interface when an error happens
// at the network layer. Currently just logs error.
504
func (bs *Bitswap) ReceiveError(err error) {
505
	log.Infof("Bitswap ReceiveError: %s", err)
506 507
	// TODO log the network error
	// TODO bubble the network error up to the parent context/error logger
508 509
}

510
// Close is called to shutdown Bitswap
511
func (bs *Bitswap) Close() error {
512
	return bs.process.Close()
513
}
514

515 516
// GetWantlist returns the current local wantlist (both want-blocks and
// want-haves).
517
func (bs *Bitswap) GetWantlist() []cid.Cid {
dirkmc's avatar
dirkmc committed
518 519 520
	return bs.pm.CurrentWants()
}

521 522 523 524 525
// GetWantBlocks returns the current list of want-blocks.
func (bs *Bitswap) GetWantBlocks() []cid.Cid {
	return bs.pm.CurrentWantBlocks()
}

dirkmc's avatar
dirkmc committed
526 527 528
// GetWanthaves returns the current list of want-haves.
func (bs *Bitswap) GetWantHaves() []cid.Cid {
	return bs.pm.CurrentWantHaves()
529
}
530

531
// IsOnline is needed to match go-ipfs-exchange-interface
532 533 534
func (bs *Bitswap) IsOnline() bool {
	return true
}
535

536 537 538 539 540 541
// NewSession generates a new Bitswap session. You should use this, rather
// that calling Bitswap.GetBlocks, any time you intend to do several related
// block requests in a row. The session returned will have it's own GetBlocks
// method, but the session will use the fact that the requests are related to
// be more efficient in its requests to peers. If you are using a session
// from go-blockservice, it will create a bitswap session automatically.
542
func (bs *Bitswap) NewSession(ctx context.Context) exchange.Fetcher {
543
	return bs.sm.NewSession(ctx, bs.provSearchDelay, bs.rebroadcastDelay)
544
}