query.go 14.2 KB
Newer Older
Juan Batiz-Benet's avatar
Juan Batiz-Benet committed
1 2 3
package dht

import (
Jeromy's avatar
Jeromy committed
4
	"context"
Steven Allen's avatar
Steven Allen committed
5
	"errors"
Adin Schmahmann's avatar
Adin Schmahmann committed
6
	"fmt"
7
	"math"
8
	"sync"
Aarsh Shah's avatar
Aarsh Shah committed
9
	"time"
10 11

	"github.com/google/uuid"
Adin Schmahmann's avatar
Adin Schmahmann committed
12

13 14
	"github.com/libp2p/go-libp2p-core/network"
	"github.com/libp2p/go-libp2p-core/peer"
15
	pstore "github.com/libp2p/go-libp2p-core/peerstore"
Adin Schmahmann's avatar
Adin Schmahmann committed
16
	"github.com/libp2p/go-libp2p-core/routing"
17

Adin Schmahmann's avatar
Adin Schmahmann committed
18
	"github.com/libp2p/go-libp2p-kad-dht/qpeerset"
19
	kb "github.com/libp2p/go-libp2p-kbucket"
Juan Batiz-Benet's avatar
Juan Batiz-Benet committed
20 21
)

Steven Allen's avatar
Steven Allen committed
22 23 24
// ErrNoPeersQueried is returned when we failed to connect to any peers.
var ErrNoPeersQueried = errors.New("failed to query any peers")

Adin Schmahmann's avatar
Adin Schmahmann committed
25
type queryFn func(context.Context, peer.ID) ([]*peer.AddrInfo, error)
Adin Schmahmann's avatar
Adin Schmahmann committed
26
type stopFn func() bool
27

Aarsh Shah's avatar
Aarsh Shah committed
28
// query represents a single DHT query.
Adin Schmahmann's avatar
Adin Schmahmann committed
29
type query struct {
30 31 32 33 34 35
	// unique identifier for the lookup instance
	id uuid.UUID

	// target key for the lookup
	key string

36 37
	// the query context.
	ctx context.Context
Adin Schmahmann's avatar
Adin Schmahmann committed
38

39
	// the cancellation function for the query context.
Adin Schmahmann's avatar
Adin Schmahmann committed
40
	cancel context.CancelFunc
41

Adin Schmahmann's avatar
Adin Schmahmann committed
42
	dht *IpfsDHT
Jeromy's avatar
Jeromy committed
43

Adin Schmahmann's avatar
Adin Schmahmann committed
44 45 46
	// seedPeers is the set of peers that seed the query
	seedPeers []peer.ID

47 48 49
	// peerTimes contains the duration of each successful query to a peer
	peerTimes map[peer.ID]time.Duration

Adin Schmahmann's avatar
Adin Schmahmann committed
50 51 52 53 54 55
	// queryPeers is the set of peers known by this query and their respective states.
	queryPeers *qpeerset.QueryPeerset

	// terminated is set when the first worker thread encounters the termination condition.
	// Its role is to make sure that once termination is determined, it is sticky.
	terminated bool
56

57 58 59
	// waitGroup ensures lookup does not end until all query goroutines complete.
	waitGroup sync.WaitGroup

60 61 62 63 64
	// the function that will be used to query a single peer.
	queryFn queryFn

	// stopFn is used to determine if we should stop the WHOLE disjoint query.
	stopFn stopFn
65 66
}

Adin Schmahmann's avatar
Adin Schmahmann committed
67
type lookupWithFollowupResult struct {
Aarsh Shah's avatar
Aarsh Shah committed
68 69
	peers []peer.ID            // the top K not unreachable peers at the end of the query
	state []qpeerset.PeerState // the peer states at the end of the query
Adin Schmahmann's avatar
Adin Schmahmann committed
70

Adin Schmahmann's avatar
Adin Schmahmann committed
71 72 73 74 75 76 77 78 79 80 81 82
	// indicates that neither the lookup nor the followup has been prematurely terminated by an external condition such
	// as context cancellation or the stop function being called.
	completed bool
}

// runLookupWithFollowup executes the lookup on the target using the given query function and stopping when either the
// context is cancelled or the stop function returns true. Note: if the stop function is not sticky, i.e. it does not
// return true every time after the first time it returns true, it is not guaranteed to cause a stop to occur just
// because it momentarily returns true.
//
// After the lookup is complete the query function is run (unless stopped) against all of the top K peers from the
// lookup that have not already been successfully queried.
Aarsh Shah's avatar
Aarsh Shah committed
83
func (dht *IpfsDHT) runLookupWithFollowup(ctx context.Context, target string, queryFn queryFn, stopFn stopFn) (*lookupWithFollowupResult, error) {
Adin Schmahmann's avatar
Adin Schmahmann committed
84
	// run the query
Aarsh Shah's avatar
Aarsh Shah committed
85
	lookupRes, err := dht.runQuery(ctx, target, queryFn, stopFn)
Adin Schmahmann's avatar
Adin Schmahmann committed
86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112
	if err != nil {
		return nil, err
	}

	// query all of the top K peers we've either Heard about or have outstanding queries we're Waiting on.
	// This ensures that all of the top K results have been queried which adds to resiliency against churn for query
	// functions that carry state (e.g. FindProviders and GetValue) as well as establish connections that are needed
	// by stateless query functions (e.g. GetClosestPeers and therefore Provide and PutValue)
	queryPeers := make([]peer.ID, 0, len(lookupRes.peers))
	for i, p := range lookupRes.peers {
		if state := lookupRes.state[i]; state == qpeerset.PeerHeard || state == qpeerset.PeerWaiting {
			queryPeers = append(queryPeers, p)
		}
	}

	if len(queryPeers) == 0 {
		return lookupRes, nil
	}

	// return if the lookup has been externally stopped
	if ctx.Err() != nil || stopFn() {
		lookupRes.completed = false
		return lookupRes, nil
	}

	doneCh := make(chan struct{}, len(queryPeers))
	followUpCtx, cancelFollowUp := context.WithCancel(ctx)
113
	defer cancelFollowUp()
Adin Schmahmann's avatar
Adin Schmahmann committed
114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142
	for _, p := range queryPeers {
		qp := p
		go func() {
			_, _ = queryFn(followUpCtx, qp)
			doneCh <- struct{}{}
		}()
	}

	// wait for all queries to complete before returning, aborting ongoing queries if we've been externally stopped
processFollowUp:
	for i := 0; i < len(queryPeers); i++ {
		select {
		case <-doneCh:
			if stopFn() {
				cancelFollowUp()
				if i < len(queryPeers)-1 {
					lookupRes.completed = false
				}
				break processFollowUp
			}
		case <-ctx.Done():
			lookupRes.completed = false
			break processFollowUp
		}
	}

	return lookupRes, nil
}

Aarsh Shah's avatar
Aarsh Shah committed
143
func (dht *IpfsDHT) runQuery(ctx context.Context, target string, queryFn queryFn, stopFn stopFn) (*lookupWithFollowupResult, error) {
144
	// pick the K closest peers to the key in our Routing table and shuffle them.
Adin Schmahmann's avatar
Adin Schmahmann committed
145 146
	targetKadID := kb.ConvertKey(target)
	seedPeers := dht.routingTable.NearestPeers(targetKadID, dht.bucketSize)
147 148 149 150 151 152 153
	if len(seedPeers) == 0 {
		routing.PublishQueryEvent(ctx, &routing.QueryEvent{
			Type:  routing.QueryError,
			Extra: kb.ErrLookupFailure.Error(),
		})
		return nil, kb.ErrLookupFailure
	}
Adin Schmahmann's avatar
Adin Schmahmann committed
154

Aarsh Shah's avatar
Aarsh Shah committed
155
	q := &query{
156 157
		id:         uuid.New(),
		key:        target,
158
		ctx:        ctx,
Aarsh Shah's avatar
Aarsh Shah committed
159 160 161
		dht:        dht,
		queryPeers: qpeerset.NewQueryPeerset(target),
		seedPeers:  seedPeers,
162
		peerTimes:  make(map[peer.ID]time.Duration),
Aarsh Shah's avatar
Aarsh Shah committed
163 164 165
		terminated: false,
		queryFn:    queryFn,
		stopFn:     stopFn,
166 167
	}

Aarsh Shah's avatar
Aarsh Shah committed
168
	// run the query
169 170 171 172 173
	q.run()

	if ctx.Err() == nil {
		q.recordValuablePeers()
	}
174

Aarsh Shah's avatar
Aarsh Shah committed
175
	res := q.constructLookupResult(targetKadID)
Adin Schmahmann's avatar
Adin Schmahmann committed
176
	return res, nil
177 178
}

Aarsh Shah's avatar
Aarsh Shah committed
179 180 181
func (q *query) recordPeerIsValuable(p peer.ID) {
	q.dht.routingTable.UpdateLastSuccessfulOutboundQuery(p, time.Now())
}
182 183

func (q *query) recordValuablePeers() {
184 185 186 187 188 189 190 191 192 193 194 195 196 197
	// Valuable peers algorithm:
	// Label the seed peer that responded to a query in the shortest amount of time as the "most valuable peer" (MVP)
	// Each seed peer that responded to a query within some range (i.e. 2x) of the MVP's time is a valuable peer
	// Mark the MVP and all the other valuable peers as valuable
	mvpDuration := time.Duration(math.MaxInt64)
	for _, p := range q.seedPeers {
		if queryTime, ok := q.peerTimes[p]; ok && queryTime < mvpDuration {
			mvpDuration = queryTime
		}
	}

	for _, p := range q.seedPeers {
		if queryTime, ok := q.peerTimes[p]; ok && queryTime < mvpDuration*2 {
			q.recordPeerIsValuable(p)
198 199 200 201
		}
	}
}

Adin Schmahmann's avatar
Adin Schmahmann committed
202
// constructLookupResult takes the query information and uses it to construct the lookup result
Aarsh Shah's avatar
Aarsh Shah committed
203 204
func (q *query) constructLookupResult(target kb.ID) *lookupWithFollowupResult {
	// determine if the query terminated early
Adin Schmahmann's avatar
Adin Schmahmann committed
205
	completed := true
Aarsh Shah's avatar
Aarsh Shah committed
206

207 208 209 210
	// Lookup and starvation are both valid ways for a lookup to complete. (Starvation does not imply failure.)
	// Lookup termination (as defined in isLookupTermination) is not possible in small networks.
	// Starvation is a successful query termination in small networks.
	if !(q.isLookupTermination() || q.isStarvationTermination()) {
Aarsh Shah's avatar
Aarsh Shah committed
211
		completed = false
Adin Schmahmann's avatar
Adin Schmahmann committed
212
	}
213

Aarsh Shah's avatar
Aarsh Shah committed
214
	// extract the top K not unreachable peers
Adin Schmahmann's avatar
Adin Schmahmann committed
215 216
	var peers []peer.ID
	peerState := make(map[peer.ID]qpeerset.PeerState)
Aarsh Shah's avatar
Aarsh Shah committed
217 218 219 220 221
	qp := q.queryPeers.GetClosestNotUnreachable(q.dht.bucketSize)
	for _, p := range qp {
		state := q.queryPeers.GetState(p)
		peerState[p] = state
		peers = append(peers, p)
222 223
	}

Adin Schmahmann's avatar
Adin Schmahmann committed
224 225
	// get the top K overall peers
	sortedPeers := kb.SortClosestPeers(peers, target)
Aarsh Shah's avatar
Aarsh Shah committed
226 227
	if len(sortedPeers) > q.dht.bucketSize {
		sortedPeers = sortedPeers[:q.dht.bucketSize]
228 229
	}

Aarsh Shah's avatar
Aarsh Shah committed
230
	// return the top K not unreachable peers as well as their states at the end of the query
Adin Schmahmann's avatar
Adin Schmahmann committed
231 232 233 234 235 236 237 238 239
	res := &lookupWithFollowupResult{
		peers:     sortedPeers,
		state:     make([]qpeerset.PeerState, len(sortedPeers)),
		completed: completed,
	}

	for i, p := range sortedPeers {
		res.state[i] = peerState[p]
	}
240 241

	return res
Adin Schmahmann's avatar
Adin Schmahmann committed
242
}
243

Adin Schmahmann's avatar
Adin Schmahmann committed
244
type queryUpdate struct {
245 246 247 248 249
	cause         peer.ID
	heard         []peer.ID
	queried       []peer.ID
	unreachable   []peer.ID
	queryDuration time.Duration
Adin Schmahmann's avatar
Adin Schmahmann committed
250
}
251

252
func (q *query) run() {
Adin Schmahmann's avatar
Adin Schmahmann committed
253 254
	pathCtx, cancelPath := context.WithCancel(q.ctx)
	defer cancelPath()
255

Adin Schmahmann's avatar
Adin Schmahmann committed
256
	alpha := q.dht.alpha
257

Adin Schmahmann's avatar
Adin Schmahmann committed
258
	ch := make(chan *queryUpdate, alpha)
259
	ch <- &queryUpdate{cause: q.dht.self, heard: q.seedPeers}
260

261 262
	// return only once all outstanding queries have completed.
	defer q.waitGroup.Wait()
Adin Schmahmann's avatar
Adin Schmahmann committed
263
	for {
264
		var cause peer.ID
Adin Schmahmann's avatar
Adin Schmahmann committed
265 266
		select {
		case update := <-ch:
267 268
			q.updateState(pathCtx, update)
			cause = update.cause
Adin Schmahmann's avatar
Adin Schmahmann committed
269
		case <-pathCtx.Done():
270
			q.terminate(pathCtx, cancelPath, LookupCancelled)
Adin Schmahmann's avatar
Adin Schmahmann committed
271 272
		}

Adin Schmahmann's avatar
Adin Schmahmann committed
273
		// termination is triggered on end-of-lookup conditions or starvation of unused peers
274 275 276
		if ready, reason := q.isReadyToTerminate(); ready {
			q.terminate(pathCtx, cancelPath, reason)
		}
Adin Schmahmann's avatar
Adin Schmahmann committed
277

278 279
		if q.terminated {
			return
Adin Schmahmann's avatar
Adin Schmahmann committed
280 281 282 283 284 285 286 287
		}

		// if all "threads" are busy, wait until someone finishes
		if q.queryPeers.NumWaiting() >= alpha {
			continue
		}

		// spawn new queries, up to the parallelism allowance
288 289 290 291 292
		// calculate the maximum number of queries we could be spawning.
		// Note: NumWaiting will be updated in spawnQuery
		maxNumQueriesToSpawn := alpha - q.queryPeers.NumWaiting()
		// try spawning the queries, if there are no available peers to query then we won't spawn them
		for j := 0; j < maxNumQueriesToSpawn; j++ {
293
			q.spawnQuery(pathCtx, cause, ch)
Adin Schmahmann's avatar
Adin Schmahmann committed
294 295 296 297
		}
	}
}

298 299
// spawnQuery starts one query, if an available heard peer is found
func (q *query) spawnQuery(ctx context.Context, cause peer.ID, ch chan<- *queryUpdate) {
Adin Schmahmann's avatar
Adin Schmahmann committed
300 301 302
	if peers := q.queryPeers.GetSortedHeard(); len(peers) == 0 {
		return
	} else {
303 304 305 306 307 308 309 310 311 312 313 314 315 316 317 318 319
		PublishLookupEvent(ctx,
			NewLookupEvent(
				q.dht.self,
				q.id,
				q.key,
				NewLookupUpdateEvent(
					cause,
					q.queryPeers.GetReferrer(peers[0]),
					nil,                 // heard
					[]peer.ID{peers[0]}, // waiting
					nil,                 // queried
					nil,                 // unreachable
				),
				nil,
				nil,
			),
		)
Adin Schmahmann's avatar
Adin Schmahmann committed
320
		q.queryPeers.SetState(peers[0], qpeerset.PeerWaiting)
321 322
		q.waitGroup.Add(1)
		go q.queryPeer(ctx, ch, peers[0])
Adin Schmahmann's avatar
Adin Schmahmann committed
323 324 325
	}
}

326
func (q *query) isReadyToTerminate() (bool, LookupTerminationReason) {
Adin Schmahmann's avatar
Adin Schmahmann committed
327 328
	// give the application logic a chance to terminate
	if q.stopFn() {
329
		return true, LookupStopped
Adin Schmahmann's avatar
Adin Schmahmann committed
330 331
	}
	if q.isStarvationTermination() {
332
		return true, LookupStarvation
Adin Schmahmann's avatar
Adin Schmahmann committed
333 334
	}
	if q.isLookupTermination() {
335
		return true, LookupCompleted
Adin Schmahmann's avatar
Adin Schmahmann committed
336
	}
337
	return false, -1
Adin Schmahmann's avatar
Adin Schmahmann committed
338 339 340 341 342 343 344 345 346 347
}

// From the set of all nodes that are not unreachable,
// if the closest beta nodes are all queried, the lookup can terminate.
func (q *query) isLookupTermination() bool {
	var peers []peer.ID
	peers = q.queryPeers.GetClosestNotUnreachable(q.dht.beta)
	for _, p := range peers {
		if q.queryPeers.GetState(p) != qpeerset.PeerQueried {
			return false
Adin Schmahmann's avatar
Adin Schmahmann committed
348
		}
349
	}
Adin Schmahmann's avatar
Adin Schmahmann committed
350 351 352 353 354
	return true
}

func (q *query) isStarvationTermination() bool {
	return q.queryPeers.NumHeard() == 0 && q.queryPeers.NumWaiting() == 0
355 356
}

357 358 359 360 361 362 363 364 365 366 367 368 369 370 371 372 373
func (q *query) terminate(ctx context.Context, cancel context.CancelFunc, reason LookupTerminationReason) {
	if q.terminated {
		return
	} else {
		PublishLookupEvent(ctx,
			NewLookupEvent(
				q.dht.self,
				q.id,
				q.key,
				nil,
				nil,
				NewLookupTerminateEvent(reason),
			),
		)
		cancel() // abort outstanding queries
		q.terminated = true
	}
374 375
}

Adin Schmahmann's avatar
Adin Schmahmann committed
376 377
// queryPeer queries a single peer and reports its findings on the channel.
// queryPeer does not access the query state in queryPeers!
378 379 380
func (q *query) queryPeer(ctx context.Context, ch chan<- *queryUpdate, p peer.ID) {
	defer q.waitGroup.Done()
	dialCtx, queryCtx := ctx, ctx
Adin Schmahmann's avatar
Adin Schmahmann committed
381

382
	startQuery := time.Now()
383
	// dial the peer
Adin Schmahmann's avatar
Adin Schmahmann committed
384
	if err := q.dht.dialPeer(dialCtx, p); err != nil {
Aarsh Shah's avatar
Aarsh Shah committed
385 386 387 388
		// remove the peer if there was a dial failure..but not because of a context cancellation
		if dialCtx.Err() == nil {
			q.dht.peerStoppedDHT(q.dht.ctx, p)
		}
389
		ch <- &queryUpdate{cause: p, unreachable: []peer.ID{p}}
Adin Schmahmann's avatar
Adin Schmahmann committed
390
		return
Adin Schmahmann's avatar
Adin Schmahmann committed
391
	}
392 393

	// send query RPC to the remote peer
Adin Schmahmann's avatar
Adin Schmahmann committed
394 395
	newPeers, err := q.queryFn(queryCtx, p)
	if err != nil {
Aarsh Shah's avatar
Aarsh Shah committed
396 397 398
		if queryCtx.Err() == nil {
			q.dht.peerStoppedDHT(q.dht.ctx, p)
		}
399
		ch <- &queryUpdate{cause: p, unreachable: []peer.ID{p}}
Adin Schmahmann's avatar
Adin Schmahmann committed
400
		return
Juan Batiz-Benet's avatar
Juan Batiz-Benet committed
401
	}
402

403 404
	queryDuration := time.Since(startQuery)

Aarsh Shah's avatar
Aarsh Shah committed
405 406 407
	// query successful, try to add to RT
	q.dht.peerFound(q.dht.ctx, p, true)

Adin Schmahmann's avatar
Adin Schmahmann committed
408 409
	// process new peers
	saw := []peer.ID{}
Adin Schmahmann's avatar
Adin Schmahmann committed
410 411 412 413 414
	for _, next := range newPeers {
		if next.ID == q.dht.self { // don't add self.
			logger.Debugf("PEERS CLOSER -- worker for: %v found self", p)
			continue
		}
415

416 417 418 419
		// add any other know addresses for the candidate peer.
		curInfo := q.dht.peerstore.PeerInfo(next.ID)
		next.Addrs = append(next.Addrs, curInfo.Addrs...)

Adin Schmahmann's avatar
Adin Schmahmann committed
420
		// add their addresses to the dialer's peerstore
421 422 423 424
		if q.dht.queryPeerFilter(q.dht, *next) {
			q.dht.peerstore.AddAddrs(next.ID, next.Addrs, pstore.TempAddrTTL)
			saw = append(saw, next.ID)
		}
425
	}
Adin Schmahmann's avatar
Adin Schmahmann committed
426

427
	ch <- &queryUpdate{cause: p, heard: saw, queried: []peer.ID{p}, queryDuration: queryDuration}
Adin Schmahmann's avatar
Adin Schmahmann committed
428
}
429

430 431 432 433 434 435 436 437 438 439 440 441 442 443 444 445 446 447 448 449 450 451
func (q *query) updateState(ctx context.Context, up *queryUpdate) {
	if q.terminated {
		panic("update should not be invoked after the logical lookup termination")
	}
	PublishLookupEvent(ctx,
		NewLookupEvent(
			q.dht.self,
			q.id,
			q.key,
			nil,
			NewLookupUpdateEvent(
				up.cause,
				up.cause,
				up.heard,       // heard
				nil,            // waiting
				up.queried,     // queried
				up.unreachable, // unreachable
			),
			nil,
		),
	)
	for _, p := range up.heard {
Adin Schmahmann's avatar
Adin Schmahmann committed
452 453 454
		if p == q.dht.self { // don't add self.
			continue
		}
455
		q.queryPeers.TryAdd(p, up.cause)
Adin Schmahmann's avatar
Adin Schmahmann committed
456 457 458 459 460 461 462
	}
	for _, p := range up.queried {
		if p == q.dht.self { // don't add self.
			continue
		}
		if st := q.queryPeers.GetState(p); st == qpeerset.PeerWaiting {
			q.queryPeers.SetState(p, qpeerset.PeerQueried)
463
			q.peerTimes[p] = up.queryDuration
Adin Schmahmann's avatar
Adin Schmahmann committed
464 465 466 467 468 469 470 471 472 473 474 475 476
		} else {
			panic(fmt.Errorf("kademlia protocol error: tried to transition to the queried state from state %v", st))
		}
	}
	for _, p := range up.unreachable {
		if p == q.dht.self { // don't add self.
			continue
		}
		if st := q.queryPeers.GetState(p); st == qpeerset.PeerWaiting {
			q.queryPeers.SetState(p, qpeerset.PeerUnreachable)
		} else {
			panic(fmt.Errorf("kademlia protocol error: tried to transition to the unreachable state from state %v", st))
		}
477
	}
478
}
Juan Batiz-Benet's avatar
Juan Batiz-Benet committed
479

Adin Schmahmann's avatar
Adin Schmahmann committed
480
func (dht *IpfsDHT) dialPeer(ctx context.Context, p peer.ID) error {
481
	// short-circuit if we're already connected.
Adin Schmahmann's avatar
Adin Schmahmann committed
482
	if dht.host.Network().Connectedness(p) == network.Connected {
483 484 485
		return nil
	}

Matt Joiner's avatar
Matt Joiner committed
486
	logger.Debug("not connected. dialing.")
Adin Schmahmann's avatar
Adin Schmahmann committed
487
	routing.PublishQueryEvent(ctx, &routing.QueryEvent{
488
		Type: routing.DialingPeer,
489 490 491
		ID:   p,
	})

492
	pi := peer.AddrInfo{ID: p}
Adin Schmahmann's avatar
Adin Schmahmann committed
493
	if err := dht.host.Connect(ctx, pi); err != nil {
Matt Joiner's avatar
Matt Joiner committed
494
		logger.Debugf("error connecting: %s", err)
Adin Schmahmann's avatar
Adin Schmahmann committed
495
		routing.PublishQueryEvent(ctx, &routing.QueryEvent{
496
			Type:  routing.QueryError,
497 498 499 500 501 502
			Extra: err.Error(),
			ID:    p,
		})

		return err
	}
Matt Joiner's avatar
Matt Joiner committed
503
	logger.Debugf("connected. dial success.")
504 505
	return nil
}