query.go 13.5 KB
Newer Older
Juan Batiz-Benet's avatar
Juan Batiz-Benet committed
1 2 3
package dht

import (
Jeromy's avatar
Jeromy committed
4
	"context"
Steven Allen's avatar
Steven Allen committed
5
	"errors"
Adin Schmahmann's avatar
Adin Schmahmann committed
6
	"fmt"
7
	"sync"
Aarsh Shah's avatar
Aarsh Shah committed
8
	"time"
9 10

	"github.com/google/uuid"
Adin Schmahmann's avatar
Adin Schmahmann committed
11

12 13
	"github.com/libp2p/go-libp2p-core/network"
	"github.com/libp2p/go-libp2p-core/peer"
14
	pstore "github.com/libp2p/go-libp2p-core/peerstore"
Adin Schmahmann's avatar
Adin Schmahmann committed
15
	"github.com/libp2p/go-libp2p-core/routing"
16

Adin Schmahmann's avatar
Adin Schmahmann committed
17
	"github.com/libp2p/go-libp2p-kad-dht/qpeerset"
18
	kb "github.com/libp2p/go-libp2p-kbucket"
Juan Batiz-Benet's avatar
Juan Batiz-Benet committed
19 20
)

Steven Allen's avatar
Steven Allen committed
21 22 23
// ErrNoPeersQueried is returned when we failed to connect to any peers.
var ErrNoPeersQueried = errors.New("failed to query any peers")

Adin Schmahmann's avatar
Adin Schmahmann committed
24
type queryFn func(context.Context, peer.ID) ([]*peer.AddrInfo, error)
Adin Schmahmann's avatar
Adin Schmahmann committed
25
type stopFn func() bool
26

Aarsh Shah's avatar
Aarsh Shah committed
27
// query represents a single DHT query.
Adin Schmahmann's avatar
Adin Schmahmann committed
28
type query struct {
29 30 31 32 33 34
	// unique identifier for the lookup instance
	id uuid.UUID

	// target key for the lookup
	key string

35 36
	// the query context.
	ctx context.Context
Adin Schmahmann's avatar
Adin Schmahmann committed
37

38
	// the cancellation function for the query context.
Adin Schmahmann's avatar
Adin Schmahmann committed
39
	cancel context.CancelFunc
40

Adin Schmahmann's avatar
Adin Schmahmann committed
41
	dht *IpfsDHT
Jeromy's avatar
Jeromy committed
42

Adin Schmahmann's avatar
Adin Schmahmann committed
43 44 45 46 47 48 49 50 51
	// seedPeers is the set of peers that seed the query
	seedPeers []peer.ID

	// queryPeers is the set of peers known by this query and their respective states.
	queryPeers *qpeerset.QueryPeerset

	// terminated is set when the first worker thread encounters the termination condition.
	// Its role is to make sure that once termination is determined, it is sticky.
	terminated bool
52

53 54 55
	// waitGroup ensures lookup does not end until all query goroutines complete.
	waitGroup sync.WaitGroup

56 57 58 59 60
	// the function that will be used to query a single peer.
	queryFn queryFn

	// stopFn is used to determine if we should stop the WHOLE disjoint query.
	stopFn stopFn
61 62
}

Adin Schmahmann's avatar
Adin Schmahmann committed
63
type lookupWithFollowupResult struct {
Aarsh Shah's avatar
Aarsh Shah committed
64 65
	peers []peer.ID            // the top K not unreachable peers at the end of the query
	state []qpeerset.PeerState // the peer states at the end of the query
Adin Schmahmann's avatar
Adin Schmahmann committed
66

Adin Schmahmann's avatar
Adin Schmahmann committed
67 68 69 70 71 72 73 74 75 76 77 78
	// indicates that neither the lookup nor the followup has been prematurely terminated by an external condition such
	// as context cancellation or the stop function being called.
	completed bool
}

// runLookupWithFollowup executes the lookup on the target using the given query function and stopping when either the
// context is cancelled or the stop function returns true. Note: if the stop function is not sticky, i.e. it does not
// return true every time after the first time it returns true, it is not guaranteed to cause a stop to occur just
// because it momentarily returns true.
//
// After the lookup is complete the query function is run (unless stopped) against all of the top K peers from the
// lookup that have not already been successfully queried.
Aarsh Shah's avatar
Aarsh Shah committed
79
func (dht *IpfsDHT) runLookupWithFollowup(ctx context.Context, target string, queryFn queryFn, stopFn stopFn) (*lookupWithFollowupResult, error) {
Adin Schmahmann's avatar
Adin Schmahmann committed
80
	// run the query
Aarsh Shah's avatar
Aarsh Shah committed
81
	lookupRes, err := dht.runQuery(ctx, target, queryFn, stopFn)
Adin Schmahmann's avatar
Adin Schmahmann committed
82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108
	if err != nil {
		return nil, err
	}

	// query all of the top K peers we've either Heard about or have outstanding queries we're Waiting on.
	// This ensures that all of the top K results have been queried which adds to resiliency against churn for query
	// functions that carry state (e.g. FindProviders and GetValue) as well as establish connections that are needed
	// by stateless query functions (e.g. GetClosestPeers and therefore Provide and PutValue)
	queryPeers := make([]peer.ID, 0, len(lookupRes.peers))
	for i, p := range lookupRes.peers {
		if state := lookupRes.state[i]; state == qpeerset.PeerHeard || state == qpeerset.PeerWaiting {
			queryPeers = append(queryPeers, p)
		}
	}

	if len(queryPeers) == 0 {
		return lookupRes, nil
	}

	// return if the lookup has been externally stopped
	if ctx.Err() != nil || stopFn() {
		lookupRes.completed = false
		return lookupRes, nil
	}

	doneCh := make(chan struct{}, len(queryPeers))
	followUpCtx, cancelFollowUp := context.WithCancel(ctx)
109
	defer cancelFollowUp()
Adin Schmahmann's avatar
Adin Schmahmann committed
110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138
	for _, p := range queryPeers {
		qp := p
		go func() {
			_, _ = queryFn(followUpCtx, qp)
			doneCh <- struct{}{}
		}()
	}

	// wait for all queries to complete before returning, aborting ongoing queries if we've been externally stopped
processFollowUp:
	for i := 0; i < len(queryPeers); i++ {
		select {
		case <-doneCh:
			if stopFn() {
				cancelFollowUp()
				if i < len(queryPeers)-1 {
					lookupRes.completed = false
				}
				break processFollowUp
			}
		case <-ctx.Done():
			lookupRes.completed = false
			break processFollowUp
		}
	}

	return lookupRes, nil
}

Aarsh Shah's avatar
Aarsh Shah committed
139
func (dht *IpfsDHT) runQuery(ctx context.Context, target string, queryFn queryFn, stopFn stopFn) (*lookupWithFollowupResult, error) {
140
	// pick the K closest peers to the key in our Routing table and shuffle them.
Adin Schmahmann's avatar
Adin Schmahmann committed
141 142
	targetKadID := kb.ConvertKey(target)
	seedPeers := dht.routingTable.NearestPeers(targetKadID, dht.bucketSize)
143 144 145 146 147 148 149
	if len(seedPeers) == 0 {
		routing.PublishQueryEvent(ctx, &routing.QueryEvent{
			Type:  routing.QueryError,
			Extra: kb.ErrLookupFailure.Error(),
		})
		return nil, kb.ErrLookupFailure
	}
Adin Schmahmann's avatar
Adin Schmahmann committed
150

Aarsh Shah's avatar
Aarsh Shah committed
151
	q := &query{
152 153
		id:         uuid.New(),
		key:        target,
154
		ctx:        ctx,
Aarsh Shah's avatar
Aarsh Shah committed
155 156 157 158 159 160
		dht:        dht,
		queryPeers: qpeerset.NewQueryPeerset(target),
		seedPeers:  seedPeers,
		terminated: false,
		queryFn:    queryFn,
		stopFn:     stopFn,
161 162
	}

Aarsh Shah's avatar
Aarsh Shah committed
163
	// run the query
164 165 166 167 168
	q.run()

	if ctx.Err() == nil {
		q.recordValuablePeers()
	}
169

Aarsh Shah's avatar
Aarsh Shah committed
170
	res := q.constructLookupResult(targetKadID)
Adin Schmahmann's avatar
Adin Schmahmann committed
171
	return res, nil
172 173
}

Aarsh Shah's avatar
Aarsh Shah committed
174 175 176
func (q *query) recordPeerIsValuable(p peer.ID) {
	q.dht.routingTable.UpdateLastSuccessfulOutboundQuery(p, time.Now())
}
177 178 179 180 181 182

func (q *query) recordValuablePeers() {
	closePeers := q.queryPeers.GetClosestNotUnreachable(q.dht.beta)
	for _, p := range closePeers {
		referrer := p
		for {
Aarsh Shah's avatar
Aarsh Shah committed
183
			q.recordPeerIsValuable(referrer)
184 185 186 187 188 189 190 191
			referrer = q.queryPeers.GetReferrer(referrer)
			if referrer == q.dht.self {
				break
			}
		}
	}
}

Adin Schmahmann's avatar
Adin Schmahmann committed
192
// constructLookupResult takes the query information and uses it to construct the lookup result
Aarsh Shah's avatar
Aarsh Shah committed
193 194
func (q *query) constructLookupResult(target kb.ID) *lookupWithFollowupResult {
	// determine if the query terminated early
Adin Schmahmann's avatar
Adin Schmahmann committed
195
	completed := true
Aarsh Shah's avatar
Aarsh Shah committed
196

197 198 199 200
	// Lookup and starvation are both valid ways for a lookup to complete. (Starvation does not imply failure.)
	// Lookup termination (as defined in isLookupTermination) is not possible in small networks.
	// Starvation is a successful query termination in small networks.
	if !(q.isLookupTermination() || q.isStarvationTermination()) {
Aarsh Shah's avatar
Aarsh Shah committed
201
		completed = false
Adin Schmahmann's avatar
Adin Schmahmann committed
202
	}
203

Aarsh Shah's avatar
Aarsh Shah committed
204
	// extract the top K not unreachable peers
Adin Schmahmann's avatar
Adin Schmahmann committed
205 206
	var peers []peer.ID
	peerState := make(map[peer.ID]qpeerset.PeerState)
Aarsh Shah's avatar
Aarsh Shah committed
207 208 209 210 211
	qp := q.queryPeers.GetClosestNotUnreachable(q.dht.bucketSize)
	for _, p := range qp {
		state := q.queryPeers.GetState(p)
		peerState[p] = state
		peers = append(peers, p)
212 213
	}

Adin Schmahmann's avatar
Adin Schmahmann committed
214 215
	// get the top K overall peers
	sortedPeers := kb.SortClosestPeers(peers, target)
Aarsh Shah's avatar
Aarsh Shah committed
216 217
	if len(sortedPeers) > q.dht.bucketSize {
		sortedPeers = sortedPeers[:q.dht.bucketSize]
218 219
	}

Aarsh Shah's avatar
Aarsh Shah committed
220
	// return the top K not unreachable peers as well as their states at the end of the query
Adin Schmahmann's avatar
Adin Schmahmann committed
221 222 223 224 225 226 227 228 229
	res := &lookupWithFollowupResult{
		peers:     sortedPeers,
		state:     make([]qpeerset.PeerState, len(sortedPeers)),
		completed: completed,
	}

	for i, p := range sortedPeers {
		res.state[i] = peerState[p]
	}
230 231

	return res
Adin Schmahmann's avatar
Adin Schmahmann committed
232
}
233

Adin Schmahmann's avatar
Adin Schmahmann committed
234
type queryUpdate struct {
235 236
	cause       peer.ID
	heard       []peer.ID
Adin Schmahmann's avatar
Adin Schmahmann committed
237 238 239
	queried     []peer.ID
	unreachable []peer.ID
}
240

241
func (q *query) run() {
Adin Schmahmann's avatar
Adin Schmahmann committed
242 243
	pathCtx, cancelPath := context.WithCancel(q.ctx)
	defer cancelPath()
244

Adin Schmahmann's avatar
Adin Schmahmann committed
245
	alpha := q.dht.alpha
246

Adin Schmahmann's avatar
Adin Schmahmann committed
247
	ch := make(chan *queryUpdate, alpha)
248
	ch <- &queryUpdate{cause: q.dht.self, heard: q.seedPeers}
249

250 251
	// return only once all outstanding queries have completed.
	defer q.waitGroup.Wait()
Adin Schmahmann's avatar
Adin Schmahmann committed
252
	for {
253
		var cause peer.ID
Adin Schmahmann's avatar
Adin Schmahmann committed
254 255
		select {
		case update := <-ch:
256 257
			q.updateState(pathCtx, update)
			cause = update.cause
Adin Schmahmann's avatar
Adin Schmahmann committed
258
		case <-pathCtx.Done():
259
			q.terminate(pathCtx, cancelPath, LookupCancelled)
Adin Schmahmann's avatar
Adin Schmahmann committed
260 261
		}

Adin Schmahmann's avatar
Adin Schmahmann committed
262
		// termination is triggered on end-of-lookup conditions or starvation of unused peers
263 264 265
		if ready, reason := q.isReadyToTerminate(); ready {
			q.terminate(pathCtx, cancelPath, reason)
		}
Adin Schmahmann's avatar
Adin Schmahmann committed
266

267 268
		if q.terminated {
			return
Adin Schmahmann's avatar
Adin Schmahmann committed
269 270 271 272 273 274 275 276
		}

		// if all "threads" are busy, wait until someone finishes
		if q.queryPeers.NumWaiting() >= alpha {
			continue
		}

		// spawn new queries, up to the parallelism allowance
277 278 279 280 281
		// calculate the maximum number of queries we could be spawning.
		// Note: NumWaiting will be updated in spawnQuery
		maxNumQueriesToSpawn := alpha - q.queryPeers.NumWaiting()
		// try spawning the queries, if there are no available peers to query then we won't spawn them
		for j := 0; j < maxNumQueriesToSpawn; j++ {
282
			q.spawnQuery(pathCtx, cause, ch)
Adin Schmahmann's avatar
Adin Schmahmann committed
283 284 285 286
		}
	}
}

287 288
// spawnQuery starts one query, if an available heard peer is found
func (q *query) spawnQuery(ctx context.Context, cause peer.ID, ch chan<- *queryUpdate) {
Adin Schmahmann's avatar
Adin Schmahmann committed
289 290 291
	if peers := q.queryPeers.GetSortedHeard(); len(peers) == 0 {
		return
	} else {
292 293 294 295 296 297 298 299 300 301 302 303 304 305 306 307 308
		PublishLookupEvent(ctx,
			NewLookupEvent(
				q.dht.self,
				q.id,
				q.key,
				NewLookupUpdateEvent(
					cause,
					q.queryPeers.GetReferrer(peers[0]),
					nil,                 // heard
					[]peer.ID{peers[0]}, // waiting
					nil,                 // queried
					nil,                 // unreachable
				),
				nil,
				nil,
			),
		)
Adin Schmahmann's avatar
Adin Schmahmann committed
309
		q.queryPeers.SetState(peers[0], qpeerset.PeerWaiting)
310 311
		q.waitGroup.Add(1)
		go q.queryPeer(ctx, ch, peers[0])
Adin Schmahmann's avatar
Adin Schmahmann committed
312 313 314
	}
}

315
func (q *query) isReadyToTerminate() (bool, LookupTerminationReason) {
Adin Schmahmann's avatar
Adin Schmahmann committed
316 317
	// give the application logic a chance to terminate
	if q.stopFn() {
318
		return true, LookupStopped
Adin Schmahmann's avatar
Adin Schmahmann committed
319 320
	}
	if q.isStarvationTermination() {
321
		return true, LookupStarvation
Adin Schmahmann's avatar
Adin Schmahmann committed
322 323
	}
	if q.isLookupTermination() {
324
		return true, LookupCompleted
Adin Schmahmann's avatar
Adin Schmahmann committed
325
	}
326
	return false, -1
Adin Schmahmann's avatar
Adin Schmahmann committed
327 328 329 330 331 332 333 334 335 336
}

// From the set of all nodes that are not unreachable,
// if the closest beta nodes are all queried, the lookup can terminate.
func (q *query) isLookupTermination() bool {
	var peers []peer.ID
	peers = q.queryPeers.GetClosestNotUnreachable(q.dht.beta)
	for _, p := range peers {
		if q.queryPeers.GetState(p) != qpeerset.PeerQueried {
			return false
Adin Schmahmann's avatar
Adin Schmahmann committed
337
		}
338
	}
Adin Schmahmann's avatar
Adin Schmahmann committed
339 340 341 342 343
	return true
}

func (q *query) isStarvationTermination() bool {
	return q.queryPeers.NumHeard() == 0 && q.queryPeers.NumWaiting() == 0
344 345
}

346 347 348 349 350 351 352 353 354 355 356 357 358 359 360 361 362
func (q *query) terminate(ctx context.Context, cancel context.CancelFunc, reason LookupTerminationReason) {
	if q.terminated {
		return
	} else {
		PublishLookupEvent(ctx,
			NewLookupEvent(
				q.dht.self,
				q.id,
				q.key,
				nil,
				nil,
				NewLookupTerminateEvent(reason),
			),
		)
		cancel() // abort outstanding queries
		q.terminated = true
	}
363 364
}

Adin Schmahmann's avatar
Adin Schmahmann committed
365 366
// queryPeer queries a single peer and reports its findings on the channel.
// queryPeer does not access the query state in queryPeers!
367 368 369
func (q *query) queryPeer(ctx context.Context, ch chan<- *queryUpdate, p peer.ID) {
	defer q.waitGroup.Done()
	dialCtx, queryCtx := ctx, ctx
Adin Schmahmann's avatar
Adin Schmahmann committed
370

371
	// dial the peer
Adin Schmahmann's avatar
Adin Schmahmann committed
372
	if err := q.dht.dialPeer(dialCtx, p); err != nil {
Aarsh Shah's avatar
Aarsh Shah committed
373 374 375 376
		// remove the peer if there was a dial failure..but not because of a context cancellation
		if dialCtx.Err() == nil {
			q.dht.peerStoppedDHT(q.dht.ctx, p)
		}
377
		ch <- &queryUpdate{cause: p, unreachable: []peer.ID{p}}
Adin Schmahmann's avatar
Adin Schmahmann committed
378
		return
Adin Schmahmann's avatar
Adin Schmahmann committed
379
	}
380 381

	// send query RPC to the remote peer
Adin Schmahmann's avatar
Adin Schmahmann committed
382 383
	newPeers, err := q.queryFn(queryCtx, p)
	if err != nil {
Aarsh Shah's avatar
Aarsh Shah committed
384 385 386
		if queryCtx.Err() == nil {
			q.dht.peerStoppedDHT(q.dht.ctx, p)
		}
387
		ch <- &queryUpdate{cause: p, unreachable: []peer.ID{p}}
Adin Schmahmann's avatar
Adin Schmahmann committed
388
		return
Juan Batiz-Benet's avatar
Juan Batiz-Benet committed
389
	}
390

Aarsh Shah's avatar
Aarsh Shah committed
391 392 393
	// query successful, try to add to RT
	q.dht.peerFound(q.dht.ctx, p, true)

Adin Schmahmann's avatar
Adin Schmahmann committed
394 395
	// process new peers
	saw := []peer.ID{}
Adin Schmahmann's avatar
Adin Schmahmann committed
396 397 398 399 400
	for _, next := range newPeers {
		if next.ID == q.dht.self { // don't add self.
			logger.Debugf("PEERS CLOSER -- worker for: %v found self", p)
			continue
		}
401

402 403 404 405
		// add any other know addresses for the candidate peer.
		curInfo := q.dht.peerstore.PeerInfo(next.ID)
		next.Addrs = append(next.Addrs, curInfo.Addrs...)

Adin Schmahmann's avatar
Adin Schmahmann committed
406
		// add their addresses to the dialer's peerstore
407 408 409 410
		if q.dht.queryPeerFilter(q.dht, *next) {
			q.dht.peerstore.AddAddrs(next.ID, next.Addrs, pstore.TempAddrTTL)
			saw = append(saw, next.ID)
		}
411
	}
Adin Schmahmann's avatar
Adin Schmahmann committed
412

413
	ch <- &queryUpdate{cause: p, heard: saw, queried: []peer.ID{p}}
Adin Schmahmann's avatar
Adin Schmahmann committed
414
}
415

416 417 418 419 420 421 422 423 424 425 426 427 428 429 430 431 432 433 434 435 436 437
func (q *query) updateState(ctx context.Context, up *queryUpdate) {
	if q.terminated {
		panic("update should not be invoked after the logical lookup termination")
	}
	PublishLookupEvent(ctx,
		NewLookupEvent(
			q.dht.self,
			q.id,
			q.key,
			nil,
			NewLookupUpdateEvent(
				up.cause,
				up.cause,
				up.heard,       // heard
				nil,            // waiting
				up.queried,     // queried
				up.unreachable, // unreachable
			),
			nil,
		),
	)
	for _, p := range up.heard {
Adin Schmahmann's avatar
Adin Schmahmann committed
438 439 440
		if p == q.dht.self { // don't add self.
			continue
		}
441
		q.queryPeers.TryAdd(p, up.cause)
Adin Schmahmann's avatar
Adin Schmahmann committed
442 443 444 445 446 447 448 449 450 451 452 453 454 455 456 457 458 459 460 461
	}
	for _, p := range up.queried {
		if p == q.dht.self { // don't add self.
			continue
		}
		if st := q.queryPeers.GetState(p); st == qpeerset.PeerWaiting {
			q.queryPeers.SetState(p, qpeerset.PeerQueried)
		} else {
			panic(fmt.Errorf("kademlia protocol error: tried to transition to the queried state from state %v", st))
		}
	}
	for _, p := range up.unreachable {
		if p == q.dht.self { // don't add self.
			continue
		}
		if st := q.queryPeers.GetState(p); st == qpeerset.PeerWaiting {
			q.queryPeers.SetState(p, qpeerset.PeerUnreachable)
		} else {
			panic(fmt.Errorf("kademlia protocol error: tried to transition to the unreachable state from state %v", st))
		}
462
	}
463
}
Juan Batiz-Benet's avatar
Juan Batiz-Benet committed
464

Adin Schmahmann's avatar
Adin Schmahmann committed
465
func (dht *IpfsDHT) dialPeer(ctx context.Context, p peer.ID) error {
466
	// short-circuit if we're already connected.
Adin Schmahmann's avatar
Adin Schmahmann committed
467
	if dht.host.Network().Connectedness(p) == network.Connected {
468 469 470
		return nil
	}

Matt Joiner's avatar
Matt Joiner committed
471
	logger.Debug("not connected. dialing.")
Adin Schmahmann's avatar
Adin Schmahmann committed
472
	routing.PublishQueryEvent(ctx, &routing.QueryEvent{
473
		Type: routing.DialingPeer,
474 475 476
		ID:   p,
	})

477
	pi := peer.AddrInfo{ID: p}
Adin Schmahmann's avatar
Adin Schmahmann committed
478
	if err := dht.host.Connect(ctx, pi); err != nil {
Matt Joiner's avatar
Matt Joiner committed
479
		logger.Debugf("error connecting: %s", err)
Adin Schmahmann's avatar
Adin Schmahmann committed
480
		routing.PublishQueryEvent(ctx, &routing.QueryEvent{
481
			Type:  routing.QueryError,
482 483 484 485 486 487
			Extra: err.Error(),
			ID:    p,
		})

		return err
	}
Matt Joiner's avatar
Matt Joiner committed
488
	logger.Debugf("connected. dial success.")
489 490
	return nil
}