lbry.go/dht/node_finder.go

373 lines
8.8 KiB
Go
Raw Normal View History

package dht
import (
2018-04-28 02:16:12 +02:00
"sort"
"sync"
2018-04-05 17:35:57 +02:00
"time"
"github.com/lbryio/internal-apis/app/crypto"
"github.com/lbryio/lbry.go/errors"
"github.com/lbryio/lbry.go/stopOnce"
2018-06-14 17:48:02 +02:00
"github.com/lbryio/reflector.go/dht/bits"
"github.com/sirupsen/logrus"
"github.com/uber-go/atomic"
)
// TODO: iterativeFindValue may be stopping early. if it gets a response with one peer, it should keep going because other nodes may know about more peers that have that blob
// TODO: or, it should try a tcp handshake with peers as it finds them, to make sure they are still online and have the blob
var cfLog *logrus.Logger
func init() {
cfLog = logrus.StandardLogger()
}
func NodeFinderUserLogger(l *logrus.Logger) {
cfLog = l
}
2018-04-28 02:16:12 +02:00
type contactFinder struct {
findValue bool // true if we're using findValue
2018-06-14 17:48:02 +02:00
target bits.Bitmap
2018-04-28 02:16:12 +02:00
node *Node
2018-05-24 19:05:05 +02:00
stop *stopOnce.Stopper
findValueMutex *sync.Mutex
2018-04-28 02:16:12 +02:00
findValueResult []Contact
2018-04-28 02:16:12 +02:00
activeContactsMutex *sync.Mutex
activeContacts []Contact
2018-04-05 17:35:57 +02:00
shortlistMutex *sync.Mutex
2018-04-28 02:16:12 +02:00
shortlist []Contact
2018-06-14 17:48:02 +02:00
shortlistAdded map[bits.Bitmap]bool
closestContactMutex *sync.RWMutex
closestContact *Contact
notGettingCloser *atomic.Bool
}
2018-06-14 17:48:02 +02:00
func FindContacts(node *Node, target bits.Bitmap, findValue bool, upstreamStop stopOnce.Chan) ([]Contact, bool, error) {
2018-06-13 18:45:47 +02:00
cf := &contactFinder{
2018-04-28 02:16:12 +02:00
node: node,
target: target,
findValue: findValue,
findValueMutex: &sync.Mutex{},
activeContactsMutex: &sync.Mutex{},
shortlistMutex: &sync.Mutex{},
2018-06-14 17:48:02 +02:00
shortlistAdded: make(map[bits.Bitmap]bool),
2018-05-24 19:05:05 +02:00
stop: stopOnce.New(),
closestContactMutex: &sync.RWMutex{},
notGettingCloser: atomic.NewBool(false),
}
2018-06-13 18:45:47 +02:00
if upstreamStop != nil {
go func() {
select {
case <-upstreamStop:
cf.Stop()
case <-cf.stop.Ch():
}
}()
2018-06-13 18:45:47 +02:00
}
2018-06-13 18:45:47 +02:00
return cf.Find()
}
2018-06-13 18:45:47 +02:00
func (cf *contactFinder) Stop() {
2018-05-24 19:05:05 +02:00
cf.stop.Stop()
cf.stop.Wait()
2018-05-13 22:02:46 +02:00
}
2018-06-13 18:45:47 +02:00
func (cf *contactFinder) Find() ([]Contact, bool, error) {
2018-04-28 02:16:12 +02:00
if cf.findValue {
2018-06-22 15:30:16 +02:00
cf.debug("starting iterativeFindValue")
} else {
2018-06-22 15:30:16 +02:00
cf.debug("starting iterativeFindNode")
}
2018-04-28 02:16:12 +02:00
cf.appendNewToShortlist(cf.node.rt.GetClosest(cf.target, alpha))
if len(cf.shortlist) == 0 {
return nil, false, errors.Err("[%s] find %s: no contacts in routing table", cf.node.id.HexShort(), cf.target.HexShort())
}
go cf.cycle(false)
timeout := 5 * time.Second
CycleLoop:
for {
select {
case <-time.After(timeout):
go cf.cycle(false)
case <-cf.stop.Ch():
break CycleLoop
}
}
// TODO: what to do if we have less than K active contacts, shortlist is empty, but we have other contacts in our routing table whom we have not contacted. prolly contact them
2018-06-13 18:45:47 +02:00
var contacts []Contact
var found bool
2018-04-28 02:16:12 +02:00
if cf.findValue && len(cf.findValueResult) > 0 {
2018-06-13 18:45:47 +02:00
contacts = cf.findValueResult
found = true
} else {
2018-06-13 18:45:47 +02:00
contacts = cf.activeContacts
if len(contacts) > bucketSize {
contacts = contacts[:bucketSize]
}
}
2018-06-13 18:45:47 +02:00
cf.Stop()
return contacts, found, nil
}
// cycle does a single cycle of sending alpha probes and checking results against closestNode
func (cf *contactFinder) cycle(bigCycle bool) {
cycleID := crypto.RandString(6)
if bigCycle {
cf.debug("LAUNCHING CYCLE %s, AND ITS A BIG CYCLE", cycleID)
} else {
cf.debug("LAUNCHING CYCLE %s", cycleID)
}
defer cf.debug("CYCLE %s DONE", cycleID)
cf.closestContactMutex.RLock()
closestContact := cf.closestContact
cf.closestContactMutex.RUnlock()
2018-04-05 17:35:57 +02:00
var wg sync.WaitGroup
ch := make(chan *Contact)
2018-04-05 17:35:57 +02:00
limit := alpha
if bigCycle {
limit = bucketSize
}
for i := 0; i < limit; i++ {
wg.Add(1)
go func() {
defer wg.Done()
ch <- cf.probe(cycleID)
}()
}
2018-04-05 17:35:57 +02:00
go func() {
wg.Wait()
close(ch)
}()
2018-04-05 17:35:57 +02:00
foundCloser := false
for {
c, more := <-ch
if !more {
break
}
if c != nil && (closestContact == nil || cf.target.Closer(c.ID, closestContact.ID)) {
if closestContact != nil {
cf.debug("|%s| best contact improved: %s -> %s", cycleID, closestContact.ID.HexShort(), c.ID.HexShort())
2018-04-05 17:35:57 +02:00
} else {
cf.debug("|%s| best contact starting at %s", cycleID, c.ID.HexShort())
2018-04-05 17:35:57 +02:00
}
foundCloser = true
closestContact = c
}
}
if cf.isSearchFinished() {
cf.stop.Stop()
return
}
if foundCloser {
cf.closestContactMutex.Lock()
// have to check again after locking in case other probes found a closer one in the meantime
if cf.closestContact == nil || cf.target.Closer(closestContact.ID, cf.closestContact.ID) {
cf.closestContact = closestContact
}
cf.closestContactMutex.Unlock()
go cf.cycle(false)
} else if !bigCycle {
cf.debug("|%s| no improvement, running big cycle", cycleID)
go cf.cycle(true)
} else {
// big cycle ran and there was no improvement, so we're done
cf.debug("|%s| big cycle ran, still no improvement", cycleID)
cf.notGettingCloser.Store(true)
}
}
// probe sends a single probe, updates the lists, and returns the closest contact it found
func (cf *contactFinder) probe(cycleID string) *Contact {
maybeContact := cf.popFromShortlist()
if maybeContact == nil {
cf.debug("|%s| no contacts in shortlist, returning", cycleID)
return nil
}
c := *maybeContact
if c.ID.Equals(cf.node.id) {
return nil
}
cf.debug("|%s| probe %s: launching", cycleID, c.ID.HexShort())
req := Request{Arg: &cf.target}
if cf.findValue {
req.Method = findValueMethod
} else {
req.Method = findNodeMethod
}
var res *Response
2018-06-25 21:56:45 +02:00
resCh := cf.node.SendAsync(c, req)
select {
case res = <-resCh:
case <-cf.stop.Ch():
cf.debug("|%s| probe %s: canceled", cycleID, c.ID.HexShort())
return nil
}
if res == nil {
cf.debug("|%s| probe %s: req canceled or timed out", cycleID, c.ID.HexShort())
return nil
}
if cf.findValue && res.FindValueKey != "" {
cf.debug("|%s| probe %s: got value", cycleID, c.ID.HexShort())
cf.findValueMutex.Lock()
cf.findValueResult = res.Contacts
cf.findValueMutex.Unlock()
cf.stop.Stop()
return nil
}
cf.debug("|%s| probe %s: got %s", cycleID, c.ID.HexShort(), res.argsDebug())
cf.insertIntoActiveList(c)
cf.appendNewToShortlist(res.Contacts)
cf.activeContactsMutex.Lock()
contacts := cf.activeContacts
if len(contacts) > bucketSize {
contacts = contacts[:bucketSize]
}
contactsStr := ""
for _, c := range contacts {
contactsStr += c.ID.HexShort() + ", "
}
cf.activeContactsMutex.Unlock()
return cf.closest(res.Contacts...)
}
func (cf *contactFinder) probeClosestOutstanding() {
}
// appendNewToShortlist appends any new contacts to the shortlist and sorts it by distance
// contacts that have already been added to the shortlist in the past are ignored
2018-04-28 02:16:12 +02:00
func (cf *contactFinder) appendNewToShortlist(contacts []Contact) {
cf.shortlistMutex.Lock()
defer cf.shortlistMutex.Unlock()
2018-04-28 02:16:12 +02:00
for _, c := range contacts {
if _, ok := cf.shortlistAdded[c.ID]; !ok {
2018-04-28 02:16:12 +02:00
cf.shortlist = append(cf.shortlist, c)
cf.shortlistAdded[c.ID] = true
}
}
2018-04-28 02:16:12 +02:00
sortInPlace(cf.shortlist, cf.target)
}
// popFromShortlist pops the first contact off the shortlist and returns it
2018-04-28 02:16:12 +02:00
func (cf *contactFinder) popFromShortlist() *Contact {
cf.shortlistMutex.Lock()
defer cf.shortlistMutex.Unlock()
2018-04-28 02:16:12 +02:00
if len(cf.shortlist) == 0 {
return nil
}
2018-04-28 02:16:12 +02:00
first := cf.shortlist[0]
cf.shortlist = cf.shortlist[1:]
return &first
}
// insertIntoActiveList inserts the contact into appropriate place in the list of active contacts (sorted by distance)
2018-04-28 02:16:12 +02:00
func (cf *contactFinder) insertIntoActiveList(contact Contact) {
cf.activeContactsMutex.Lock()
defer cf.activeContactsMutex.Unlock()
inserted := false
2018-04-28 02:16:12 +02:00
for i, n := range cf.activeContacts {
if cf.target.Closer(contact.ID, n.ID) {
2018-04-28 02:16:12 +02:00
cf.activeContacts = append(cf.activeContacts[:i], append([]Contact{contact}, cf.activeContacts[i:]...)...)
inserted = true
2018-04-05 17:35:57 +02:00
break
}
}
if !inserted {
2018-04-28 02:16:12 +02:00
cf.activeContacts = append(cf.activeContacts, contact)
}
}
// isSearchFinished returns true if the search is done and should be stopped
2018-04-28 02:16:12 +02:00
func (cf *contactFinder) isSearchFinished() bool {
if cf.findValue && len(cf.findValueResult) > 0 {
return true
}
select {
2018-05-24 19:05:05 +02:00
case <-cf.stop.Ch():
return true
default:
}
if cf.notGettingCloser.Load() {
return true
}
cf.activeContactsMutex.Lock()
defer cf.activeContactsMutex.Unlock()
if len(cf.activeContacts) >= bucketSize {
return true
}
return false
}
func (cf *contactFinder) debug(format string, args ...interface{}) {
args = append([]interface{}{cf.node.id.HexShort()}, append([]interface{}{cf.target.HexShort()}, args...)...)
cfLog.Debugf("[%s] find %s: "+format, args...)
2018-04-28 02:16:12 +02:00
}
func (cf *contactFinder) closest(contacts ...Contact) *Contact {
if len(contacts) == 0 {
return nil
}
closest := contacts[0]
for _, c := range contacts {
if cf.target.Closer(c.ID, closest.ID) {
closest = c
}
}
return &closest
2018-06-22 15:30:16 +02:00
}
2018-06-14 17:48:02 +02:00
func sortInPlace(contacts []Contact, target bits.Bitmap) {
2018-04-28 02:16:12 +02:00
toSort := make([]sortedContact, len(contacts))
for i, n := range contacts {
toSort[i] = sortedContact{n, n.ID.Xor(target)}
2018-04-28 02:16:12 +02:00
}
sort.Sort(byXorDistance(toSort))
for i, c := range toSort {
contacts[i] = c.contact
}
}