2016-12-13 20:53:24 -06:00
|
|
|
import binascii
|
|
|
|
import hashlib
|
2018-02-21 14:53:12 -05:00
|
|
|
import logging
|
2018-07-20 16:45:58 -03:00
|
|
|
from functools import reduce
|
|
|
|
|
2018-02-20 13:30:56 -05:00
|
|
|
from twisted.internet import defer, error, task
|
2016-12-13 20:53:24 -06:00
|
|
|
|
2018-11-07 15:15:05 -05:00
|
|
|
from lbrynet.utils import generate_id, DeferredDict
|
2018-11-09 14:02:03 -05:00
|
|
|
from lbrynet.dht.call_later_manager import CallLaterManager
|
|
|
|
from lbrynet.dht.error import TimeoutError
|
|
|
|
from lbrynet.dht import constants, routingtable, datastore, protocol
|
|
|
|
from lbrynet.dht.contact import ContactManager
|
|
|
|
from lbrynet.dht.iterativefind import iterativeFind
|
2015-08-20 11:27:15 -04:00
|
|
|
|
2015-09-08 15:42:56 -04:00
|
|
|
log = logging.getLogger(__name__)
|
|
|
|
|
|
|
|
|
2015-08-20 11:27:15 -04:00
|
|
|
def rpcmethod(func):
|
|
|
|
""" Decorator to expose Node methods as remote procedure calls
|
2016-12-13 17:08:29 -06:00
|
|
|
|
2015-08-20 11:27:15 -04:00
|
|
|
Apply this decorator to methods in the Node class (or a subclass) in order
|
|
|
|
to make them remotely callable via the DHT's RPC mechanism.
|
|
|
|
"""
|
|
|
|
func.rpcmethod = True
|
|
|
|
return func
|
|
|
|
|
2016-12-13 18:11:04 -06:00
|
|
|
|
2018-07-21 18:34:59 -04:00
|
|
|
class MockKademliaHelper:
|
2018-05-23 17:02:25 -04:00
|
|
|
def __init__(self, clock=None, callLater=None, resolve=None, listenUDP=None):
|
|
|
|
if not listenUDP or not resolve or not callLater or not clock:
|
|
|
|
from twisted.internet import reactor
|
|
|
|
listenUDP = listenUDP or reactor.listenUDP
|
|
|
|
resolve = resolve or reactor.resolve
|
|
|
|
callLater = callLater or reactor.callLater
|
|
|
|
clock = clock or reactor
|
|
|
|
|
|
|
|
self.clock = clock
|
2018-05-23 17:32:55 -04:00
|
|
|
self.contact_manager = ContactManager(self.clock.seconds)
|
2018-05-23 17:02:25 -04:00
|
|
|
self.reactor_listenUDP = listenUDP
|
|
|
|
self.reactor_resolve = resolve
|
2018-05-23 20:41:01 -04:00
|
|
|
self.call_later_manager = CallLaterManager(callLater)
|
|
|
|
self.reactor_callLater = self.call_later_manager.call_later
|
|
|
|
self.reactor_callSoon = self.call_later_manager.call_soon
|
2018-05-23 17:02:25 -04:00
|
|
|
|
|
|
|
self._listeningPort = None # object implementing Twisted
|
|
|
|
# IListeningPort This will contain a deferred created when
|
|
|
|
# joining the network, to enable publishing/retrieving
|
|
|
|
# information from the DHT as soon as the node is part of the
|
|
|
|
# network (add callbacks to this deferred if scheduling such
|
|
|
|
# operations before the node has finished joining the network)
|
|
|
|
|
|
|
|
def get_looping_call(self, fn, *args, **kwargs):
|
|
|
|
lc = task.LoopingCall(fn, *args, **kwargs)
|
|
|
|
lc.clock = self.clock
|
|
|
|
return lc
|
|
|
|
|
|
|
|
def safe_stop_looping_call(self, lc):
|
|
|
|
if lc and lc.running:
|
|
|
|
return lc.stop()
|
|
|
|
return defer.succeed(None)
|
|
|
|
|
|
|
|
def safe_start_looping_call(self, lc, t):
|
|
|
|
if lc and not lc.running:
|
|
|
|
lc.start(t)
|
|
|
|
|
|
|
|
|
|
|
|
class Node(MockKademliaHelper):
|
2015-08-20 11:27:15 -04:00
|
|
|
""" Local node in the Kademlia network
|
2016-12-13 17:08:29 -06:00
|
|
|
|
2015-08-20 11:27:15 -04:00
|
|
|
This class represents a single local node in a Kademlia network; in other
|
|
|
|
words, this class encapsulates an Entangled-using application's "presence"
|
|
|
|
in a Kademlia network.
|
2016-12-13 17:08:29 -06:00
|
|
|
|
2015-08-20 11:27:15 -04:00
|
|
|
In Entangled, all interactions with the Kademlia network by a client
|
2016-12-13 17:08:29 -06:00
|
|
|
application is performed via this class (or a subclass).
|
2015-08-20 11:27:15 -04:00
|
|
|
"""
|
2017-03-31 13:32:43 -04:00
|
|
|
|
2018-03-27 15:12:44 -04:00
|
|
|
def __init__(self, node_id=None, udpPort=4000, dataStore=None,
|
2017-10-10 13:15:25 -04:00
|
|
|
routingTableClass=None, networkProtocol=None,
|
2018-05-23 17:02:25 -04:00
|
|
|
externalIP=None, peerPort=3333, listenUDP=None,
|
2018-10-30 13:41:38 -04:00
|
|
|
callLater=None, resolve=None, clock=None,
|
|
|
|
interface='', externalUDPPort=None):
|
2015-08-20 11:27:15 -04:00
|
|
|
"""
|
|
|
|
@param dataStore: The data store to use. This must be class inheriting
|
|
|
|
from the C{DataStore} interface (or providing the
|
|
|
|
same API). How the data store manages its data
|
|
|
|
internally is up to the implementation of that data
|
|
|
|
store.
|
|
|
|
@type dataStore: entangled.kademlia.datastore.DataStore
|
|
|
|
@param routingTable: The routing table class to use. Since there exists
|
|
|
|
some ambiguity as to how the routing table should be
|
|
|
|
implemented in Kademlia, a different routing table
|
|
|
|
may be used, as long as the appropriate API is
|
|
|
|
exposed. This should be a class, not an object,
|
|
|
|
in order to allow the Node to pass an
|
|
|
|
auto-generated node ID to the routingtable object
|
2016-12-13 17:08:29 -06:00
|
|
|
upon instantiation (if necessary).
|
2015-08-20 11:27:15 -04:00
|
|
|
@type routingTable: entangled.kademlia.routingtable.RoutingTable
|
|
|
|
@param networkProtocol: The network protocol to use. This can be
|
|
|
|
overridden from the default to (for example)
|
|
|
|
change the format of the physical RPC messages
|
|
|
|
being transmitted.
|
|
|
|
@type networkProtocol: entangled.kademlia.protocol.KademliaProtocol
|
2017-10-27 14:12:52 -04:00
|
|
|
@param externalIP: the IP at which this node can be contacted
|
|
|
|
@param peerPort: the port at which this node announces it has a blob for
|
2015-08-20 11:27:15 -04:00
|
|
|
"""
|
2018-02-20 13:30:56 -05:00
|
|
|
|
2018-07-21 18:34:59 -04:00
|
|
|
super().__init__(clock, callLater, resolve, listenUDP)
|
2017-10-10 13:15:25 -04:00
|
|
|
self.node_id = node_id or self._generateID()
|
2015-08-20 11:27:15 -04:00
|
|
|
self.port = udpPort
|
2018-07-17 17:13:33 -04:00
|
|
|
self._listen_interface = interface
|
2018-05-23 17:02:25 -04:00
|
|
|
self._change_token_lc = self.get_looping_call(self.change_token)
|
|
|
|
self._refresh_node_lc = self.get_looping_call(self._refreshNode)
|
2018-05-29 11:05:33 -04:00
|
|
|
self._refresh_contacts_lc = self.get_looping_call(self._refreshContacts)
|
2018-03-27 15:12:44 -04:00
|
|
|
|
2015-08-20 11:27:15 -04:00
|
|
|
# Create k-buckets (for storing contacts)
|
2017-04-25 14:21:13 -04:00
|
|
|
if routingTableClass is None:
|
2018-05-23 16:57:27 -04:00
|
|
|
self._routingTable = routingtable.TreeRoutingTable(self.node_id, self.clock.seconds)
|
2015-08-20 11:27:15 -04:00
|
|
|
else:
|
2018-02-20 13:30:56 -05:00
|
|
|
self._routingTable = routingTableClass(self.node_id, self.clock.seconds)
|
2015-08-20 11:27:15 -04:00
|
|
|
|
2018-10-30 13:41:38 -04:00
|
|
|
self._protocol = networkProtocol or protocol.KademliaProtocol(self)
|
2015-08-20 11:27:15 -04:00
|
|
|
self.token_secret = self._generateID()
|
|
|
|
self.old_token_secret = None
|
|
|
|
self.externalIP = externalIP
|
2017-10-27 14:12:52 -04:00
|
|
|
self.peerPort = peerPort
|
2018-08-05 13:12:39 -04:00
|
|
|
self.externalUDPPort = externalUDPPort or self.port
|
2018-05-24 10:23:22 -04:00
|
|
|
self._dataStore = dataStore or datastore.DictDataStore(self.clock.seconds)
|
2018-05-23 17:02:25 -04:00
|
|
|
self._join_deferred = None
|
2018-02-15 17:30:14 -05:00
|
|
|
|
2018-07-17 23:00:34 -03:00
|
|
|
#def __del__(self):
|
|
|
|
# log.warning("unclean shutdown of the dht node")
|
|
|
|
# if hasattr(self, "_listeningPort") and self._listeningPort is not None:
|
|
|
|
# self._listeningPort.stopListening()
|
2015-08-20 11:27:15 -04:00
|
|
|
|
2018-07-24 18:51:41 -03:00
|
|
|
def __str__(self):
|
|
|
|
return '<%s.%s object; ID: %s, IP address: %s, UDP port: %d>' % (
|
|
|
|
self.__module__, self.__class__.__name__, binascii.hexlify(self.node_id), self.externalIP, self.port)
|
|
|
|
|
2018-02-20 13:30:56 -05:00
|
|
|
@defer.inlineCallbacks
|
2015-08-20 11:27:15 -04:00
|
|
|
def stop(self):
|
2017-10-23 13:13:06 -04:00
|
|
|
# stop LoopingCalls:
|
2018-05-23 17:02:25 -04:00
|
|
|
yield self.safe_stop_looping_call(self._refresh_node_lc)
|
|
|
|
yield self.safe_stop_looping_call(self._change_token_lc)
|
2018-05-29 11:05:33 -04:00
|
|
|
yield self.safe_stop_looping_call(self._refresh_contacts_lc)
|
2015-08-20 11:27:15 -04:00
|
|
|
if self._listeningPort is not None:
|
2018-02-20 13:30:56 -05:00
|
|
|
yield self._listeningPort.stopListening()
|
2018-05-23 20:41:41 -04:00
|
|
|
self._listeningPort = None
|
2015-08-20 11:27:15 -04:00
|
|
|
|
2018-02-20 13:37:02 -05:00
|
|
|
def start_listening(self):
|
2018-03-05 13:15:07 -05:00
|
|
|
if not self._listeningPort:
|
|
|
|
try:
|
2018-07-17 17:38:19 -04:00
|
|
|
self._listeningPort = self.reactor_listenUDP(self.port, self._protocol,
|
|
|
|
interface=self._listen_interface)
|
2018-03-05 13:15:07 -05:00
|
|
|
except error.CannotListenError as e:
|
|
|
|
import traceback
|
|
|
|
log.error("Couldn't bind to port %d. %s", self.port, traceback.format_exc())
|
|
|
|
raise ValueError("%s lbrynet may already be running." % str(e))
|
|
|
|
else:
|
2018-05-23 18:01:30 -04:00
|
|
|
log.warning("Already bound to port %s", self._listeningPort)
|
2018-02-20 13:37:02 -05:00
|
|
|
|
2018-05-23 18:01:30 -04:00
|
|
|
@defer.inlineCallbacks
|
|
|
|
def joinNetwork(self, known_node_addresses=(('jack.lbry.tech', 4455), )):
|
2018-03-05 13:14:47 -05:00
|
|
|
"""
|
|
|
|
Attempt to join the dht, retry every 30 seconds if unsuccessful
|
|
|
|
:param known_node_addresses: [(str, int)] list of hostnames and ports for known dht seed nodes
|
|
|
|
"""
|
2018-05-23 18:01:30 -04:00
|
|
|
|
|
|
|
self._join_deferred = defer.Deferred()
|
|
|
|
known_node_resolution = {}
|
|
|
|
|
2018-02-20 13:37:02 -05:00
|
|
|
@defer.inlineCallbacks
|
|
|
|
def _resolve_seeds():
|
2018-05-23 18:01:30 -04:00
|
|
|
result = {}
|
|
|
|
for host, port in known_node_addresses:
|
|
|
|
node_address = yield self.reactor_resolve(host)
|
|
|
|
result[(host, port)] = node_address
|
|
|
|
defer.returnValue(result)
|
|
|
|
|
|
|
|
if not known_node_resolution:
|
|
|
|
known_node_resolution = yield _resolve_seeds()
|
|
|
|
# we are one of the seed nodes, don't add ourselves
|
2018-07-17 23:00:34 -03:00
|
|
|
if (self.externalIP, self.port) in known_node_resolution.values():
|
2018-05-23 18:01:30 -04:00
|
|
|
del known_node_resolution[(self.externalIP, self.port)]
|
|
|
|
known_node_addresses.remove((self.externalIP, self.port))
|
|
|
|
|
|
|
|
def _ping_contacts(contacts):
|
|
|
|
d = DeferredDict({contact: contact.ping() for contact in contacts}, consumeErrors=True)
|
|
|
|
d.addErrback(lambda err: err.trap(TimeoutError))
|
|
|
|
return d
|
|
|
|
|
|
|
|
@defer.inlineCallbacks
|
|
|
|
def _initialize_routing():
|
2018-02-20 13:37:02 -05:00
|
|
|
bootstrap_contacts = []
|
2018-05-23 18:01:30 -04:00
|
|
|
contact_addresses = {(c.address, c.port): c for c in self.contacts}
|
2018-07-17 23:00:34 -03:00
|
|
|
for (host, port), ip_address in known_node_resolution.items():
|
2018-05-23 18:01:30 -04:00
|
|
|
if (host, port) not in contact_addresses:
|
|
|
|
# Create temporary contact information for the list of addresses of known nodes
|
|
|
|
# The contact node id will be set with the responding node id when we initialize it to None
|
|
|
|
contact = self.contact_manager.make_contact(None, ip_address, port, self._protocol)
|
|
|
|
bootstrap_contacts.append(contact)
|
2018-02-20 13:37:02 -05:00
|
|
|
else:
|
2018-05-23 18:01:30 -04:00
|
|
|
for contact in self.contacts:
|
|
|
|
if contact.address == ip_address and contact.port == port:
|
|
|
|
if not contact.id:
|
|
|
|
bootstrap_contacts.append(contact)
|
|
|
|
break
|
|
|
|
if not bootstrap_contacts:
|
|
|
|
log.warning("no bootstrap contacts to ping")
|
|
|
|
ping_result = yield _ping_contacts(bootstrap_contacts)
|
2018-10-01 15:23:50 -03:00
|
|
|
shortlist = list(ping_result.keys())
|
2018-05-23 18:01:30 -04:00
|
|
|
if not shortlist:
|
|
|
|
log.warning("failed to ping %i bootstrap contacts", len(bootstrap_contacts))
|
|
|
|
defer.returnValue(None)
|
|
|
|
else:
|
|
|
|
# find the closest peers to us
|
2018-06-06 17:22:36 -04:00
|
|
|
closest = yield self._iterativeFind(self.node_id, shortlist if not self.contacts else None)
|
2018-05-23 18:01:30 -04:00
|
|
|
yield _ping_contacts(closest)
|
2018-11-13 09:32:56 -05:00
|
|
|
# query random hashes in our bucket key ranges to fill or split them
|
|
|
|
random_ids_in_range = self._routingTable.getRefreshList()
|
|
|
|
while random_ids_in_range:
|
|
|
|
yield self.iterativeFindNode(random_ids_in_range.pop())
|
2018-05-23 18:01:30 -04:00
|
|
|
defer.returnValue(None)
|
|
|
|
|
|
|
|
@defer.inlineCallbacks
|
|
|
|
def _iterative_join(joined_d=None, last_buckets_with_contacts=None):
|
|
|
|
log.info("Attempting to join the DHT network, %i contacts known so far", len(self.contacts))
|
|
|
|
joined_d = joined_d or defer.Deferred()
|
|
|
|
yield _initialize_routing()
|
|
|
|
buckets_with_contacts = self.bucketsWithContacts()
|
|
|
|
if last_buckets_with_contacts and last_buckets_with_contacts == buckets_with_contacts:
|
|
|
|
if not joined_d.called:
|
|
|
|
joined_d.callback(True)
|
|
|
|
elif buckets_with_contacts < 4:
|
2018-06-07 12:16:27 -04:00
|
|
|
self.reactor_callLater(0, _iterative_join, joined_d, buckets_with_contacts)
|
2018-05-23 18:01:30 -04:00
|
|
|
elif not joined_d.called:
|
|
|
|
joined_d.callback(None)
|
|
|
|
yield joined_d
|
|
|
|
if not self._join_deferred.called:
|
|
|
|
self._join_deferred.callback(True)
|
|
|
|
defer.returnValue(None)
|
|
|
|
|
|
|
|
yield _iterative_join()
|
2018-02-20 13:37:02 -05:00
|
|
|
|
2018-02-01 17:17:17 +08:00
|
|
|
@defer.inlineCallbacks
|
2018-11-07 18:35:00 -05:00
|
|
|
def start(self, known_node_addresses=None, block_on_join=False):
|
2018-02-01 17:17:17 +08:00
|
|
|
""" Causes the Node to attempt to join the DHT network by contacting the
|
|
|
|
known DHT nodes. This can be called multiple times if the previous attempt
|
|
|
|
has failed or if the Node has lost all the contacts.
|
|
|
|
|
2018-02-15 17:30:14 -05:00
|
|
|
@param known_node_addresses: A sequence of tuples containing IP address
|
2018-02-01 17:17:17 +08:00
|
|
|
information for existing nodes on the
|
|
|
|
Kademlia network, in the format:
|
|
|
|
C{(<ip address>, (udp port>)}
|
2018-02-15 17:30:14 -05:00
|
|
|
@type known_node_addresses: list
|
2018-02-01 17:17:17 +08:00
|
|
|
"""
|
|
|
|
|
2018-02-20 13:37:02 -05:00
|
|
|
self.start_listening()
|
2018-05-23 17:41:56 -04:00
|
|
|
yield self._protocol._listening
|
|
|
|
# TODO: Refresh all k-buckets further away than this node's closest neighbour
|
2018-11-07 18:35:00 -05:00
|
|
|
d = self.joinNetwork(known_node_addresses or [])
|
|
|
|
d.addCallback(lambda _: self.start_looping_calls())
|
|
|
|
d.addCallback(lambda _: log.info("Joined the dht"))
|
|
|
|
if block_on_join:
|
|
|
|
yield d
|
2018-05-23 18:01:30 -04:00
|
|
|
|
2018-07-23 16:13:56 -04:00
|
|
|
def start_looping_calls(self):
|
2018-05-23 17:02:25 -04:00
|
|
|
self.safe_start_looping_call(self._change_token_lc, constants.tokenSecretChangeInterval)
|
2017-10-23 13:13:06 -04:00
|
|
|
# Start refreshing k-buckets periodically, if necessary
|
2018-05-23 17:02:25 -04:00
|
|
|
self.safe_start_looping_call(self._refresh_node_lc, constants.checkRefreshInterval)
|
2018-05-29 11:05:33 -04:00
|
|
|
self.safe_start_looping_call(self._refresh_contacts_lc, 60)
|
2018-02-15 17:30:14 -05:00
|
|
|
|
2017-10-10 13:28:57 -04:00
|
|
|
@property
|
|
|
|
def contacts(self):
|
|
|
|
def _inner():
|
|
|
|
for i in range(len(self._routingTable._buckets)):
|
|
|
|
for contact in self._routingTable._buckets[i]._contacts:
|
|
|
|
yield contact
|
|
|
|
return list(_inner())
|
|
|
|
|
2018-02-01 17:21:52 +08:00
|
|
|
def hasContacts(self):
|
|
|
|
for bucket in self._routingTable._buckets:
|
|
|
|
if bucket._contacts:
|
|
|
|
return True
|
|
|
|
return False
|
|
|
|
|
2018-05-23 18:01:30 -04:00
|
|
|
def bucketsWithContacts(self):
|
|
|
|
return self._routingTable.bucketsWithContacts()
|
2015-08-20 11:27:15 -04:00
|
|
|
|
2018-06-05 15:08:49 -04:00
|
|
|
@defer.inlineCallbacks
|
|
|
|
def storeToContact(self, blob_hash, contact):
|
|
|
|
try:
|
2018-09-28 14:19:51 -03:00
|
|
|
if not contact.token:
|
|
|
|
yield contact.findValue(blob_hash)
|
|
|
|
res = yield contact.store(blob_hash, contact.token, self.peerPort, self.node_id, 0)
|
2018-07-24 18:51:41 -03:00
|
|
|
if res != b"OK":
|
2018-06-05 15:08:49 -04:00
|
|
|
raise ValueError(res)
|
|
|
|
log.debug("Stored %s to %s (%s)", binascii.hexlify(blob_hash), contact.log_id(), contact.address)
|
2018-09-28 14:19:51 -03:00
|
|
|
return True
|
2018-06-05 15:08:49 -04:00
|
|
|
except protocol.TimeoutError:
|
|
|
|
log.debug("Timeout while storing blob_hash %s at %s",
|
|
|
|
binascii.hexlify(blob_hash), contact.log_id())
|
|
|
|
except ValueError as err:
|
2018-07-24 18:51:41 -03:00
|
|
|
log.error("Unexpected response: %s" % err)
|
2018-06-05 15:08:49 -04:00
|
|
|
except Exception as err:
|
2018-09-28 14:19:51 -03:00
|
|
|
if 'Invalid token' in str(err):
|
|
|
|
contact.update_token(None)
|
2018-06-05 15:08:49 -04:00
|
|
|
log.error("Unexpected error while storing blob_hash %s at %s: %s",
|
|
|
|
binascii.hexlify(blob_hash), contact, err)
|
2018-09-28 14:19:51 -03:00
|
|
|
return False
|
2018-06-05 15:08:49 -04:00
|
|
|
|
2017-10-10 13:12:47 -04:00
|
|
|
@defer.inlineCallbacks
|
2018-05-23 18:09:41 -04:00
|
|
|
def announceHaveBlob(self, blob_hash):
|
2018-03-27 15:04:47 -04:00
|
|
|
contacts = yield self.iterativeFindNode(blob_hash)
|
|
|
|
|
2018-06-05 15:08:49 -04:00
|
|
|
if not self.externalIP:
|
|
|
|
raise Exception("Cannot determine external IP: %s" % self.externalIP)
|
|
|
|
stored_to = yield DeferredDict({contact: self.storeToContact(blob_hash, contact) for contact in contacts})
|
2018-07-24 18:51:41 -03:00
|
|
|
contacted_node_ids = [binascii.hexlify(contact.id) for contact in stored_to.keys() if stored_to[contact]]
|
2018-05-31 10:50:11 -04:00
|
|
|
log.debug("Stored %s to %i of %i attempted peers", binascii.hexlify(blob_hash),
|
2018-07-31 13:20:25 -04:00
|
|
|
len(contacted_node_ids), len(contacts))
|
2018-03-27 15:04:47 -04:00
|
|
|
defer.returnValue(contacted_node_ids)
|
2015-08-20 11:27:15 -04:00
|
|
|
|
|
|
|
def change_token(self):
|
|
|
|
self.old_token_secret = self.token_secret
|
|
|
|
self.token_secret = self._generateID()
|
|
|
|
|
|
|
|
def make_token(self, compact_ip):
|
|
|
|
h = hashlib.new('sha384')
|
|
|
|
h.update(self.token_secret + compact_ip)
|
|
|
|
return h.digest()
|
|
|
|
|
|
|
|
def verify_token(self, token, compact_ip):
|
|
|
|
h = hashlib.new('sha384')
|
|
|
|
h.update(self.token_secret + compact_ip)
|
2018-06-14 15:07:10 -04:00
|
|
|
if self.old_token_secret and not token == h.digest(): # TODO: why should we be accepting the previous token?
|
2015-08-20 11:27:15 -04:00
|
|
|
h = hashlib.new('sha384')
|
|
|
|
h.update(self.old_token_secret + compact_ip)
|
|
|
|
if not token == h.digest():
|
|
|
|
return False
|
|
|
|
return True
|
|
|
|
|
|
|
|
def iterativeFindNode(self, key):
|
|
|
|
""" The basic Kademlia node lookup operation
|
2016-12-13 17:08:29 -06:00
|
|
|
|
2015-08-20 11:27:15 -04:00
|
|
|
Call this to find a remote node in the P2P overlay network.
|
2016-12-13 17:08:29 -06:00
|
|
|
|
2015-08-20 11:27:15 -04:00
|
|
|
@param key: the n-bit key (i.e. the node or value ID) to search for
|
|
|
|
@type key: str
|
2016-12-13 17:08:29 -06:00
|
|
|
|
2015-08-20 11:27:15 -04:00
|
|
|
@return: This immediately returns a deferred object, which will return
|
|
|
|
a list of k "closest" contacts (C{kademlia.contact.Contact}
|
|
|
|
objects) to the specified key as soon as the operation is
|
|
|
|
finished.
|
|
|
|
@rtype: twisted.internet.defer.Deferred
|
|
|
|
"""
|
|
|
|
return self._iterativeFind(key)
|
|
|
|
|
2017-05-25 14:01:39 -04:00
|
|
|
@defer.inlineCallbacks
|
2018-07-05 21:38:52 -03:00
|
|
|
def iterativeFindValue(self, key, exclude=None):
|
2015-08-20 11:27:15 -04:00
|
|
|
""" The Kademlia search operation (deterministic)
|
2016-12-13 17:08:29 -06:00
|
|
|
|
2015-08-20 11:27:15 -04:00
|
|
|
Call this to retrieve data from the DHT.
|
2016-12-13 17:08:29 -06:00
|
|
|
|
2015-08-20 11:27:15 -04:00
|
|
|
@param key: the n-bit key (i.e. the value ID) to search for
|
|
|
|
@type key: str
|
2016-12-13 17:08:29 -06:00
|
|
|
|
2015-08-20 11:27:15 -04:00
|
|
|
@return: This immediately returns a deferred object, which will return
|
|
|
|
either one of two things:
|
|
|
|
- If the value was found, it will return a Python
|
|
|
|
dictionary containing the searched-for key (the C{key}
|
|
|
|
parameter passed to this method), and its associated
|
|
|
|
value, in the format:
|
|
|
|
C{<str>key: <str>data_value}
|
|
|
|
- If the value was not found, it will return a list of k
|
|
|
|
"closest" contacts (C{kademlia.contact.Contact} objects)
|
|
|
|
to the specified key
|
|
|
|
@rtype: twisted.internet.defer.Deferred
|
|
|
|
"""
|
|
|
|
|
2018-07-24 18:51:41 -03:00
|
|
|
if len(key) != constants.key_bits // 8:
|
2018-05-23 18:09:41 -04:00
|
|
|
raise ValueError("invalid key length!")
|
|
|
|
|
2015-08-20 11:27:15 -04:00
|
|
|
# Execute the search
|
2018-07-05 21:38:52 -03:00
|
|
|
find_result = yield self._iterativeFind(key, rpc='findValue', exclude=exclude)
|
2018-05-23 18:09:41 -04:00
|
|
|
if isinstance(find_result, dict):
|
2018-02-20 13:39:14 -05:00
|
|
|
# We have found the value; now see who was the closest contact without it...
|
|
|
|
# ...and store the key/value pair
|
2018-05-23 18:09:41 -04:00
|
|
|
pass
|
2018-02-20 13:39:14 -05:00
|
|
|
else:
|
|
|
|
# The value wasn't found, but a list of contacts was returned
|
|
|
|
# Now, see if we have the value (it might seem wasteful to search on the network
|
|
|
|
# first, but it ensures that all values are properly propagated through the
|
|
|
|
# network
|
|
|
|
if self._dataStore.hasPeersForBlob(key):
|
|
|
|
# Ok, we have the value locally, so use that
|
|
|
|
# Send this value to the closest node without it
|
|
|
|
peers = self._dataStore.getPeersForBlob(key)
|
2018-05-23 18:09:41 -04:00
|
|
|
find_result = {key: peers}
|
2018-02-20 13:39:14 -05:00
|
|
|
else:
|
2018-05-23 18:09:41 -04:00
|
|
|
pass
|
|
|
|
|
2018-08-10 18:23:07 -03:00
|
|
|
defer.returnValue(list(set(find_result.get(key, []) if find_result else [])))
|
|
|
|
# TODO: get this working
|
|
|
|
# if 'closestNodeNoValue' in find_result:
|
|
|
|
# closest_node_without_value = find_result['closestNodeNoValue']
|
|
|
|
# try:
|
|
|
|
# response, address = yield closest_node_without_value.findValue(key, rawResponse=True)
|
|
|
|
# yield closest_node_without_value.store(key, response.response['token'], self.peerPort)
|
|
|
|
# except TimeoutError:
|
|
|
|
# pass
|
2015-08-20 11:27:15 -04:00
|
|
|
|
|
|
|
def addContact(self, contact):
|
|
|
|
""" Add/update the given contact; simple wrapper for the same method
|
|
|
|
in this object's RoutingTable object
|
|
|
|
|
|
|
|
@param contact: The contact to add to this node's k-buckets
|
|
|
|
@type contact: kademlia.contact.Contact
|
|
|
|
"""
|
2018-05-23 17:32:55 -04:00
|
|
|
return self._routingTable.addContact(contact)
|
2015-08-20 11:27:15 -04:00
|
|
|
|
2018-05-23 17:32:55 -04:00
|
|
|
def removeContact(self, contact):
|
2015-08-20 11:27:15 -04:00
|
|
|
""" Remove the contact with the specified node ID from this node's
|
|
|
|
table of known nodes. This is a simple wrapper for the same method
|
|
|
|
in this object's RoutingTable object
|
2016-12-13 17:08:29 -06:00
|
|
|
|
2018-05-23 17:32:55 -04:00
|
|
|
@param contact: The Contact object to remove
|
|
|
|
@type contact: _Contact
|
2015-08-20 11:27:15 -04:00
|
|
|
"""
|
2018-05-23 17:32:55 -04:00
|
|
|
self._routingTable.removeContact(contact)
|
2015-08-20 11:27:15 -04:00
|
|
|
|
|
|
|
def findContact(self, contactID):
|
|
|
|
""" Find a entangled.kademlia.contact.Contact object for the specified
|
|
|
|
cotact ID
|
2016-12-13 17:08:29 -06:00
|
|
|
|
2015-08-20 11:27:15 -04:00
|
|
|
@param contactID: The contact ID of the required Contact object
|
|
|
|
@type contactID: str
|
2016-12-13 17:08:29 -06:00
|
|
|
|
2015-08-20 11:27:15 -04:00
|
|
|
@return: Contact object of remote node with the specified node ID,
|
|
|
|
or None if the contact was not found
|
|
|
|
@rtype: twisted.internet.defer.Deferred
|
|
|
|
"""
|
|
|
|
try:
|
2018-10-01 02:07:39 -03:00
|
|
|
df = defer.succeed(self._routingTable.getContact(contactID))
|
2018-05-23 17:32:55 -04:00
|
|
|
except (ValueError, IndexError):
|
2015-08-20 11:27:15 -04:00
|
|
|
df = self.iterativeFindNode(contactID)
|
2018-10-01 02:07:39 -03:00
|
|
|
df.addCallback(lambda nodes: ([node for node in nodes if node.id == contactID] or (None,))[0])
|
2015-08-20 11:27:15 -04:00
|
|
|
return df
|
|
|
|
|
|
|
|
@rpcmethod
|
|
|
|
def ping(self):
|
|
|
|
""" Used to verify contact between two Kademlia nodes
|
2016-12-13 17:08:29 -06:00
|
|
|
|
2015-08-20 11:27:15 -04:00
|
|
|
@rtype: str
|
|
|
|
"""
|
2018-07-20 16:45:58 -03:00
|
|
|
return b'pong'
|
2015-08-20 11:27:15 -04:00
|
|
|
|
|
|
|
@rpcmethod
|
2018-05-31 10:50:11 -04:00
|
|
|
def store(self, rpc_contact, blob_hash, token, port, originalPublisherID, age):
|
2018-05-24 15:52:37 -04:00
|
|
|
""" Store the received data in this node's local datastore
|
2016-12-13 17:08:29 -06:00
|
|
|
|
2018-05-24 15:52:37 -04:00
|
|
|
@param blob_hash: The hash of the data
|
2018-05-23 17:32:55 -04:00
|
|
|
@type blob_hash: str
|
2018-05-24 15:52:37 -04:00
|
|
|
|
|
|
|
@param token: The token we previously returned when this contact sent us a findValue
|
|
|
|
@type token: str
|
|
|
|
|
|
|
|
@param port: The TCP port the contact is listening on for requests for this blob (the peerPort)
|
|
|
|
@type port: int
|
|
|
|
|
|
|
|
@param originalPublisherID: The node ID of the node that is the publisher of the data
|
2015-08-20 11:27:15 -04:00
|
|
|
@type originalPublisherID: str
|
2018-05-24 15:52:37 -04:00
|
|
|
|
2015-08-20 11:27:15 -04:00
|
|
|
@param age: The relative age of the data (time in seconds since it was
|
|
|
|
originally published). Note that the original publish time
|
|
|
|
isn't actually given, to compensate for clock skew between
|
|
|
|
different nodes.
|
|
|
|
@type age: int
|
|
|
|
|
|
|
|
@rtype: str
|
|
|
|
"""
|
2018-05-24 15:52:37 -04:00
|
|
|
|
2017-04-25 14:21:13 -04:00
|
|
|
if originalPublisherID is None:
|
2018-05-23 17:32:55 -04:00
|
|
|
originalPublisherID = rpc_contact.id
|
|
|
|
compact_ip = rpc_contact.compact_ip()
|
2018-06-29 12:00:52 -04:00
|
|
|
if self.clock.seconds() - self._protocol.started_listening_time < constants.tokenSecretChangeInterval:
|
|
|
|
pass
|
|
|
|
elif not self.verify_token(token, compact_ip):
|
2018-05-23 17:32:55 -04:00
|
|
|
raise ValueError("Invalid token")
|
|
|
|
if 0 <= port <= 65536:
|
2018-08-22 01:12:46 -03:00
|
|
|
compact_port = port.to_bytes(2, 'big')
|
2015-08-20 11:27:15 -04:00
|
|
|
else:
|
2018-10-18 13:42:45 +03:00
|
|
|
raise TypeError(f'Invalid port: {port}')
|
2018-05-23 17:32:55 -04:00
|
|
|
compact_address = compact_ip + compact_port + rpc_contact.id
|
2018-05-24 10:23:22 -04:00
|
|
|
now = int(self.clock.seconds())
|
2018-05-23 17:32:55 -04:00
|
|
|
originallyPublished = now - age
|
2018-05-24 15:52:37 -04:00
|
|
|
self._dataStore.addPeerToBlob(rpc_contact, blob_hash, compact_address, now, originallyPublished,
|
|
|
|
originalPublisherID)
|
2018-07-20 16:45:58 -03:00
|
|
|
return b'OK'
|
2015-08-20 11:27:15 -04:00
|
|
|
|
|
|
|
@rpcmethod
|
2018-05-23 17:32:55 -04:00
|
|
|
def findNode(self, rpc_contact, key):
|
2015-08-20 11:27:15 -04:00
|
|
|
""" Finds a number of known nodes closest to the node/value with the
|
|
|
|
specified key.
|
2016-11-04 15:09:40 -05:00
|
|
|
|
2015-08-20 11:27:15 -04:00
|
|
|
@param key: the n-bit key (i.e. the node or value ID) to search for
|
|
|
|
@type key: str
|
|
|
|
|
|
|
|
@return: A list of contact triples closest to the specified key.
|
|
|
|
This method will return C{k} (or C{count}, if specified)
|
|
|
|
contacts if at all possible; it will only return fewer if the
|
|
|
|
node is returning all of the contacts that it knows of.
|
|
|
|
@rtype: list
|
|
|
|
"""
|
2018-07-24 18:51:41 -03:00
|
|
|
if len(key) != constants.key_bits // 8:
|
2018-05-23 17:32:55 -04:00
|
|
|
raise ValueError("invalid contact id length: %i" % len(key))
|
2017-10-10 13:29:29 -04:00
|
|
|
|
2018-07-02 10:57:29 -04:00
|
|
|
contacts = self._routingTable.findCloseNodes(key, sender_node_id=rpc_contact.id)
|
2017-04-10 10:51:49 -04:00
|
|
|
contact_triples = []
|
2015-08-20 11:27:15 -04:00
|
|
|
for contact in contacts:
|
2017-04-10 10:51:49 -04:00
|
|
|
contact_triples.append((contact.id, contact.address, contact.port))
|
|
|
|
return contact_triples
|
2015-08-20 11:27:15 -04:00
|
|
|
|
|
|
|
@rpcmethod
|
2018-05-23 17:32:55 -04:00
|
|
|
def findValue(self, rpc_contact, key):
|
2015-08-20 11:27:15 -04:00
|
|
|
""" Return the value associated with the specified key if present in
|
|
|
|
this node's data, otherwise execute FIND_NODE for the key
|
2016-11-04 15:09:40 -05:00
|
|
|
|
2015-08-20 11:27:15 -04:00
|
|
|
@param key: The hashtable key of the data to return
|
|
|
|
@type key: str
|
2016-11-04 15:09:40 -05:00
|
|
|
|
2015-08-20 11:27:15 -04:00
|
|
|
@return: A dictionary containing the requested key/value pair,
|
|
|
|
or a list of contact triples closest to the requested key.
|
|
|
|
@rtype: dict or list
|
|
|
|
"""
|
2017-05-25 14:01:39 -04:00
|
|
|
|
2018-07-24 18:51:41 -03:00
|
|
|
if len(key) != constants.key_bits // 8:
|
2018-05-23 17:32:55 -04:00
|
|
|
raise ValueError("invalid blob hash length: %i" % len(key))
|
|
|
|
|
|
|
|
response = {
|
2018-07-20 16:45:58 -03:00
|
|
|
b'token': self.make_token(rpc_contact.compact_ip()),
|
2018-05-23 17:32:55 -04:00
|
|
|
}
|
|
|
|
|
2018-05-31 10:50:11 -04:00
|
|
|
if self._protocol._protocolVersion:
|
2018-07-20 16:45:58 -03:00
|
|
|
response[b'protocolVersion'] = self._protocol._protocolVersion
|
2018-05-31 10:50:11 -04:00
|
|
|
|
2018-06-29 12:01:46 -04:00
|
|
|
# get peers we have stored for this blob
|
|
|
|
has_other_peers = self._dataStore.hasPeersForBlob(key)
|
|
|
|
peers = []
|
|
|
|
if has_other_peers:
|
|
|
|
peers.extend(self._dataStore.getPeersForBlob(key))
|
|
|
|
|
|
|
|
# if we don't have k storing peers to return and we have this hash locally, include our contact information
|
|
|
|
if len(peers) < constants.k and key in self._dataStore.completed_blobs:
|
2018-07-20 16:45:58 -03:00
|
|
|
compact_ip = reduce(lambda buff, x: buff + bytearray([int(x)]), self.externalIP.split('.'), bytearray())
|
2018-08-22 01:12:46 -03:00
|
|
|
compact_port = self.peerPort.to_bytes(2, 'big')
|
2018-06-29 12:01:46 -04:00
|
|
|
compact_address = compact_ip + compact_port + self.node_id
|
|
|
|
peers.append(compact_address)
|
|
|
|
|
|
|
|
if peers:
|
|
|
|
response[key] = peers
|
2015-08-20 11:27:15 -04:00
|
|
|
else:
|
2018-07-20 16:45:58 -03:00
|
|
|
response[b'contacts'] = self.findNode(rpc_contact, key)
|
2018-05-23 17:32:55 -04:00
|
|
|
return response
|
2015-08-20 11:27:15 -04:00
|
|
|
|
|
|
|
def _generateID(self):
|
|
|
|
""" Generates an n-bit pseudo-random identifier
|
2016-12-13 17:08:29 -06:00
|
|
|
|
2015-08-20 11:27:15 -04:00
|
|
|
@return: A globally unique n-bit pseudo-random identifier
|
|
|
|
@rtype: str
|
|
|
|
"""
|
2017-04-10 10:51:49 -04:00
|
|
|
return generate_id()
|
2015-08-20 11:27:15 -04:00
|
|
|
|
2018-11-04 14:06:29 -05:00
|
|
|
# from lbrynet.p2p.utils import profile_deferred
|
2018-06-06 17:21:56 -04:00
|
|
|
# @profile_deferred()
|
2017-05-25 14:01:39 -04:00
|
|
|
@defer.inlineCallbacks
|
2018-07-05 21:38:52 -03:00
|
|
|
def _iterativeFind(self, key, startupShortlist=None, rpc='findNode', exclude=None):
|
2015-08-20 11:27:15 -04:00
|
|
|
""" The basic Kademlia iterative lookup operation (for nodes/values)
|
2016-12-13 17:08:29 -06:00
|
|
|
|
2015-08-20 11:27:15 -04:00
|
|
|
This builds a list of k "closest" contacts through iterative use of
|
|
|
|
the "FIND_NODE" RPC, or if C{findValue} is set to C{True}, using the
|
|
|
|
"FIND_VALUE" RPC, in which case the value (if found) may be returned
|
|
|
|
instead of a list of contacts
|
2016-12-13 17:08:29 -06:00
|
|
|
|
2015-08-20 11:27:15 -04:00
|
|
|
@param key: the n-bit key (i.e. the node or value ID) to search for
|
|
|
|
@type key: str
|
|
|
|
@param startupShortlist: A list of contacts to use as the starting
|
|
|
|
shortlist for this search; this is normally
|
|
|
|
only used when the node joins the network
|
|
|
|
@type startupShortlist: list
|
|
|
|
@param rpc: The name of the RPC to issue to remote nodes during the
|
|
|
|
Kademlia lookup operation (e.g. this sets whether this
|
|
|
|
algorithm should search for a data value (if
|
|
|
|
rpc='findValue') or not. It can thus be used to perform
|
|
|
|
other operations that piggy-back on the basic Kademlia
|
|
|
|
lookup operation (Entangled's "delete" RPC, for instance).
|
|
|
|
@type rpc: str
|
2016-12-13 17:08:29 -06:00
|
|
|
|
2015-08-20 11:27:15 -04:00
|
|
|
@return: If C{findValue} is C{True}, the algorithm will stop as soon
|
|
|
|
as a data value for C{key} is found, and return a dictionary
|
|
|
|
containing the key and the found value. Otherwise, it will
|
|
|
|
return a list of the k closest nodes to the specified key
|
|
|
|
@rtype: twisted.internet.defer.Deferred
|
|
|
|
"""
|
2018-05-23 17:32:55 -04:00
|
|
|
|
2018-07-24 18:51:41 -03:00
|
|
|
if len(key) != constants.key_bits // 8:
|
2018-05-23 17:32:55 -04:00
|
|
|
raise ValueError("invalid key length: %i" % len(key))
|
2017-04-10 10:51:49 -04:00
|
|
|
|
2017-04-25 14:21:13 -04:00
|
|
|
if startupShortlist is None:
|
2018-07-02 10:57:29 -04:00
|
|
|
shortlist = self._routingTable.findCloseNodes(key)
|
2018-05-23 17:32:55 -04:00
|
|
|
# if key != self.node_id:
|
|
|
|
# # Update the "last accessed" timestamp for the appropriate k-bucket
|
|
|
|
# self._routingTable.touchKBucket(key)
|
2015-08-20 11:27:15 -04:00
|
|
|
if len(shortlist) == 0:
|
2018-10-18 14:40:37 +03:00
|
|
|
log.warning("This node doesn't know any other nodes")
|
2015-08-20 11:27:15 -04:00
|
|
|
# This node doesn't know of any other nodes
|
|
|
|
fakeDf = defer.Deferred()
|
|
|
|
fakeDf.callback([])
|
2017-05-25 14:01:39 -04:00
|
|
|
result = yield fakeDf
|
|
|
|
defer.returnValue(result)
|
2015-08-20 11:27:15 -04:00
|
|
|
else:
|
2018-05-23 17:32:55 -04:00
|
|
|
# This is used during the bootstrap process
|
2015-08-20 11:27:15 -04:00
|
|
|
shortlist = startupShortlist
|
|
|
|
|
2018-07-05 21:38:52 -03:00
|
|
|
result = yield iterativeFind(self, shortlist, key, rpc, exclude=exclude)
|
2017-05-25 14:01:39 -04:00
|
|
|
defer.returnValue(result)
|
2015-08-20 11:27:15 -04:00
|
|
|
|
2017-10-23 13:13:06 -04:00
|
|
|
@defer.inlineCallbacks
|
2015-08-20 11:27:15 -04:00
|
|
|
def _refreshNode(self):
|
|
|
|
""" Periodically called to perform k-bucket refreshes and data
|
|
|
|
replication/republishing as necessary """
|
2017-10-23 13:13:06 -04:00
|
|
|
yield self._refreshRoutingTable()
|
|
|
|
self._dataStore.removeExpiredPeers()
|
2018-09-28 10:51:07 -03:00
|
|
|
self._refreshStoringPeers()
|
2017-10-23 13:13:06 -04:00
|
|
|
defer.returnValue(None)
|
2015-08-20 11:27:15 -04:00
|
|
|
|
2018-05-23 18:11:41 -04:00
|
|
|
def _refreshContacts(self):
|
2018-09-30 23:53:32 -03:00
|
|
|
self._protocol._ping_queue.enqueue_maybe_ping(*self.contacts, delay=0)
|
2018-05-23 18:11:41 -04:00
|
|
|
|
2018-05-24 15:52:37 -04:00
|
|
|
def _refreshStoringPeers(self):
|
2018-09-30 23:53:32 -03:00
|
|
|
self._protocol._ping_queue.enqueue_maybe_ping(*self._dataStore.getStoringContacts(), delay=0)
|
2018-05-24 15:52:37 -04:00
|
|
|
|
2017-10-23 15:36:50 -04:00
|
|
|
@defer.inlineCallbacks
|
2015-08-20 11:27:15 -04:00
|
|
|
def _refreshRoutingTable(self):
|
2018-05-29 11:05:33 -04:00
|
|
|
nodeIDs = self._routingTable.getRefreshList(0, False)
|
2017-10-23 15:36:50 -04:00
|
|
|
while nodeIDs:
|
|
|
|
searchID = nodeIDs.pop()
|
|
|
|
yield self.iterativeFindNode(searchID)
|
|
|
|
defer.returnValue(None)
|