2019-01-22 12:49:43 -05:00
|
|
|
import typing
|
|
|
|
import asyncio
|
|
|
|
import logging
|
2019-09-27 04:34:58 -03:00
|
|
|
from dataclasses import dataclass, field
|
|
|
|
from functools import lru_cache
|
2021-12-10 03:48:33 -03:00
|
|
|
|
|
|
|
from prometheus_client import Gauge
|
|
|
|
|
2021-06-04 11:54:37 -03:00
|
|
|
from lbry.utils import is_valid_public_ipv4 as _is_valid_public_ipv4, LRUCache
|
2019-06-20 20:55:47 -04:00
|
|
|
from lbry.dht import constants
|
|
|
|
from lbry.dht.serialization.datagram import make_compact_address, make_compact_ip, decode_compact_address
|
2019-01-22 12:49:43 -05:00
|
|
|
|
2021-01-21 16:20:53 -05:00
|
|
|
ALLOW_LOCALHOST = False
|
2022-01-29 14:23:41 -03:00
|
|
|
CACHE_SIZE = 16384
|
2019-01-22 12:49:43 -05:00
|
|
|
log = logging.getLogger(__name__)
|
2019-09-25 12:39:34 -03:00
|
|
|
|
|
|
|
|
2022-01-07 12:58:52 -03:00
|
|
|
@lru_cache(CACHE_SIZE)
|
2019-09-30 21:00:10 -03:00
|
|
|
def make_kademlia_peer(node_id: typing.Optional[bytes], address: typing.Optional[str],
|
|
|
|
udp_port: typing.Optional[int] = None,
|
2019-11-29 15:28:41 -05:00
|
|
|
tcp_port: typing.Optional[int] = None,
|
|
|
|
allow_localhost: bool = False) -> 'KademliaPeer':
|
|
|
|
return KademliaPeer(address, node_id, udp_port, tcp_port=tcp_port, allow_localhost=allow_localhost)
|
2019-01-22 12:49:43 -05:00
|
|
|
|
|
|
|
|
2019-11-29 15:28:41 -05:00
|
|
|
def is_valid_public_ipv4(address, allow_localhost: bool = False):
|
2019-12-01 17:21:42 -05:00
|
|
|
allow_localhost = bool(allow_localhost or ALLOW_LOCALHOST)
|
2021-01-21 16:20:53 -05:00
|
|
|
return _is_valid_public_ipv4(address, allow_localhost)
|
2019-01-22 12:49:43 -05:00
|
|
|
|
|
|
|
|
|
|
|
class PeerManager:
|
2021-12-10 03:48:33 -03:00
|
|
|
peer_manager_keys_metric = Gauge(
|
|
|
|
"peer_manager_keys", "Number of keys tracked by PeerManager dicts (sum)", namespace="dht_node",
|
|
|
|
labelnames=("scope",)
|
|
|
|
)
|
2019-08-02 13:14:41 -04:00
|
|
|
def __init__(self, loop: asyncio.AbstractEventLoop):
|
2019-01-22 12:49:43 -05:00
|
|
|
self._loop = loop
|
|
|
|
self._rpc_failures: typing.Dict[
|
|
|
|
typing.Tuple[str, int], typing.Tuple[typing.Optional[float], typing.Optional[float]]
|
2022-01-07 12:58:52 -03:00
|
|
|
] = LRUCache(CACHE_SIZE)
|
|
|
|
self._last_replied: typing.Dict[typing.Tuple[str, int], float] = LRUCache(CACHE_SIZE)
|
|
|
|
self._last_sent: typing.Dict[typing.Tuple[str, int], float] = LRUCache(CACHE_SIZE)
|
|
|
|
self._last_requested: typing.Dict[typing.Tuple[str, int], float] = LRUCache(CACHE_SIZE)
|
|
|
|
self._node_id_mapping: typing.Dict[typing.Tuple[str, int], bytes] = LRUCache(CACHE_SIZE)
|
|
|
|
self._node_id_reverse_mapping: typing.Dict[bytes, typing.Tuple[str, int]] = LRUCache(CACHE_SIZE)
|
|
|
|
self._node_tokens: typing.Dict[bytes, (float, bytes)] = LRUCache(CACHE_SIZE)
|
2019-01-22 12:49:43 -05:00
|
|
|
|
2021-12-10 03:48:33 -03:00
|
|
|
def count_cache_keys(self):
|
|
|
|
return len(self._rpc_failures) + len(self._last_replied) + len(self._last_sent) + len(
|
|
|
|
self._last_requested) + len(self._node_id_mapping) + len(self._node_id_reverse_mapping) + len(
|
|
|
|
self._node_tokens)
|
|
|
|
|
2019-05-12 03:39:11 -03:00
|
|
|
def reset(self):
|
|
|
|
for statistic in (self._rpc_failures, self._last_replied, self._last_sent, self._last_requested):
|
|
|
|
statistic.clear()
|
|
|
|
|
2019-01-31 20:43:19 -05:00
|
|
|
def report_failure(self, address: str, udp_port: int):
|
2019-01-22 12:49:43 -05:00
|
|
|
now = self._loop.time()
|
2019-01-31 20:43:19 -05:00
|
|
|
_, previous = self._rpc_failures.pop((address, udp_port), (None, None))
|
|
|
|
self._rpc_failures[(address, udp_port)] = (previous, now)
|
2019-01-22 12:49:43 -05:00
|
|
|
|
2019-01-31 20:43:19 -05:00
|
|
|
def report_last_sent(self, address: str, udp_port: int):
|
2019-01-22 12:49:43 -05:00
|
|
|
now = self._loop.time()
|
2019-01-31 20:43:19 -05:00
|
|
|
self._last_sent[(address, udp_port)] = now
|
2019-01-22 12:49:43 -05:00
|
|
|
|
2019-01-31 20:43:19 -05:00
|
|
|
def report_last_replied(self, address: str, udp_port: int):
|
2019-01-22 12:49:43 -05:00
|
|
|
now = self._loop.time()
|
2019-01-31 20:43:19 -05:00
|
|
|
self._last_replied[(address, udp_port)] = now
|
2019-01-22 12:49:43 -05:00
|
|
|
|
2019-01-31 20:43:19 -05:00
|
|
|
def report_last_requested(self, address: str, udp_port: int):
|
2019-01-22 12:49:43 -05:00
|
|
|
now = self._loop.time()
|
2019-01-31 20:43:19 -05:00
|
|
|
self._last_requested[(address, udp_port)] = now
|
2019-01-22 12:49:43 -05:00
|
|
|
|
2019-01-31 20:43:19 -05:00
|
|
|
def clear_token(self, node_id: bytes):
|
|
|
|
self._node_tokens.pop(node_id, None)
|
2019-01-22 12:49:43 -05:00
|
|
|
|
2019-01-31 20:43:19 -05:00
|
|
|
def update_token(self, node_id: bytes, token: bytes):
|
2019-01-22 12:49:43 -05:00
|
|
|
now = self._loop.time()
|
2019-01-31 20:43:19 -05:00
|
|
|
self._node_tokens[node_id] = (now, token)
|
2019-01-22 12:49:43 -05:00
|
|
|
|
|
|
|
def get_node_token(self, node_id: bytes) -> typing.Optional[bytes]:
|
2019-08-02 13:14:41 -04:00
|
|
|
ts, token = self._node_tokens.get(node_id, (0, None))
|
2020-01-03 00:57:28 -03:00
|
|
|
if ts and ts > self._loop.time() - constants.TOKEN_SECRET_REFRESH_INTERVAL:
|
2019-01-22 12:49:43 -05:00
|
|
|
return token
|
|
|
|
|
|
|
|
def get_last_replied(self, address: str, udp_port: int) -> typing.Optional[float]:
|
|
|
|
return self._last_replied.get((address, udp_port))
|
|
|
|
|
2019-01-31 20:43:19 -05:00
|
|
|
def update_contact_triple(self, node_id: bytes, address: str, udp_port: int):
|
2019-01-22 12:49:43 -05:00
|
|
|
"""
|
|
|
|
Update the mapping of node_id -> address tuple and that of address tuple -> node_id
|
|
|
|
This is to handle peers changing addresses and ids while assuring that the we only ever have
|
|
|
|
one node id / address tuple mapped to each other
|
|
|
|
"""
|
2019-01-31 20:43:19 -05:00
|
|
|
if (address, udp_port) in self._node_id_mapping:
|
|
|
|
self._node_id_reverse_mapping.pop(self._node_id_mapping.pop((address, udp_port)))
|
|
|
|
if node_id in self._node_id_reverse_mapping:
|
|
|
|
self._node_id_mapping.pop(self._node_id_reverse_mapping.pop(node_id))
|
|
|
|
self._node_id_mapping[(address, udp_port)] = node_id
|
|
|
|
self._node_id_reverse_mapping[node_id] = (address, udp_port)
|
2021-12-10 03:48:33 -03:00
|
|
|
self.peer_manager_keys_metric.labels("global").set(self.count_cache_keys())
|
2019-01-22 12:49:43 -05:00
|
|
|
|
2019-01-31 20:43:19 -05:00
|
|
|
def prune(self): # TODO: periodically call this
|
2019-01-22 12:49:43 -05:00
|
|
|
now = self._loop.time()
|
2019-01-31 20:43:19 -05:00
|
|
|
to_pop = []
|
|
|
|
for (address, udp_port), (_, last_failure) in self._rpc_failures.items():
|
2020-01-03 00:57:28 -03:00
|
|
|
if last_failure and last_failure < now - constants.RPC_ATTEMPTS_PRUNING_WINDOW:
|
2019-01-31 20:43:19 -05:00
|
|
|
to_pop.append((address, udp_port))
|
|
|
|
while to_pop:
|
|
|
|
del self._rpc_failures[to_pop.pop()]
|
|
|
|
to_pop = []
|
2020-01-03 01:31:28 -03:00
|
|
|
for node_id, (age, token) in self._node_tokens.items(): # pylint: disable=unused-variable
|
2020-01-03 00:57:28 -03:00
|
|
|
if age < now - constants.TOKEN_SECRET_REFRESH_INTERVAL:
|
2019-01-31 20:43:19 -05:00
|
|
|
to_pop.append(node_id)
|
|
|
|
while to_pop:
|
|
|
|
del self._node_tokens[to_pop.pop()]
|
2019-01-22 12:49:43 -05:00
|
|
|
|
2020-01-03 01:31:28 -03:00
|
|
|
def contact_triple_is_good(self, node_id: bytes, address: str, udp_port: int): # pylint: disable=too-many-return-statements
|
2019-01-22 12:49:43 -05:00
|
|
|
"""
|
|
|
|
:return: False if peer is bad, None if peer is unknown, or True if peer is good
|
|
|
|
"""
|
|
|
|
|
2020-01-03 00:57:28 -03:00
|
|
|
delay = self._loop.time() - constants.CHECK_REFRESH_INTERVAL
|
2019-01-22 12:49:43 -05:00
|
|
|
|
2019-05-11 23:30:05 -03:00
|
|
|
# fixme: find a way to re-enable that without breaking other parts
|
2019-10-04 09:18:54 -04:00
|
|
|
# if node_id not in self._node_id_reverse_mapping or (address, udp_port) not in self._node_id_mapping:
|
2019-05-11 23:30:05 -03:00
|
|
|
# return
|
2019-10-04 09:18:54 -04:00
|
|
|
# addr_tup = (address, udp_port)
|
|
|
|
# if self._node_id_reverse_mapping[node_id] != addr_tup or self._node_id_mapping[addr_tup] != node_id:
|
2019-05-11 23:30:05 -03:00
|
|
|
# return
|
2019-01-22 12:49:43 -05:00
|
|
|
previous_failure, most_recent_failure = self._rpc_failures.get((address, udp_port), (None, None))
|
|
|
|
last_requested = self._last_requested.get((address, udp_port))
|
|
|
|
last_replied = self._last_replied.get((address, udp_port))
|
2019-10-01 18:11:30 -03:00
|
|
|
if node_id is None:
|
|
|
|
return None
|
2019-01-22 12:49:43 -05:00
|
|
|
if most_recent_failure and last_replied:
|
|
|
|
if delay < last_replied > most_recent_failure:
|
|
|
|
return True
|
|
|
|
elif last_replied > most_recent_failure:
|
|
|
|
return
|
|
|
|
return False
|
|
|
|
elif previous_failure and most_recent_failure and most_recent_failure > delay:
|
|
|
|
return False
|
|
|
|
elif last_replied and last_replied > delay:
|
|
|
|
return True
|
|
|
|
elif last_requested and last_requested > delay:
|
|
|
|
return None
|
|
|
|
return
|
|
|
|
|
|
|
|
def peer_is_good(self, peer: 'KademliaPeer'):
|
|
|
|
return self.contact_triple_is_good(peer.node_id, peer.address, peer.udp_port)
|
|
|
|
|
2020-01-03 01:31:28 -03:00
|
|
|
def decode_tcp_peer_from_compact_address(self, compact_address: bytes) -> 'KademliaPeer': # pylint: disable=no-self-use
|
2019-01-22 12:49:43 -05:00
|
|
|
node_id, address, tcp_port = decode_compact_address(compact_address)
|
2019-09-30 21:00:10 -03:00
|
|
|
return make_kademlia_peer(node_id, address, udp_port=None, tcp_port=tcp_port)
|
2019-01-22 12:49:43 -05:00
|
|
|
|
|
|
|
|
2019-09-27 04:34:58 -03:00
|
|
|
@dataclass(unsafe_hash=True)
|
2019-01-22 12:49:43 -05:00
|
|
|
class KademliaPeer:
|
2019-09-27 04:34:58 -03:00
|
|
|
address: str = field(hash=True)
|
|
|
|
_node_id: typing.Optional[bytes] = field(hash=True)
|
|
|
|
udp_port: typing.Optional[int] = field(hash=True)
|
2019-10-01 18:02:23 -03:00
|
|
|
tcp_port: typing.Optional[int] = field(compare=False, hash=False)
|
|
|
|
protocol_version: typing.Optional[int] = field(default=1, compare=False, hash=False)
|
2019-11-29 15:28:41 -05:00
|
|
|
allow_localhost: bool = field(default=False, compare=False, hash=False)
|
2019-09-27 04:34:58 -03:00
|
|
|
|
|
|
|
def __post_init__(self):
|
|
|
|
if self._node_id is not None:
|
2020-01-03 00:57:28 -03:00
|
|
|
if not len(self._node_id) == constants.HASH_LENGTH:
|
2021-09-29 15:33:43 -03:00
|
|
|
raise ValueError("invalid node_id: {}".format(self._node_id.hex()))
|
2021-04-28 12:20:37 -04:00
|
|
|
if self.udp_port is not None and not 1024 <= self.udp_port <= 65535:
|
2021-08-03 15:29:52 -03:00
|
|
|
raise ValueError(f"invalid udp port: {self.address}:{self.udp_port}")
|
2021-04-28 12:20:37 -04:00
|
|
|
if self.tcp_port is not None and not 1024 <= self.tcp_port <= 65535:
|
2021-08-03 15:29:52 -03:00
|
|
|
raise ValueError(f"invalid tcp port: {self.address}:{self.tcp_port}")
|
2019-11-29 15:28:41 -05:00
|
|
|
if not is_valid_public_ipv4(self.address, self.allow_localhost):
|
2019-10-08 13:31:06 -04:00
|
|
|
raise ValueError(f"invalid ip address: '{self.address}'")
|
2019-01-22 12:49:43 -05:00
|
|
|
|
|
|
|
def update_tcp_port(self, tcp_port: int):
|
|
|
|
self.tcp_port = tcp_port
|
|
|
|
|
|
|
|
@property
|
|
|
|
def node_id(self) -> bytes:
|
|
|
|
return self._node_id
|
|
|
|
|
|
|
|
def compact_address_udp(self) -> bytearray:
|
|
|
|
return make_compact_address(self.node_id, self.address, self.udp_port)
|
|
|
|
|
|
|
|
def compact_address_tcp(self) -> bytearray:
|
|
|
|
return make_compact_address(self.node_id, self.address, self.tcp_port)
|
|
|
|
|
|
|
|
def compact_ip(self):
|
|
|
|
return make_compact_ip(self.address)
|