2019-03-15 14:00:49 -04:00
|
|
|
import contextlib
|
2022-02-18 18:53:10 -03:00
|
|
|
import logging
|
2019-03-15 14:00:49 -04:00
|
|
|
import typing
|
|
|
|
import binascii
|
2019-06-18 20:08:50 -04:00
|
|
|
import socket
|
2019-03-15 14:00:49 -04:00
|
|
|
import asyncio
|
2022-02-18 18:53:10 -03:00
|
|
|
|
2019-12-31 15:30:13 -05:00
|
|
|
from lbry.testcase import AsyncioTestCase
|
2019-03-15 14:00:49 -04:00
|
|
|
from tests import dht_mocks
|
2022-02-18 18:53:10 -03:00
|
|
|
from lbry.dht.protocol.distance import Distance
|
2019-06-20 21:02:58 -04:00
|
|
|
from lbry.conf import Config
|
|
|
|
from lbry.dht import constants
|
|
|
|
from lbry.dht.node import Node
|
2019-09-30 21:00:10 -03:00
|
|
|
from lbry.dht.peer import PeerManager, make_kademlia_peer
|
2019-06-20 21:02:58 -04:00
|
|
|
from lbry.dht.blob_announcer import BlobAnnouncer
|
|
|
|
from lbry.extras.daemon.storage import SQLiteStorage
|
2022-02-18 18:53:10 -03:00
|
|
|
|
2019-03-15 14:00:49 -04:00
|
|
|
|
|
|
|
class TestBlobAnnouncer(AsyncioTestCase):
|
|
|
|
async def setup_node(self, peer_addresses, address, node_id):
|
|
|
|
self.nodes: typing.Dict[int, Node] = {}
|
2022-02-18 18:53:10 -03:00
|
|
|
self.advance = dht_mocks.get_time_accelerator(self.loop)
|
|
|
|
self.instant_advance = dht_mocks.get_time_accelerator(self.loop)
|
2019-03-15 14:00:49 -04:00
|
|
|
self.conf = Config()
|
|
|
|
self.peer_manager = PeerManager(self.loop)
|
|
|
|
self.node = Node(self.loop, self.peer_manager, node_id, 4444, 4444, 3333, address)
|
|
|
|
await self.node.start_listening(address)
|
2022-02-18 18:53:10 -03:00
|
|
|
await asyncio.gather(*[self.add_peer(node_id, address) for node_id, address in peer_addresses])
|
|
|
|
for first_peer in self.nodes.values():
|
|
|
|
for second_peer in self.nodes.values():
|
|
|
|
if first_peer == second_peer:
|
|
|
|
continue
|
|
|
|
self.add_peer_to_routing_table(first_peer, second_peer)
|
|
|
|
self.add_peer_to_routing_table(second_peer, first_peer)
|
|
|
|
await self.advance(0.1) # just to make pings go through
|
2019-03-15 14:00:49 -04:00
|
|
|
self.node.joined.set()
|
2019-06-18 20:08:50 -04:00
|
|
|
self.node._refresh_task = self.loop.create_task(self.node.refresh_node())
|
2022-02-18 18:53:10 -03:00
|
|
|
self.storage = SQLiteStorage(self.conf, ":memory:", self.loop, self.loop.time)
|
|
|
|
await self.storage.open()
|
|
|
|
self.blob_announcer = BlobAnnouncer(self.loop, self.node, self.storage)
|
2019-03-15 14:00:49 -04:00
|
|
|
|
|
|
|
async def add_peer(self, node_id, address, add_to_routing_table=True):
|
2022-02-18 18:53:10 -03:00
|
|
|
#print('add', node_id.hex()[:8], address)
|
2019-03-15 14:00:49 -04:00
|
|
|
n = Node(self.loop, PeerManager(self.loop), node_id, 4444, 4444, 3333, address)
|
|
|
|
await n.start_listening(address)
|
|
|
|
self.nodes.update({len(self.nodes): n})
|
|
|
|
if add_to_routing_table:
|
2022-02-18 18:53:10 -03:00
|
|
|
self.add_peer_to_routing_table(self.node, n)
|
|
|
|
|
|
|
|
def add_peer_to_routing_table(self, adder, being_added):
|
|
|
|
adder.protocol.add_peer(
|
|
|
|
make_kademlia_peer(
|
|
|
|
being_added.protocol.node_id, being_added.protocol.external_ip, being_added.protocol.udp_port
|
2019-03-15 14:00:49 -04:00
|
|
|
)
|
2022-02-18 18:53:10 -03:00
|
|
|
)
|
2019-03-15 14:00:49 -04:00
|
|
|
|
|
|
|
@contextlib.asynccontextmanager
|
2022-02-18 18:53:10 -03:00
|
|
|
async def _test_network_context(self, peer_count=200):
|
|
|
|
self.peer_addresses = [
|
|
|
|
(constants.generate_id(i), socket.inet_ntoa(int(i + 0x01000001).to_bytes(length=4, byteorder='big')))
|
|
|
|
for i in range(1, peer_count + 1)
|
2019-03-15 14:00:49 -04:00
|
|
|
]
|
|
|
|
try:
|
|
|
|
with dht_mocks.mock_network_loop(self.loop):
|
2022-02-18 18:53:10 -03:00
|
|
|
await self.setup_node(self.peer_addresses, '1.2.3.1', constants.generate_id(1000))
|
2019-03-15 14:00:49 -04:00
|
|
|
yield
|
|
|
|
finally:
|
|
|
|
self.blob_announcer.stop()
|
|
|
|
self.node.stop()
|
|
|
|
for n in self.nodes.values():
|
|
|
|
n.stop()
|
|
|
|
|
|
|
|
async def chain_peer(self, node_id, address):
|
|
|
|
previous_last_node = self.nodes[len(self.nodes) - 1]
|
|
|
|
await self.add_peer(node_id, address, False)
|
|
|
|
last_node = self.nodes[len(self.nodes) - 1]
|
|
|
|
peer = last_node.protocol.get_rpc_peer(
|
2019-09-30 21:00:10 -03:00
|
|
|
make_kademlia_peer(
|
2019-03-15 14:00:49 -04:00
|
|
|
previous_last_node.protocol.node_id, previous_last_node.protocol.external_ip,
|
|
|
|
previous_last_node.protocol.udp_port
|
|
|
|
)
|
|
|
|
)
|
|
|
|
await peer.ping()
|
2022-02-18 18:53:10 -03:00
|
|
|
return last_node
|
2019-03-15 14:00:49 -04:00
|
|
|
|
|
|
|
async def test_announce_blobs(self):
|
|
|
|
blob1 = binascii.hexlify(b'1' * 48).decode()
|
|
|
|
blob2 = binascii.hexlify(b'2' * 48).decode()
|
|
|
|
|
2022-02-18 18:53:10 -03:00
|
|
|
async with self._test_network_context(peer_count=100):
|
|
|
|
await self.storage.add_blobs((blob1, 1024, 0, True), (blob2, 1024, 0, True), finished=True)
|
|
|
|
await self.storage.add_blobs(
|
|
|
|
*((constants.generate_id(value).hex(), 1024, 0, True) for value in range(1000, 1090)),
|
|
|
|
finished=True)
|
|
|
|
await self.storage.db.execute("update blob set next_announce_time=0, should_announce=1")
|
2019-03-15 14:00:49 -04:00
|
|
|
to_announce = await self.storage.get_blobs_to_announce()
|
2022-02-18 18:53:10 -03:00
|
|
|
self.assertEqual(92, len(to_announce))
|
|
|
|
self.blob_announcer.start(batch_size=10) # so it covers batching logic
|
2019-05-12 03:39:11 -03:00
|
|
|
# takes 60 seconds to start, but we advance 120 to ensure it processed all batches
|
2022-02-18 18:53:10 -03:00
|
|
|
ongoing_announcements = asyncio.ensure_future(self.blob_announcer.wait())
|
|
|
|
await self.instant_advance(60.0)
|
|
|
|
await ongoing_announcements
|
2019-03-15 14:00:49 -04:00
|
|
|
to_announce = await self.storage.get_blobs_to_announce()
|
|
|
|
self.assertEqual(0, len(to_announce))
|
|
|
|
self.blob_announcer.stop()
|
|
|
|
|
2022-02-18 18:53:10 -03:00
|
|
|
# as routing table pollution will cause some peers to be hard to reach, we add a tolerance for CI
|
|
|
|
tolerance = 0.8 # at least 80% of the announcements are within the top K
|
|
|
|
for blob in await self.storage.get_all_blob_hashes():
|
|
|
|
distance = Distance(bytes.fromhex(blob))
|
|
|
|
candidates = list(self.nodes.values())
|
|
|
|
candidates.sort(key=lambda sorting_node: distance(sorting_node.protocol.node_id))
|
|
|
|
has_it = 0
|
|
|
|
for index, node in enumerate(candidates[:constants.K], start=1):
|
|
|
|
if node.protocol.data_store.get_peers_for_blob(bytes.fromhex(blob)):
|
|
|
|
has_it += 1
|
|
|
|
else:
|
|
|
|
logging.warning("blob %s wasnt found between the best K (%s)", blob[:8], node.protocol.node_id.hex()[:8])
|
|
|
|
self.assertGreaterEqual(has_it, int(tolerance * constants.K))
|
|
|
|
|
|
|
|
|
2019-03-15 14:00:49 -04:00
|
|
|
# test that we can route from a poorly connected peer all the way to the announced blob
|
|
|
|
|
2022-02-18 18:53:10 -03:00
|
|
|
current = len(self.nodes)
|
|
|
|
await self.chain_peer(constants.generate_id(current + 1), '1.2.3.10')
|
|
|
|
await self.chain_peer(constants.generate_id(current + 2), '1.2.3.11')
|
|
|
|
await self.chain_peer(constants.generate_id(current + 3), '1.2.3.12')
|
|
|
|
await self.chain_peer(constants.generate_id(current + 4), '1.2.3.13')
|
|
|
|
last = await self.chain_peer(constants.generate_id(current + 5), '1.2.3.14')
|
2019-03-15 14:00:49 -04:00
|
|
|
|
|
|
|
search_q, peer_q = asyncio.Queue(loop=self.loop), asyncio.Queue(loop=self.loop)
|
|
|
|
search_q.put_nowait(blob1)
|
|
|
|
|
|
|
|
_, task = last.accumulate_peers(search_q, peer_q)
|
2022-02-18 18:53:10 -03:00
|
|
|
found_peers = await asyncio.wait_for(peer_q.get(), 1.0)
|
2019-05-11 04:58:50 -03:00
|
|
|
task.cancel()
|
2019-03-15 14:00:49 -04:00
|
|
|
|
|
|
|
self.assertEqual(1, len(found_peers))
|
|
|
|
self.assertEqual(self.node.protocol.node_id, found_peers[0].node_id)
|
|
|
|
self.assertEqual(self.node.protocol.external_ip, found_peers[0].address)
|
|
|
|
self.assertEqual(self.node.protocol.peer_port, found_peers[0].tcp_port)
|
2019-06-18 20:08:50 -04:00
|
|
|
|
|
|
|
async def test_popular_blob(self):
|
|
|
|
peer_count = 150
|
2022-02-18 18:53:10 -03:00
|
|
|
blob_hash = constants.generate_id(99999)
|
2019-06-18 20:08:50 -04:00
|
|
|
|
2022-02-18 18:53:10 -03:00
|
|
|
async with self._test_network_context(peer_count=peer_count):
|
2019-06-18 20:08:50 -04:00
|
|
|
total_seen = set()
|
2022-02-18 18:53:10 -03:00
|
|
|
announced_to = self.nodes.pop(0)
|
|
|
|
for i, node in enumerate(self.nodes.values()):
|
|
|
|
self.add_peer_to_routing_table(announced_to, node)
|
2019-06-18 20:08:50 -04:00
|
|
|
peer = node.protocol.get_rpc_peer(
|
2019-09-30 21:00:10 -03:00
|
|
|
make_kademlia_peer(
|
2019-06-18 20:08:50 -04:00
|
|
|
announced_to.protocol.node_id,
|
|
|
|
announced_to.protocol.external_ip,
|
|
|
|
announced_to.protocol.udp_port
|
|
|
|
)
|
|
|
|
)
|
|
|
|
response = await peer.store(blob_hash)
|
|
|
|
self.assertEqual(response, b'OK')
|
|
|
|
peers_for_blob = await peer.find_value(blob_hash, 0)
|
2022-02-18 18:53:10 -03:00
|
|
|
if i == 0:
|
2019-10-02 19:58:51 +03:00
|
|
|
self.assertNotIn(blob_hash, peers_for_blob)
|
2019-06-18 20:08:50 -04:00
|
|
|
self.assertEqual(peers_for_blob[b'p'], 0)
|
|
|
|
else:
|
2022-02-18 18:53:10 -03:00
|
|
|
self.assertEqual(len(peers_for_blob[blob_hash]), min(i, constants.K))
|
|
|
|
self.assertEqual(len(announced_to.protocol.data_store.get_peers_for_blob(blob_hash)), i + 1)
|
2020-01-03 00:57:28 -03:00
|
|
|
if i - 1 > constants.K:
|
|
|
|
self.assertEqual(len(peers_for_blob[b'contacts']), constants.K)
|
2022-02-18 18:53:10 -03:00
|
|
|
self.assertEqual(peers_for_blob[b'p'], (i // (constants.K + 1)) + 1)
|
2019-06-18 20:08:50 -04:00
|
|
|
seen = set(peers_for_blob[blob_hash])
|
2020-01-03 00:57:28 -03:00
|
|
|
self.assertEqual(len(seen), constants.K)
|
2019-06-18 20:08:50 -04:00
|
|
|
self.assertEqual(len(peers_for_blob[blob_hash]), len(seen))
|
|
|
|
|
|
|
|
for pg in range(1, peers_for_blob[b'p']):
|
|
|
|
page_x = await peer.find_value(blob_hash, pg)
|
|
|
|
self.assertNotIn(b'contacts', page_x)
|
|
|
|
page_x_set = set(page_x[blob_hash])
|
|
|
|
self.assertEqual(len(page_x[blob_hash]), len(page_x_set))
|
2019-10-02 19:58:51 +03:00
|
|
|
self.assertGreater(len(page_x_set), 0)
|
2019-06-18 20:08:50 -04:00
|
|
|
self.assertSetEqual(seen.intersection(page_x_set), set())
|
|
|
|
seen.intersection_update(page_x_set)
|
|
|
|
total_seen.update(page_x_set)
|
|
|
|
else:
|
2022-02-18 18:53:10 -03:00
|
|
|
self.assertEqual(len(peers_for_blob[b'contacts']), 8) # we always add 8 on first page
|
2019-06-18 20:08:50 -04:00
|
|
|
self.assertEqual(len(total_seen), peer_count - 2)
|