lbry-sdk/lbry/db/database.py

320 lines
12 KiB
Python
Raw Normal View History

2020-05-01 09:29:44 -04:00
import os
2020-04-11 17:27:41 -04:00
import asyncio
2020-05-20 17:59:26 -04:00
import tempfile
2020-06-05 00:35:22 -04:00
import multiprocessing as mp
2020-06-21 19:51:09 -04:00
from typing import List, Optional, Iterable, Iterator, TypeVar, Generic, TYPE_CHECKING, Dict
2020-05-01 09:29:44 -04:00
from concurrent.futures import Executor, ThreadPoolExecutor, ProcessPoolExecutor
from functools import partial
2020-04-11 17:27:41 -04:00
2020-05-01 09:29:44 -04:00
from sqlalchemy import create_engine, text
2020-04-11 17:27:41 -04:00
2020-06-05 00:35:22 -04:00
from lbry.event import EventController
2020-05-01 09:29:44 -04:00
from lbry.crypto.bip32 import PubKey
from lbry.blockchain.transaction import Transaction, Output
2020-06-21 19:51:09 -04:00
from .constants import TXO_TYPES, CLAIM_TYPE_CODES
2020-06-05 00:35:22 -04:00
from .query_context import initialize, ProgressPublisher
2020-05-01 09:29:44 -04:00
from . import queries as q
2020-06-05 00:35:22 -04:00
from . import sync
2020-04-11 17:27:41 -04:00
if TYPE_CHECKING:
from lbry.blockchain.ledger import Ledger
2020-05-01 09:29:44 -04:00
def clean_wallet_account_ids(constraints):
wallet = constraints.pop('wallet', None)
account = constraints.pop('account', None)
2020-04-11 17:27:41 -04:00
accounts = constraints.pop('accounts', [])
2020-05-01 09:29:44 -04:00
if account and not accounts:
accounts = [account]
if wallet:
constraints['wallet_account_ids'] = [account.id for account in wallet.accounts]
if not accounts:
accounts = wallet.accounts
2020-04-11 17:27:41 -04:00
if accounts:
2020-05-01 09:29:44 -04:00
constraints['account_ids'] = [account.id for account in accounts]
2020-04-11 17:27:41 -04:00
async def add_channel_keys_to_txo_results(accounts: List, txos: Iterable[Output]):
2020-05-01 09:29:44 -04:00
sub_channels = set()
for txo in txos:
if txo.claim.is_channel:
for account in accounts:
private_key = await account.get_channel_private_key(
2020-05-01 09:29:44 -04:00
txo.claim.channel.public_key_bytes
)
if private_key:
txo.private_key = private_key
break
if txo.channel is not None:
sub_channels.add(txo.channel)
if sub_channels:
await add_channel_keys_to_txo_results(accounts, sub_channels)
2020-04-11 17:27:41 -04:00
2020-06-05 00:35:22 -04:00
ResultType = TypeVar('ResultType')
class Result(Generic[ResultType]):
__slots__ = 'rows', 'total', 'censor'
def __init__(self, rows: List[ResultType], total, censor=None):
self.rows = rows
self.total = total
self.censor = censor
def __getitem__(self, item: int) -> ResultType:
return self.rows[item]
def __iter__(self) -> Iterator[ResultType]:
return iter(self.rows)
def __len__(self):
return len(self.rows)
def __repr__(self):
return repr(self.rows)
2020-04-11 17:27:41 -04:00
class Database:
2020-06-05 00:35:22 -04:00
def __init__(self, ledger: 'Ledger', processes=-1):
self.url = ledger.conf.db_url_or_default
2020-05-01 09:29:44 -04:00
self.ledger = ledger
2020-06-05 00:35:22 -04:00
self.processes = self._normalize_processes(processes)
2020-05-01 09:29:44 -04:00
self.executor: Optional[Executor] = None
2020-06-05 00:35:22 -04:00
self.message_queue = mp.Queue()
self.stop_event = mp.Event()
self._on_progress_controller = EventController()
self.on_progress = self._on_progress_controller.stream
self.progress_publisher = ProgressPublisher(
self.message_queue, self._on_progress_controller
)
@staticmethod
def _normalize_processes(processes):
if processes == 0:
return os.cpu_count()
elif processes > 0:
return processes
return 1
2020-04-11 20:01:10 -04:00
2020-05-20 17:59:26 -04:00
@classmethod
2020-06-05 00:35:22 -04:00
def temp_sqlite_regtest(cls, lbrycrd_dir=None):
from lbry import Config, RegTestLedger # pylint: disable=import-outside-toplevel
2020-05-20 17:59:26 -04:00
directory = tempfile.mkdtemp()
conf = Config.with_same_dir(directory)
2020-06-05 00:35:22 -04:00
if lbrycrd_dir is not None:
conf.lbrycrd_dir = lbrycrd_dir
2020-05-20 17:59:26 -04:00
ledger = RegTestLedger(conf)
2020-06-05 00:35:22 -04:00
return cls(ledger)
2020-05-20 17:59:26 -04:00
2020-06-19 14:28:34 -04:00
@classmethod
def temp_sqlite(cls):
from lbry import Config, Ledger # pylint: disable=import-outside-toplevel
conf = Config.with_same_dir(tempfile.mkdtemp())
return cls(Ledger(conf))
@classmethod
2020-06-05 00:35:22 -04:00
def in_memory(cls):
from lbry import Config, Ledger # pylint: disable=import-outside-toplevel
conf = Config.with_same_dir('/dev/null')
conf.db_url = 'sqlite:///:memory:'
return cls(Ledger(conf))
2020-05-01 09:29:44 -04:00
def sync_create(self, name):
engine = create_engine(self.url)
db = engine.connect()
db.execute(text("COMMIT"))
db.execute(text(f"CREATE DATABASE {name}"))
2020-04-11 17:27:41 -04:00
2020-05-01 09:29:44 -04:00
async def create(self, name):
return await asyncio.get_event_loop().run_in_executor(None, self.sync_create, name)
2020-04-11 17:27:41 -04:00
2020-05-01 09:29:44 -04:00
def sync_drop(self, name):
engine = create_engine(self.url)
db = engine.connect()
db.execute(text("COMMIT"))
db.execute(text(f"DROP DATABASE IF EXISTS {name}"))
2020-04-11 17:27:41 -04:00
2020-05-01 09:29:44 -04:00
async def drop(self, name):
return await asyncio.get_event_loop().run_in_executor(None, self.sync_drop, name)
2020-04-11 17:27:41 -04:00
async def open(self):
2020-05-01 09:29:44 -04:00
assert self.executor is None, "Database already open."
2020-06-05 00:35:22 -04:00
self.progress_publisher.start()
kwargs = {
"initializer": initialize,
"initargs": (
self.ledger,
self.message_queue, self.stop_event
2020-05-01 09:29:44 -04:00
)
2020-06-05 00:35:22 -04:00
}
if self.processes > 1:
self.executor = ProcessPoolExecutor(max_workers=self.processes, **kwargs)
2020-05-01 09:29:44 -04:00
else:
2020-06-05 00:35:22 -04:00
self.executor = ThreadPoolExecutor(max_workers=1, **kwargs)
2020-05-01 09:29:44 -04:00
return await self.run_in_executor(q.check_version_and_create_tables)
2020-04-11 17:27:41 -04:00
async def close(self):
2020-06-05 00:35:22 -04:00
self.progress_publisher.stop()
2020-05-01 09:29:44 -04:00
if self.executor is not None:
self.executor.shutdown()
self.executor = None
async def run_in_executor(self, func, *args, **kwargs):
if kwargs:
clean_wallet_account_ids(kwargs)
return await asyncio.get_event_loop().run_in_executor(
self.executor, partial(func, *args, **kwargs)
2020-04-11 17:27:41 -04:00
)
2020-06-05 00:35:22 -04:00
async def fetch_result(self, func, *args, **kwargs) -> Result:
rows, total = await self.run_in_executor(func, *args, **kwargs)
return Result(rows, total)
2020-05-18 08:14:30 -04:00
async def execute(self, sql):
return await self.run_in_executor(q.execute, sql)
2020-05-01 09:29:44 -04:00
async def execute_fetchall(self, sql):
return await self.run_in_executor(q.execute_fetchall, sql)
2020-04-11 17:27:41 -04:00
2020-06-19 14:28:34 -04:00
async def process_inputs_outputs(self):
return await self.run_in_executor(sync.process_inputs_outputs)
2020-06-05 00:35:22 -04:00
2020-06-19 14:28:34 -04:00
async def process_all_things_after_sync(self):
return await self.run_in_executor(sync.process_all_things_after_sync)
2020-06-05 00:35:22 -04:00
2020-06-19 14:28:34 -04:00
async def needs_initial_sync(self) -> bool:
return (await self.get_best_tx_height()) == -1
2020-06-05 00:35:22 -04:00
2020-06-19 14:28:34 -04:00
async def get_best_tx_height(self) -> int:
return await self.run_in_executor(q.get_best_tx_height)
2020-04-11 17:27:41 -04:00
2020-06-19 14:28:34 -04:00
async def get_best_block_height_for_file(self, file_number) -> int:
return await self.run_in_executor(q.get_best_block_height_for_file, file_number)
2020-06-05 00:35:22 -04:00
2020-05-01 09:29:44 -04:00
async def get_blocks_without_filters(self):
return await self.run_in_executor(q.get_blocks_without_filters)
2020-04-11 17:27:41 -04:00
2020-05-01 09:29:44 -04:00
async def get_transactions_without_filters(self):
return await self.run_in_executor(q.get_transactions_without_filters)
2020-04-11 17:27:41 -04:00
2020-05-01 09:29:44 -04:00
async def get_block_tx_addresses(self, block_hash=None, tx_hash=None):
return await self.run_in_executor(q.get_block_tx_addresses, block_hash, tx_hash)
2020-04-11 17:27:41 -04:00
2020-05-01 09:29:44 -04:00
async def get_block_address_filters(self):
return await self.run_in_executor(q.get_block_address_filters)
2020-04-11 17:27:41 -04:00
2020-05-01 09:29:44 -04:00
async def get_transaction_address_filters(self, block_hash):
return await self.run_in_executor(q.get_transaction_address_filters, block_hash)
2020-04-11 17:27:41 -04:00
2020-06-19 14:28:34 -04:00
async def insert_block(self, block):
return await self.run_in_executor(q.insert_block, block)
2020-06-05 00:35:22 -04:00
async def insert_transaction(self, block_hash, tx):
return await self.run_in_executor(q.insert_transaction, block_hash, tx)
2020-04-11 17:27:41 -04:00
2020-05-01 09:29:44 -04:00
async def update_address_used_times(self, addresses):
return await self.run_in_executor(q.update_address_used_times, addresses)
2020-04-11 17:27:41 -04:00
async def reserve_outputs(self, txos, is_reserved=True):
txo_hashes = [txo.hash for txo in txos]
if txo_hashes:
2020-05-01 09:29:44 -04:00
return await self.run_in_executor(
q.reserve_outputs, txo_hashes, is_reserved
2020-04-11 17:27:41 -04:00
)
async def release_outputs(self, txos):
2020-05-01 09:29:44 -04:00
return await self.reserve_outputs(txos, is_reserved=False)
2020-04-11 17:27:41 -04:00
2020-05-01 09:29:44 -04:00
async def release_tx(self, tx):
return await self.release_outputs([txi.txo_ref.txo for txi in tx.inputs])
2020-04-11 17:27:41 -04:00
2020-05-01 09:29:44 -04:00
async def release_all_outputs(self, account):
return await self.run_in_executor(q.release_all_outputs, account.id)
2020-04-11 17:27:41 -04:00
2020-05-01 09:29:44 -04:00
async def get_balance(self, **constraints):
return await self.run_in_executor(q.get_balance, **constraints)
2020-04-11 17:27:41 -04:00
async def get_report(self, accounts):
return await self.run_in_executor(q.get_report, accounts=accounts)
2020-04-11 17:27:41 -04:00
2020-06-05 00:35:22 -04:00
async def get_addresses(self, **constraints) -> Result[dict]:
addresses = await self.fetch_result(q.get_addresses, **constraints)
2020-05-01 09:29:44 -04:00
if addresses and 'pubkey' in addresses[0]:
2020-04-11 17:27:41 -04:00
for address in addresses:
address['pubkey'] = PubKey(
self.ledger, bytes(address.pop('pubkey')), bytes(address.pop('chain_code')),
address.pop('n'), address.pop('depth')
)
2020-06-05 00:35:22 -04:00
return addresses
2020-04-11 17:27:41 -04:00
2020-05-01 09:29:44 -04:00
async def get_all_addresses(self):
return await self.run_in_executor(q.get_all_addresses)
2020-04-11 17:27:41 -04:00
async def get_address(self, **constraints):
2020-06-05 00:35:22 -04:00
for address in await self.get_addresses(limit=1, **constraints):
return address
2020-04-11 17:27:41 -04:00
async def add_keys(self, account, chain, pubkeys):
2020-05-01 09:29:44 -04:00
return await self.run_in_executor(q.add_keys, account, chain, pubkeys)
2020-04-11 17:27:41 -04:00
2020-06-05 00:35:22 -04:00
async def get_transactions(self, **constraints) -> Result[Transaction]:
return await self.fetch_result(q.get_transactions, **constraints)
2020-04-11 17:27:41 -04:00
2020-05-01 09:29:44 -04:00
async def get_transaction(self, **constraints) -> Optional[Transaction]:
2020-06-05 00:35:22 -04:00
txs = await self.get_transactions(limit=1, **constraints)
2020-05-01 09:29:44 -04:00
if txs:
return txs[0]
2020-04-11 17:27:41 -04:00
2020-06-05 00:35:22 -04:00
async def get_purchases(self, **constraints) -> Result[Output]:
return await self.fetch_result(q.get_purchases, **constraints)
2020-04-11 17:27:41 -04:00
2020-06-05 00:35:22 -04:00
async def search_claims(self, **constraints) -> Result[Output]:
2020-06-19 14:28:34 -04:00
#assert set(constraints).issubset(SEARCH_PARAMS), \
# f"Search query contains invalid arguments: {set(constraints).difference(SEARCH_PARAMS)}"
claims, total, censor = await self.run_in_executor(q.search_claims, **constraints)
2020-06-05 00:35:22 -04:00
return Result(claims, total, censor)
2020-04-11 17:27:41 -04:00
2020-06-21 19:51:09 -04:00
async def search_supports(self, **constraints) -> Result[Output]:
return await self.fetch_result(q.search_supports, **constraints)
async def resolve(self, *urls) -> Dict[str, Output]:
return await self.run_in_executor(q.resolve, *urls)
2020-06-05 00:35:22 -04:00
async def get_txo_sum(self, **constraints) -> int:
2020-05-01 09:29:44 -04:00
return await self.run_in_executor(q.get_txo_sum, **constraints)
2020-04-11 17:27:41 -04:00
2020-06-05 00:35:22 -04:00
async def get_txo_plot(self, **constraints) -> List[dict]:
2020-05-01 09:29:44 -04:00
return await self.run_in_executor(q.get_txo_plot, **constraints)
2020-04-11 17:27:41 -04:00
2020-06-05 00:35:22 -04:00
async def get_txos(self, **constraints) -> Result[Output]:
txos = await self.fetch_result(q.get_txos, **constraints)
2020-05-01 09:29:44 -04:00
if 'wallet' in constraints:
await add_channel_keys_to_txo_results(constraints['wallet'].accounts, txos)
2020-06-05 00:35:22 -04:00
return txos
2020-04-11 17:27:41 -04:00
2020-06-05 00:35:22 -04:00
async def get_utxos(self, **constraints) -> Result[Output]:
2020-05-01 09:29:44 -04:00
return await self.get_txos(is_spent=False, **constraints)
2020-04-11 17:27:41 -04:00
2020-06-05 00:35:22 -04:00
async def get_supports(self, **constraints) -> Result[Output]:
2020-05-01 09:29:44 -04:00
return await self.get_utxos(txo_type=TXO_TYPES['support'], **constraints)
2020-04-11 17:27:41 -04:00
2020-06-05 00:35:22 -04:00
async def get_claims(self, **constraints) -> Result[Output]:
2020-06-19 14:28:34 -04:00
if 'txo_type' not in constraints:
2020-06-21 19:51:09 -04:00
constraints['txo_type__in'] = CLAIM_TYPE_CODES
2020-06-19 14:28:34 -04:00
txos = await self.fetch_result(q.get_txos, **constraints)
2020-05-01 09:29:44 -04:00
if 'wallet' in constraints:
await add_channel_keys_to_txo_results(constraints['wallet'].accounts, txos)
2020-06-05 00:35:22 -04:00
return txos
2020-04-11 17:27:41 -04:00
2020-06-05 00:35:22 -04:00
async def get_streams(self, **constraints) -> Result[Output]:
2020-05-01 09:29:44 -04:00
return await self.get_claims(txo_type=TXO_TYPES['stream'], **constraints)
2020-04-11 17:27:41 -04:00
2020-06-05 00:35:22 -04:00
async def get_channels(self, **constraints) -> Result[Output]:
2020-05-01 09:29:44 -04:00
return await self.get_claims(txo_type=TXO_TYPES['channel'], **constraints)
2020-04-11 17:27:41 -04:00
2020-06-05 00:35:22 -04:00
async def get_collections(self, **constraints) -> Result[Output]:
2020-05-01 09:29:44 -04:00
return await self.get_claims(txo_type=TXO_TYPES['collection'], **constraints)