lbry-sdk/lbrynet/extras/daemon/storage.py

860 lines
39 KiB
Python
Raw Normal View History

import os
2018-02-12 13:36:35 -05:00
import logging
2019-01-22 15:43:01 -05:00
import sqlite3
import typing
2019-01-22 15:43:01 -05:00
import asyncio
import binascii
import time
2019-01-22 15:43:01 -05:00
from torba.client.basedatabase import SQLiteMixin
2019-01-21 15:55:50 -05:00
from lbrynet.conf import Config
2019-03-20 01:46:23 -04:00
from lbrynet.wallet.dewies import dewies_to_lbc, lbc_to_dewies
from lbrynet.wallet.transaction import Transaction
2019-03-20 01:46:23 -04:00
from lbrynet.schema.claim import Claim
2019-01-22 15:43:01 -05:00
from lbrynet.dht.constants import data_expiration
2019-01-22 17:44:25 -05:00
from lbrynet.blob.blob_info import BlobInfo
2019-01-22 15:43:01 -05:00
if typing.TYPE_CHECKING:
from lbrynet.blob.blob_file import BlobFile
from lbrynet.stream.descriptor import StreamDescriptor
2018-02-12 13:36:35 -05:00
log = logging.getLogger(__name__)
2019-01-22 15:43:01 -05:00
opt_str = typing.Optional[str]
opt_int = typing.Optional[int]
2018-02-12 13:36:35 -05:00
def calculate_effective_amount(amount: str, supports: typing.Optional[typing.List[typing.Dict]] = None) -> str:
return dewies_to_lbc(
lbc_to_dewies(amount) + sum([lbc_to_dewies(support['amount']) for support in supports])
)
2019-01-22 15:43:01 -05:00
class StoredStreamClaim:
def __init__(self, stream_hash: str, outpoint: opt_str = None, claim_id: opt_str = None, name: opt_str = None,
amount: opt_int = None, height: opt_int = None, serialized: opt_str = None,
channel_claim_id: opt_str = None, address: opt_str = None, claim_sequence: opt_int = None,
channel_name: opt_str = None):
self.stream_hash = stream_hash
self.claim_id = claim_id
self.outpoint = outpoint
self.claim_name = name
self.amount = amount
self.height = height
2019-03-20 01:46:23 -04:00
self.claim: typing.Optional[Claim] = None if not serialized else Claim.from_bytes(
binascii.unhexlify(serialized)
)
2019-01-22 15:43:01 -05:00
self.claim_address = address
self.claim_sequence = claim_sequence
self.channel_claim_id = channel_claim_id
self.channel_name = channel_name
@property
def txid(self) -> typing.Optional[str]:
return None if not self.outpoint else self.outpoint.split(":")[0]
@property
def nout(self) -> typing.Optional[int]:
return None if not self.outpoint else int(self.outpoint.split(":")[1])
def as_dict(self) -> typing.Dict:
return {
"name": self.claim_name,
"claim_id": self.claim_id,
"address": self.claim_address,
"claim_sequence": self.claim_sequence,
"value": self.claim,
"height": self.height,
"amount": dewies_to_lbc(self.amount),
"nout": self.nout,
"txid": self.txid,
"channel_claim_id": self.channel_claim_id,
"channel_name": self.channel_name
}
def get_claims_from_stream_hashes(transaction: sqlite3.Connection,
stream_hashes: typing.List[str]) -> typing.Dict[str, StoredStreamClaim]:
query = (
"select content_claim.stream_hash, c.*, case when c.channel_claim_id is not null then "
" (select claim_name from claim where claim_id==c.channel_claim_id) "
" else null end as channel_name "
" from content_claim "
" inner join claim c on c.claim_outpoint=content_claim.claim_outpoint and content_claim.stream_hash in {}"
" order by c.rowid desc"
)
return {
claim_info.stream_hash: claim_info
for claim_info in [
None if not claim_info else StoredStreamClaim(*claim_info)
for claim_info in _batched_select(transaction, query, stream_hashes)
]
}
2018-02-12 13:36:35 -05:00
2019-01-22 15:43:01 -05:00
def get_content_claim_from_outpoint(transaction: sqlite3.Connection,
outpoint: str) -> typing.Optional[StoredStreamClaim]:
query = (
"select content_claim.stream_hash, c.*, case when c.channel_claim_id is not null then "
" (select claim_name from claim where claim_id==c.channel_claim_id) "
" else null end as channel_name "
" from content_claim "
" inner join claim c on c.claim_outpoint=content_claim.claim_outpoint and content_claim.claim_outpoint=?"
2018-12-15 15:31:02 -05:00
)
2019-01-22 15:43:01 -05:00
claim_fields = transaction.execute(query, (outpoint, )).fetchone()
if claim_fields:
return StoredStreamClaim(*claim_fields)
2018-02-12 13:36:35 -05:00
2019-02-08 19:51:13 -05:00
def _batched_select(transaction, query, parameters, batch_size=900):
for start_index in range(0, len(parameters), batch_size):
current_batch = parameters[start_index:start_index+batch_size]
2019-01-22 15:43:01 -05:00
bind = "({})".format(','.join(['?'] * len(current_batch)))
for result in transaction.execute(query.format(bind), current_batch):
yield result
2018-02-12 13:36:35 -05:00
def get_all_lbry_files(transaction: sqlite3.Connection) -> typing.List[typing.Dict]:
2019-02-08 19:51:13 -05:00
files = []
signed_claims = {}
for (rowid, stream_hash, file_name, download_dir, data_rate, status, saved_file, raw_content_fee, _,
sd_hash, stream_key, stream_name, suggested_file_name, *claim_args) in _batched_select(
2019-02-08 19:51:13 -05:00
transaction, "select file.rowid, file.*, stream.*, c.* "
"from file inner join stream on file.stream_hash=stream.stream_hash "
"inner join content_claim cc on file.stream_hash=cc.stream_hash "
"inner join claim c on cc.claim_outpoint=c.claim_outpoint "
"where file.stream_hash in {} "
2019-02-08 19:51:13 -05:00
"order by c.rowid desc", [
stream_hash for (stream_hash,) in transaction.execute("select stream_hash from file")]):
claim = StoredStreamClaim(stream_hash, *claim_args)
if claim.channel_claim_id:
if claim.channel_claim_id not in signed_claims:
signed_claims[claim.channel_claim_id] = []
signed_claims[claim.channel_claim_id].append(claim)
files.append(
{
2019-02-15 16:44:31 -05:00
"rowid": rowid,
2019-02-08 19:51:13 -05:00
"stream_hash": stream_hash,
"file_name": file_name, # hex
"download_directory": download_dir, # hex
"blob_data_rate": data_rate,
"status": status,
"sd_hash": sd_hash,
"key": stream_key,
"stream_name": stream_name, # hex
"suggested_file_name": suggested_file_name, # hex
"claim": claim,
"saved_file": bool(saved_file),
"content_fee": None if not raw_content_fee else Transaction(
binascii.unhexlify(raw_content_fee)
)
2019-02-08 19:51:13 -05:00
}
)
for claim_name, claim_id in _batched_select(
transaction, "select c.claim_name, c.claim_id from claim c where c.claim_id in {}",
list(signed_claims.keys())):
for claim in signed_claims[claim_id]:
claim.channel_name = claim_name
2019-02-08 19:51:13 -05:00
return files
def store_stream(transaction: sqlite3.Connection, sd_blob: 'BlobFile', descriptor: 'StreamDescriptor'):
# add all blobs, except the last one, which is empty
transaction.executemany(
"insert or ignore into blob values (?, ?, ?, ?, ?, ?, ?)",
[(blob.blob_hash, blob.length, 0, 0, "pending", 0, 0)
for blob in (descriptor.blobs[:-1] if len(descriptor.blobs) > 1 else descriptor.blobs) + [sd_blob]]
)
# associate the blobs to the stream
transaction.execute("insert or ignore into stream values (?, ?, ?, ?, ?)",
(descriptor.stream_hash, sd_blob.blob_hash, descriptor.key,
binascii.hexlify(descriptor.stream_name.encode()).decode(),
binascii.hexlify(descriptor.suggested_file_name.encode()).decode()))
# add the stream
transaction.executemany(
"insert or ignore into stream_blob values (?, ?, ?, ?)",
[(descriptor.stream_hash, blob.blob_hash, blob.blob_num, blob.iv)
for blob in descriptor.blobs]
)
# ensure should_announce is set regardless if insert was ignored
transaction.execute(
"update blob set should_announce=1 where blob_hash in (?, ?)",
(sd_blob.blob_hash, descriptor.blobs[0].blob_hash,)
)
2019-02-14 12:33:48 -05:00
def delete_stream(transaction: sqlite3.Connection, descriptor: 'StreamDescriptor'):
blob_hashes = [(blob.blob_hash, ) for blob in descriptor.blobs[:-1]]
blob_hashes.append((descriptor.sd_hash, ))
2019-02-14 12:33:48 -05:00
transaction.execute("delete from content_claim where stream_hash=? ", (descriptor.stream_hash,))
transaction.execute("delete from file where stream_hash=? ", (descriptor.stream_hash,))
transaction.execute("delete from stream_blob where stream_hash=?", (descriptor.stream_hash,))
transaction.execute("delete from stream where stream_hash=? ", (descriptor.stream_hash,))
transaction.executemany("delete from blob where blob_hash=?", blob_hashes)
2019-02-14 12:33:48 -05:00
def store_file(transaction: sqlite3.Connection, stream_hash: str, file_name: typing.Optional[str],
download_directory: typing.Optional[str], data_payment_rate: float, status: str,
content_fee: typing.Optional[Transaction]) -> int:
if not file_name and not download_directory:
encoded_file_name, encoded_download_dir = None, None
else:
encoded_file_name = binascii.hexlify(file_name.encode()).decode()
encoded_download_dir = binascii.hexlify(download_directory.encode()).decode()
transaction.execute(
"insert or replace into file values (?, ?, ?, ?, ?, ?, ?)",
(stream_hash, encoded_file_name, encoded_download_dir, data_payment_rate, status,
1 if (file_name and download_directory and os.path.isfile(os.path.join(download_directory, file_name))) else 0,
2019-05-09 18:02:07 -04:00
None if not content_fee else binascii.hexlify(content_fee.raw).decode())
)
2019-02-15 16:44:31 -05:00
return transaction.execute("select rowid from file where stream_hash=?", (stream_hash, )).fetchone()[0]
2018-12-15 15:31:02 -05:00
class SQLiteStorage(SQLiteMixin):
2018-02-12 13:36:35 -05:00
CREATE_TABLES_QUERY = """
pragma foreign_keys=on;
pragma journal_mode=WAL;
2019-01-22 15:43:01 -05:00
2018-02-12 13:36:35 -05:00
create table if not exists blob (
blob_hash char(96) primary key not null,
blob_length integer not null,
next_announce_time integer not null,
should_announce integer not null default 0,
2018-03-27 14:58:29 -04:00
status text not null,
last_announced_time integer,
single_announce integer
2018-02-12 13:36:35 -05:00
);
2019-01-22 15:43:01 -05:00
2018-02-12 13:36:35 -05:00
create table if not exists stream (
stream_hash char(96) not null primary key,
2018-02-12 15:10:06 -05:00
sd_hash char(96) not null references blob,
2018-02-12 13:36:35 -05:00
stream_key text not null,
stream_name text not null,
2018-02-12 15:10:06 -05:00
suggested_filename text not null
2018-02-12 13:36:35 -05:00
);
2019-01-22 15:43:01 -05:00
2018-02-12 13:36:35 -05:00
create table if not exists stream_blob (
2018-02-12 15:10:06 -05:00
stream_hash char(96) not null references stream,
blob_hash char(96) references blob,
2018-02-12 13:36:35 -05:00
position integer not null,
iv char(32) not null,
2018-02-12 15:10:06 -05:00
primary key (stream_hash, blob_hash)
2018-02-12 13:36:35 -05:00
);
2019-01-22 15:43:01 -05:00
2018-02-12 13:36:35 -05:00
create table if not exists claim (
claim_outpoint text not null primary key,
claim_id char(40) not null,
claim_name text not null,
amount integer not null,
height integer not null,
serialized_metadata blob not null,
channel_claim_id text,
address text not null,
claim_sequence integer not null
);
create table if not exists file (
2018-02-12 15:10:06 -05:00
stream_hash text primary key not null references stream,
file_name text,
download_directory text,
2018-02-12 13:36:35 -05:00
blob_data_rate real not null,
status text not null,
saved_file integer not null,
content_fee text
2018-02-12 13:36:35 -05:00
);
2019-01-22 15:43:01 -05:00
2018-02-12 13:36:35 -05:00
create table if not exists content_claim (
2018-02-12 15:10:06 -05:00
stream_hash text unique not null references file,
claim_outpoint text not null references claim,
primary key (stream_hash, claim_outpoint)
2018-02-12 13:36:35 -05:00
);
2019-01-22 15:43:01 -05:00
2018-02-12 13:36:35 -05:00
create table if not exists support (
support_outpoint text not null primary key,
claim_id text not null,
amount integer not null,
address text not null
);
2019-01-22 15:43:01 -05:00
create table if not exists reflected_stream (
sd_hash text not null,
reflector_address text not null,
timestamp integer,
primary key (sd_hash, reflector_address)
);
2018-10-09 23:58:32 -04:00
"""
2018-02-12 13:36:35 -05:00
def __init__(self, conf: Config, path, loop=None, time_getter: typing.Optional[typing.Callable[[], float]] = None):
2018-12-15 15:31:02 -05:00
super().__init__(path)
2019-01-21 15:55:50 -05:00
self.conf = conf
2018-12-15 15:31:02 -05:00
self.content_claim_callbacks = {}
2019-01-07 20:23:18 -05:00
self.loop = loop or asyncio.get_event_loop()
self.time_getter = time_getter or time.time
2018-12-15 15:31:02 -05:00
async def run_and_return_one_or_none(self, query, *args):
for row in await self.db.execute_fetchall(query, args):
if len(row) == 1:
return row[0]
2018-12-15 15:31:02 -05:00
return row
async def run_and_return_list(self, query, *args):
rows = list(await self.db.execute_fetchall(query, args))
return [col[0] for col in rows] if rows else []
2018-02-12 13:36:35 -05:00
# # # # # # # # # blob functions # # # # # # # # #
async def add_blobs(self, *blob_hashes_and_lengths: typing.Tuple[str, int], finished=False):
def _add_blobs(transaction: sqlite3.Connection):
transaction.executemany(
"insert or ignore into blob values (?, ?, ?, ?, ?, ?, ?)",
[
(blob_hash, length, 0, 0, "pending" if not finished else "finished", 0, 0)
for blob_hash, length in blob_hashes_and_lengths
]
)
if finished:
transaction.executemany(
"update blob set status='finished' where blob.blob_hash=?", [
(blob_hash, ) for blob_hash, _ in blob_hashes_and_lengths
]
)
return await self.db.run(_add_blobs)
2018-02-12 13:36:35 -05:00
2019-01-22 15:43:01 -05:00
def get_blob_status(self, blob_hash: str):
2018-02-12 13:36:35 -05:00
return self.run_and_return_one_or_none(
"select status from blob where blob_hash=?", blob_hash
)
2019-01-22 15:43:01 -05:00
def should_announce(self, blob_hash: str):
2018-02-12 13:36:35 -05:00
return self.run_and_return_one_or_none(
"select should_announce from blob where blob_hash=?", blob_hash
)
def count_should_announce_blobs(self):
return self.run_and_return_one_or_none(
2018-03-08 16:46:39 -05:00
"select count(*) from blob where should_announce=1 and status='finished'"
2018-02-12 13:36:35 -05:00
)
def get_all_should_announce_blobs(self):
return self.run_and_return_list(
2018-03-08 16:46:39 -05:00
"select blob_hash from blob where should_announce=1 and status='finished'"
2018-02-12 13:36:35 -05:00
)
2019-01-22 15:43:01 -05:00
def get_all_finished_blobs(self):
return self.run_and_return_list(
"select blob_hash from blob where status='finished'"
)
2018-08-02 17:33:56 -04:00
def count_finished_blobs(self):
return self.run_and_return_one_or_none(
"select count(*) from blob where status='finished'"
)
def update_last_announced_blobs(self, blob_hashes: typing.List[str]):
2019-01-22 15:43:01 -05:00
def _update_last_announced_blobs(transaction: sqlite3.Connection):
last_announced = self.time_getter()
2019-01-22 15:43:01 -05:00
return transaction.executemany(
"update blob set next_announce_time=?, last_announced_time=?, single_announce=0 "
"where blob_hash=?",
[(int(last_announced + (data_expiration / 2)), int(last_announced), blob_hash)
for blob_hash in blob_hashes]
)
return self.db.run(_update_last_announced_blobs)
def should_single_announce_blobs(self, blob_hashes, immediate=False):
def set_single_announce(transaction):
now = int(self.time_getter())
for blob_hash in blob_hashes:
if immediate:
transaction.execute(
"update blob set single_announce=1, next_announce_time=? "
"where blob_hash=? and status='finished'", (int(now), blob_hash)
)
else:
transaction.execute(
2019-01-22 15:43:01 -05:00
"update blob set single_announce=1 where blob_hash=? and status='finished'", (blob_hash,)
)
2018-12-15 15:31:02 -05:00
return self.db.run(set_single_announce)
def get_blobs_to_announce(self):
2018-02-12 13:36:35 -05:00
def get_and_update(transaction):
timestamp = int(self.time_getter())
2019-01-28 09:51:02 -05:00
if self.conf.announce_head_and_sd_only:
2018-02-12 13:36:35 -05:00
r = transaction.execute(
"select blob_hash from blob "
"where blob_hash is not null and "
2019-02-08 16:29:55 -05:00
"(should_announce=1 or single_announce=1) and next_announce_time<? and status='finished' "
"order by next_announce_time asc limit ?",
(timestamp, int(self.conf.concurrent_blob_announcers * 10))
2018-02-12 13:36:35 -05:00
)
else:
r = transaction.execute(
2018-03-08 16:46:39 -05:00
"select blob_hash from blob where blob_hash is not null "
2019-02-08 16:29:55 -05:00
"and next_announce_time<? and status='finished' "
"order by next_announce_time asc limit ?",
(timestamp, int(self.conf.concurrent_blob_announcers * 10))
2018-02-12 13:36:35 -05:00
)
2019-02-08 16:29:55 -05:00
return [b[0] for b in r.fetchall()]
2018-12-15 15:31:02 -05:00
return self.db.run(get_and_update)
2018-02-12 13:36:35 -05:00
def delete_blobs_from_db(self, blob_hashes):
def delete_blobs(transaction):
2019-01-22 15:43:01 -05:00
transaction.executemany(
"delete from blob where blob_hash=?;", [(blob_hash,) for blob_hash in blob_hashes]
)
return self.db.run_with_foreign_keys_disabled(delete_blobs)
2018-02-12 13:36:35 -05:00
def get_all_blob_hashes(self):
return self.run_and_return_list("select blob_hash from blob")
def sync_missing_blobs(self, blob_files: typing.Set[str]) -> typing.Awaitable[typing.Set[str]]:
def _sync_blobs(transaction: sqlite3.Connection) -> typing.Set[str]:
to_update = [
(blob_hash, )
for (blob_hash, ) in transaction.execute("select blob_hash from blob where status='finished'")
if blob_hash not in blob_files
]
transaction.executemany(
"update blob set status='pending' where blob_hash=?",
to_update
)
return {
blob_hash
for blob_hash, in _batched_select(
transaction, "select blob_hash from blob where status='finished' and blob_hash in {}",
list(blob_files)
)
}
return self.db.run(_sync_blobs)
2019-03-31 13:42:27 -04:00
def sync_files_to_blobs(self):
def _sync_blobs(transaction: sqlite3.Connection):
2019-03-31 13:42:27 -04:00
transaction.executemany(
"update file set status='stopped' where stream_hash=?",
transaction.execute(
"select distinct sb.stream_hash from stream_blob sb "
"inner join blob b on b.blob_hash=sb.blob_hash and b.status=='pending'"
).fetchall()
)
return self.db.run(_sync_blobs)
def set_files_as_streaming(self, stream_hashes: typing.List[str]):
def _set_streaming(transaction: sqlite3.Connection):
transaction.executemany(
"update file set file_name=null, download_directory=null where stream_hash=?",
[(stream_hash, ) for stream_hash in stream_hashes]
)
return self.db.run(_set_streaming)
2019-01-22 15:43:01 -05:00
# # # # # # # # # stream functions # # # # # # # # #
2018-03-08 16:46:39 -05:00
2019-01-22 15:43:01 -05:00
async def stream_exists(self, sd_hash: str) -> bool:
streams = await self.run_and_return_one_or_none("select stream_hash from stream where sd_hash=?", sd_hash)
return streams is not None
2018-03-08 16:46:39 -05:00
2019-01-22 15:43:01 -05:00
async def file_exists(self, sd_hash: str) -> bool:
streams = await self.run_and_return_one_or_none("select f.stream_hash from file f "
"inner join stream s on "
"s.stream_hash=f.stream_hash and s.sd_hash=?", sd_hash)
return streams is not None
2018-02-12 13:36:35 -05:00
2019-02-15 16:44:31 -05:00
def rowid_for_stream(self, stream_hash: str) -> typing.Awaitable[typing.Optional[int]]:
return self.run_and_return_one_or_none(
"select rowid from file where stream_hash=?", stream_hash
)
2019-01-22 15:43:01 -05:00
def store_stream(self, sd_blob: 'BlobFile', descriptor: 'StreamDescriptor'):
return self.db.run(store_stream, sd_blob, descriptor)
2018-02-12 13:36:35 -05:00
2019-02-14 18:16:16 -05:00
def get_blobs_for_stream(self, stream_hash, only_completed=False) -> typing.Awaitable[typing.List[BlobInfo]]:
2019-01-22 17:44:25 -05:00
def _get_blobs_for_stream(transaction):
crypt_blob_infos = []
stream_blobs = transaction.execute(
2019-02-14 18:16:16 -05:00
"select blob_hash, position, iv from stream_blob where stream_hash=? "
"order by position asc", (stream_hash, )
2019-01-22 17:44:25 -05:00
).fetchall()
if only_completed:
lengths = transaction.execute(
"select b.blob_hash, b.blob_length from blob b "
"inner join stream_blob s ON b.blob_hash=s.blob_hash and b.status='finished' and s.stream_hash=?",
(stream_hash, )
).fetchall()
else:
lengths = transaction.execute(
"select b.blob_hash, b.blob_length from blob b "
"inner join stream_blob s ON b.blob_hash=s.blob_hash and s.stream_hash=?",
(stream_hash, )
).fetchall()
blob_length_dict = {}
for blob_hash, length in lengths:
blob_length_dict[blob_hash] = length
for blob_hash, position, iv in stream_blobs:
blob_length = blob_length_dict.get(blob_hash, 0)
crypt_blob_infos.append(BlobInfo(position, blob_length, iv, blob_hash))
2019-02-14 18:16:16 -05:00
if not blob_hash:
break
2019-01-22 17:44:25 -05:00
return crypt_blob_infos
return self.db.run(_get_blobs_for_stream)
def get_sd_blob_hash_for_stream(self, stream_hash):
return self.run_and_return_one_or_none(
"select sd_hash from stream where stream_hash=?", stream_hash
)
def get_stream_hash_for_sd_hash(self, sd_blob_hash):
return self.run_and_return_one_or_none(
"select stream_hash from stream where sd_hash = ?", sd_blob_hash
)
def get_stream_info_for_sd_hash(self, sd_blob_hash):
return self.run_and_return_one_or_none(
"select stream_hash, stream_name, suggested_filename, stream_key from stream where sd_hash = ?",
sd_blob_hash
)
2019-01-22 15:43:01 -05:00
def delete_stream(self, descriptor: 'StreamDescriptor'):
2019-02-14 12:33:48 -05:00
return self.db.run_with_foreign_keys_disabled(delete_stream, descriptor)
2018-02-12 13:36:35 -05:00
# # # # # # # # # file stuff # # # # # # # # #
def save_downloaded_file(self, stream_hash: str, file_name: typing.Optional[str],
download_directory: typing.Optional[str], data_payment_rate: float,
content_fee: typing.Optional[Transaction] = None) -> typing.Awaitable[int]:
2019-01-22 15:43:01 -05:00
return self.save_published_file(
stream_hash, file_name, download_directory, data_payment_rate, status="running",
content_fee=content_fee
2018-02-12 13:36:35 -05:00
)
def save_published_file(self, stream_hash: str, file_name: typing.Optional[str],
download_directory: typing.Optional[str], data_payment_rate: float,
status: str = "finished",
content_fee: typing.Optional[Transaction] = None) -> typing.Awaitable[int]:
return self.db.run(store_file, stream_hash, file_name, download_directory, data_payment_rate, status,
content_fee)
async def update_manually_removed_files_since_last_run(self):
"""
Update files that have been removed from the downloads directory since the last run
"""
def update_manually_removed_files(transaction: sqlite3.Connection):
removed = []
for (stream_hash, download_directory, file_name) in transaction.execute(
"select stream_hash, download_directory, file_name from file where saved_file=1"
).fetchall():
if download_directory and file_name and os.path.isfile(
2019-05-10 11:48:49 -04:00
os.path.join(binascii.unhexlify(download_directory).decode(),
binascii.unhexlify(file_name).decode())):
continue
else:
removed.append((stream_hash,))
if removed:
transaction.executemany(
"update file set file_name=null, download_directory=null, saved_file=0 where stream_hash=?",
removed
)
return await self.db.run(update_manually_removed_files)
2018-02-12 13:36:35 -05:00
2019-02-08 19:51:13 -05:00
def get_all_lbry_files(self) -> typing.Awaitable[typing.List[typing.Dict]]:
return self.db.run(get_all_lbry_files)
2018-02-12 13:36:35 -05:00
2019-01-22 15:43:01 -05:00
def change_file_status(self, stream_hash: str, new_status: str):
log.debug("update file status %s -> %s", stream_hash, new_status)
2019-01-22 15:43:01 -05:00
return self.db.execute("update file set status=? where stream_hash=?", (new_status, stream_hash))
2018-02-12 13:36:35 -05:00
async def change_file_download_dir_and_file_name(self, stream_hash: str, download_dir: typing.Optional[str],
file_name: typing.Optional[str]):
if not file_name or not download_dir:
encoded_file_name, encoded_download_dir = None, None
else:
encoded_file_name = binascii.hexlify(file_name.encode()).decode()
encoded_download_dir = binascii.hexlify(download_dir.encode()).decode()
return await self.db.execute("update file set download_directory=?, file_name=? where stream_hash=?", (
encoded_download_dir, encoded_file_name, stream_hash,
2019-02-01 15:46:31 -05:00
))
async def save_content_fee(self, stream_hash: str, content_fee: Transaction):
return await self.db.execute("update file set content_fee=? where stream_hash=?", (
binascii.hexlify(content_fee.raw), stream_hash,
))
async def set_saved_file(self, stream_hash: str):
return await self.db.execute("update file set saved_file=1 where stream_hash=?", (
stream_hash,
))
async def clear_saved_file(self, stream_hash: str):
return await self.db.execute("update file set saved_file=0 where stream_hash=?", (
stream_hash,
))
async def recover_streams(self, descriptors_and_sds: typing.List[typing.Tuple['StreamDescriptor', 'BlobFile',
typing.Optional[Transaction]]],
download_directory: str):
def _recover(transaction: sqlite3.Connection):
stream_hashes = [x[0].stream_hash for x in descriptors_and_sds]
for descriptor, sd_blob, content_fee in descriptors_and_sds:
content_claim = transaction.execute(
"select * from content_claim where stream_hash=?", (descriptor.stream_hash, )
).fetchone()
delete_stream(transaction, descriptor) # this will also delete the content claim
store_stream(transaction, sd_blob, descriptor)
store_file(transaction, descriptor.stream_hash, os.path.basename(descriptor.suggested_file_name),
download_directory, 0.0, 'stopped', content_fee=content_fee)
if content_claim:
transaction.execute("insert or ignore into content_claim values (?, ?)", content_claim)
transaction.executemany(
"update file set status='stopped' where stream_hash=?",
[(stream_hash, ) for stream_hash in stream_hashes]
)
download_dir = binascii.hexlify(self.conf.download_dir.encode()).decode()
transaction.executemany(
f"update file set download_directory=? where stream_hash=?",
[(download_dir, stream_hash) for stream_hash in stream_hashes]
)
await self.db.run_with_foreign_keys_disabled(_recover)
2019-01-22 15:43:01 -05:00
def get_all_stream_hashes(self):
return self.run_and_return_list("select stream_hash from stream")
2018-02-12 13:36:35 -05:00
# # # # # # # # # support functions # # # # # # # # #
2019-04-19 20:42:35 -03:00
def save_supports(self, claim_id_to_supports: dict):
2018-02-12 13:36:35 -05:00
# TODO: add 'address' to support items returned for a claim from lbrycrdd and lbryum-server
def _save_support(transaction):
2019-04-19 20:42:35 -03:00
bind = "({})".format(','.join(['?'] * len(claim_id_to_supports)))
transaction.execute(f"delete from support where claim_id in {bind}", list(claim_id_to_supports.keys()))
for claim_id, supports in claim_id_to_supports.items():
for support in supports:
transaction.execute(
"insert into support values (?, ?, ?, ?)",
("%s:%i" % (support['txid'], support['nout']), claim_id, lbc_to_dewies(support['amount']),
support.get('address', ""))
)
2018-12-15 15:31:02 -05:00
return self.db.run(_save_support)
2018-02-12 13:36:35 -05:00
def get_supports(self, *claim_ids):
2018-02-12 13:36:35 -05:00
def _format_support(outpoint, supported_id, amount, address):
return {
"txid": outpoint.split(":")[0],
"nout": int(outpoint.split(":")[1]),
"claim_id": supported_id,
"amount": dewies_to_lbc(amount),
2018-02-12 13:36:35 -05:00
"address": address,
}
def _get_supports(transaction):
return [
_format_support(*support_info)
2018-11-07 10:25:46 -03:00
for support_info in _batched_select(
transaction,
"select * from support where claim_id in {}",
tuple(claim_ids)
2018-11-07 10:25:46 -03:00
)
2018-02-12 13:36:35 -05:00
]
2018-12-15 15:31:02 -05:00
return self.db.run(_get_supports)
2018-02-12 13:36:35 -05:00
# # # # # # # # # claim functions # # # # # # # # #
2018-12-15 15:31:02 -05:00
async def save_claims(self, claim_infos):
2019-04-19 20:42:35 -03:00
claim_id_to_supports = {}
2018-12-15 15:31:02 -05:00
update_file_callbacks = []
2018-06-20 11:41:43 -04:00
def _save_claims(transaction):
content_claims_to_update = []
for claim_info in claim_infos:
outpoint = "%s:%i" % (claim_info['txid'], claim_info['nout'])
claim_id = claim_info['claim_id']
name = claim_info['name']
amount = lbc_to_dewies(claim_info['amount'])
2018-06-20 11:41:43 -04:00
height = claim_info['height']
address = claim_info['address']
sequence = claim_info['claim_sequence']
2019-03-20 01:46:23 -04:00
certificate_id = claim_info['value'].signing_channel_id
2018-06-20 11:41:43 -04:00
try:
2019-04-20 01:12:43 -04:00
source_hash = claim_info['value'].stream.source.sd_hash
2019-03-20 01:46:23 -04:00
except (AttributeError, ValueError):
2018-06-20 11:41:43 -04:00
source_hash = None
2019-03-20 01:46:23 -04:00
serialized = binascii.hexlify(claim_info['value'].to_bytes())
2018-06-20 11:41:43 -04:00
transaction.execute(
"insert or replace into claim values (?, ?, ?, ?, ?, ?, ?, ?, ?)",
(outpoint, claim_id, name, amount, height, serialized, certificate_id, address, sequence)
)
2019-01-22 15:43:01 -05:00
# if this response doesn't have support info don't overwrite the existing
# support info
if 'supports' in claim_info:
2019-04-19 20:42:35 -03:00
claim_id_to_supports[claim_id] = claim_info['supports']
2018-06-20 11:41:43 -04:00
if not source_hash:
continue
stream_hash = transaction.execute(
"select file.stream_hash from stream "
2019-01-22 15:43:01 -05:00
"inner join file on file.stream_hash=stream.stream_hash where sd_hash=?", (source_hash,)
2018-06-20 11:41:43 -04:00
).fetchone()
if not stream_hash:
continue
stream_hash = stream_hash[0]
known_outpoint = transaction.execute(
2019-01-22 15:43:01 -05:00
"select claim_outpoint from content_claim where stream_hash=?", (stream_hash,)
2019-03-20 01:46:23 -04:00
).fetchone()
2018-06-20 11:41:43 -04:00
known_claim_id = transaction.execute(
"select claim_id from claim "
"inner join content_claim c3 ON claim.claim_outpoint=c3.claim_outpoint "
2019-01-22 15:43:01 -05:00
"where c3.stream_hash=?", (stream_hash,)
2019-03-20 01:46:23 -04:00
).fetchone()
2018-06-20 11:41:43 -04:00
if not known_claim_id:
content_claims_to_update.append((stream_hash, outpoint))
elif known_outpoint != outpoint:
content_claims_to_update.append((stream_hash, outpoint))
for stream_hash, outpoint in content_claims_to_update:
self._save_content_claim(transaction, outpoint, stream_hash)
if stream_hash in self.content_claim_callbacks:
update_file_callbacks.append(self.content_claim_callbacks[stream_hash]())
2018-12-15 15:31:02 -05:00
await self.db.run(_save_claims)
if update_file_callbacks:
await asyncio.wait(update_file_callbacks)
2019-04-19 20:42:35 -03:00
if claim_id_to_supports:
await self.save_supports(claim_id_to_supports)
2018-08-15 19:23:06 -04:00
def save_claims_for_resolve(self, claim_infos):
to_save = {}
2018-08-15 19:23:06 -04:00
for info in claim_infos:
if 'value' in info:
if info['value']:
to_save[info['claim_id']] = info
2018-08-15 19:23:06 -04:00
else:
for key in ('certificate', 'claim'):
if info.get(key, {}).get('value'):
to_save[info[key]['claim_id']] = info[key]
return self.save_claims(to_save.values())
2018-08-15 19:23:06 -04:00
2018-06-20 11:41:43 -04:00
@staticmethod
def _save_content_claim(transaction, claim_outpoint, stream_hash):
# get the claim id and serialized metadata
claim_info = transaction.execute(
"select claim_id, serialized_metadata from claim where claim_outpoint=?", (claim_outpoint,)
).fetchone()
if not claim_info:
raise Exception("claim not found")
2019-03-20 01:46:23 -04:00
new_claim_id, claim = claim_info[0], Claim.from_bytes(binascii.unhexlify(claim_info[1]))
2018-06-20 11:41:43 -04:00
# certificate claims should not be in the content_claim table
if not claim.is_stream:
raise Exception("claim does not contain a stream")
# get the known sd hash for this stream
known_sd_hash = transaction.execute(
"select sd_hash from stream where stream_hash=?", (stream_hash,)
).fetchone()
if not known_sd_hash:
raise Exception("stream not found")
# check the claim contains the same sd hash
2019-04-20 01:12:43 -04:00
if known_sd_hash[0] != claim.stream.source.sd_hash:
2018-06-20 11:41:43 -04:00
raise Exception("stream mismatch")
# if there is a current claim associated to the file, check that the new claim is an update to it
current_associated_content = transaction.execute(
"select claim_outpoint from content_claim where stream_hash=?", (stream_hash,)
).fetchone()
if current_associated_content:
current_associated_claim_id = transaction.execute(
"select claim_id from claim where claim_outpoint=?", current_associated_content
).fetchone()[0]
if current_associated_claim_id != new_claim_id:
2018-10-25 17:51:17 -04:00
raise Exception(
f"mismatching claim ids when updating stream {current_associated_claim_id} vs {new_claim_id}"
)
2018-06-20 11:41:43 -04:00
# update the claim associated to the file
transaction.execute("insert or replace into content_claim values (?, ?)", (stream_hash, claim_outpoint))
2018-12-15 15:31:02 -05:00
async def save_content_claim(self, stream_hash, claim_outpoint):
await self.db.run(self._save_content_claim, claim_outpoint, stream_hash)
# update corresponding ManagedEncryptedFileDownloader object
if stream_hash in self.content_claim_callbacks:
2018-12-15 15:31:02 -05:00
await self.content_claim_callbacks[stream_hash]()
2018-02-12 13:36:35 -05:00
2019-01-22 15:43:01 -05:00
async def get_content_claim(self, stream_hash: str, include_supports: typing.Optional[bool] = True) -> typing.Dict:
claims = await self.db.run(get_claims_from_stream_hashes, [stream_hash])
claim = None
if claims:
claim = claims[stream_hash].as_dict()
if include_supports:
supports = await self.get_supports(claim['claim_id'])
2018-05-09 10:50:44 -03:00
claim['supports'] = supports
claim['effective_amount'] = calculate_effective_amount(claim['amount'], supports)
2019-01-22 15:43:01 -05:00
return claim
async def get_claims_from_stream_hashes(self, stream_hashes: typing.List[str],
include_supports: typing.Optional[bool] = True):
claims = await self.db.run(get_claims_from_stream_hashes, stream_hashes)
return {stream_hash: claim_info.as_dict() for stream_hash, claim_info in claims.items()}
2018-05-09 10:50:44 -03:00
2018-12-15 15:31:02 -05:00
async def get_claim(self, claim_outpoint, include_supports=True):
2019-01-22 15:43:01 -05:00
claim_info = await self.db.run(get_content_claim_from_outpoint, claim_outpoint)
if not claim_info:
return
result = claim_info.as_dict()
2018-02-12 13:36:35 -05:00
if include_supports:
2019-01-22 15:43:01 -05:00
supports = await self.get_supports(result['claim_id'])
result['supports'] = supports
result['effective_amount'] = calculate_effective_amount(result['amount'], supports)
2018-12-15 15:31:02 -05:00
return result
2018-02-12 13:36:35 -05:00
def get_unknown_certificate_ids(self):
def _get_unknown_certificate_claim_ids(transaction):
return [
claim_id for (claim_id,) in transaction.execute(
"select distinct c1.channel_claim_id from claim as c1 "
"where c1.channel_claim_id!='' "
"and c1.channel_claim_id not in "
"(select c2.claim_id from claim as c2)"
).fetchall()
]
2018-12-15 15:31:02 -05:00
return self.db.run(_get_unknown_certificate_claim_ids)
2018-02-28 14:59:12 -05:00
2018-12-15 15:31:02 -05:00
async def get_pending_claim_outpoints(self):
claim_outpoints = await self.run_and_return_list("select claim_outpoint from claim where height=-1")
2018-02-28 14:59:12 -05:00
results = {} # {txid: [nout, ...]}
for outpoint_str in claim_outpoints:
txid, nout = outpoint_str.split(":")
outputs = results.get(txid, [])
outputs.append(int(nout))
results[txid] = outputs
if results:
log.debug("missing transaction heights for %i claims", len(results))
2018-12-15 15:31:02 -05:00
return results
2018-02-28 14:59:12 -05:00
def save_claim_tx_heights(self, claim_tx_heights):
def _save_claim_heights(transaction):
for outpoint, height in claim_tx_heights.items():
2018-02-28 14:59:12 -05:00
transaction.execute(
"update claim set height=? where claim_outpoint=? and height=-1",
(height, outpoint)
)
2018-12-15 15:31:02 -05:00
return self.db.run(_save_claim_heights)
# # # # # # # # # reflector functions # # # # # # # # #
def update_reflected_stream(self, sd_hash, reflector_address, success=True):
if success:
2018-12-15 15:31:02 -05:00
return self.db.execute(
"insert or replace into reflected_stream values (?, ?, ?)",
2019-02-05 13:14:59 -03:00
(sd_hash, reflector_address, self.time_getter())
)
2018-12-15 15:31:02 -05:00
return self.db.execute(
"delete from reflected_stream where sd_hash=? and reflector_address=?",
(sd_hash, reflector_address)
)
def get_streams_to_re_reflect(self):
return self.run_and_return_list(
"select s.sd_hash from stream s "
"left outer join reflected_stream r on s.sd_hash=r.sd_hash "
"where r.timestamp is null or r.timestamp < ?",
int(self.time_getter()) - 86400
)