2019-01-22 12:54:17 -05:00
|
|
|
import os
|
|
|
|
import binascii
|
|
|
|
import logging
|
|
|
|
import typing
|
|
|
|
import asyncio
|
|
|
|
from lbrynet.blob import MAX_BLOB_SIZE
|
|
|
|
from lbrynet.stream.descriptor import StreamDescriptor
|
|
|
|
if typing.TYPE_CHECKING:
|
|
|
|
from lbrynet.blob.blob_manager import BlobFileManager
|
|
|
|
from lbrynet.blob.blob_info import BlobInfo
|
|
|
|
from lbrynet.blob.blob_file import BlobFile
|
|
|
|
|
|
|
|
|
|
|
|
log = logging.getLogger(__name__)
|
|
|
|
|
|
|
|
|
|
|
|
def _get_next_available_file_name(download_directory: str, file_name: str) -> str:
|
2019-02-05 15:26:14 -05:00
|
|
|
base_name, ext = os.path.splitext(os.path.basename(file_name))
|
2019-01-22 12:54:17 -05:00
|
|
|
i = 0
|
|
|
|
while os.path.isfile(os.path.join(download_directory, file_name)):
|
|
|
|
i += 1
|
|
|
|
file_name = "%s_%i%s" % (base_name, i, ext)
|
|
|
|
|
2019-02-13 20:41:01 -03:00
|
|
|
return file_name
|
2019-01-22 12:54:17 -05:00
|
|
|
|
|
|
|
|
|
|
|
async def get_next_available_file_name(loop: asyncio.BaseEventLoop, download_directory: str, file_name: str) -> str:
|
|
|
|
return await loop.run_in_executor(None, _get_next_available_file_name, download_directory, file_name)
|
|
|
|
|
|
|
|
|
|
|
|
class StreamAssembler:
|
2019-02-13 20:41:01 -03:00
|
|
|
def __init__(self, loop: asyncio.BaseEventLoop, blob_manager: 'BlobFileManager', sd_hash: str,
|
2019-02-13 20:44:38 -03:00
|
|
|
output_file_name: typing.Optional[str] = None):
|
2019-02-13 20:41:01 -03:00
|
|
|
self.output_file_name = output_file_name
|
2019-01-22 12:54:17 -05:00
|
|
|
self.loop = loop
|
|
|
|
self.blob_manager = blob_manager
|
|
|
|
self.sd_hash = sd_hash
|
|
|
|
self.sd_blob: 'BlobFile' = None
|
|
|
|
self.descriptor: StreamDescriptor = None
|
|
|
|
self.got_descriptor = asyncio.Event(loop=self.loop)
|
|
|
|
self.wrote_bytes_event = asyncio.Event(loop=self.loop)
|
|
|
|
self.stream_finished_event = asyncio.Event(loop=self.loop)
|
|
|
|
self.output_path = ''
|
|
|
|
self.stream_handle = None
|
|
|
|
self.written_bytes: int = 0
|
|
|
|
|
|
|
|
async def _decrypt_blob(self, blob: 'BlobFile', blob_info: 'BlobInfo', key: str):
|
2019-02-06 09:29:19 -05:00
|
|
|
if not blob or not self.stream_handle or self.stream_handle.closed:
|
2019-02-01 16:04:53 -03:00
|
|
|
return False
|
2019-01-22 12:54:17 -05:00
|
|
|
|
|
|
|
def _decrypt_and_write():
|
2019-02-01 16:04:53 -03:00
|
|
|
offset = blob_info.blob_num * (MAX_BLOB_SIZE - 1)
|
2019-01-22 12:54:17 -05:00
|
|
|
self.stream_handle.seek(offset)
|
|
|
|
_decrypted = blob.decrypt(
|
|
|
|
binascii.unhexlify(key), binascii.unhexlify(blob_info.iv.encode())
|
|
|
|
)
|
|
|
|
self.stream_handle.write(_decrypted)
|
|
|
|
self.stream_handle.flush()
|
|
|
|
self.written_bytes += len(_decrypted)
|
2019-01-29 20:47:02 -05:00
|
|
|
log.debug("decrypted %s", blob.blob_hash[:8])
|
2019-02-01 16:04:53 -03:00
|
|
|
|
|
|
|
await self.loop.run_in_executor(None, _decrypt_and_write)
|
2019-02-05 00:39:43 -03:00
|
|
|
return True
|
2019-01-22 12:54:17 -05:00
|
|
|
|
2019-01-30 14:57:09 -05:00
|
|
|
async def setup(self):
|
|
|
|
pass
|
|
|
|
|
|
|
|
async def after_got_descriptor(self):
|
|
|
|
pass
|
|
|
|
|
|
|
|
async def after_finished(self):
|
|
|
|
pass
|
|
|
|
|
2019-01-22 12:54:17 -05:00
|
|
|
async def assemble_decrypted_stream(self, output_dir: str, output_file_name: typing.Optional[str] = None):
|
|
|
|
if not os.path.isdir(output_dir):
|
|
|
|
raise OSError(f"output directory does not exist: '{output_dir}' '{output_file_name}'")
|
2019-01-30 14:57:09 -05:00
|
|
|
await self.setup()
|
2019-01-22 12:54:17 -05:00
|
|
|
self.sd_blob = await self.get_blob(self.sd_hash)
|
|
|
|
self.descriptor = await StreamDescriptor.from_stream_descriptor_blob(self.loop, self.blob_manager.blob_dir,
|
|
|
|
self.sd_blob)
|
2019-02-05 00:39:43 -03:00
|
|
|
await self.after_got_descriptor()
|
2019-02-13 20:41:01 -03:00
|
|
|
self.output_file_name = output_file_name or self.descriptor.suggested_file_name
|
|
|
|
self.output_file_name = await get_next_available_file_name(self.loop, output_dir, self.output_file_name)
|
|
|
|
self.output_path = os.path.join(output_dir, self.output_file_name)
|
2019-01-22 12:54:17 -05:00
|
|
|
if not self.got_descriptor.is_set():
|
|
|
|
self.got_descriptor.set()
|
|
|
|
await self.blob_manager.storage.store_stream(
|
|
|
|
self.sd_blob, self.descriptor
|
|
|
|
)
|
2019-02-05 00:23:04 -03:00
|
|
|
await self.blob_manager.blob_completed(self.sd_blob)
|
2019-02-06 09:29:19 -05:00
|
|
|
written_blobs = None
|
2019-02-08 03:42:31 -03:00
|
|
|
save_tasks = []
|
2019-02-06 09:29:19 -05:00
|
|
|
try:
|
|
|
|
with open(self.output_path, 'wb') as stream_handle:
|
|
|
|
self.stream_handle = stream_handle
|
|
|
|
for i, blob_info in enumerate(self.descriptor.blobs[:-1]):
|
|
|
|
if blob_info.blob_num != i:
|
|
|
|
log.error("sd blob %s is invalid, cannot assemble stream", self.descriptor.sd_hash)
|
2019-01-31 17:34:48 -05:00
|
|
|
return
|
2019-02-06 09:29:19 -05:00
|
|
|
while self.stream_handle and not self.stream_handle.closed:
|
|
|
|
try:
|
|
|
|
blob = await self.get_blob(blob_info.blob_hash, blob_info.length)
|
2019-02-06 15:40:16 -03:00
|
|
|
if blob and blob.length != blob_info.length:
|
|
|
|
log.warning("Found incomplete, deleting: %s", blob_info.blob_hash)
|
|
|
|
await self.blob_manager.delete_blobs([blob_info.blob_hash])
|
|
|
|
continue
|
2019-02-06 09:29:19 -05:00
|
|
|
if await self._decrypt_blob(blob, blob_info, self.descriptor.key):
|
2019-02-08 03:42:31 -03:00
|
|
|
save_tasks.append(asyncio.ensure_future(self.blob_manager.blob_completed(blob)))
|
2019-02-06 09:29:19 -05:00
|
|
|
written_blobs = i
|
2019-02-06 13:08:57 -05:00
|
|
|
if not self.wrote_bytes_event.is_set():
|
|
|
|
self.wrote_bytes_event.set()
|
|
|
|
log.debug("written %i/%i", written_blobs, len(self.descriptor.blobs) - 2)
|
2019-02-06 09:29:19 -05:00
|
|
|
break
|
|
|
|
except FileNotFoundError:
|
|
|
|
log.debug("stream assembler stopped")
|
|
|
|
return
|
|
|
|
except (ValueError, IOError, OSError):
|
|
|
|
log.warning("failed to decrypt blob %s for stream %s", blob_info.blob_hash,
|
|
|
|
self.descriptor.sd_hash)
|
|
|
|
continue
|
|
|
|
finally:
|
2019-02-06 12:18:24 -05:00
|
|
|
if written_blobs == len(self.descriptor.blobs) - 2:
|
2019-02-06 09:29:19 -05:00
|
|
|
log.debug("finished decrypting and assembling stream")
|
2019-02-14 17:35:06 -03:00
|
|
|
if save_tasks:
|
|
|
|
await asyncio.wait(save_tasks)
|
2019-02-06 09:29:19 -05:00
|
|
|
await self.after_finished()
|
2019-02-06 13:32:50 -05:00
|
|
|
self.stream_finished_event.set()
|
2019-02-06 09:29:19 -05:00
|
|
|
else:
|
2019-02-06 13:08:57 -05:00
|
|
|
log.debug("stream decryption and assembly did not finish (%i/%i blobs are done)", written_blobs or 0,
|
2019-02-06 12:18:24 -05:00
|
|
|
len(self.descriptor.blobs) - 2)
|
2019-02-14 17:35:06 -03:00
|
|
|
if self.output_path and os.path.isfile(self.output_path):
|
2019-02-13 21:30:32 -03:00
|
|
|
log.debug("erasing incomplete file assembly: %s", self.output_path)
|
|
|
|
os.unlink(self.output_path)
|
2019-01-22 12:54:17 -05:00
|
|
|
|
|
|
|
async def get_blob(self, blob_hash: str, length: typing.Optional[int] = None) -> 'BlobFile':
|
2019-01-30 14:57:09 -05:00
|
|
|
return self.blob_manager.get_blob(blob_hash, length)
|