Skip to content

Commit

Permalink
move more logic out of the downloader component
Browse files Browse the repository at this point in the history
  • Loading branch information
shyba committed Oct 25, 2021
1 parent cc9f184 commit 94f9377
Show file tree
Hide file tree
Showing 7 changed files with 51 additions and 76 deletions.
20 changes: 11 additions & 9 deletions lbry/blob/disk_space_manager.py
Expand Up @@ -15,8 +15,12 @@ def __init__(self, config, db, blob_manager, cleaning_interval=30 * 60, analytic
self.task = None
self.analytics = analytics

async def get_free_space_bytes(self, is_network_blob=False):
limit_mb = self.config.network_storage_limit if is_network_blob else self.config.blob_storage_limit
return max(0, limit_mb*1024*1024 - (await self.get_space_used_mb(is_network_blob)))

async def get_space_used_bytes(self, is_network_blob=False):
return await self.db.get_stored_blob_disk_usage(is_orphan_blob=is_network_blob)
return await self.db.get_stored_blob_disk_usage(is_network_blob=is_network_blob)

async def get_space_used_mb(self, is_network_blob=False):
return int(await self.get_space_used_bytes(is_network_blob)/1024.0/1024.0)
Expand All @@ -25,23 +29,21 @@ async def clean(self):
await self._clean(False)
await self._clean(True)

async def _clean(self, from_network_storage=False):
space_used_bytes = await self.get_space_used_bytes(from_network_storage)
if from_network_storage:
storage_limit = self.config.network_storage_limit*1024*1024 if self.config.network_storage_limit else None
else:
storage_limit = self.config.blob_storage_limit*1024*1024 if self.config.blob_storage_limit else None
async def _clean(self, is_network_blob=False):
space_used_bytes = await self.get_space_used_bytes(is_network_blob)
storage_limit_mb = self.config.network_storage_limit if is_network_blob else self.config.blob_storage_limit
storage_limit = storage_limit_mb*1024*1024 if storage_limit_mb else None
if self.analytics:
asyncio.create_task(
self.analytics.send_disk_space_used(space_used_bytes, storage_limit, from_network_storage)
self.analytics.send_disk_space_used(space_used_bytes, storage_limit, is_network_blob)
)
if not storage_limit:
return 0
delete = []
available = storage_limit - space_used_bytes
if available > 0:
return 0
for blob_hash, file_size, _ in await self.db.get_stored_blobs(is_mine=False, orphans=from_network_storage):
for blob_hash, file_size, _ in await self.db.get_stored_blobs(is_mine=False, is_network_blob=is_network_blob):
delete.append(blob_hash)
available += file_size
if available > 0:
Expand Down
5 changes: 5 additions & 0 deletions lbry/dht/node.py
Expand Up @@ -31,6 +31,11 @@ def __init__(self, loop: asyncio.AbstractEventLoop, peer_manager: 'PeerManager',
self._refresh_task: asyncio.Task = None
self._storage = storage

@property
def last_requested_blob_hash(self):
if len(self.protocol.data_store.requested_blobs) > 0:
return self.protocol.data_store.requested_blobs[-1]

async def refresh_node(self, force_once=False):
while True:
# remove peers with expired blob announcements from the datastore
Expand Down
60 changes: 24 additions & 36 deletions lbry/extras/daemon/components.py
Expand Up @@ -4,7 +4,6 @@
import logging
import binascii
import typing
from collections import deque

import base58

Expand All @@ -19,7 +18,7 @@
from lbry.blob.blob_manager import BlobManager
from lbry.blob.disk_space_manager import DiskSpaceManager
from lbry.blob_exchange.server import BlobServer
from lbry.stream.downloader import StreamDownloader
from lbry.stream.background_downloader import BackgroundDownloader
from lbry.stream.stream_manager import StreamManager
from lbry.file.file_manager import FileManager
from lbry.extras.daemon.component import Component
Expand Down Expand Up @@ -381,65 +380,54 @@ async def stop(self):
self.file_manager.stop()


class BackgroundDownloader(Component):
class BackgroundDownloaderComponent(Component):
component_name = BACKGROUND_DOWNLOADER_COMPONENT
depends_on = [DATABASE_COMPONENT, BLOB_COMPONENT, DISK_SPACE_COMPONENT]

def __init__(self, component_manager):
super().__init__(component_manager)
self.task: typing.Optional[asyncio.Task] = None
self.download_loop_delay_seconds = 60
self.finished_iteration = asyncio.Event()
self.requested_blobs = deque(maxlen=10)
self.ongoing_download: typing.Optional[asyncio.Task] = None
self.space_manager: typing.Optional[DiskSpaceManager] = None
self.background_downloader: typing.Optional[BackgroundDownloader] = None
self.dht_node: typing.Optional[Node] = None

@property
def is_busy(self):
return bool(self.ongoing_download and not self.ongoing_download.done())

@property
def component(self) -> 'BackgroundDownloader':
def component(self) -> 'BackgroundDownloaderComponent':
return self

async def get_status(self):
return {'running': self.task is not None and not self.task.done(), 'enqueued': len(self.requested_blobs)}
return {'running': self.task is not None and not self.task.done(),
'ongoing_download': self.is_busy}

async def loop(self):
while True:
if self.component_manager.has_component(DHT_COMPONENT):
node = self.component_manager.get_component(DHT_COMPONENT)
self.requested_blobs = node.protocol.data_store.requested_blobs
if self.requested_blobs and (not self.ongoing_download or self.ongoing_download.done()):
blob_hash = self.requested_blobs.pop()
self.ongoing_download = asyncio.create_task(self.download_blobs(blob_hash))
self.ongoing_download.add_done_callback(lambda _: self.finished_iteration.set())
self.finished_iteration.clear()
if not self.is_busy and await self.space_manager.get_free_space_bytes(True) > 0:
blob_hash = self.dht_node.last_requested_blob_hash
if blob_hash:
self.ongoing_download = asyncio.create_task(self.background_downloader.download_blobs(blob_hash))
await asyncio.sleep(self.download_loop_delay_seconds)

async def download_blobs(self, sd_hash):
if self.conf.network_storage_limit <= 0:
return
space_manager: DiskSpaceManager = self.component_manager.get_component(DISK_SPACE_COMPONENT)
if (await space_manager.get_space_used_mb(True)) >= self.conf.network_storage_limit:
log.info("Allocated space for proactive downloader is full. Background download aborted.")
async def start(self):
self.space_manager: DiskSpaceManager = self.component_manager.get_component(DISK_SPACE_COMPONENT)
if not self.component_manager.has_component(DHT_COMPONENT):
return
self.dht_node = self.component_manager.get_component(DHT_COMPONENT)
blob_manager = self.component_manager.get_component(BLOB_COMPONENT)
downloader = StreamDownloader(asyncio.get_running_loop(), self.conf, blob_manager, sd_hash)
storage = blob_manager.storage
node = None
if self.component_manager.has_component(DHT_COMPONENT):
node = self.component_manager.get_component(DHT_COMPONENT)
try:
await downloader.start(node, save_stream=False)
except ValueError:
return
for blob_info in downloader.descriptor.blobs[:-1]:
await downloader.download_stream_blob(blob_info)
await storage.set_announce(sd_hash, downloader.descriptor.blobs[0].blob_hash)

async def start(self):
storage = self.component_manager.get_component(DATABASE_COMPONENT)
self.background_downloader = BackgroundDownloader(self.conf, storage, blob_manager, self.dht_node)
self.task = asyncio.create_task(self.loop())

async def stop(self):
if self.ongoing_download and not self.ongoing_download.done():
self.ongoing_download.cancel()
self.task.cancel()
if self.task:
self.task.cancel()


class DiskSpaceComponent(Component):
Expand Down
10 changes: 5 additions & 5 deletions lbry/extras/daemon/storage.py
Expand Up @@ -442,9 +442,9 @@ def delete_blobs(transaction):
def get_all_blob_hashes(self):
return self.run_and_return_list("select blob_hash from blob")

async def get_stored_blobs(self, is_mine: bool, orphans=False):
async def get_stored_blobs(self, is_mine: bool, is_network_blob=False):
is_mine = 1 if is_mine else 0
if orphans:
if is_network_blob:
return await self.db.execute_fetchall(
"select blob.blob_hash, blob.blob_length, blob.added_on "
"from blob left join stream_blob using (blob_hash) "
Expand All @@ -466,14 +466,14 @@ async def get_stored_blobs(self, is_mine: bool, orphans=False):
)
return normal_blobs + sd_blobs

async def get_stored_blob_disk_usage(self, is_mine: Optional[bool] = None, is_orphan_blob: bool = False):
async def get_stored_blob_disk_usage(self, is_mine: Optional[bool] = None, is_network_blob: bool = False):
sql = "select coalesce(sum(blob_length), 0) "
if is_orphan_blob:
if is_network_blob:
sql += "from blob left join stream_blob using (blob_hash) where stream_blob.stream_hash is null"
else:
sql += "from blob join stream_blob using (blob_hash)"
if is_mine is not None:
sql += f'{(" and " if is_orphan_blob else " where ")} is_mine=?'
sql += f'{(" and " if is_network_blob else " where ")} is_mine=?'
args = (1 if is_mine else 0,) if is_mine is not None else ()
return (await self.db.execute_fetchone(sql, args))[0]

Expand Down
4 changes: 2 additions & 2 deletions lbry/stream/background_downloader.py
Expand Up @@ -4,7 +4,7 @@


class BackgroundDownloader:
def __init__(self, conf, storage, blob_manager, dht_node):
def __init__(self, conf, storage, blob_manager, dht_node=None):
self.storage = storage
self.blob_manager = blob_manager
self.node = dht_node
Expand All @@ -18,4 +18,4 @@ async def download_blobs(self, sd_hash):
return
for blob_info in downloader.descriptor.blobs[:-1]:
await downloader.download_stream_blob(blob_info)
await self.storage.set_announce(sd_hash, downloader.descriptor.blobs[0].blob_hash)
await self.storage.set_announce(sd_hash, downloader.descriptor.blobs[0].blob_hash)
26 changes: 3 additions & 23 deletions tests/integration/datanetwork/test_file_commands.py
Expand Up @@ -4,6 +4,7 @@
from binascii import hexlify

from lbry.schema import Claim
from lbry.stream.background_downloader import BackgroundDownloader
from lbry.stream.descriptor import StreamDescriptor
from lbry.testcase import CommandTestCase
from lbry.extras.daemon.components import TorrentSession, BACKGROUND_DOWNLOADER_COMPONENT
Expand Down Expand Up @@ -611,8 +612,7 @@ async def test_ensure_download(self):
content2 = content2['outputs'][0]['value']['source']['sd_hash']
self.assertEqual('48', (await self.status())['disk_space']['space_used'])

proactive_downloader = self.daemon.component_manager.get_component(BACKGROUND_DOWNLOADER_COMPONENT)
self.daemon.conf.network_storage_limit = 100
proactive_downloader = BackgroundDownloader(self.daemon.conf, self.daemon.storage, self.daemon.blob_manager)
await self.clear()
self.assertEqual('0', (await self.status())['disk_space']['space_used'])
self.assertEqual('0', (await self.status())['disk_space']['network_seeding_space_used'])
Expand All @@ -636,34 +636,14 @@ async def test_ensure_download(self):
await proactive_downloader.download_blobs(blobs[0].blob_hash)
self.assertEqual({blobs[0].blob_hash}, self.daemon.blob_manager.completed_blob_hashes)

# trigger from requested blobs
await self.clear()
await proactive_downloader.stop()
proactive_downloader.requested_blobs.append(content1)
finished = proactive_downloader.finished_iteration.wait()
await proactive_downloader.start()
await finished
await self.assertBlobs(content1)
await self.clear()
# test that disk space manager doesn't delete orphan network blobs
await proactive_downloader.download_blobs(content1)
await self.daemon.storage.db.execute_fetchall("update blob set added_on=0") # so it is preferred for cleaning
await self.daemon.jsonrpc_get("content2", save_file=False)
while (await self.file_list())[0]['status'] == 'running':
while (await self.file_list())[0]['status'] != 'stopped':
await asyncio.sleep(0.5)
await self.assertBlobs(content1, no_files=False)

self.daemon.conf.blob_storage_limit = 1
await self.blob_clean()
await self.assertBlobs(content1, no_files=False)

# downloading above limit triggers cleanup
self.daemon.conf.network_storage_limit = 6
with self.assertLogs() as log:
await proactive_downloader.download_blobs(content2)
self.assertIn('Allocated space for proactive downloader is full.', log.output[0])
await self.assertBlobs(content1, no_files=False)
self.assertEqual('32', (await self.status())['disk_space']['network_seeding_space_used'])
await self.blob_clean()
self.assertLessEqual(int((await self.status())['disk_space']['network_seeding_space_used']),
self.daemon.conf.network_storage_limit)
2 changes: 1 addition & 1 deletion tests/unit/components/test_component_manager.py
Expand Up @@ -33,7 +33,7 @@ def setUp(self):
components.WalletServerPaymentsComponent
],
[
components.BackgroundDownloader,
components.BackgroundDownloaderComponent,
]
]
self.component_manager = ComponentManager(Config())
Expand Down

0 comments on commit 94f9377

Please sign in to comment.