Make cache update background task

This commit is contained in:
2022-01-08 20:51:31 +03:00
parent 272a54a6fe
commit d7620f07ad
3 changed files with 28 additions and 16 deletions

View File

@@ -1,4 +1,5 @@
import asyncio
import logging
from typing import Optional
from app.models import CachedFile
@@ -8,7 +9,15 @@ from app.services.files_uploader import upload_file
from app.services.library_client import get_books, get_book, Book
PAGE_SIZE = 50
logger = logging.getLogger("telegram_channel_files_manager")
PAGE_SIZE = 100
class FileTypeNotAllowed(Exception):
def __init__(self, message: str) -> None:
super().__init__(message)
class CacheUpdater:
@@ -18,21 +27,17 @@ class CacheUpdater:
async def _check_book(self, book: Book):
for file_type in book.available_types:
cached_file = await CachedFile.objects.get_or_none(
exists = await CachedFile.objects.filter(
object_id=book.id, object_type=file_type
)
).exists()
if cached_file is None:
if not exists:
await self.queue.put((book, file_type))
async def _start_producer(self):
books_page = await get_books(1, 1)
books_page = await get_books(1, PAGE_SIZE)
page_count = books_page.total // PAGE_SIZE
if books_page.total % PAGE_SIZE != 0:
page_count += 1
for page_number in range(1, page_count + 1):
for page_number in range(1, books_page.total_pages + 1):
page = await get_books(page_number, PAGE_SIZE)
for book in page.items:
@@ -42,6 +47,7 @@ class CacheUpdater:
@classmethod
async def _cache_file(cls, book: Book, file_type) -> Optional[CachedFile]:
logger.info(f"Cache {book.id} {file_type}...")
data = await download(book.source.id, book.remote_id, file_type)
if data is None:
@@ -70,9 +76,12 @@ class CacheUpdater:
await self._cache_file(book, file_type)
async def _update(self):
logger.info("Start update...")
await asyncio.gather(
self._start_producer(), self._start_worker(), self._start_worker()
self._start_producer(),
*[self._start_worker() for _ in range(2)],
)
logger.info("Update complete!")
@classmethod
async def update(cls):
@@ -84,6 +93,6 @@ class CacheUpdater:
book = await get_book(book_id)
if file_type not in book.available_types:
return None # ToDO: raise HTTPException
raise FileTypeNotAllowed(f"{file_type} not in {book.available_types}!")
return await cls._cache_file(book, file_type)