mirror of
https://github.com/flibusta-apps/telegram_files_cache_server.git
synced 2025-12-06 06:35:38 +01:00
151 lines
4.1 KiB
Python
151 lines
4.1 KiB
Python
import collections
|
|
import logging
|
|
import random
|
|
from datetime import timedelta
|
|
from tempfile import SpooledTemporaryFile
|
|
from typing import Optional, cast
|
|
|
|
import httpx
|
|
from arq.connections import ArqRedis
|
|
from arq.worker import Retry
|
|
from fastapi import UploadFile
|
|
from redis import asyncio as aioredis
|
|
from redis.exceptions import LockError
|
|
|
|
from app.models import CachedFile
|
|
from app.services.caption_getter import get_caption
|
|
from app.services.downloader import download
|
|
from app.services.files_client import upload_file
|
|
from app.services.library_client import Book, get_book, get_books
|
|
|
|
logger = logging.getLogger("telegram_channel_files_manager")
|
|
|
|
|
|
PAGE_SIZE = 100
|
|
|
|
|
|
class FileTypeNotAllowed(Exception):
|
|
def __init__(self, message: str) -> None:
|
|
super().__init__(message)
|
|
|
|
|
|
async def check_books_page(ctx, page_number: int) -> None:
|
|
arq_pool: ArqRedis = ctx["arc_pool"]
|
|
|
|
page = await get_books(page_number, PAGE_SIZE)
|
|
|
|
object_ids = [book.id for book in page.items]
|
|
|
|
cached_files = await CachedFile.objects.filter(object_id__in=object_ids).all()
|
|
|
|
cached_files_map = collections.defaultdict(set)
|
|
for cached_file in cached_files:
|
|
cached_files_map[cached_file.object_id].add(cached_file.object_type)
|
|
|
|
for book in page.items:
|
|
for file_type in book.available_types:
|
|
if file_type not in cached_files_map[book.id]:
|
|
await arq_pool.enqueue_job(
|
|
"cache_file_by_book_id",
|
|
book.id,
|
|
file_type,
|
|
by_request=False,
|
|
_job_id=f"cache_file_by_book_id_{book.id}_{file_type}",
|
|
)
|
|
|
|
|
|
async def check_books(ctx: dict, *args, **kwargs) -> None: # NOSONAR
|
|
arq_pool: ArqRedis = ctx["arc_pool"]
|
|
try:
|
|
books_page = await get_books(1, PAGE_SIZE)
|
|
except httpx.ConnectError:
|
|
raise Retry(defer=15) # noqa: B904
|
|
|
|
for i, page_number in enumerate(range(books_page.total_pages, 0, -1)):
|
|
await arq_pool.enqueue_job(
|
|
"check_books_page",
|
|
page_number,
|
|
_defer_by=2 * i,
|
|
_job_id=f"check_books_page_{page_number}",
|
|
)
|
|
|
|
|
|
async def cache_file(book: Book, file_type: str) -> Optional[CachedFile]:
|
|
if await CachedFile.objects.filter(
|
|
object_id=book.id, object_type=file_type
|
|
).exists():
|
|
return
|
|
|
|
retry_exc = Retry(defer=timedelta(minutes=15).seconds * random.random())
|
|
|
|
try:
|
|
data = await download(book.source.id, book.remote_id, file_type)
|
|
except httpx.HTTPError:
|
|
raise retry_exc
|
|
|
|
if data is None:
|
|
raise retry_exc
|
|
|
|
response, client, filename = data
|
|
caption = get_caption(book)
|
|
|
|
temp_file = UploadFile(filename)
|
|
async for chunk in response.aiter_bytes(2048):
|
|
await temp_file.write(chunk)
|
|
await temp_file.seek(0)
|
|
|
|
await response.aclose()
|
|
await client.aclose()
|
|
|
|
upload_data = await upload_file(
|
|
cast(SpooledTemporaryFile, temp_file.file), filename, caption
|
|
)
|
|
|
|
if upload_data is None:
|
|
return None
|
|
|
|
return await CachedFile.objects.create(
|
|
object_id=book.id,
|
|
object_type=file_type,
|
|
message_id=upload_data.data["message_id"],
|
|
chat_id=upload_data.data["chat_id"],
|
|
)
|
|
|
|
|
|
async def cache_file_by_book_id(
|
|
ctx: dict, # NOSONAR
|
|
book_id: int,
|
|
file_type: str,
|
|
by_request: bool = True,
|
|
) -> Optional[CachedFile]:
|
|
r_client: aioredis.Redis = ctx["redis"]
|
|
|
|
get_book_retry = 3 if by_request else 1
|
|
book = await get_book(book_id, get_book_retry)
|
|
|
|
if book is None:
|
|
if by_request:
|
|
return None
|
|
raise Retry(defer=15)
|
|
|
|
if file_type not in book.available_types:
|
|
return None
|
|
|
|
lock = r_client.lock(f"{book_id}_{file_type}", blocking_timeout=5)
|
|
|
|
try:
|
|
try:
|
|
async with lock:
|
|
result = await cache_file(book, file_type)
|
|
|
|
if by_request:
|
|
return result
|
|
except LockError:
|
|
raise Retry( # noqa: B904
|
|
defer=timedelta(minutes=15).seconds * random.random()
|
|
)
|
|
except Retry as e:
|
|
if by_request:
|
|
return None
|
|
raise e
|