video_downloader_service/src/core/master_service.py

94 lines
3.3 KiB
Python
Raw Normal View History

import asyncio
import concurrent.futures as pool
import os.path
import subprocess
2023-08-24 03:28:55 +03:00
from functools import partial
from fastapi import HTTPException
from src.core.async_queue import AsyncQueue
2023-08-24 16:45:55 +03:00
from src.core.rabbitmq import get_messages
from src.core.redis_client import RedisClient
2023-08-24 16:45:55 +03:00
from src.core.result import Result, ResultTypeEnum
from src.core.ydl import VideoDownloader
from src.exceptions.download_exceptions import SiteNotImplementedException
2023-08-24 03:28:55 +03:00
class MasterService:
def __init__(self):
2023-08-24 16:45:55 +03:00
self.loop = asyncio.get_event_loop()
2023-08-24 03:28:55 +03:00
self.MAX_EXECUTOR_WORKERS = 8
2023-08-24 16:45:55 +03:00
self.executor = pool.ProcessPoolExecutor(max_workers=self.MAX_EXECUTOR_WORKERS,
initializer=executor_initializer)
self.queue = AsyncQueue()
2023-08-24 03:28:55 +03:00
self.rabbit_consumer = get_messages
2023-08-24 16:45:55 +03:00
self.currently_underway = {} # contains currently in progress videos
2023-08-24 03:28:55 +03:00
async def run(self):
subprocess.run(
"for pid in $(ps -ef | grep video_downloader_executor_process | awk '{print $2}'); do kill -9 $pid; done",
shell=True, capture_output=True
)
2023-08-24 16:45:55 +03:00
tasks = [self.loop.create_task(self.create_workers()) for i in range(self.MAX_EXECUTOR_WORKERS + 1)]
2023-08-24 03:28:55 +03:00
await asyncio.gather(self.rabbit_consumer(self.queue), *tasks)
2023-08-24 16:45:55 +03:00
async def create_workers(self):
while True:
video_params = await self.queue.get()
redis = RedisClient()
await redis.del_task_from_queue_and_add_to_tasks(task=video_params)
2023-08-24 16:45:55 +03:00
self.currently_underway[video_params['link']] = video_params
download_task = self.loop.run_in_executor(self.executor, partial(
MasterService.video_processing_executor, video_params=video_params
)
2023-08-24 16:45:55 +03:00
)
result = await download_task
await redis.del_task_from_tasks_and_add_to_task_done(task=video_params)
# TODO process result
2023-08-24 16:45:55 +03:00
self.queue.task_done()
@staticmethod
def video_download(video_params: dict):
ydl_opts = {
"format": video_params["format"],
"merge_output_format": video_params["merge_output_format"],
'outtmpl': video_params["outtmpl"],
"quiet": True
2023-08-24 16:45:55 +03:00
}
downloader = VideoDownloader(link=video_params["link"], ydl_opts=ydl_opts)
video_info = downloader.get_info()
if os.path.exists(
os.path.join(os.getcwd() + f"Youtube/{video_info['id']}_{video_info['width']}.{video_info['ext']}")
):
return Result(result_type=ResultTypeEnum.EXIST)
2023-08-24 16:45:55 +03:00
try:
downloader.ydl_opts["quiet"] = False
2023-08-24 16:45:55 +03:00
result = downloader.download()
return result
except SiteNotImplementedException as ex:
raise HTTPException(
status_code=400,
detail=ex.message
)
@staticmethod
def video_processing_executor(video_params: dict):
try:
MasterService.video_download(video_params=video_params)
return Result(result_type=ResultTypeEnum.DONE)
except Exception as ex:
return Result(result_type=ResultTypeEnum.EXCEPTION, value=ex)
# TODO upload to server
def executor_initializer():
import setproctitle
setproctitle.setproctitle(f'video_downloader_executor_process')
return True