2024-09-10 07:04:39 +00:00
|
|
|
__package__ = 'archivebox.queues'
|
|
|
|
|
|
|
|
from django_huey import db_task, task
|
|
|
|
|
|
|
|
from huey_monitor.models import TaskModel
|
|
|
|
from huey_monitor.tqdm import ProcessInfo
|
|
|
|
|
2024-09-25 04:17:51 +00:00
|
|
|
from .supervisor_util import get_or_create_supervisord_process
|
|
|
|
|
|
|
|
|
2024-09-10 07:04:39 +00:00
|
|
|
@db_task(queue="system_tasks", context=True)
|
|
|
|
def bg_add(add_kwargs, task=None, parent_task_id=None):
|
2024-09-25 04:17:51 +00:00
|
|
|
get_or_create_supervisord_process(daemonize=True)
|
|
|
|
|
2024-09-10 07:04:39 +00:00
|
|
|
from ..main import add
|
|
|
|
|
|
|
|
if task and parent_task_id:
|
|
|
|
TaskModel.objects.set_parent_task(main_task_id=parent_task_id, sub_task_id=task.id)
|
|
|
|
|
|
|
|
assert add_kwargs and add_kwargs.get("urls")
|
|
|
|
rough_url_count = add_kwargs["urls"].count("://")
|
|
|
|
|
|
|
|
process_info = ProcessInfo(task, desc="add", parent_task_id=parent_task_id, total=rough_url_count)
|
|
|
|
|
|
|
|
result = add(**add_kwargs)
|
|
|
|
process_info.update(n=rough_url_count)
|
|
|
|
return result
|
|
|
|
|
|
|
|
|
|
|
|
@task(queue="system_tasks", context=True)
|
|
|
|
def bg_archive_links(args, kwargs=None, task=None, parent_task_id=None):
|
2024-09-25 04:17:51 +00:00
|
|
|
get_or_create_supervisord_process(daemonize=True)
|
|
|
|
|
2024-09-10 07:04:39 +00:00
|
|
|
from ..extractors import archive_links
|
|
|
|
|
|
|
|
if task and parent_task_id:
|
|
|
|
TaskModel.objects.set_parent_task(main_task_id=parent_task_id, sub_task_id=task.id)
|
|
|
|
|
|
|
|
assert args and args[0]
|
|
|
|
kwargs = kwargs or {}
|
|
|
|
|
|
|
|
rough_count = len(args[0])
|
|
|
|
|
|
|
|
process_info = ProcessInfo(task, desc="archive_links", parent_task_id=parent_task_id, total=rough_count)
|
|
|
|
|
|
|
|
result = archive_links(*args, **kwargs)
|
|
|
|
process_info.update(n=rough_count)
|
|
|
|
return result
|
2024-09-25 04:17:51 +00:00
|
|
|
|
|
|
|
|
|
|
|
@task(queue="system_tasks", context=True)
|
|
|
|
def bg_archive_link(args, kwargs=None,task=None, parent_task_id=None):
|
|
|
|
get_or_create_supervisord_process(daemonize=True)
|
|
|
|
|
|
|
|
from ..extractors import archive_link
|
|
|
|
|
|
|
|
if task and parent_task_id:
|
|
|
|
TaskModel.objects.set_parent_task(main_task_id=parent_task_id, sub_task_id=task.id)
|
|
|
|
|
|
|
|
assert args and args[0]
|
|
|
|
kwargs = kwargs or {}
|
|
|
|
|
|
|
|
rough_count = len(args[0])
|
|
|
|
|
|
|
|
process_info = ProcessInfo(task, desc="archive_link", parent_task_id=parent_task_id, total=rough_count)
|
|
|
|
|
|
|
|
result = archive_link(*args, **kwargs)
|
|
|
|
process_info.update(n=rough_count)
|
|
|
|
return result
|
|
|
|
|
|
|
|
|
|
|
|
@task(queue="system_tasks", context=True)
|
|
|
|
def bg_archive_snapshot(snapshot, overwrite=False, methods=None, task=None, parent_task_id=None):
|
|
|
|
# get_or_create_supervisord_process(daemonize=True)
|
|
|
|
|
|
|
|
from ..extractors import archive_link
|
|
|
|
|
|
|
|
if task and parent_task_id:
|
|
|
|
TaskModel.objects.set_parent_task(main_task_id=parent_task_id, sub_task_id=task.id)
|
|
|
|
|
|
|
|
process_info = ProcessInfo(task, desc="archive_link", parent_task_id=parent_task_id, total=1)
|
|
|
|
|
|
|
|
link = snapshot.as_link_with_details()
|
|
|
|
|
|
|
|
result = archive_link(link, overwrite=overwrite, methods=methods)
|
|
|
|
process_info.update(n=1)
|
|
|
|
return result
|
|
|
|
|