mirror of
https://github.com/paperless-ngx/paperless-ngx.git
synced 2026-03-19 07:25:58 +00:00
35 lines
1.2 KiB
Python
35 lines
1.2 KiB
Python
import os
|
|
|
|
from celery import Celery
|
|
from celery.signals import worker_process_init
|
|
|
|
# Set the default Django settings module for the 'celery' program.
|
|
os.environ.setdefault("DJANGO_SETTINGS_MODULE", "paperless.settings")
|
|
|
|
app = Celery("paperless")
|
|
|
|
# Using a string here means the worker doesn't have to serialize
|
|
# the configuration object to child processes.
|
|
# - namespace='CELERY' means all celery-related configuration keys
|
|
# should have a `CELERY_` prefix.
|
|
app.config_from_object("django.conf:settings", namespace="CELERY")
|
|
|
|
# Load task modules from all registered Django apps.
|
|
app.autodiscover_tasks()
|
|
|
|
|
|
@worker_process_init.connect
|
|
def on_worker_process_init(**kwargs) -> None: # pragma: no cover
|
|
"""
|
|
Register built-in parsers eagerly in each Celery worker process.
|
|
|
|
This registers only the built-in parsers (no entrypoint discovery) so
|
|
that workers can begin consuming documents immediately. Entrypoint
|
|
discovery for third-party parsers is deferred to the first call of
|
|
get_parser_registry() inside a task, keeping worker_process_init
|
|
well within its 4-second timeout budget.
|
|
"""
|
|
from paperless.parsers.registry import init_builtin_parsers
|
|
|
|
init_builtin_parsers()
|