85 lines
3.2 KiB
Python
85 lines
3.2 KiB
Python
from __future__ import absolute_import
|
|
|
|
import logging
|
|
|
|
from django.db import transaction
|
|
from django.utils.translation import ugettext_lazy as _
|
|
from django.utils.translation import ugettext
|
|
from django.db.models.signals import post_save, post_syncdb
|
|
from django.dispatch import receiver
|
|
from django.db.utils import DatabaseError
|
|
|
|
from navigation.api import (bind_links, register_multi_item_links,
|
|
register_multi_item_links)
|
|
from documents.models import Document, DocumentVersion
|
|
from maintenance.api import register_maintenance_links
|
|
from project_tools.api import register_tool
|
|
from acls.api import class_permissions
|
|
from scheduler.api import register_interval_job
|
|
from statistics.api import register_statistics
|
|
from job_processor.models import JobQueue, JobType
|
|
|
|
from .conf.settings import (AUTOMATIC_OCR, QUEUE_PROCESSING_INTERVAL)
|
|
from .models import OCRProcessingSingleton
|
|
from .api import do_document_ocr
|
|
from .permissions import PERMISSION_OCR_DOCUMENT
|
|
from .exceptions import AlreadyQueued
|
|
from . import models as ocr_models
|
|
from .statistics import get_statistics
|
|
from .literals import OCR_QUEUE_NAME
|
|
|
|
logger = logging.getLogger(__name__)
|
|
ocr_job_queue = None
|
|
|
|
from .links import (submit_document, re_queue_multiple_document,
|
|
queue_document_multiple_delete, ocr_disable,
|
|
ocr_enable, all_document_ocr_cleanup, ocr_log,
|
|
ocr_tool_link, submit_document_multiple)
|
|
|
|
bind_links([Document], [submit_document])
|
|
bind_links([OCRProcessingSingleton], [ocr_disable, ocr_enable])
|
|
#register_multi_item_links(['queue_document_list'], [re_queue_multiple_document, queue_document_multiple_delete])
|
|
|
|
register_maintenance_links([all_document_ocr_cleanup], namespace='ocr', title=_(u'OCR'))
|
|
register_multi_item_links(['folder_view', 'search', 'results', 'index_instance_node_view', 'document_find_duplicates', 'document_type_document_list', 'document_group_view', 'document_list', 'document_list_recent'], [submit_document_multiple])
|
|
|
|
|
|
@transaction.commit_on_success
|
|
def create_ocr_job_queue():
|
|
global ocr_job_queue
|
|
try:
|
|
ocr_job_queue, created = JobQueue.objects.get_or_create(name=OCR_QUEUE_NAME, defaults={'label': _('OCR'), 'unique_jobs': True})
|
|
except DatabaseError:
|
|
transaction.rollback()
|
|
|
|
|
|
@receiver(post_save, dispatch_uid='document_post_save', sender=DocumentVersion)
|
|
def document_post_save(sender, instance, **kwargs):
|
|
logger.debug('received post save signal')
|
|
logger.debug('instance: %s' % instance)
|
|
if kwargs.get('created', False):
|
|
if AUTOMATIC_OCR:
|
|
try:
|
|
DocumentQueue.objects.queue_document(instance.document)
|
|
except AlreadyQueued:
|
|
pass
|
|
|
|
# Disabled because it appears Django execute signals using the same
|
|
# process of the signal emiter effectively blocking the view until
|
|
# the OCR process completes which could take several minutes :/
|
|
#@receiver(post_save, dispatch_uid='call_queue', sender=QueueDocument)
|
|
#def call_queue(sender, **kwargs):
|
|
# if kwargs.get('created', False):
|
|
# logger.debug('got call_queue signal: %s' % kwargs)
|
|
# task_process_document_queues()
|
|
|
|
register_tool(ocr_tool_link)
|
|
|
|
class_permissions(Document, [
|
|
PERMISSION_OCR_DOCUMENT,
|
|
])
|
|
|
|
#register_statistics(get_statistics)
|
|
create_ocr_job_queue()
|
|
ocr_job_type = JobType('ocr', _(u'OCR'), do_document_ocr)
|