Initial changes for the new queue based OCR processing

This commit is contained in:
Roberto Rosario
2012-07-29 05:33:04 -04:00
parent d97b3f344d
commit d2e6df4dde
14 changed files with 280 additions and 180 deletions

View File

@@ -87,7 +87,7 @@ def do_document_ocr(queue_document):
parser, if the parser fails or if there is no parser registered for
the document mimetype do a visual OCR by calling tesseract
"""
for document_page in queue_document.document.pages.all():
for document_page in queue_document.document_version.pages.all():
try:
# Try to extract text by means of a parser
parse_document_page(document_page)