The conditional_escape call caused downloaded OCR text to contain HTML entities like "

Signed-off-by: Roberto Rosario <roberto.rosario.gonzalez@gmail.com>
This commit is contained in:
Roberto Rosario
2018-06-28 02:04:49 -04:00
parent c4c73666aa
commit 85926ae8f8

View File

@@ -2,7 +2,6 @@ from __future__ import unicode_literals
from django.apps import apps
from django.utils.encoding import force_text
from django.utils.html import conditional_escape
def get_document_ocr_content(document):
@@ -16,4 +15,4 @@ def get_document_ocr_content(document):
except DocumentPageOCRContent.DoesNotExist:
pass
else:
yield conditional_escape(force_text(page_content))
yield force_text(page_content)