The feature can now work on emails with nested parts. Also the metadata.yaml attachment no longer needs to be the first attachment. Signed-off-by: Roberto Rosario <roberto.rosario@mayan-edms.com>
470 lines
15 KiB
Python
470 lines
15 KiB
Python
from __future__ import unicode_literals
|
|
|
|
import fcntl
|
|
from multiprocessing import Process
|
|
import shutil
|
|
|
|
import mock
|
|
from pathlib2 import Path
|
|
import yaml
|
|
try:
|
|
from yaml import CSafeDumper as SafeDumper
|
|
except ImportError:
|
|
from yaml import SafeDumper
|
|
|
|
from django.core import mail
|
|
from django.utils.encoding import force_text
|
|
|
|
from mayan.apps.documents.models import Document
|
|
from mayan.apps.documents.tests import (
|
|
GenericDocumentTestCase, TEST_COMPRESSED_DOCUMENT_PATH,
|
|
TEST_NON_ASCII_DOCUMENT_FILENAME, TEST_NON_ASCII_DOCUMENT_PATH,
|
|
TEST_NON_ASCII_COMPRESSED_DOCUMENT_PATH, TEST_SMALL_DOCUMENT_FILENAME,
|
|
TEST_SMALL_DOCUMENT_PATH
|
|
)
|
|
from mayan.apps.metadata.models import MetadataType
|
|
from mayan.apps.storage.utils import mkdtemp
|
|
|
|
from ..literals import SOURCE_UNCOMPRESS_CHOICE_Y
|
|
from ..models.email_sources import EmailBaseModel, IMAPEmail, POP3Email
|
|
from ..models.watch_folder_sources import WatchFolderSource
|
|
from ..models.webform_sources import WebFormSource
|
|
|
|
from .literals import (
|
|
TEST_EMAIL_ATTACHMENT_AND_INLINE, TEST_EMAIL_BASE64_FILENAME,
|
|
TEST_EMAIL_BASE64_FILENAME_FROM, TEST_EMAIL_BASE64_FILENAME_SUBJECT,
|
|
TEST_EMAIL_INLINE_IMAGE, TEST_EMAIL_NO_CONTENT_TYPE,
|
|
TEST_EMAIL_NO_CONTENT_TYPE_STRING, TEST_EMAIL_ZERO_LENGTH_ATTACHMENT,
|
|
TEST_WATCHFOLDER_SUBFOLDER
|
|
)
|
|
|
|
|
|
class CompressedUploadsTestCase(GenericDocumentTestCase):
|
|
auto_upload_document = False
|
|
|
|
def test_upload_compressed_file(self):
|
|
source = WebFormSource(
|
|
label='test source', uncompress=SOURCE_UNCOMPRESS_CHOICE_Y
|
|
)
|
|
|
|
with open(TEST_COMPRESSED_DOCUMENT_PATH, mode='rb') as file_object:
|
|
source.handle_upload(
|
|
document_type=self.test_document_type,
|
|
file_object=file_object,
|
|
expand=(source.uncompress == SOURCE_UNCOMPRESS_CHOICE_Y)
|
|
)
|
|
|
|
self.assertEqual(Document.objects.count(), 2)
|
|
self.assertTrue(
|
|
'first document.pdf' in Document.objects.values_list(
|
|
'label', flat=True
|
|
)
|
|
)
|
|
self.assertTrue(
|
|
'second document.pdf' in Document.objects.values_list(
|
|
'label', flat=True
|
|
)
|
|
)
|
|
|
|
|
|
class EmailBaseTestCase(GenericDocumentTestCase):
|
|
auto_upload_document = False
|
|
|
|
def _create_email_source(self):
|
|
self.source = EmailBaseModel(
|
|
document_type=self.test_document_type,
|
|
host='', username='', password='', store_body=True
|
|
)
|
|
|
|
def test_decode_email_base64_encoded_filename(self):
|
|
"""
|
|
Test decoding of base64 encoded e-mail attachment filename.
|
|
"""
|
|
self._create_email_source()
|
|
EmailBaseModel.process_message(
|
|
source=self.source, message_text=TEST_EMAIL_BASE64_FILENAME
|
|
)
|
|
|
|
self.assertEqual(
|
|
Document.objects.first().label, 'Ampelm\xe4nnchen.txt'
|
|
)
|
|
|
|
def test_decode_email_no_content_type(self):
|
|
self._create_email_source()
|
|
EmailBaseModel.process_message(
|
|
source=self.source, message_text=TEST_EMAIL_NO_CONTENT_TYPE
|
|
)
|
|
self.assertTrue(
|
|
TEST_EMAIL_NO_CONTENT_TYPE_STRING in Document.objects.first().open().read()
|
|
)
|
|
|
|
def test_decode_email_zero_length_attachment(self):
|
|
self._create_email_source()
|
|
self.source.store_body = False
|
|
self.source.save()
|
|
|
|
EmailBaseModel.process_message(
|
|
source=self.source, message_text=TEST_EMAIL_ZERO_LENGTH_ATTACHMENT
|
|
)
|
|
|
|
self.assertEqual(Document.objects.count(), 0)
|
|
|
|
def test_decode_email_with_inline_image(self):
|
|
# Silence expected errors in other apps
|
|
self._silence_logger(name='mayan.apps.converter.backends')
|
|
|
|
self._create_email_source()
|
|
EmailBaseModel.process_message(
|
|
source=self.source, message_text=TEST_EMAIL_INLINE_IMAGE
|
|
)
|
|
self.assertTrue(Document.objects.count(), 2)
|
|
self.assertQuerysetEqual(
|
|
ordered=False, qs=Document.objects.all(), values=(
|
|
'<Document: test-01.png>', '<Document: email_body.html>'
|
|
),
|
|
)
|
|
|
|
def test_decode_email_with_attachment_and_inline_image(self):
|
|
# Silence expected errors in other apps
|
|
self._silence_logger(name='mayan.apps.converter.backends')
|
|
|
|
self._create_email_source()
|
|
EmailBaseModel.process_message(
|
|
source=self.source, message_text=TEST_EMAIL_ATTACHMENT_AND_INLINE
|
|
)
|
|
self.assertTrue(Document.objects.count(), 2)
|
|
self.assertQuerysetEqual(
|
|
ordered=False, qs=Document.objects.all(), values=(
|
|
'<Document: test-01.png>', '<Document: email_body.html>',
|
|
),
|
|
)
|
|
|
|
def test_decode_email_and_store_from_and_subject_as_metadata(self):
|
|
metadata_from = MetadataType.objects.create(name='from')
|
|
metadata_subject = MetadataType.objects.create(name='subject')
|
|
self.test_document_type.metadata.create(metadata_type=metadata_from)
|
|
self.test_document_type.metadata.create(metadata_type=metadata_subject)
|
|
|
|
self._create_email_source()
|
|
self.source.from_metadata_type = metadata_from
|
|
self.source.subject_metadata_type = metadata_subject
|
|
self.source.save()
|
|
|
|
EmailBaseModel.process_message(
|
|
source=self.source, message_text=TEST_EMAIL_BASE64_FILENAME
|
|
)
|
|
|
|
document = Document.objects.first()
|
|
|
|
self.assertEqual(
|
|
document.label, 'Ampelm\xe4nnchen.txt'
|
|
)
|
|
self.assertEqual(
|
|
document.metadata.get(metadata_type=metadata_from).value,
|
|
TEST_EMAIL_BASE64_FILENAME_FROM
|
|
)
|
|
self.assertEqual(
|
|
document.metadata.get(metadata_type=metadata_subject).value,
|
|
TEST_EMAIL_BASE64_FILENAME_SUBJECT
|
|
)
|
|
|
|
def test_document_upload_no_body(self):
|
|
# Silence expected errors in other apps
|
|
self._silence_logger(name='mayan.apps.converter.backends')
|
|
|
|
self._create_email_source()
|
|
self.source.store_body = False
|
|
self.source.save()
|
|
|
|
EmailBaseModel.process_message(
|
|
source=self.source, message_text=TEST_EMAIL_ATTACHMENT_AND_INLINE
|
|
)
|
|
|
|
# Only two attachments, no body document
|
|
self.assertEqual(1, Document.objects.count())
|
|
|
|
def test_document_upload_with_body(self):
|
|
# Silence expected errors in other apps
|
|
self._silence_logger(name='mayan.apps.converter.backends')
|
|
|
|
self._create_email_source()
|
|
|
|
EmailBaseModel.process_message(
|
|
source=self.source, message_text=TEST_EMAIL_ATTACHMENT_AND_INLINE
|
|
)
|
|
|
|
# Only two attachments and a body document
|
|
self.assertEqual(2, Document.objects.count())
|
|
|
|
def test_metadata_yaml_attachment(self):
|
|
TEST_METADATA_VALUE_1 = 'test value 1'
|
|
TEST_METADATA_VALUE_2 = 'test value 2'
|
|
|
|
test_metadata_type_1 = MetadataType.objects.create(
|
|
name='test_metadata_type_1'
|
|
)
|
|
test_metadata_type_2 = MetadataType.objects.create(
|
|
name='test_metadata_type_2'
|
|
)
|
|
self.test_document_type.metadata.create(
|
|
metadata_type=test_metadata_type_1
|
|
)
|
|
self.test_document_type.metadata.create(
|
|
metadata_type=test_metadata_type_2
|
|
)
|
|
|
|
test_metadata_yaml = yaml.dump(
|
|
Dumper=SafeDumper, data={
|
|
test_metadata_type_1.name: TEST_METADATA_VALUE_1,
|
|
test_metadata_type_2.name: TEST_METADATA_VALUE_2,
|
|
}
|
|
)
|
|
|
|
# Create email with a test attachment first, then the metadata.yaml
|
|
# attachment
|
|
with mail.get_connection(
|
|
backend='django.core.mail.backends.locmem.EmailBackend'
|
|
) as connection:
|
|
email_message = mail.EmailMultiAlternatives(
|
|
body='test email body', connection=connection,
|
|
subject='test email subject', to=['test@example.com'],
|
|
)
|
|
|
|
email_message.attach(
|
|
filename='test_attachment',
|
|
content='test_content',
|
|
)
|
|
|
|
email_message.attach(
|
|
filename='metadata.yaml',
|
|
content=test_metadata_yaml,
|
|
)
|
|
|
|
email_message.send()
|
|
|
|
self._create_email_source()
|
|
self.source.store_body = True
|
|
self.source.save()
|
|
|
|
EmailBaseModel.process_message(
|
|
source=self.source, message_text=mail.outbox[0].message()
|
|
)
|
|
|
|
self.assertEqual(Document.objects.count(), 2)
|
|
|
|
for document in Document.objects.all():
|
|
self.assertEqual(
|
|
document.metadata.get(metadata_type=test_metadata_type_1).value,
|
|
TEST_METADATA_VALUE_1
|
|
)
|
|
self.assertEqual(
|
|
document.metadata.get(metadata_type=test_metadata_type_2).value,
|
|
TEST_METADATA_VALUE_2
|
|
)
|
|
|
|
|
|
class IMAPSourceTestCase(GenericDocumentTestCase):
|
|
auto_upload_document = False
|
|
|
|
class MockIMAPServer(object):
|
|
def login(self, user, password):
|
|
return ('OK', ['{} authenticated (Success)'.format(user)])
|
|
|
|
def select(self, mailbox='INBOX', readonly=False):
|
|
return ('OK', ['1'])
|
|
|
|
def search(self, charset, *criteria):
|
|
return ('OK', ['1'])
|
|
|
|
def fetch(self, message_set, message_parts):
|
|
return (
|
|
'OK', [
|
|
(
|
|
'1 (RFC822 {4800}',
|
|
TEST_EMAIL_BASE64_FILENAME
|
|
), ' FLAGS (\\Seen))'
|
|
]
|
|
)
|
|
|
|
def store(self, message_set, command, flags):
|
|
return ('OK', ['1 (FLAGS (\\Seen \\Deleted))'])
|
|
|
|
def expunge(self):
|
|
return ('OK', ['1'])
|
|
|
|
def close(self):
|
|
return ('OK', ['Returned to authenticated state. (Success)'])
|
|
|
|
def logout(self):
|
|
return ('BYE', ['LOGOUT Requested'])
|
|
|
|
@mock.patch('imaplib.IMAP4_SSL', autospec=True)
|
|
def test_download_document(self, mock_imaplib):
|
|
mock_imaplib.return_value = IMAPSourceTestCase.MockIMAPServer()
|
|
self.source = IMAPEmail.objects.create(
|
|
document_type=self.test_document_type, label='', host='',
|
|
password='', username=''
|
|
)
|
|
|
|
self.source.check_source()
|
|
self.assertEqual(
|
|
Document.objects.first().label, 'Ampelm\xe4nnchen.txt'
|
|
)
|
|
|
|
|
|
class POP3SourceTestCase(GenericDocumentTestCase):
|
|
auto_upload_document = False
|
|
|
|
class MockMailbox(object):
|
|
def dele(self, which):
|
|
return
|
|
|
|
def getwelcome(self):
|
|
return
|
|
|
|
def list(self, which=None):
|
|
return (None, ['1 test'])
|
|
|
|
def user(self, user):
|
|
return
|
|
|
|
def pass_(self, pswd):
|
|
return
|
|
|
|
def quit(self):
|
|
return
|
|
|
|
def retr(self, which=None):
|
|
return (
|
|
1, [TEST_EMAIL_BASE64_FILENAME]
|
|
)
|
|
|
|
@mock.patch('poplib.POP3_SSL', autospec=True)
|
|
def test_download_document(self, mock_poplib):
|
|
mock_poplib.return_value = POP3SourceTestCase.MockMailbox()
|
|
self.source = POP3Email.objects.create(
|
|
document_type=self.test_document_type, label='', host='', password='',
|
|
username=''
|
|
)
|
|
|
|
self.source.check_source()
|
|
self.assertEqual(
|
|
Document.objects.first().label, 'Ampelm\xe4nnchen.txt'
|
|
)
|
|
|
|
|
|
class WatchFolderTestCase(GenericDocumentTestCase):
|
|
auto_upload_document = False
|
|
|
|
def _create_test_watchfolder(self):
|
|
return WatchFolderSource.objects.create(
|
|
document_type=self.test_document_type,
|
|
folder_path=self.temporary_directory,
|
|
include_subdirectories=False,
|
|
uncompress=SOURCE_UNCOMPRESS_CHOICE_Y
|
|
)
|
|
|
|
def setUp(self):
|
|
super(WatchFolderTestCase, self).setUp()
|
|
self.temporary_directory = mkdtemp()
|
|
|
|
def tearDown(self):
|
|
shutil.rmtree(self.temporary_directory)
|
|
super(WatchFolderTestCase, self).tearDown()
|
|
|
|
def test_subfolder_support_disabled(self):
|
|
watch_folder = self._create_test_watchfolder()
|
|
|
|
test_path = Path(self.temporary_directory)
|
|
test_subfolder = test_path.joinpath(TEST_WATCHFOLDER_SUBFOLDER)
|
|
test_subfolder.mkdir()
|
|
|
|
shutil.copy(TEST_SMALL_DOCUMENT_PATH, force_text(test_subfolder))
|
|
watch_folder.check_source()
|
|
self.assertEqual(Document.objects.count(), 0)
|
|
|
|
def test_subfolder_support_enabled(self):
|
|
watch_folder = self._create_test_watchfolder()
|
|
watch_folder.include_subdirectories = True
|
|
watch_folder.save()
|
|
|
|
test_path = Path(self.temporary_directory)
|
|
test_subfolder = test_path.joinpath(TEST_WATCHFOLDER_SUBFOLDER)
|
|
test_subfolder.mkdir()
|
|
|
|
shutil.copy(TEST_SMALL_DOCUMENT_PATH, force_text(test_subfolder))
|
|
watch_folder.check_source()
|
|
self.assertEqual(Document.objects.count(), 1)
|
|
|
|
document = Document.objects.first()
|
|
|
|
self.assertEqual(document.exists(), True)
|
|
self.assertEqual(document.size, 17436)
|
|
|
|
self.assertEqual(document.file_mimetype, 'image/png')
|
|
self.assertEqual(document.file_mime_encoding, 'binary')
|
|
self.assertEqual(document.label, TEST_SMALL_DOCUMENT_FILENAME)
|
|
self.assertEqual(document.page_count, 1)
|
|
|
|
def test_issue_gh_163(self):
|
|
"""
|
|
Non-ASCII chars in document name failing in upload via watch folder
|
|
gh-issue #163 https://github.com/mayan-edms/mayan-edms/issues/163
|
|
"""
|
|
watch_folder = self._create_test_watchfolder()
|
|
|
|
shutil.copy(TEST_NON_ASCII_DOCUMENT_PATH, self.temporary_directory)
|
|
watch_folder.check_source()
|
|
self.assertEqual(Document.objects.count(), 1)
|
|
|
|
document = Document.objects.first()
|
|
|
|
self.assertEqual(document.exists(), True)
|
|
self.assertEqual(document.size, 17436)
|
|
|
|
self.assertEqual(document.file_mimetype, 'image/png')
|
|
self.assertEqual(document.file_mime_encoding, 'binary')
|
|
self.assertEqual(document.label, TEST_NON_ASCII_DOCUMENT_FILENAME)
|
|
self.assertEqual(document.page_count, 1)
|
|
|
|
def test_issue_gh_163_expanded(self):
|
|
"""
|
|
Test Non-ASCII named documents inside Non-ASCII named compressed file
|
|
"""
|
|
watch_folder = self._create_test_watchfolder()
|
|
|
|
shutil.copy(
|
|
TEST_NON_ASCII_COMPRESSED_DOCUMENT_PATH, self.temporary_directory
|
|
)
|
|
watch_folder.check_source()
|
|
self.assertEqual(Document.objects.count(), 1)
|
|
|
|
document = Document.objects.first()
|
|
|
|
self.assertEqual(document.exists(), True)
|
|
self.assertEqual(document.size, 17436)
|
|
|
|
self.assertEqual(document.file_mimetype, 'image/png')
|
|
self.assertEqual(document.file_mime_encoding, 'binary')
|
|
self.assertEqual(document.label, TEST_NON_ASCII_DOCUMENT_FILENAME)
|
|
self.assertEqual(document.page_count, 1)
|
|
|
|
def test_locking_support(self):
|
|
watch_folder = self._create_test_watchfolder()
|
|
|
|
shutil.copy(
|
|
TEST_SMALL_DOCUMENT_PATH, self.temporary_directory
|
|
)
|
|
|
|
path_test_file = Path(
|
|
self.temporary_directory, TEST_SMALL_DOCUMENT_FILENAME
|
|
)
|
|
|
|
with path_test_file.open(mode='rb+') as file_object:
|
|
fcntl.lockf(file_object, fcntl.LOCK_EX | fcntl.LOCK_NB)
|
|
process = Process(target=watch_folder.check_source)
|
|
process.start()
|
|
process.join()
|
|
|
|
self.assertEqual(Document.objects.count(), 0)
|