mirror of
https://github.com/paperless-ngx/paperless-ngx.git
synced 2025-04-02 13:45:10 -05:00
196 lines
5.7 KiB
Python
196 lines
5.7 KiB
Python
import filecmp
|
|
import os
|
|
import shutil
|
|
from threading import Thread
|
|
from time import sleep
|
|
from unittest import mock
|
|
|
|
from django.conf import settings
|
|
from django.test import TestCase, override_settings
|
|
|
|
from documents.consumer import ConsumerError
|
|
from documents.management.commands import document_consumer
|
|
from documents.tests.utils import setup_directories, remove_dirs
|
|
|
|
|
|
class ConsumerThread(Thread):
|
|
|
|
def __init__(self):
|
|
super().__init__()
|
|
self.cmd = document_consumer.Command()
|
|
|
|
def run(self) -> None:
|
|
self.cmd.handle(directory=settings.CONSUMPTION_DIR, oneshot=False)
|
|
|
|
def stop(self):
|
|
# Consumer checks this every second.
|
|
self.cmd.stop_flag = True
|
|
|
|
|
|
def chunked(size, source):
|
|
for i in range(0, len(source), size):
|
|
yield source[i:i+size]
|
|
|
|
|
|
class TestConsumer(TestCase):
|
|
|
|
sample_file = os.path.join(os.path.dirname(__file__), "samples", "simple.pdf")
|
|
|
|
def setUp(self) -> None:
|
|
patcher = mock.patch("documents.management.commands.document_consumer.async_task")
|
|
self.task_mock = patcher.start()
|
|
self.addCleanup(patcher.stop)
|
|
|
|
self.dirs = setup_directories()
|
|
self.addCleanup(remove_dirs, self.dirs)
|
|
|
|
def t_start(self):
|
|
self.t = ConsumerThread()
|
|
self.t.start()
|
|
# give the consumer some time to do initial work
|
|
sleep(1)
|
|
|
|
def tearDown(self) -> None:
|
|
if self.t:
|
|
self.t.stop()
|
|
|
|
def wait_for_task_mock_call(self):
|
|
n = 0
|
|
while n < 100:
|
|
if self.task_mock.call_count > 0:
|
|
# give task_mock some time to finish and raise errors
|
|
sleep(1)
|
|
return
|
|
n += 1
|
|
sleep(0.1)
|
|
self.fail("async_task was never called")
|
|
|
|
# A bogus async_task that will simply check the file for
|
|
# completeness and raise an exception otherwise.
|
|
def bogus_task(self, func, filename, **kwargs):
|
|
eq = filecmp.cmp(filename, self.sample_file, shallow=False)
|
|
if not eq:
|
|
print("Consumed an INVALID file.")
|
|
raise ConsumerError("Incomplete File READ FAILED")
|
|
else:
|
|
print("Consumed a perfectly valid file.")
|
|
|
|
def slow_write_file(self, target, incomplete=False):
|
|
with open(self.sample_file, 'rb') as f:
|
|
pdf_bytes = f.read()
|
|
|
|
if incomplete:
|
|
pdf_bytes = pdf_bytes[:len(pdf_bytes) - 100]
|
|
|
|
with open(target, 'wb') as f:
|
|
# this will take 2 seconds, since the file is about 20k.
|
|
print("Start writing file.")
|
|
for b in chunked(1000, pdf_bytes):
|
|
f.write(b)
|
|
sleep(0.1)
|
|
print("file completed.")
|
|
|
|
def test_consume_file(self):
|
|
self.t_start()
|
|
|
|
f = os.path.join(self.dirs.consumption_dir, "my_file.pdf")
|
|
shutil.copy(self.sample_file, f)
|
|
|
|
self.wait_for_task_mock_call()
|
|
|
|
self.task_mock.assert_called_once()
|
|
|
|
args, kwargs = self.task_mock.call_args
|
|
self.assertEqual(args[1], f)
|
|
|
|
@override_settings(CONSUMER_POLLING=1)
|
|
def test_consume_file_polling(self):
|
|
self.test_consume_file()
|
|
|
|
def test_consume_existing_file(self):
|
|
f = os.path.join(self.dirs.consumption_dir, "my_file.pdf")
|
|
shutil.copy(self.sample_file, f)
|
|
|
|
self.t_start()
|
|
self.task_mock.assert_called_once()
|
|
|
|
args, kwargs = self.task_mock.call_args
|
|
self.assertEqual(args[1], f)
|
|
|
|
@override_settings(CONSUMER_POLLING=1)
|
|
def test_consume_existing_file_polling(self):
|
|
self.test_consume_existing_file()
|
|
|
|
@mock.patch("documents.management.commands.document_consumer.logger.error")
|
|
def test_slow_write_pdf(self, error_logger):
|
|
|
|
self.task_mock.side_effect = self.bogus_task
|
|
|
|
self.t_start()
|
|
|
|
fname = os.path.join(self.dirs.consumption_dir, "my_file.pdf")
|
|
|
|
self.slow_write_file(fname)
|
|
|
|
self.wait_for_task_mock_call()
|
|
|
|
error_logger.assert_not_called()
|
|
|
|
self.task_mock.assert_called_once()
|
|
|
|
args, kwargs = self.task_mock.call_args
|
|
self.assertEqual(args[1], fname)
|
|
|
|
@override_settings(CONSUMER_POLLING=1)
|
|
def test_slow_write_pdf_polling(self):
|
|
self.test_slow_write_pdf()
|
|
|
|
@mock.patch("documents.management.commands.document_consumer.logger.error")
|
|
def test_slow_write_and_move(self, error_logger):
|
|
|
|
self.task_mock.side_effect = self.bogus_task
|
|
|
|
self.t_start()
|
|
|
|
fname = os.path.join(self.dirs.consumption_dir, "my_file.~df")
|
|
fname2 = os.path.join(self.dirs.consumption_dir, "my_file.pdf")
|
|
|
|
self.slow_write_file(fname)
|
|
shutil.move(fname, fname2)
|
|
|
|
self.wait_for_task_mock_call()
|
|
|
|
self.task_mock.assert_called_once()
|
|
|
|
args, kwargs = self.task_mock.call_args
|
|
self.assertEqual(args[1], fname2)
|
|
|
|
error_logger.assert_not_called()
|
|
|
|
@override_settings(CONSUMER_POLLING=1)
|
|
def test_slow_write_and_move_polling(self):
|
|
self.test_slow_write_and_move()
|
|
|
|
@mock.patch("documents.management.commands.document_consumer.logger.error")
|
|
def test_slow_write_incomplete(self, error_logger):
|
|
|
|
self.task_mock.side_effect = self.bogus_task
|
|
|
|
self.t_start()
|
|
|
|
fname = os.path.join(self.dirs.consumption_dir, "my_file.pdf")
|
|
self.slow_write_file(fname, incomplete=True)
|
|
|
|
self.wait_for_task_mock_call()
|
|
|
|
self.task_mock.assert_called_once()
|
|
args, kwargs = self.task_mock.call_args
|
|
self.assertEqual(args[1], fname)
|
|
|
|
# assert that we have an error logged with this invalid file.
|
|
error_logger.assert_called_once()
|
|
|
|
@override_settings(CONSUMER_POLLING=1)
|
|
def test_slow_write_incomplete_polling(self):
|
|
self.test_slow_write_incomplete()
|