mirror of
https://github.com/paperless-ngx/paperless-ngx.git
synced 2025-08-20 00:56:26 +00:00
Merge pull request #2302 from paperless-ngx/feature-fix-display-rtl-content
This commit is contained in:
@@ -670,28 +670,14 @@ class TestParser(DirectoriesMixin, TestCase):
|
||||
- Text from the document is extracted
|
||||
"""
|
||||
parser = RasterisedDocumentParser(None)
|
||||
with mock.patch.object(
|
||||
parser,
|
||||
"construct_ocrmypdf_parameters",
|
||||
wraps=parser.construct_ocrmypdf_parameters,
|
||||
) as wrapped:
|
||||
|
||||
parser.parse(
|
||||
os.path.join(self.SAMPLE_FILES, "rtl-test.pdf"),
|
||||
"application/pdf",
|
||||
)
|
||||
parser.parse(
|
||||
os.path.join(self.SAMPLE_FILES, "rtl-test.pdf"),
|
||||
"application/pdf",
|
||||
)
|
||||
|
||||
# There isn't a good way to actually check this working, with RTL correctly return
|
||||
# as it would require tesseract-ocr-ara installed for everyone running the
|
||||
# test suite. This test does provide the coverage though and attempts to ensure
|
||||
# the force OCR happens
|
||||
self.assertIsNotNone(parser.get_text())
|
||||
|
||||
self.assertEqual(parser.construct_ocrmypdf_parameters.call_count, 2)
|
||||
# Check the last call kwargs
|
||||
self.assertTrue(
|
||||
parser.construct_ocrmypdf_parameters.call_args.kwargs["safe_fallback"],
|
||||
)
|
||||
# Copied from the PDF to here. Don't even look at it
|
||||
self.assertIn("ةﯾﻠﺧﺎدﻻ ةرازو", parser.get_text())
|
||||
|
||||
|
||||
class TestParserFileTypes(DirectoriesMixin, TestCase):
|
||||
|
Reference in New Issue
Block a user