diff --git a/src/paperless_tesseract/parsers.py b/src/paperless_tesseract/parsers.py index a8be899f5..ecdafde98 100644 --- a/src/paperless_tesseract/parsers.py +++ b/src/paperless_tesseract/parsers.py @@ -378,13 +378,13 @@ class RasterisedDocumentParser(DocumentParser): sidecar_file, ) + if self.settings.skip_archive_file != ArchiveFileChoices.ALWAYS: + self.archive_path = archive_path + try: self.log.debug(f"Calling OCRmyPDF with args: {args}") ocrmypdf.ocr(**args) - if self.settings.skip_archive_file != ArchiveFileChoices.ALWAYS: - self.archive_path = archive_path - self.text = self.extract_text(sidecar_file, archive_path) if not self.text: