Chore: Upgrades OCRMyPDF to v16 (#7815)

2026-01-26 22:49:01 -06:00 · 2024-09-30 19:53:44 -07:00
parent 0b829cab32
commit 2ab71137b9
5 changed files with 91 additions and 38 deletions
--- a/src/paperless_mail/tests/test_parsers.py
+++ b/src/paperless_mail/tests/test_parsers.py
@@ -497,6 +497,7 @@ class TestParser:

        assert mail_parser.archive_path is not None

+    @pytest.mark.httpx_mock(can_send_already_matched_responses=True)
    def test_generate_pdf_html_email(
        self,
        httpx_mock: HTTPXMock,
@@ -575,6 +576,7 @@ class TestParser:
        with pytest.raises(ParseError):
            mail_parser.parse(html_email_file, "message/rfc822")

+    @pytest.mark.httpx_mock(can_send_already_matched_responses=True)
    def test_generate_pdf_html_email_merge_failure(
        self,
        httpx_mock: HTTPXMock,
--- a/src/paperless_tika/tests/test_tika_parser.py
+++ b/src/paperless_tika/tests/test_tika_parser.py
@@ -5,7 +5,6 @@ from pathlib import Path

 import pytest
 from httpx import codes
-from httpx._multipart import DataField
 from pytest_django.fixtures import SettingsWrapper
 from pytest_httpx import HTTPXMock

@@ -128,11 +127,22 @@ class TestTikaParser:
        tika_parser.convert_to_pdf(sample_odt_file, None)

        request = httpx_mock.get_request()
-        found = False
-        for field in request.stream.fields:
-            if isinstance(field, DataField) and field.name == "pdfa":
-                assert field.value == expected_form_value
-                found = True
-        assert found, "pdfFormat was not found"

-        httpx_mock.reset(assert_all_responses_were_requested=False)
+        expected_field_name = "pdfa"
+
+        content_type = request.headers["Content-Type"]
+        assert "multipart/form-data" in content_type
+
+        boundary = content_type.split("boundary=")[1]
+
+        parts = request.content.split(f"--{boundary}".encode())
+
+        form_field_found = any(
+            f'name="{expected_field_name}"'.encode() in part
+            and expected_form_value.encode() in part
+            for part in parts
+        )
+
+        assert form_field_found
+
+        httpx_mock.reset()