associate error messages with documents

This commit is contained in:
jonaswinkler 2021-02-22 11:38:16 +01:00
parent d64818b46c
commit aa3d91a338

View File

@ -4,7 +4,9 @@ import multiprocessing
import logging import logging
import os import os
import shutil import shutil
import sys
import uuid import uuid
from io import TextIOBase
import tqdm import tqdm
from django import db from django import db
@ -12,7 +14,6 @@ from django.conf import settings
from django.core.management.base import BaseCommand from django.core.management.base import BaseCommand
from django.db import transaction from django.db import transaction
from filelock import FileLock from filelock import FileLock
from whoosh.writing import AsyncWriter
from documents.models import Document from documents.models import Document
from ... import index from ... import index
@ -24,11 +25,28 @@ from ...parsers import get_parser_class_for_mime_type
logger = logging.getLogger("paperless.management.archiver") logger = logging.getLogger("paperless.management.archiver")
class LoggerWriter(TextIOBase):
def __init__(self, doc: Document):
self.doc = doc
def write(self, message):
# if statement reduces the amount of newlines that are
# printed to the logger
if message != '\n':
logger.error(
f"Document {self.doc} (ID: {self.doc.pk}): {message}"
)
def handle_document(document_id): def handle_document(document_id):
document = Document.objects.get(id=document_id) document = Document.objects.get(id=document_id)
mime_type = document.mime_type mime_type = document.mime_type
# redirect errors to the log and associate them with the current document
sys.stderr = LoggerWriter(document)
parser_class = get_parser_class_for_mime_type(mime_type) parser_class = get_parser_class_for_mime_type(mime_type)
if not parser_class: if not parser_class: