mirror of
https://github.com/paperless-ngx/paperless-ngx.git
synced 2025-04-02 13:45:10 -05:00
New logging appears to work
This commit is contained in:
parent
e149baec4e
commit
2fe9b0cbc1
@ -3,6 +3,7 @@ Changelog
|
|||||||
|
|
||||||
* 0.1.1 (master)
|
* 0.1.1 (master)
|
||||||
|
|
||||||
|
* `#60`_: Setup logging to actually use the Python native logging framework.
|
||||||
* `#53`_: Fixed an annoying bug that caused ``.jpeg`` and ``.JPG`` images
|
* `#53`_: Fixed an annoying bug that caused ``.jpeg`` and ``.JPG`` images
|
||||||
to be imported but made unavailable.
|
to be imported but made unavailable.
|
||||||
|
|
||||||
@ -73,3 +74,4 @@ Changelog
|
|||||||
.. _#53: https://github.com/danielquinn/paperless/issues/53
|
.. _#53: https://github.com/danielquinn/paperless/issues/53
|
||||||
.. _#54: https://github.com/danielquinn/paperless/issues/54
|
.. _#54: https://github.com/danielquinn/paperless/issues/54
|
||||||
.. _#57: https://github.com/danielquinn/paperless/issues/57
|
.. _#57: https://github.com/danielquinn/paperless/issues/57
|
||||||
|
.. _#60: https://github.com/danielquinn/paperless/issues/60
|
||||||
|
@ -3,7 +3,7 @@ from django.contrib.auth.models import User, Group
|
|||||||
from django.core.urlresolvers import reverse
|
from django.core.urlresolvers import reverse
|
||||||
from django.templatetags.static import static
|
from django.templatetags.static import static
|
||||||
|
|
||||||
from .models import Sender, Tag, Document
|
from .models import Sender, Tag, Document, Log
|
||||||
|
|
||||||
|
|
||||||
class MonthListFilter(admin.SimpleListFilter):
|
class MonthListFilter(admin.SimpleListFilter):
|
||||||
@ -57,7 +57,7 @@ class DocumentAdmin(admin.ModelAdmin):
|
|||||||
r = ""
|
r = ""
|
||||||
for tag in obj.tags.all():
|
for tag in obj.tags.all():
|
||||||
colour = tag.get_colour_display()
|
colour = tag.get_colour_display()
|
||||||
r += html_tag(
|
r += self._html_tag(
|
||||||
"a",
|
"a",
|
||||||
tag.slug,
|
tag.slug,
|
||||||
**{
|
**{
|
||||||
@ -73,9 +73,9 @@ class DocumentAdmin(admin.ModelAdmin):
|
|||||||
tags_.allow_tags = True
|
tags_.allow_tags = True
|
||||||
|
|
||||||
def document(self, obj):
|
def document(self, obj):
|
||||||
return html_tag(
|
return self._html_tag(
|
||||||
"a",
|
"a",
|
||||||
html_tag(
|
self._html_tag(
|
||||||
"img",
|
"img",
|
||||||
src=static("documents/img/{}.png".format(obj.file_type)),
|
src=static("documents/img/{}.png".format(obj.file_type)),
|
||||||
width=22,
|
width=22,
|
||||||
@ -87,23 +87,32 @@ class DocumentAdmin(admin.ModelAdmin):
|
|||||||
)
|
)
|
||||||
document.allow_tags = True
|
document.allow_tags = True
|
||||||
|
|
||||||
|
@staticmethod
|
||||||
|
def _html_tag(kind, inside=None, **kwargs):
|
||||||
|
|
||||||
|
attributes = []
|
||||||
|
for lft, rgt in kwargs.items():
|
||||||
|
attributes.append('{}="{}"'.format(lft, rgt))
|
||||||
|
|
||||||
|
if inside is not None:
|
||||||
|
return "<{kind} {attributes}>{inside}</{kind}>".format(
|
||||||
|
kind=kind, attributes=" ".join(attributes), inside=inside)
|
||||||
|
|
||||||
|
return "<{} {}/>".format(kind, " ".join(attributes))
|
||||||
|
|
||||||
|
|
||||||
|
class LogAdmin(admin.ModelAdmin):
|
||||||
|
|
||||||
|
list_display = ("message", "level", "component")
|
||||||
|
list_filter = ("level", "component",)
|
||||||
|
|
||||||
|
|
||||||
admin.site.register(Sender)
|
admin.site.register(Sender)
|
||||||
admin.site.register(Tag, TagAdmin)
|
admin.site.register(Tag, TagAdmin)
|
||||||
admin.site.register(Document, DocumentAdmin)
|
admin.site.register(Document, DocumentAdmin)
|
||||||
|
admin.site.register(Log, LogAdmin)
|
||||||
|
|
||||||
|
|
||||||
# Unless we implement multi-user, these default registrations don't make sense.
|
# Unless we implement multi-user, these default registrations don't make sense.
|
||||||
admin.site.unregister(Group)
|
admin.site.unregister(Group)
|
||||||
admin.site.unregister(User)
|
admin.site.unregister(User)
|
||||||
|
|
||||||
|
|
||||||
def html_tag(kind, inside=None, **kwargs):
|
|
||||||
|
|
||||||
attributes = []
|
|
||||||
for lft, rgt in kwargs.items():
|
|
||||||
attributes.append('{}="{}"'.format(lft, rgt))
|
|
||||||
|
|
||||||
if inside is not None:
|
|
||||||
return "<{kind} {attributes}>{inside}</{kind}>".format(
|
|
||||||
kind=kind, attributes=" ".join(attributes), inside=inside)
|
|
||||||
|
|
||||||
return "<{} {}/>".format(kind, " ".join(attributes))
|
|
||||||
|
@ -1,5 +1,8 @@
|
|||||||
import datetime
|
import datetime
|
||||||
|
import logging
|
||||||
import tempfile
|
import tempfile
|
||||||
|
import uuid
|
||||||
|
|
||||||
from multiprocessing.pool import Pool
|
from multiprocessing.pool import Pool
|
||||||
|
|
||||||
import itertools
|
import itertools
|
||||||
@ -19,10 +22,9 @@ from django.utils import timezone
|
|||||||
from django.template.defaultfilters import slugify
|
from django.template.defaultfilters import slugify
|
||||||
from pyocr.tesseract import TesseractError
|
from pyocr.tesseract import TesseractError
|
||||||
|
|
||||||
from logger.models import Log
|
|
||||||
from paperless.db import GnuPG
|
from paperless.db import GnuPG
|
||||||
|
|
||||||
from .models import Sender, Tag, Document
|
from .models import Sender, Tag, Document, Log
|
||||||
from .languages import ISO639
|
from .languages import ISO639
|
||||||
|
|
||||||
|
|
||||||
@ -67,6 +69,8 @@ class Consumer(object):
|
|||||||
def __init__(self, verbosity=1):
|
def __init__(self, verbosity=1):
|
||||||
|
|
||||||
self.verbosity = verbosity
|
self.verbosity = verbosity
|
||||||
|
self.logger = logging.getLogger(__name__)
|
||||||
|
self.logging_group = None
|
||||||
|
|
||||||
try:
|
try:
|
||||||
os.makedirs(self.SCRATCH)
|
os.makedirs(self.SCRATCH)
|
||||||
@ -86,6 +90,12 @@ class Consumer(object):
|
|||||||
raise ConsumerError(
|
raise ConsumerError(
|
||||||
"Consumption directory {} does not exist".format(self.CONSUME))
|
"Consumption directory {} does not exist".format(self.CONSUME))
|
||||||
|
|
||||||
|
def log(self, level, message):
|
||||||
|
getattr(self.logger, level)(message, extra={
|
||||||
|
"group": self.logging_group,
|
||||||
|
"component": Log.COMPONENT_CONSUMER
|
||||||
|
})
|
||||||
|
|
||||||
def consume(self):
|
def consume(self):
|
||||||
|
|
||||||
for doc in os.listdir(self.CONSUME):
|
for doc in os.listdir(self.CONSUME):
|
||||||
@ -104,7 +114,9 @@ class Consumer(object):
|
|||||||
if self._is_ready(doc):
|
if self._is_ready(doc):
|
||||||
continue
|
continue
|
||||||
|
|
||||||
Log.info("Consuming {}".format(doc), Log.COMPONENT_CONSUMER)
|
self.logging_group = uuid.uuid4()
|
||||||
|
|
||||||
|
self.log("info", "Consuming {}".format(doc))
|
||||||
|
|
||||||
tempdir = tempfile.mkdtemp(prefix="paperless", dir=self.SCRATCH)
|
tempdir = tempfile.mkdtemp(prefix="paperless", dir=self.SCRATCH)
|
||||||
pngs = self._get_greyscale(tempdir, doc)
|
pngs = self._get_greyscale(tempdir, doc)
|
||||||
@ -114,8 +126,7 @@ class Consumer(object):
|
|||||||
self._store(text, doc)
|
self._store(text, doc)
|
||||||
except OCRError:
|
except OCRError:
|
||||||
self._ignore.append(doc)
|
self._ignore.append(doc)
|
||||||
Log.error(
|
self.log("error", "OCR FAILURE: {}".format(doc))
|
||||||
"OCR FAILURE: {}".format(doc), Log.COMPONENT_CONSUMER)
|
|
||||||
self._cleanup_tempdir(tempdir)
|
self._cleanup_tempdir(tempdir)
|
||||||
continue
|
continue
|
||||||
else:
|
else:
|
||||||
@ -124,10 +135,7 @@ class Consumer(object):
|
|||||||
|
|
||||||
def _get_greyscale(self, tempdir, doc):
|
def _get_greyscale(self, tempdir, doc):
|
||||||
|
|
||||||
Log.debug(
|
self.log("info", "Generating greyscale image from {}".format(doc))
|
||||||
"Generating greyscale image from {}".format(doc),
|
|
||||||
Log.COMPONENT_CONSUMER
|
|
||||||
)
|
|
||||||
|
|
||||||
png = os.path.join(tempdir, "convert-%04d.jpg")
|
png = os.path.join(tempdir, "convert-%04d.jpg")
|
||||||
|
|
||||||
@ -143,18 +151,13 @@ class Consumer(object):
|
|||||||
|
|
||||||
return sorted(filter(lambda __: os.path.isfile(__), pngs))
|
return sorted(filter(lambda __: os.path.isfile(__), pngs))
|
||||||
|
|
||||||
@staticmethod
|
def _guess_language(self, text):
|
||||||
def _guess_language(text):
|
|
||||||
try:
|
try:
|
||||||
guess = langdetect.detect(text)
|
guess = langdetect.detect(text)
|
||||||
Log.debug(
|
self.log("debug", "Language detected: {}".format(guess))
|
||||||
"Language detected: {}".format(guess),
|
|
||||||
Log.COMPONENT_CONSUMER
|
|
||||||
)
|
|
||||||
return guess
|
return guess
|
||||||
except Exception as e:
|
except Exception as e:
|
||||||
Log.warning(
|
self.log("warning", "Language detection error: {}".format(e))
|
||||||
"Language detection error: {}".format(e), Log.COMPONENT_MAIL)
|
|
||||||
|
|
||||||
def _get_ocr(self, pngs):
|
def _get_ocr(self, pngs):
|
||||||
"""
|
"""
|
||||||
@ -165,7 +168,7 @@ class Consumer(object):
|
|||||||
if not pngs:
|
if not pngs:
|
||||||
raise OCRError
|
raise OCRError
|
||||||
|
|
||||||
Log.debug("OCRing the document", Log.COMPONENT_CONSUMER)
|
self.log("info", "OCRing the document")
|
||||||
|
|
||||||
# Since the division gets rounded down by int, this calculation works
|
# Since the division gets rounded down by int, this calculation works
|
||||||
# for every edge-case, i.e. 1
|
# for every edge-case, i.e. 1
|
||||||
@ -175,12 +178,12 @@ class Consumer(object):
|
|||||||
guessed_language = self._guess_language(raw_text)
|
guessed_language = self._guess_language(raw_text)
|
||||||
|
|
||||||
if not guessed_language or guessed_language not in ISO639:
|
if not guessed_language or guessed_language not in ISO639:
|
||||||
Log.warning("Language detection failed!", Log.COMPONENT_CONSUMER)
|
self.log("warning", "Language detection failed!")
|
||||||
if settings.FORGIVING_OCR:
|
if settings.FORGIVING_OCR:
|
||||||
Log.warning(
|
self.log(
|
||||||
|
"warning",
|
||||||
"As FORGIVING_OCR is enabled, we're going to make the "
|
"As FORGIVING_OCR is enabled, we're going to make the "
|
||||||
"best with what we have.",
|
"best with what we have."
|
||||||
Log.COMPONENT_CONSUMER
|
|
||||||
)
|
)
|
||||||
raw_text = self._assemble_ocr_sections(pngs, middle, raw_text)
|
raw_text = self._assemble_ocr_sections(pngs, middle, raw_text)
|
||||||
return raw_text
|
return raw_text
|
||||||
@ -194,12 +197,12 @@ class Consumer(object):
|
|||||||
return self._ocr(pngs, ISO639[guessed_language])
|
return self._ocr(pngs, ISO639[guessed_language])
|
||||||
except pyocr.pyocr.tesseract.TesseractError:
|
except pyocr.pyocr.tesseract.TesseractError:
|
||||||
if settings.FORGIVING_OCR:
|
if settings.FORGIVING_OCR:
|
||||||
Log.warning(
|
self.log(
|
||||||
|
"warning",
|
||||||
"OCR for {} failed, but we're going to stick with what "
|
"OCR for {} failed, but we're going to stick with what "
|
||||||
"we've got since FORGIVING_OCR is enabled.".format(
|
"we've got since FORGIVING_OCR is enabled.".format(
|
||||||
guessed_language
|
guessed_language
|
||||||
),
|
)
|
||||||
Log.COMPONENT_CONSUMER
|
|
||||||
)
|
)
|
||||||
raw_text = self._assemble_ocr_sections(pngs, middle, raw_text)
|
raw_text = self._assemble_ocr_sections(pngs, middle, raw_text)
|
||||||
return raw_text
|
return raw_text
|
||||||
@ -222,28 +225,15 @@ class Consumer(object):
|
|||||||
if not pngs:
|
if not pngs:
|
||||||
return ""
|
return ""
|
||||||
|
|
||||||
Log.debug("Parsing for {}".format(lang), Log.COMPONENT_CONSUMER)
|
self.log("info", "Parsing for {}".format(lang))
|
||||||
|
|
||||||
with Pool(processes=self.THREADS) as pool:
|
with Pool(processes=self.THREADS) as pool:
|
||||||
r = pool.map(
|
r = pool.map(image_to_string, itertools.product(pngs, [lang]))
|
||||||
self.image_to_string, itertools.product(pngs, [lang]))
|
|
||||||
r = " ".join(r)
|
r = " ".join(r)
|
||||||
|
|
||||||
# Strip out excess white space to allow matching to go smoother
|
# Strip out excess white space to allow matching to go smoother
|
||||||
return re.sub(r"\s+", " ", r)
|
return re.sub(r"\s+", " ", r)
|
||||||
|
|
||||||
def image_to_string(self, args):
|
|
||||||
png, lang = args
|
|
||||||
ocr = pyocr.get_available_tools()[0]
|
|
||||||
with Image.open(os.path.join(self.SCRATCH, png)) as f:
|
|
||||||
if ocr.can_detect_orientation():
|
|
||||||
try:
|
|
||||||
orientation = ocr.detect_orientation(f, lang=lang)
|
|
||||||
f = f.rotate(orientation["angle"], expand=1)
|
|
||||||
except TesseractError:
|
|
||||||
pass
|
|
||||||
return ocr.image_to_string(f, lang=lang)
|
|
||||||
|
|
||||||
def _guess_attributes_from_name(self, parseable):
|
def _guess_attributes_from_name(self, parseable):
|
||||||
"""
|
"""
|
||||||
We use a crude naming convention to make handling the sender, title,
|
We use a crude naming convention to make handling the sender, title,
|
||||||
@ -301,7 +291,7 @@ class Consumer(object):
|
|||||||
|
|
||||||
stats = os.stat(doc)
|
stats = os.stat(doc)
|
||||||
|
|
||||||
Log.debug("Saving record to database", Log.COMPONENT_CONSUMER)
|
self.log("debug", "Saving record to database")
|
||||||
|
|
||||||
document = Document.objects.create(
|
document = Document.objects.create(
|
||||||
sender=sender,
|
sender=sender,
|
||||||
@ -316,23 +306,22 @@ class Consumer(object):
|
|||||||
|
|
||||||
if relevant_tags:
|
if relevant_tags:
|
||||||
tag_names = ", ".join([t.slug for t in relevant_tags])
|
tag_names = ", ".join([t.slug for t in relevant_tags])
|
||||||
Log.debug(
|
self.log("debug", "Tagging with {}".format(tag_names))
|
||||||
"Tagging with {}".format(tag_names), Log.COMPONENT_CONSUMER)
|
|
||||||
document.tags.add(*relevant_tags)
|
document.tags.add(*relevant_tags)
|
||||||
|
|
||||||
with open(doc, "rb") as unencrypted:
|
with open(doc, "rb") as unencrypted:
|
||||||
with open(document.source_path, "wb") as encrypted:
|
with open(document.source_path, "wb") as encrypted:
|
||||||
Log.debug("Encrypting", Log.COMPONENT_CONSUMER)
|
self.log("debug", "Encrypting")
|
||||||
encrypted.write(GnuPG.encrypted(unencrypted))
|
encrypted.write(GnuPG.encrypted(unencrypted))
|
||||||
|
|
||||||
@staticmethod
|
self.log("info", "Completed")
|
||||||
def _cleanup_tempdir(d):
|
|
||||||
Log.debug("Deleting directory {}".format(d), Log.COMPONENT_CONSUMER)
|
def _cleanup_tempdir(self, d):
|
||||||
|
self.log("debug", "Deleting directory {}".format(d))
|
||||||
shutil.rmtree(d)
|
shutil.rmtree(d)
|
||||||
|
|
||||||
@staticmethod
|
def _cleanup_doc(self, doc):
|
||||||
def _cleanup_doc(doc):
|
self.log("debug", "Deleting document {}".format(doc))
|
||||||
Log.debug("Deleting document {}".format(doc), Log.COMPONENT_CONSUMER)
|
|
||||||
os.unlink(doc)
|
os.unlink(doc)
|
||||||
|
|
||||||
def _is_ready(self, doc):
|
def _is_ready(self, doc):
|
||||||
@ -350,3 +339,23 @@ class Consumer(object):
|
|||||||
self.stats[doc] = t
|
self.stats[doc] = t
|
||||||
|
|
||||||
return False
|
return False
|
||||||
|
|
||||||
|
|
||||||
|
def image_to_string(args):
|
||||||
|
"""
|
||||||
|
I have no idea why, but if this function were a method of Consumer, it
|
||||||
|
would explode with:
|
||||||
|
|
||||||
|
`TypeError: cannot serialize '_io.TextIOWrapper' object`.
|
||||||
|
"""
|
||||||
|
|
||||||
|
png, lang = args
|
||||||
|
ocr = pyocr.get_available_tools()[0]
|
||||||
|
with Image.open(os.path.join(Consumer.SCRATCH, png)) as f:
|
||||||
|
if ocr.can_detect_orientation():
|
||||||
|
try:
|
||||||
|
orientation = ocr.detect_orientation(f, lang=lang)
|
||||||
|
f = f.rotate(orientation["angle"], expand=1)
|
||||||
|
except TesseractError:
|
||||||
|
pass
|
||||||
|
return ocr.image_to_string(f, lang=lang)
|
||||||
|
30
src/documents/loggers.py
Normal file
30
src/documents/loggers.py
Normal file
@ -0,0 +1,30 @@
|
|||||||
|
import logging
|
||||||
|
|
||||||
|
|
||||||
|
class PaperlessLogger(logging.StreamHandler):
|
||||||
|
"""
|
||||||
|
A logger smart enough to know to log some kinds of messages to the database
|
||||||
|
for later retrieval in a pretty interface.
|
||||||
|
"""
|
||||||
|
|
||||||
|
def emit(self, record):
|
||||||
|
|
||||||
|
logging.StreamHandler.emit(self, record)
|
||||||
|
|
||||||
|
if not hasattr(record, "component"):
|
||||||
|
return
|
||||||
|
|
||||||
|
# We have to do the import here or Django will barf when it tries to
|
||||||
|
# load this because the apps aren't loaded at that point
|
||||||
|
from .models import Log
|
||||||
|
|
||||||
|
kwargs = {
|
||||||
|
"message": record.msg,
|
||||||
|
"component": record.component,
|
||||||
|
"level": record.levelno,
|
||||||
|
}
|
||||||
|
|
||||||
|
if hasattr(record, "group"):
|
||||||
|
kwargs["group"] = record.group
|
||||||
|
|
||||||
|
Log.objects.create(**kwargs)
|
@ -1,8 +1,10 @@
|
|||||||
import datetime
|
import datetime
|
||||||
import imaplib
|
import imaplib
|
||||||
|
import logging
|
||||||
import os
|
import os
|
||||||
import re
|
import re
|
||||||
import time
|
import time
|
||||||
|
import uuid
|
||||||
|
|
||||||
from base64 import b64decode
|
from base64 import b64decode
|
||||||
from email import policy
|
from email import policy
|
||||||
@ -11,10 +13,8 @@ from dateutil import parser
|
|||||||
|
|
||||||
from django.conf import settings
|
from django.conf import settings
|
||||||
|
|
||||||
from logger.models import Log
|
|
||||||
|
|
||||||
from .consumer import Consumer
|
from .consumer import Consumer
|
||||||
from .models import Sender
|
from .models import Sender, Log
|
||||||
|
|
||||||
|
|
||||||
class MailFetcherError(Exception):
|
class MailFetcherError(Exception):
|
||||||
@ -25,7 +25,20 @@ class InvalidMessageError(Exception):
|
|||||||
pass
|
pass
|
||||||
|
|
||||||
|
|
||||||
class Message(object):
|
class Loggable(object):
|
||||||
|
|
||||||
|
def __init__(self, group=None):
|
||||||
|
self.logger = logging.getLogger(__name__)
|
||||||
|
self.logging_group = group or uuid.uuid4()
|
||||||
|
|
||||||
|
def log(self, level, message):
|
||||||
|
getattr(self.logger, level)(message, extra={
|
||||||
|
"group": self.logging_group,
|
||||||
|
"component": Log.COMPONENT_MAIL
|
||||||
|
})
|
||||||
|
|
||||||
|
|
||||||
|
class Message(Loggable):
|
||||||
"""
|
"""
|
||||||
A crude, but simple email message class. We assume that there's a subject
|
A crude, but simple email message class. We assume that there's a subject
|
||||||
and n attachments, and that we don't care about the message body.
|
and n attachments, and that we don't care about the message body.
|
||||||
@ -33,13 +46,13 @@ class Message(object):
|
|||||||
|
|
||||||
SECRET = settings.UPLOAD_SHARED_SECRET
|
SECRET = settings.UPLOAD_SHARED_SECRET
|
||||||
|
|
||||||
def __init__(self, data, verbosity=1):
|
def __init__(self, data, group=None):
|
||||||
"""
|
"""
|
||||||
Cribbed heavily from
|
Cribbed heavily from
|
||||||
https://www.ianlewis.org/en/parsing-email-attachments-python
|
https://www.ianlewis.org/en/parsing-email-attachments-python
|
||||||
"""
|
"""
|
||||||
|
|
||||||
self.verbosity = verbosity
|
Loggable.__init__(self, group=group)
|
||||||
|
|
||||||
self.subject = None
|
self.subject = None
|
||||||
self.time = None
|
self.time = None
|
||||||
@ -54,8 +67,7 @@ class Message(object):
|
|||||||
|
|
||||||
self._set_time(message)
|
self._set_time(message)
|
||||||
|
|
||||||
Log.info(
|
self.log("info", 'Importing email: "{}"'.format(self.subject))
|
||||||
'Importing email: "{}"'.format(self.subject), Log.COMPONENT_MAIL)
|
|
||||||
|
|
||||||
attachments = []
|
attachments = []
|
||||||
for part in message.walk():
|
for part in message.walk():
|
||||||
@ -134,9 +146,11 @@ class Attachment(object):
|
|||||||
return self.data
|
return self.data
|
||||||
|
|
||||||
|
|
||||||
class MailFetcher(object):
|
class MailFetcher(Loggable):
|
||||||
|
|
||||||
def __init__(self, verbosity=1):
|
def __init__(self):
|
||||||
|
|
||||||
|
Loggable.__init__(self)
|
||||||
|
|
||||||
self._connection = None
|
self._connection = None
|
||||||
self._host = settings.MAIL_CONSUMPTION["HOST"]
|
self._host = settings.MAIL_CONSUMPTION["HOST"]
|
||||||
@ -148,7 +162,6 @@ class MailFetcher(object):
|
|||||||
self._enabled = bool(self._host)
|
self._enabled = bool(self._host)
|
||||||
|
|
||||||
self.last_checked = datetime.datetime.now()
|
self.last_checked = datetime.datetime.now()
|
||||||
self.verbosity = verbosity
|
|
||||||
|
|
||||||
def pull(self):
|
def pull(self):
|
||||||
"""
|
"""
|
||||||
@ -159,14 +172,11 @@ class MailFetcher(object):
|
|||||||
|
|
||||||
if self._enabled:
|
if self._enabled:
|
||||||
|
|
||||||
Log.info("Checking mail", Log.COMPONENT_MAIL)
|
self.log("info", "Checking mail")
|
||||||
|
|
||||||
for message in self._get_messages():
|
for message in self._get_messages():
|
||||||
|
|
||||||
Log.debug(
|
self.log("info", 'Storing email: "{}"'.format(message.subject))
|
||||||
'Storing email: "{}"'.format(message.subject),
|
|
||||||
Log.COMPONENT_MAIL
|
|
||||||
)
|
|
||||||
|
|
||||||
t = int(time.mktime(message.time.timetuple()))
|
t = int(time.mktime(message.time.timetuple()))
|
||||||
file_name = os.path.join(Consumer.CONSUME, message.file_name)
|
file_name = os.path.join(Consumer.CONSUME, message.file_name)
|
||||||
@ -193,7 +203,7 @@ class MailFetcher(object):
|
|||||||
self._connection.logout()
|
self._connection.logout()
|
||||||
|
|
||||||
except Exception as e:
|
except Exception as e:
|
||||||
Log.error(e, Log.COMPONENT_MAIL)
|
self.log("error", str(e))
|
||||||
|
|
||||||
return r
|
return r
|
||||||
|
|
||||||
@ -218,9 +228,9 @@ class MailFetcher(object):
|
|||||||
|
|
||||||
message = None
|
message = None
|
||||||
try:
|
try:
|
||||||
message = Message(data[0][1], self.verbosity)
|
message = Message(data[0][1], self.logging_group)
|
||||||
except InvalidMessageError as e:
|
except InvalidMessageError as e:
|
||||||
Log.error(e, Log.COMPONENT_MAIL)
|
self.log("error", str(e))
|
||||||
else:
|
else:
|
||||||
self._connection.store(num, "+FLAGS", "\\Deleted")
|
self._connection.store(num, "+FLAGS", "\\Deleted")
|
||||||
|
|
||||||
|
@ -1,5 +1,5 @@
|
|||||||
# -*- coding: utf-8 -*-
|
# -*- coding: utf-8 -*-
|
||||||
# Generated by Django 1.9 on 2016-02-14 16:08
|
# Generated by Django 1.9 on 2016-02-27 17:54
|
||||||
from __future__ import unicode_literals
|
from __future__ import unicode_literals
|
||||||
|
|
||||||
from django.db import migrations, models
|
from django.db import migrations, models
|
||||||
@ -7,9 +7,8 @@ from django.db import migrations, models
|
|||||||
|
|
||||||
class Migration(migrations.Migration):
|
class Migration(migrations.Migration):
|
||||||
|
|
||||||
initial = True
|
|
||||||
|
|
||||||
dependencies = [
|
dependencies = [
|
||||||
|
('documents', '0009_auto_20160214_0040'),
|
||||||
]
|
]
|
||||||
|
|
||||||
operations = [
|
operations = [
|
||||||
@ -17,14 +16,15 @@ class Migration(migrations.Migration):
|
|||||||
name='Log',
|
name='Log',
|
||||||
fields=[
|
fields=[
|
||||||
('id', models.AutoField(auto_created=True, primary_key=True, serialize=False, verbose_name='ID')),
|
('id', models.AutoField(auto_created=True, primary_key=True, serialize=False, verbose_name='ID')),
|
||||||
('time', models.DateTimeField(auto_now_add=True)),
|
('group', models.UUIDField(blank=True)),
|
||||||
('message', models.TextField()),
|
('message', models.TextField()),
|
||||||
('level', models.PositiveIntegerField(choices=[(1, 'Error'), (2, 'Warning'), (3, 'Informational'), (4, 'Debugging')], default=3)),
|
('level', models.PositiveIntegerField(choices=[(10, 'Debugging'), (20, 'Informational'), (30, 'Warning'), (40, 'Error'), (50, 'Critical')], default=20)),
|
||||||
('component', models.PositiveIntegerField(choices=[(1, 'Consumer'), (2, 'Mail Fetcher')])),
|
('component', models.PositiveIntegerField(choices=[(1, 'Consumer'), (2, 'Mail Fetcher')])),
|
||||||
|
('created', models.DateTimeField(auto_now_add=True)),
|
||||||
|
('modified', models.DateTimeField(auto_now=True)),
|
||||||
],
|
],
|
||||||
),
|
options={
|
||||||
migrations.AlterModelOptions(
|
'ordering': ('-modified',),
|
||||||
name='log',
|
},
|
||||||
options={'ordering': ('-time',)},
|
|
||||||
),
|
),
|
||||||
]
|
]
|
@ -1,3 +1,4 @@
|
|||||||
|
import logging
|
||||||
import os
|
import os
|
||||||
import re
|
import re
|
||||||
|
|
||||||
@ -187,3 +188,34 @@ class Document(models.Model):
|
|||||||
@property
|
@property
|
||||||
def download_url(self):
|
def download_url(self):
|
||||||
return reverse("fetch", kwargs={"pk": self.pk})
|
return reverse("fetch", kwargs={"pk": self.pk})
|
||||||
|
|
||||||
|
|
||||||
|
class Log(models.Model):
|
||||||
|
|
||||||
|
LEVELS = (
|
||||||
|
(logging.DEBUG, "Debugging"),
|
||||||
|
(logging.INFO, "Informational"),
|
||||||
|
(logging.WARNING, "Warning"),
|
||||||
|
(logging.ERROR, "Error"),
|
||||||
|
(logging.CRITICAL, "Critical"),
|
||||||
|
)
|
||||||
|
|
||||||
|
COMPONENT_CONSUMER = 1
|
||||||
|
COMPONENT_MAIL = 2
|
||||||
|
COMPONENTS = (
|
||||||
|
(COMPONENT_CONSUMER, "Consumer"),
|
||||||
|
(COMPONENT_MAIL, "Mail Fetcher")
|
||||||
|
)
|
||||||
|
|
||||||
|
group = models.UUIDField(blank=True)
|
||||||
|
message = models.TextField()
|
||||||
|
level = models.PositiveIntegerField(choices=LEVELS, default=logging.INFO)
|
||||||
|
component = models.PositiveIntegerField(choices=COMPONENTS)
|
||||||
|
created = models.DateTimeField(auto_now_add=True)
|
||||||
|
modified = models.DateTimeField(auto_now=True)
|
||||||
|
|
||||||
|
class Meta(object):
|
||||||
|
ordering = ("-modified",)
|
||||||
|
|
||||||
|
def __str__(self):
|
||||||
|
return self.message
|
||||||
|
124
src/documents/tests/test_logger.py
Normal file
124
src/documents/tests/test_logger.py
Normal file
@ -0,0 +1,124 @@
|
|||||||
|
import logging
|
||||||
|
import uuid
|
||||||
|
|
||||||
|
from unittest import mock
|
||||||
|
|
||||||
|
from django.test import TestCase
|
||||||
|
|
||||||
|
from ..models import Log
|
||||||
|
|
||||||
|
|
||||||
|
class TestPaperlessLog(TestCase):
|
||||||
|
|
||||||
|
def __init__(self, *args, **kwargs):
|
||||||
|
TestCase.__init__(self, *args, **kwargs)
|
||||||
|
self.logger = logging.getLogger(
|
||||||
|
"documents.management.commands.document_consumer")
|
||||||
|
|
||||||
|
def test_ignored(self):
|
||||||
|
with mock.patch("logging.StreamHandler.emit") as __:
|
||||||
|
self.assertEqual(Log.objects.all().count(), 0)
|
||||||
|
self.logger.info("This is an informational message")
|
||||||
|
self.logger.warning("This is an informational message")
|
||||||
|
self.logger.error("This is an informational message")
|
||||||
|
self.logger.critical("This is an informational message")
|
||||||
|
self.assertEqual(Log.objects.all().count(), 0)
|
||||||
|
|
||||||
|
def test_that_it_saves_at_all(self):
|
||||||
|
|
||||||
|
kw = {
|
||||||
|
"group": uuid.uuid4(),
|
||||||
|
"component": Log.COMPONENT_MAIL
|
||||||
|
}
|
||||||
|
|
||||||
|
self.assertEqual(Log.objects.all().count(), 0)
|
||||||
|
|
||||||
|
with mock.patch("logging.StreamHandler.emit") as __:
|
||||||
|
|
||||||
|
# Debug messages are ignored by default
|
||||||
|
self.logger.debug("This is a debugging message", extra=kw)
|
||||||
|
self.assertEqual(Log.objects.all().count(), 0)
|
||||||
|
|
||||||
|
self.logger.info("This is an informational message", extra=kw)
|
||||||
|
self.assertEqual(Log.objects.all().count(), 1)
|
||||||
|
|
||||||
|
self.logger.warning("This is an warning message", extra=kw)
|
||||||
|
self.assertEqual(Log.objects.all().count(), 2)
|
||||||
|
|
||||||
|
self.logger.error("This is an error message", extra=kw)
|
||||||
|
self.assertEqual(Log.objects.all().count(), 3)
|
||||||
|
|
||||||
|
self.logger.critical("This is a critical message", extra=kw)
|
||||||
|
self.assertEqual(Log.objects.all().count(), 4)
|
||||||
|
|
||||||
|
def test_groups(self):
|
||||||
|
|
||||||
|
kw1 = {
|
||||||
|
"group": uuid.uuid4(),
|
||||||
|
"component": Log.COMPONENT_MAIL
|
||||||
|
}
|
||||||
|
kw2 = {
|
||||||
|
"group": uuid.uuid4(),
|
||||||
|
"component": Log.COMPONENT_MAIL
|
||||||
|
}
|
||||||
|
|
||||||
|
self.assertEqual(Log.objects.all().count(), 0)
|
||||||
|
|
||||||
|
with mock.patch("logging.StreamHandler.emit") as __:
|
||||||
|
|
||||||
|
# Debug messages are ignored by default
|
||||||
|
self.logger.debug("This is a debugging message", extra=kw1)
|
||||||
|
self.assertEqual(Log.objects.all().count(), 0)
|
||||||
|
|
||||||
|
self.logger.info("This is an informational message", extra=kw2)
|
||||||
|
self.assertEqual(Log.objects.all().count(), 1)
|
||||||
|
self.assertEqual(Log.objects.filter(group=kw2["group"]).count(), 1)
|
||||||
|
|
||||||
|
self.logger.warning("This is an warning message", extra=kw1)
|
||||||
|
self.assertEqual(Log.objects.all().count(), 2)
|
||||||
|
self.assertEqual(Log.objects.filter(group=kw1["group"]).count(), 1)
|
||||||
|
|
||||||
|
self.logger.error("This is an error message", extra=kw2)
|
||||||
|
self.assertEqual(Log.objects.all().count(), 3)
|
||||||
|
self.assertEqual(Log.objects.filter(group=kw2["group"]).count(), 2)
|
||||||
|
|
||||||
|
self.logger.critical("This is a critical message", extra=kw1)
|
||||||
|
self.assertEqual(Log.objects.all().count(), 4)
|
||||||
|
self.assertEqual(Log.objects.filter(group=kw1["group"]).count(), 2)
|
||||||
|
|
||||||
|
def test_components(self):
|
||||||
|
|
||||||
|
c1 = Log.COMPONENT_CONSUMER
|
||||||
|
c2 = Log.COMPONENT_MAIL
|
||||||
|
kw1 = {
|
||||||
|
"group": uuid.uuid4(),
|
||||||
|
"component": c1
|
||||||
|
}
|
||||||
|
kw2 = {
|
||||||
|
"group": kw1["group"],
|
||||||
|
"component": c2
|
||||||
|
}
|
||||||
|
|
||||||
|
self.assertEqual(Log.objects.all().count(), 0)
|
||||||
|
|
||||||
|
with mock.patch("logging.StreamHandler.emit") as __:
|
||||||
|
|
||||||
|
# Debug messages are ignored by default
|
||||||
|
self.logger.debug("This is a debugging message", extra=kw1)
|
||||||
|
self.assertEqual(Log.objects.all().count(), 0)
|
||||||
|
|
||||||
|
self.logger.info("This is an informational message", extra=kw2)
|
||||||
|
self.assertEqual(Log.objects.all().count(), 1)
|
||||||
|
self.assertEqual(Log.objects.filter(component=c2).count(), 1)
|
||||||
|
|
||||||
|
self.logger.warning("This is an warning message", extra=kw1)
|
||||||
|
self.assertEqual(Log.objects.all().count(), 2)
|
||||||
|
self.assertEqual(Log.objects.filter(component=c1).count(), 1)
|
||||||
|
|
||||||
|
self.logger.error("This is an error message", extra=kw2)
|
||||||
|
self.assertEqual(Log.objects.all().count(), 3)
|
||||||
|
self.assertEqual(Log.objects.filter(component=c2).count(), 2)
|
||||||
|
|
||||||
|
self.logger.critical("This is a critical message", extra=kw1)
|
||||||
|
self.assertEqual(Log.objects.all().count(), 4)
|
||||||
|
self.assertEqual(Log.objects.filter(component=c1).count(), 2)
|
@ -1,12 +0,0 @@
|
|||||||
from django.contrib import admin
|
|
||||||
|
|
||||||
from .models import Log
|
|
||||||
|
|
||||||
|
|
||||||
class LogAdmin(admin.ModelAdmin):
|
|
||||||
|
|
||||||
list_display = ("message", "level", "component")
|
|
||||||
list_filter = ("level", "component",)
|
|
||||||
|
|
||||||
|
|
||||||
admin.site.register(Log, LogAdmin)
|
|
@ -1,5 +0,0 @@
|
|||||||
from django.apps import AppConfig
|
|
||||||
|
|
||||||
|
|
||||||
class LoggerConfig(AppConfig):
|
|
||||||
name = 'logger'
|
|
@ -1,53 +0,0 @@
|
|||||||
from django.db import models
|
|
||||||
|
|
||||||
|
|
||||||
class Log(models.Model):
|
|
||||||
|
|
||||||
LEVEL_ERROR = 1
|
|
||||||
LEVEL_WARNING = 2
|
|
||||||
LEVEL_INFO = 3
|
|
||||||
LEVEL_DEBUG = 4
|
|
||||||
LEVELS = (
|
|
||||||
(LEVEL_ERROR, "Error"),
|
|
||||||
(LEVEL_WARNING, "Warning"),
|
|
||||||
(LEVEL_INFO, "Informational"),
|
|
||||||
(LEVEL_DEBUG, "Debugging"),
|
|
||||||
)
|
|
||||||
|
|
||||||
COMPONENT_CONSUMER = 1
|
|
||||||
COMPONENT_MAIL = 2
|
|
||||||
COMPONENTS = (
|
|
||||||
(COMPONENT_CONSUMER, "Consumer"),
|
|
||||||
(COMPONENT_MAIL, "Mail Fetcher")
|
|
||||||
)
|
|
||||||
|
|
||||||
time = models.DateTimeField(auto_now_add=True)
|
|
||||||
message = models.TextField()
|
|
||||||
level = models.PositiveIntegerField(choices=LEVELS, default=LEVEL_INFO)
|
|
||||||
component = models.PositiveIntegerField(choices=COMPONENTS)
|
|
||||||
|
|
||||||
class Meta(object):
|
|
||||||
ordering = ("-time",)
|
|
||||||
|
|
||||||
def __str__(self):
|
|
||||||
return self.message
|
|
||||||
|
|
||||||
@classmethod
|
|
||||||
def error(cls, message, component):
|
|
||||||
cls.objects.create(
|
|
||||||
message=message, level=cls.LEVEL_ERROR, component=component)
|
|
||||||
|
|
||||||
@classmethod
|
|
||||||
def warning(cls, message, component):
|
|
||||||
cls.objects.create(
|
|
||||||
message=message, level=cls.LEVEL_WARNING, component=component)
|
|
||||||
|
|
||||||
@classmethod
|
|
||||||
def info(cls, message, component):
|
|
||||||
cls.objects.create(
|
|
||||||
message=message, level=cls.LEVEL_INFO, component=component)
|
|
||||||
|
|
||||||
@classmethod
|
|
||||||
def debug(cls, message, component):
|
|
||||||
cls.objects.create(
|
|
||||||
message=message, level=cls.LEVEL_DEBUG, component=component)
|
|
@ -1,3 +0,0 @@
|
|||||||
from django.test import TestCase
|
|
||||||
|
|
||||||
# Create your tests here.
|
|
@ -1,3 +0,0 @@
|
|||||||
from django.shortcuts import render
|
|
||||||
|
|
||||||
# Create your views here.
|
|
@ -42,7 +42,6 @@ INSTALLED_APPS = [
|
|||||||
"django_extensions",
|
"django_extensions",
|
||||||
|
|
||||||
"documents",
|
"documents",
|
||||||
"logger",
|
|
||||||
|
|
||||||
"rest_framework",
|
"rest_framework",
|
||||||
|
|
||||||
@ -89,12 +88,12 @@ DATABASES = {
|
|||||||
"NAME": os.path.join(BASE_DIR, "..", "data", "db.sqlite3"),
|
"NAME": os.path.join(BASE_DIR, "..", "data", "db.sqlite3"),
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
if os.environ.get("PAPERLESS_DBUSER") and os.environ.get("PAPERLESS_DBPASS"):
|
if os.getenv("PAPERLESS_DBUSER") and os.getenv("PAPERLESS_DBPASS"):
|
||||||
DATABASES["default"] = {
|
DATABASES["default"] = {
|
||||||
"ENGINE": "django.db.backends.postgresql_psycopg2",
|
"ENGINE": "django.db.backends.postgresql_psycopg2",
|
||||||
"NAME": os.environ.get("PAPERLESS_DBNAME", "paperless"),
|
"NAME": os.getenv("PAPERLESS_DBNAME", "paperless"),
|
||||||
"USER": os.environ.get("PAPERLESS_DBUSER"),
|
"USER": os.getenv("PAPERLESS_DBUSER"),
|
||||||
"PASSWORD": os.environ.get("PAPERLESS_DBPASS")
|
"PASSWORD": os.getenv("PAPERLESS_DBPASS")
|
||||||
}
|
}
|
||||||
|
|
||||||
|
|
||||||
@ -141,6 +140,25 @@ STATIC_URL = '/static/'
|
|||||||
MEDIA_URL = "/media/"
|
MEDIA_URL = "/media/"
|
||||||
|
|
||||||
|
|
||||||
|
# Logging
|
||||||
|
|
||||||
|
LOGGING = {
|
||||||
|
"version": 1,
|
||||||
|
"disable_existing_loggers": False,
|
||||||
|
"handlers": {
|
||||||
|
"consumer": {
|
||||||
|
"class": "documents.loggers.PaperlessLogger",
|
||||||
|
}
|
||||||
|
},
|
||||||
|
"loggers": {
|
||||||
|
"documents": {
|
||||||
|
"handlers": ["consumer"],
|
||||||
|
"level": os.getenv("PAPERLESS_CONSUMER_LOG_LEVEL", "INFO"),
|
||||||
|
},
|
||||||
|
},
|
||||||
|
}
|
||||||
|
|
||||||
|
|
||||||
# Paperless-specific stuffs
|
# Paperless-specific stuffs
|
||||||
# Change these paths if yours are different
|
# Change these paths if yours are different
|
||||||
# ----------------------------------------------------------------------------
|
# ----------------------------------------------------------------------------
|
||||||
@ -150,15 +168,15 @@ MEDIA_URL = "/media/"
|
|||||||
OCR_LANGUAGE = "eng"
|
OCR_LANGUAGE = "eng"
|
||||||
|
|
||||||
# The amount of threads to use for OCR
|
# The amount of threads to use for OCR
|
||||||
OCR_THREADS = os.environ.get("PAPERLESS_OCR_THREADS")
|
OCR_THREADS = os.getenv("PAPERLESS_OCR_THREADS")
|
||||||
|
|
||||||
# If this is true, any failed attempts to OCR a PDF will result in the PDF being
|
# If this is true, any failed attempts to OCR a PDF will result in the PDF
|
||||||
# indexed anyway, with whatever we could get. If it's False, the file will
|
# being indexed anyway, with whatever we could get. If it's False, the file
|
||||||
# simply be left in the CONSUMPTION_DIR.
|
# will simply be left in the CONSUMPTION_DIR.
|
||||||
FORGIVING_OCR = True
|
FORGIVING_OCR = True
|
||||||
|
|
||||||
# GNUPG needs a home directory for some reason
|
# GNUPG needs a home directory for some reason
|
||||||
GNUPG_HOME = os.environ.get("HOME", "/tmp")
|
GNUPG_HOME = os.getenv("HOME", "/tmp")
|
||||||
|
|
||||||
# Convert is part of the Imagemagick package
|
# Convert is part of the Imagemagick package
|
||||||
CONVERT_BINARY = "/usr/bin/convert"
|
CONVERT_BINARY = "/usr/bin/convert"
|
||||||
@ -167,16 +185,16 @@ CONVERT_BINARY = "/usr/bin/convert"
|
|||||||
SCRATCH_DIR = "/tmp/paperless"
|
SCRATCH_DIR = "/tmp/paperless"
|
||||||
|
|
||||||
# This is where Paperless will look for PDFs to index
|
# This is where Paperless will look for PDFs to index
|
||||||
CONSUMPTION_DIR = os.environ.get("PAPERLESS_CONSUME")
|
CONSUMPTION_DIR = os.getenv("PAPERLESS_CONSUME")
|
||||||
|
|
||||||
# If you want to use IMAP mail consumption, populate this with useful values.
|
# If you want to use IMAP mail consumption, populate this with useful values.
|
||||||
# If you leave HOST set to None, we assume you're not going to use this
|
# If you leave HOST set to None, we assume you're not going to use this
|
||||||
# feature.
|
# feature.
|
||||||
MAIL_CONSUMPTION = {
|
MAIL_CONSUMPTION = {
|
||||||
"HOST": os.environ.get("PAPERLESS_CONSUME_MAIL_HOST"),
|
"HOST": os.getenv("PAPERLESS_CONSUME_MAIL_HOST"),
|
||||||
"PORT": os.environ.get("PAPERLESS_CONSUME_MAIL_PORT"),
|
"PORT": os.getenv("PAPERLESS_CONSUME_MAIL_PORT"),
|
||||||
"USERNAME": os.environ.get("PAPERLESS_CONSUME_MAIL_USER"),
|
"USERNAME": os.getenv("PAPERLESS_CONSUME_MAIL_USER"),
|
||||||
"PASSWORD": os.environ.get("PAPERLESS_CONSUME_MAIL_PASS"),
|
"PASSWORD": os.getenv("PAPERLESS_CONSUME_MAIL_PASS"),
|
||||||
"USE_SSL": True, # If True, use SSL/TLS to connect
|
"USE_SSL": True, # If True, use SSL/TLS to connect
|
||||||
"INBOX": "INBOX" # The name of the inbox on the server
|
"INBOX": "INBOX" # The name of the inbox on the server
|
||||||
}
|
}
|
||||||
@ -188,9 +206,9 @@ MAIL_CONSUMPTION = {
|
|||||||
# DON'T FORGET TO SET THIS as leaving it blank may cause some strange things
|
# DON'T FORGET TO SET THIS as leaving it blank may cause some strange things
|
||||||
# with GPG, including an interesting case where it may "encrypt" zero-byte
|
# with GPG, including an interesting case where it may "encrypt" zero-byte
|
||||||
# files.
|
# files.
|
||||||
PASSPHRASE = os.environ.get("PAPERLESS_PASSPHRASE")
|
PASSPHRASE = os.getenv("PAPERLESS_PASSPHRASE")
|
||||||
|
|
||||||
# If you intend to use the "API" to push files into the consumer, you'll need
|
# If you intend to use the "API" to push files into the consumer, you'll need
|
||||||
# to provide a shared secret here. Leaving this as the default will disable
|
# to provide a shared secret here. Leaving this as the default will disable
|
||||||
# the API.
|
# the API.
|
||||||
UPLOAD_SHARED_SECRET = os.environ.get("PAPERLESS_SECRET", "")
|
UPLOAD_SHARED_SECRET = os.getenv("PAPERLESS_SECRET", "")
|
||||||
|
Loading…
x
Reference in New Issue
Block a user