unified document matching, legacy and automatching work alongside now

This commit is contained in:
Jonas Winkler
2020-10-28 11:45:11 +01:00
parent 9e4147ac52
commit 11af74ba36
16 changed files with 629 additions and 225 deletions

View File

@@ -11,6 +11,7 @@ from operator import itemgetter
from django.conf import settings
from django.utils import timezone
from paperless.db import GnuPG
from .classifier import DocumentClassifier
from .models import Document, FileInfo, Tag
from .parsers import ParseError
@@ -49,6 +50,8 @@ class Consumer:
self.consume = consume
self.scratch = scratch
self.classifier = DocumentClassifier()
os.makedirs(self.scratch, exist_ok=True)
self.storage_type = Document.STORAGE_TYPE_UNENCRYPTED
@@ -175,10 +178,22 @@ class Consumer:
"Document {} consumption finished".format(document)
)
classifier = None
try:
self.classifier.reload()
self.classifier.update(document)
classifier = self.classifier
except FileNotFoundError:
logging.getLogger(__name__).warning("Cannot classify documents, "
"classifier model file was not "
"found.")
document_consumption_finished.send(
sender=self.__class__,
document=document,
logging_group=self.logging_group
logging_group=self.logging_group,
classifier=classifier
)
return True