From 32186e0de1328e8213edb265c3e1f98b06a6c019 Mon Sep 17 00:00:00 2001 From: jonaswinkler Date: Sun, 29 Nov 2020 16:33:33 +0100 Subject: [PATCH 001/522] added a menu for bulk edits. --- .../document-list.component.html | 26 +++++++++++++++++++ 1 file changed, 26 insertions(+) diff --git a/src-ui/src/app/components/document-list/document-list.component.html b/src-ui/src/app/components/document-list/document-list.component.html index cc682b8e3..d142fbb04 100644 --- a/src-ui/src/app/components/document-list/document-list.component.html +++ b/src-ui/src/app/components/document-list/document-list.component.html @@ -1,5 +1,31 @@ +
+ +
+ + + + + + + + + + + + + + + +
+
+
\ No newline at end of file diff --git a/src-ui/src/app/components/document-detail/document-detail.component.scss b/src-ui/src/app/components/document-detail/document-detail.component.scss index e69de29bb..630a31011 100644 --- a/src-ui/src/app/components/document-detail/document-detail.component.scss +++ b/src-ui/src/app/components/document-detail/document-detail.component.scss @@ -0,0 +1,4 @@ +.document-preview { + height: calc(100vh - 180px); + top: 70px +} \ No newline at end of file diff --git a/src-ui/src/app/components/manage/settings/settings.component.html b/src-ui/src/app/components/manage/settings/settings.component.html index 91eab807b..7a500e6eb 100644 --- a/src-ui/src/app/components/manage/settings/settings.component.html +++ b/src-ui/src/app/components/manage/settings/settings.component.html @@ -46,8 +46,8 @@ {{ config.title }} - {{ config.showInDashboard }} - {{ config.showInSideBar }} + {{ config.showInDashboard | yesno }} + {{ config.showInSideBar | yesno }} diff --git a/src-ui/src/app/pipes/yes-no.pipe.spec.ts b/src-ui/src/app/pipes/yes-no.pipe.spec.ts new file mode 100644 index 000000000..80acd8acd --- /dev/null +++ b/src-ui/src/app/pipes/yes-no.pipe.spec.ts @@ -0,0 +1,8 @@ +import { YesNoPipe } from './yes-no.pipe'; + +describe('YesNoPipe', () => { + it('create an instance', () => { + const pipe = new YesNoPipe(); + expect(pipe).toBeTruthy(); + }); +}); diff --git a/src-ui/src/app/pipes/yes-no.pipe.ts b/src-ui/src/app/pipes/yes-no.pipe.ts new file mode 100644 index 000000000..9a4ed56ef --- /dev/null +++ b/src-ui/src/app/pipes/yes-no.pipe.ts @@ -0,0 +1,12 @@ +import { Pipe, PipeTransform } from '@angular/core'; + +@Pipe({ + name: 'yesno' +}) +export class YesNoPipe implements PipeTransform { + + transform(value: boolean): unknown { + return value ? "Yes" : "No" + } + +} From c4a939dbcc363709323ce30785e007c85306bdc8 Mon Sep 17 00:00:00 2001 From: jonaswinkler Date: Tue, 8 Dec 2020 00:09:36 +0100 Subject: [PATCH 018/522] addresses #104 --- .../app/components/document-list/document-list.component.html | 4 ++-- .../app/components/document-list/document-list.component.ts | 4 ++++ 2 files changed, 6 insertions(+), 2 deletions(-) diff --git a/src-ui/src/app/components/document-list/document-list.component.html b/src-ui/src/app/components/document-list/document-list.component.html index cebe7c544..881a28dbf 100644 --- a/src-ui/src/app/components/document-list/document-list.component.html +++ b/src-ui/src/app/components/document-list/document-list.component.html @@ -44,7 +44,7 @@
-
-

{{list.collectionSize || 0}} document(s)

+

{{list.collectionSize || 0}} document(s) (filtered)

diff --git a/src-ui/src/app/components/document-list/document-list.component.ts b/src-ui/src/app/components/document-list/document-list.component.ts index dd939ac01..09e73dd96 100644 --- a/src-ui/src/app/components/document-list/document-list.component.ts +++ b/src-ui/src/app/components/document-list/document-list.component.ts @@ -32,6 +32,10 @@ export class DocumentListComponent implements OnInit { filterRules: FilterRule[] = [] showFilter = false + get isFiltered() { + return this.list.filterRules?.length > 0 + } + getTitle() { return this.list.savedViewTitle || "Documents" } From 5321ff1f207156f747b768703013d62c0e6dcdac Mon Sep 17 00:00:00 2001 From: jonaswinkler Date: Tue, 8 Dec 2020 00:45:11 +0100 Subject: [PATCH 019/522] upload status addresses #100 --- .../upload-file-widget.component.html | 25 ++++++------ .../upload-file-widget.component.ts | 38 +++++++++++++++++-- .../src/app/services/rest/document.service.ts | 2 +- 3 files changed, 50 insertions(+), 15 deletions(-) diff --git a/src-ui/src/app/components/dashboard/widgets/upload-file-widget/upload-file-widget.component.html b/src-ui/src/app/components/dashboard/widgets/upload-file-widget/upload-file-widget.component.html index cb114e49e..013486a47 100644 --- a/src-ui/src/app/components/dashboard/widgets/upload-file-widget/upload-file-widget.component.html +++ b/src-ui/src/app/components/dashboard/widgets/upload-file-widget/upload-file-widget.component.html @@ -1,15 +1,18 @@ -
- +
+ + - - + + +
+

Uploading {{uploadStatus.length}} file(s)

+ + +
+
\ No newline at end of file diff --git a/src-ui/src/app/components/dashboard/widgets/upload-file-widget/upload-file-widget.component.ts b/src-ui/src/app/components/dashboard/widgets/upload-file-widget/upload-file-widget.component.ts index 1003f31db..90bfbf1e5 100644 --- a/src-ui/src/app/components/dashboard/widgets/upload-file-widget/upload-file-widget.component.ts +++ b/src-ui/src/app/components/dashboard/widgets/upload-file-widget/upload-file-widget.component.ts @@ -1,8 +1,16 @@ +import { HttpEventType } from '@angular/common/http'; import { Component, OnInit } from '@angular/core'; import { FileSystemFileEntry, NgxFileDropEntry } from 'ngx-file-drop'; import { DocumentService } from 'src/app/services/rest/document.service'; import { Toast, ToastService } from 'src/app/services/toast.service'; + +interface UploadStatus { + file: string + loaded: number + total: number +} + @Component({ selector: 'app-upload-file-widget', templateUrl: './upload-file-widget.component.html', @@ -21,16 +29,40 @@ export class UploadFileWidgetComponent implements OnInit { public fileLeave(event){ } + uploadStatus: UploadStatus[] = [] + + uploadVisible = false + + get loadedSum() { + return this.uploadStatus.map(s => s.loaded).reduce((a,b) => a+b, 1) + } + + get totalSum() { + return this.uploadStatus.map(s => s.total).reduce((a,b) => a+b, 1) + } + public dropped(files: NgxFileDropEntry[]) { for (const droppedFile of files) { if (droppedFile.fileEntry.isFile) { const fileEntry = droppedFile.fileEntry as FileSystemFileEntry; fileEntry.file((file: File) => { - const formData = new FormData() + let formData = new FormData() formData.append('document', file, file.name) - this.documentService.uploadDocument(formData).subscribe(result => { - this.toastService.showToast(Toast.make("Information", "The document has been uploaded and will be processed by the consumer shortly.")) + + let uploadStatusObject: UploadStatus = {file: file.name, loaded: 0, total: 1} + this.uploadStatus.push(uploadStatusObject) + this.uploadVisible = true + this.documentService.uploadDocument(formData).subscribe(event => { + if (event.type == HttpEventType.UploadProgress) { + uploadStatusObject.loaded = event.loaded + uploadStatusObject.total = event.total + } else if (event.type == HttpEventType.Response) { + this.uploadStatus.splice(this.uploadStatus.indexOf(uploadStatusObject), 1) + this.toastService.showToast(Toast.make("Information", "The document has been uploaded and will be processed by the consumer shortly.")) + } + }, error => { + this.uploadStatus.splice(this.uploadStatus.indexOf(uploadStatusObject), 1) switch (error.status) { case 400: { this.toastService.showToast(Toast.makeError(`There was an error while uploading the document: ${error.error.document}`)) diff --git a/src-ui/src/app/services/rest/document.service.ts b/src-ui/src/app/services/rest/document.service.ts index 5bf2308d4..81693ec68 100644 --- a/src-ui/src/app/services/rest/document.service.ts +++ b/src-ui/src/app/services/rest/document.service.ts @@ -94,7 +94,7 @@ export class DocumentService extends AbstractPaperlessService } uploadDocument(formData) { - return this.http.post(this.getResourceUrl(null, 'post_document'), formData) + return this.http.post(this.getResourceUrl(null, 'post_document'), formData, {reportProgress: true, observe: "events"}) } getMetadata(id: number): Observable { From 30f200ad395f6d4e2a3c284da1c4a8e741390f37 Mon Sep 17 00:00:00 2001 From: jonaswinkler Date: Tue, 8 Dec 2020 00:45:23 +0100 Subject: [PATCH 020/522] fix z-order on the edit page. --- .../components/document-detail/document-detail.component.html | 2 +- .../components/document-detail/document-detail.component.scss | 3 ++- 2 files changed, 3 insertions(+), 2 deletions(-) diff --git a/src-ui/src/app/components/document-detail/document-detail.component.html b/src-ui/src/app/components/document-detail/document-detail.component.html index 783881583..42619845c 100644 --- a/src-ui/src/app/components/document-detail/document-detail.component.html +++ b/src-ui/src/app/components/document-detail/document-detail.component.html @@ -112,7 +112,7 @@ -
+

Your browser does not support PDFs. Download the PDF.

diff --git a/src-ui/src/app/components/document-detail/document-detail.component.scss b/src-ui/src/app/components/document-detail/document-detail.component.scss index 630a31011..b1e9fddfb 100644 --- a/src-ui/src/app/components/document-detail/document-detail.component.scss +++ b/src-ui/src/app/components/document-detail/document-detail.component.scss @@ -1,4 +1,5 @@ .document-preview { height: calc(100vh - 180px); - top: 70px + top: 70px; + position: sticky; } \ No newline at end of file From bb33ac5e9e3d81b2c6d86f67b3475f89137061c5 Mon Sep 17 00:00:00 2001 From: jonaswinkler Date: Tue, 8 Dec 2020 01:12:03 +0100 Subject: [PATCH 021/522] fixees #77 --- .../app/components/document-list/document-list.component.html | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/src-ui/src/app/components/document-list/document-list.component.html b/src-ui/src/app/components/document-list/document-list.component.html index 881a28dbf..8608ed92b 100644 --- a/src-ui/src/app/components/document-list/document-list.component.html +++ b/src-ui/src/app/components/document-list/document-list.component.html @@ -105,7 +105,7 @@ - {{d.title}} + {{d.title}} From c240fa18839e9c0a4c4f9bf7000da619565f12aa Mon Sep 17 00:00:00 2001 From: jonaswinkler Date: Tue, 8 Dec 2020 11:53:58 +0100 Subject: [PATCH 022/522] changelog --- docs/changelog.rst | 28 ++++++++++++++++++++++++++++ 1 file changed, 28 insertions(+) diff --git a/docs/changelog.rst b/docs/changelog.rst index 116c2e07c..b6f4295b1 100644 --- a/docs/changelog.rst +++ b/docs/changelog.rst @@ -5,6 +5,34 @@ Changelog ********* +paperless-ng 0.9.6 +################## + +This release focusses primarily on many small issues with the UI. + +* Front end + + * Paperless now has proper window titles. + * Fixed an issue with the small cards when more than 7 tags were used. + * Navigation of the "Show all" links adjusted. + * Some indication on the document lists that a filter is active was added. + * There's a new filter to filter for documents that do *not* have a certain tag. + * The file upload box now shows upload progress. + * The document edit page was reorganized. + * Table issues with too long document titles fixed. + +* API + + * The API now serves file names with documents. + +* Other + + * Fixed an issue with the docker image when a non-standard PostgreSQL port was used. + * ``FILENAME_FORMAT`` placeholder for document types. + * The filename formatter is now less restrictive with file names and tries to + conserve the original correspondents, types and titles as much as possible. + + paperless-ng 0.9.5 ################## From 9da11f29c7ca1f2a9df5feb5e386015ef78c6e3f Mon Sep 17 00:00:00 2001 From: jonaswinkler Date: Tue, 8 Dec 2020 13:54:35 +0100 Subject: [PATCH 023/522] fixes #90 --- Pipfile | 1 + Pipfile.lock | 37 +++-- docs/changelog.rst | 2 + src/documents/consumer.py | 57 +++---- src/documents/file_handling.py | 23 ++- .../management/commands/document_importer.py | 25 +-- src/documents/signals/handlers.py | 143 ++++++++++-------- src/documents/tests/test_consumer.py | 6 +- src/documents/tests/test_file_handling.py | 95 ++++++++---- src/paperless/settings.py | 4 + 10 files changed, 245 insertions(+), 148 deletions(-) diff --git a/Pipfile b/Pipfile index 2e86f2a42..830604a8d 100644 --- a/Pipfile +++ b/Pipfile @@ -19,6 +19,7 @@ django-extensions = "*" django-filter = "~=2.4.0" django-q = "~=1.3.4" djangorestframework = "~=3.12.2" +filelock = "*" fuzzywuzzy = "*" gunicorn = "*" imap-tools = "*" diff --git a/Pipfile.lock b/Pipfile.lock index 6158a70e0..198351237 100644 --- a/Pipfile.lock +++ b/Pipfile.lock @@ -1,7 +1,7 @@ { "_meta": { "hash": { - "sha256": "b10db53eb22d917723aa6107ff0970dc4e2aa886ee03d3ae08a994a856d57986" + "sha256": "3c187671ead11714d48b56f4714b145f68814e09edea818610b87f18b4f7f6fd" }, "pipfile-spec": 6, "requires": { @@ -197,6 +197,14 @@ "index": "pypi", "version": "==3.12.2" }, + "filelock": { + "hashes": [ + "sha256:18d82244ee114f543149c66a6e0c14e9c4f8a1044b5cdaadd0f82159d6a6ff59", + "sha256:929b7d63ec5b7d6b71b0fa5ac14e030b3f70b75747cef1b10da9b879fef15836" + ], + "index": "pypi", + "version": "==3.0.12" + }, "fuzzywuzzy": { "hashes": [ "sha256:45016e92264780e58972dca1b3d939ac864b78437422beecebb3095f8efd00e8", @@ -858,10 +866,10 @@ }, "certifi": { "hashes": [ - "sha256:1f422849db327d534e3d0c5f02a263458c3955ec0aae4ff09b95f195c59f4edd", - "sha256:f05def092c44fbf25834a51509ef6e631dc19765ab8a57b4e7ab85531f0a9cf4" + "sha256:1a4995114262bffbc2413b159f2a1a480c969de6e6eb13ee966d470af86af59c", + "sha256:719a74fb9e33b9bd44cc7f3a8d94bc35e4049deebe19ba7d8e108280cfd59830" ], - "version": "==2020.11.8" + "version": "==2020.12.5" }, "chardet": { "hashes": [ @@ -961,17 +969,18 @@ }, "faker": { "hashes": [ - "sha256:7bca5b074299ac6532be2f72979e6793f1a2403ca8105cb4cf0b385a964469c4", - "sha256:fb21a76064847561033d8cab1cfd11af436ddf2c6fe72eb51b3cda51dff86bdc" + "sha256:1fcb415562ee6e2395b041e85fa6901d4708d30b84d54015226fa754ed0822c3", + "sha256:e8beccb398ee9b8cc1a91d9295121d66512b6753b4846eb1e7370545d46b3311" ], - "markers": "python_version >= '3.5'", - "version": "==5.0.0" + "markers": "python_version >= '3.6'", + "version": "==5.0.1" }, "filelock": { "hashes": [ "sha256:18d82244ee114f543149c66a6e0c14e9c4f8a1044b5cdaadd0f82159d6a6ff59", "sha256:929b7d63ec5b7d6b71b0fa5ac14e030b3f70b75747cef1b10da9b879fef15836" ], + "index": "pypi", "version": "==3.0.12" }, "idna": { @@ -1100,11 +1109,11 @@ }, "pygments": { "hashes": [ - "sha256:381985fcc551eb9d37c52088a32914e00517e57f4a21609f48141ba08e193fa0", - "sha256:88a0bbcd659fcb9573703957c6b9cff9fab7295e6e76db54c9d00ae42df32773" + "sha256:ccf3acacf3782cbed4a989426012f1c535c9a90d3a7fc3f16d231b9372d2b716", + "sha256:f275b6c0909e5dafd2d6269a656aa90fa58ebf4a74f8fcf9053195d226b24a08" ], "markers": "python_version >= '3.5'", - "version": "==2.7.2" + "version": "==2.7.3" }, "pyparsing": { "hashes": [ @@ -1313,11 +1322,11 @@ }, "virtualenv": { "hashes": [ - "sha256:07cff122e9d343140366055f31be4dcd61fd598c69d11cd33a9d9c8df4546dd7", - "sha256:e0aac7525e880a429764cefd3aaaff54afb5d9f25c82627563603f5d7de5a6e5" + "sha256:54b05fc737ea9c9ee9f8340f579e5da5b09fb64fd010ab5757eb90268616907c", + "sha256:b7a8ec323ee02fb2312f098b6b4c9de99559b462775bc8fe3627a73706603c1b" ], "markers": "python_version >= '2.7' and python_version not in '3.0, 3.1, 3.2, 3.3'", - "version": "==20.2.1" + "version": "==20.2.2" }, "zipp": { "hashes": [ diff --git a/docs/changelog.rst b/docs/changelog.rst index b6f4295b1..2e3ed07f6 100644 --- a/docs/changelog.rst +++ b/docs/changelog.rst @@ -31,6 +31,8 @@ This release focusses primarily on many small issues with the UI. * ``FILENAME_FORMAT`` placeholder for document types. * The filename formatter is now less restrictive with file names and tries to conserve the original correspondents, types and titles as much as possible. + * The filename formatter does not include the document ID in filenames anymore. It will + rather append ``_01``, ``_02``, etc when it detects duplicate filenames. paperless-ng 0.9.5 diff --git a/src/documents/consumer.py b/src/documents/consumer.py index 7bae5c2a9..23d17abc9 100755 --- a/src/documents/consumer.py +++ b/src/documents/consumer.py @@ -8,13 +8,14 @@ from django.conf import settings from django.db import transaction from django.db.models import Q from django.utils import timezone +from filelock import FileLock from .classifier import DocumentClassifier, IncompatibleClassifierVersionError -from .file_handling import create_source_path_directory +from .file_handling import create_source_path_directory, \ + generate_unique_filename from .loggers import LoggingMixin from .models import Document, FileInfo, Correspondent, DocumentType, Tag -from .parsers import ParseError, get_parser_class_for_mime_type, \ - get_supported_file_extensions, parse_date +from .parsers import ParseError, get_parser_class_for_mime_type, parse_date from .signals import ( document_consumption_finished, document_consumption_started @@ -38,6 +39,10 @@ class Consumer(LoggingMixin): def pre_check_file_exists(self): if not os.path.isfile(self.path): + self.log( + "error", + "Cannot consume {}: It is not a file.".format(self.path) + ) raise ConsumerError("Cannot consume {}: It is not a file".format( self.path)) @@ -47,6 +52,10 @@ class Consumer(LoggingMixin): if Document.objects.filter(Q(checksum=checksum) | Q(archive_checksum=checksum)).exists(): # NOQA: E501 if settings.CONSUMER_DELETE_DUPLICATES: os.unlink(self.path) + self.log( + "error", + "Not consuming {}: It is a duplicate.".format(self.filename) + ) raise ConsumerError( "Not consuming {}: It is a duplicate.".format(self.filename) ) @@ -148,8 +157,9 @@ class Consumer(LoggingMixin): classifier = DocumentClassifier() classifier.reload() except (FileNotFoundError, IncompatibleClassifierVersionError) as e: - logging.getLogger(__name__).warning( - "Cannot classify documents: {}.".format(e)) + self.log( + "warning", + f"Cannot classify documents: {e}.") classifier = None # now that everything is done, we can start to store the document @@ -176,31 +186,26 @@ class Consumer(LoggingMixin): # After everything is in the database, copy the files into # place. If this fails, we'll also rollback the transaction. + with FileLock(settings.MEDIA_LOCK): + document.filename = generate_unique_filename( + document, settings.ORIGINALS_DIR) + create_source_path_directory(document.source_path) - # TODO: not required, since this is done by the file handling - # logic - create_source_path_directory(document.source_path) - - self._write(document.storage_type, - self.path, document.source_path) - - self._write(document.storage_type, - thumbnail, document.thumbnail_path) - - if archive_path and os.path.isfile(archive_path): self._write(document.storage_type, - archive_path, document.archive_path) + self.path, document.source_path) - with open(archive_path, 'rb') as f: - document.archive_checksum = hashlib.md5( - f.read()).hexdigest() - document.save() + self._write(document.storage_type, + thumbnail, document.thumbnail_path) + + if archive_path and os.path.isfile(archive_path): + create_source_path_directory(document.archive_path) + self._write(document.storage_type, + archive_path, document.archive_path) + + with open(archive_path, 'rb') as f: + document.archive_checksum = hashlib.md5( + f.read()).hexdigest() - # Afte performing all database operations and moving files - # into place, tell paperless where the file is. - document.filename = os.path.basename(document.source_path) - # Saving the document now will trigger the filename handling - # logic. document.save() # Delete the file only if it was successfully consumed diff --git a/src/documents/file_handling.py b/src/documents/file_handling.py index a6d2f3ef4..c5efc33e4 100644 --- a/src/documents/file_handling.py +++ b/src/documents/file_handling.py @@ -70,7 +70,22 @@ def many_to_dictionary(field): return mydictionary -def generate_filename(doc): +def generate_unique_filename(doc, root): + counter = 0 + + while True: + new_filename = generate_filename(doc, counter) + if new_filename == doc.filename: + # still the same as before. + return new_filename + + if os.path.exists(os.path.join(root, new_filename)): + counter += 1 + else: + return new_filename + + +def generate_filename(doc, counter=0): path = "" try: @@ -112,11 +127,11 @@ def generate_filename(doc): f"Invalid PAPERLESS_FILENAME_FORMAT: " f"{settings.PAPERLESS_FILENAME_FORMAT}, falling back to default") - # Always append the primary key to guarantee uniqueness of filename + counter_str = f"_{counter:02}" if counter else "" if len(path) > 0: - filename = "%s-%07i%s" % (path, doc.pk, doc.file_type) + filename = f"{path}{counter_str}{doc.file_type}" else: - filename = "%07i%s" % (doc.pk, doc.file_type) + filename = f"{doc.pk:07}{counter_str}{doc.file_type}" # Append .gpg for encrypted files if doc.storage_type == doc.STORAGE_TYPE_GPG: diff --git a/src/documents/management/commands/document_importer.py b/src/documents/management/commands/document_importer.py index ca8c8bf06..70d05d98b 100644 --- a/src/documents/management/commands/document_importer.py +++ b/src/documents/management/commands/document_importer.py @@ -5,11 +5,13 @@ import shutil from django.conf import settings from django.core.management import call_command from django.core.management.base import BaseCommand, CommandError +from filelock import FileLock from documents.models import Document from documents.settings import EXPORTER_FILE_NAME, EXPORTER_THUMBNAIL_NAME, \ EXPORTER_ARCHIVE_NAME -from ...file_handling import generate_filename, create_source_path_directory +from ...file_handling import create_source_path_directory, \ + generate_unique_filename from ...mixins import Renderable @@ -114,17 +116,20 @@ class Command(Renderable, BaseCommand): document.storage_type = Document.STORAGE_TYPE_UNENCRYPTED - document.filename = generate_filename(document) + with FileLock(settings.MEDIA_LOCK): + document.filename = generate_unique_filename( + document, settings.ORIGINALS_DIR) - if os.path.isfile(document.source_path): - raise FileExistsError(document.source_path) + if os.path.isfile(document.source_path): + raise FileExistsError(document.source_path) - create_source_path_directory(document.source_path) + create_source_path_directory(document.source_path) - print(f"Moving {document_path} to {document.source_path}") - shutil.copy(document_path, document.source_path) - shutil.copy(thumbnail_path, document.thumbnail_path) - if archive_path: - shutil.copy(archive_path, document.archive_path) + print(f"Moving {document_path} to {document.source_path}") + shutil.copy(document_path, document.source_path) + shutil.copy(thumbnail_path, document.thumbnail_path) + if archive_path: + create_source_path_directory(document.archive_path) + shutil.copy(archive_path, document.archive_path) document.save() diff --git a/src/documents/signals/handlers.py b/src/documents/signals/handlers.py index 32119a0a3..8a9ce18d7 100755 --- a/src/documents/signals/handlers.py +++ b/src/documents/signals/handlers.py @@ -9,11 +9,13 @@ from django.contrib.contenttypes.models import ContentType from django.db import models, DatabaseError from django.dispatch import receiver from django.utils import timezone +from filelock import FileLock from rest_framework.reverse import reverse from .. import index, matching -from ..file_handling import delete_empty_directories, generate_filename, \ - create_source_path_directory, archive_name_from_filename +from ..file_handling import delete_empty_directories, \ + create_source_path_directory, archive_name_from_filename, \ + generate_unique_filename from ..models import Document, Tag @@ -226,81 +228,94 @@ def update_filename_and_move_files(sender, instance, **kwargs): # This will in turn cause this logic to move the file where it belongs. return - old_filename = instance.filename - new_filename = generate_filename(instance) + with FileLock(settings.MEDIA_LOCK): + old_filename = instance.filename + new_filename = generate_unique_filename( + instance, settings.ORIGINALS_DIR) - if new_filename == instance.filename: - # Don't do anything if its the same. - return - - old_source_path = instance.source_path - new_source_path = os.path.join(settings.ORIGINALS_DIR, new_filename) - - if not validate_move(instance, old_source_path, new_source_path): - return - - # archive files are optional, archive checksum tells us if we have one, - # since this is None for documents without archived files. - if instance.archive_checksum: - new_archive_filename = archive_name_from_filename(new_filename) - old_archive_path = instance.archive_path - new_archive_path = os.path.join(settings.ARCHIVE_DIR, - new_archive_filename) - - if not validate_move(instance, old_archive_path, new_archive_path): + if new_filename == instance.filename: + # Don't do anything if its the same. return - create_source_path_directory(new_archive_path) - else: - old_archive_path = None - new_archive_path = None + old_source_path = instance.source_path + new_source_path = os.path.join(settings.ORIGINALS_DIR, new_filename) - create_source_path_directory(new_source_path) + if not validate_move(instance, old_source_path, new_source_path): + return - try: - os.rename(old_source_path, new_source_path) + # archive files are optional, archive checksum tells us if we have one, + # since this is None for documents without archived files. if instance.archive_checksum: - os.rename(old_archive_path, new_archive_path) - instance.filename = new_filename - # Don't save here to prevent infinite recursion. - Document.objects.filter(pk=instance.pk).update(filename=new_filename) + new_archive_filename = archive_name_from_filename(new_filename) + old_archive_path = instance.archive_path + new_archive_path = os.path.join(settings.ARCHIVE_DIR, + new_archive_filename) - logging.getLogger(__name__).debug( - f"Moved file {old_source_path} to {new_source_path}.") + if not validate_move(instance, old_archive_path, new_archive_path): + return - if instance.archive_checksum: - logging.getLogger(__name__).debug( - f"Moved file {old_archive_path} to {new_archive_path}.") + create_source_path_directory(new_archive_path) + else: + old_archive_path = None + new_archive_path = None + + create_source_path_directory(new_source_path) - except OSError as e: - instance.filename = old_filename - # this happens when we can't move a file. If that's the case for the - # archive file, we try our best to revert the changes. try: + os.rename(old_source_path, new_source_path) + if instance.archive_checksum: + os.rename(old_archive_path, new_archive_path) + instance.filename = new_filename + + # Don't save() here to prevent infinite recursion. + Document.objects.filter(pk=instance.pk).update( + filename=new_filename) + + logging.getLogger(__name__).debug( + f"Moved file {old_source_path} to {new_source_path}.") + + if instance.archive_checksum: + logging.getLogger(__name__).debug( + f"Moved file {old_archive_path} to {new_archive_path}.") + + except OSError as e: + instance.filename = old_filename + # this happens when we can't move a file. If that's the case for + # the archive file, we try our best to revert the changes. + # no need to save the instance, the update() has not happened yet. + try: + os.rename(new_source_path, old_source_path) + os.rename(new_archive_path, old_archive_path) + except Exception as e: + # This is fine, since: + # A: if we managed to move source from A to B, we will also + # manage to move it from B to A. If not, we have a serious + # issue that's going to get caught by the santiy checker. + # All files remain in place and will never be overwritten, + # so this is not the end of the world. + # B: if moving the orignal file failed, nothing has changed + # anyway. + pass + except DatabaseError as e: + # this happens after moving files, so move them back into place. + # since moving them once succeeded, it's very likely going to + # succeed again. os.rename(new_source_path, old_source_path) - os.rename(new_archive_path, old_archive_path) - except Exception as e: - # This is fine, since: - # A: if we managed to move source from A to B, we will also manage - # to move it from B to A. If not, we have a serious issue - # that's going to get caught by the santiy checker. - # all files remain in place and will never be overwritten, - # so this is not the end of the world. - # B: if moving the orignal file failed, nothing has changed anyway. - pass - except DatabaseError as e: - os.rename(new_source_path, old_source_path) - if instance.archive_checksum: - os.rename(new_archive_path, old_archive_path) - instance.filename = old_filename + if instance.archive_checksum: + os.rename(new_archive_path, old_archive_path) + instance.filename = old_filename + # again, no need to save the instance, since the actual update() + # operation failed. - if not os.path.isfile(old_source_path): - delete_empty_directories(os.path.dirname(old_source_path), - root=settings.ORIGINALS_DIR) + # finally, remove any empty sub folders. This will do nothing if + # something has failed above. + if not os.path.isfile(old_source_path): + delete_empty_directories(os.path.dirname(old_source_path), + root=settings.ORIGINALS_DIR) - if old_archive_path and not os.path.isfile(old_archive_path): - delete_empty_directories(os.path.dirname(old_archive_path), - root=settings.ARCHIVE_DIR) + if old_archive_path and not os.path.isfile(old_archive_path): + delete_empty_directories(os.path.dirname(old_archive_path), + root=settings.ARCHIVE_DIR) def set_log_entry(sender, document=None, logging_group=None, **kwargs): diff --git a/src/documents/tests/test_consumer.py b/src/documents/tests/test_consumer.py index f785bc695..f828d3e11 100644 --- a/src/documents/tests/test_consumer.py +++ b/src/documents/tests/test_consumer.py @@ -598,10 +598,10 @@ class TestConsumer(DirectoriesMixin, TestCase): self.assertEqual(document.title, "new docs") self.assertEqual(document.correspondent.name, "Bank") - self.assertEqual(document.filename, "Bank/new docs-0000001.pdf") + self.assertEqual(document.filename, "Bank/new docs.pdf") @override_settings(PAPERLESS_FILENAME_FORMAT="{correspondent}/{title}") - @mock.patch("documents.signals.handlers.generate_filename") + @mock.patch("documents.signals.handlers.generate_unique_filename") def testFilenameHandlingUnstableFormat(self, m): filenames = ["this", "that", "now this", "i cant decide"] @@ -611,7 +611,7 @@ class TestConsumer(DirectoriesMixin, TestCase): filenames.insert(0, f) return f - m.side_effect = lambda f: get_filename() + m.side_effect = lambda f, root: get_filename() filename = self.get_test_file() diff --git a/src/documents/tests/test_file_handling.py b/src/documents/tests/test_file_handling.py index 4ed93d1d4..f0a74ca4f 100644 --- a/src/documents/tests/test_file_handling.py +++ b/src/documents/tests/test_file_handling.py @@ -40,13 +40,13 @@ class TestFileHandling(DirectoriesMixin, TestCase): document.filename = generate_filename(document) # Ensure that filename is properly generated - self.assertEqual(document.filename, "none/none-{:07d}.pdf".format(document.pk)) + self.assertEqual(document.filename, "none/none.pdf") # Enable encryption and check again document.storage_type = Document.STORAGE_TYPE_GPG document.filename = generate_filename(document) self.assertEqual(document.filename, - "none/none-{:07d}.pdf.gpg".format(document.pk)) + "none/none.pdf.gpg") document.save() @@ -62,7 +62,7 @@ class TestFileHandling(DirectoriesMixin, TestCase): # Check proper handling of files self.assertEqual(os.path.isdir(settings.ORIGINALS_DIR + "/test"), True) self.assertEqual(os.path.isdir(settings.ORIGINALS_DIR + "/none"), False) - self.assertEqual(os.path.isfile(settings.ORIGINALS_DIR + "/test/test-{:07d}.pdf.gpg".format(document.pk)), True) + self.assertEqual(os.path.isfile(settings.ORIGINALS_DIR + "/test/test.pdf.gpg"), True) @override_settings(PAPERLESS_FILENAME_FORMAT="{correspondent}/{correspondent}") def test_file_renaming_missing_permissions(self): @@ -74,12 +74,12 @@ class TestFileHandling(DirectoriesMixin, TestCase): # Ensure that filename is properly generated document.filename = generate_filename(document) self.assertEqual(document.filename, - "none/none-{:07d}.pdf".format(document.pk)) + "none/none.pdf") create_source_path_directory(document.source_path) Path(document.source_path).touch() # Test source_path - self.assertEqual(document.source_path, settings.ORIGINALS_DIR + "/none/none-{:07d}.pdf".format(document.pk)) + self.assertEqual(document.source_path, settings.ORIGINALS_DIR + "/none/none.pdf") # Make the folder read- and execute-only (no writing and no renaming) os.chmod(settings.ORIGINALS_DIR + "/none", 0o555) @@ -89,8 +89,8 @@ class TestFileHandling(DirectoriesMixin, TestCase): document.save() # Check proper handling of files - self.assertEqual(os.path.isfile(settings.ORIGINALS_DIR + "/none/none-{:07d}.pdf".format(document.pk)), True) - self.assertEqual(document.filename, "none/none-{:07d}.pdf".format(document.pk)) + self.assertEqual(os.path.isfile(settings.ORIGINALS_DIR + "/none/none.pdf"), True) + self.assertEqual(document.filename, "none/none.pdf") os.chmod(settings.ORIGINALS_DIR + "/none", 0o777) @@ -108,7 +108,7 @@ class TestFileHandling(DirectoriesMixin, TestCase): # Ensure that filename is properly generated document.filename = generate_filename(document) self.assertEqual(document.filename, - "none/none-{:07d}.pdf".format(document.pk)) + "none/none.pdf") create_source_path_directory(document.source_path) Path(document.source_path).touch() @@ -125,8 +125,8 @@ class TestFileHandling(DirectoriesMixin, TestCase): # Check proper handling of files self.assertTrue(os.path.isfile(document.source_path)) - self.assertEqual(os.path.isfile(settings.ORIGINALS_DIR + "/none/none-{:07d}.pdf".format(document.pk)), True) - self.assertEqual(document.filename, "none/none-{:07d}.pdf".format(document.pk)) + self.assertEqual(os.path.isfile(settings.ORIGINALS_DIR + "/none/none.pdf"), True) + self.assertEqual(document.filename, "none/none.pdf") @override_settings(PAPERLESS_FILENAME_FORMAT="{correspondent}/{correspondent}") def test_document_delete(self): @@ -138,7 +138,7 @@ class TestFileHandling(DirectoriesMixin, TestCase): # Ensure that filename is properly generated document.filename = generate_filename(document) self.assertEqual(document.filename, - "none/none-{:07d}.pdf".format(document.pk)) + "none/none.pdf") create_source_path_directory(document.source_path) Path(document.source_path).touch() @@ -146,7 +146,7 @@ class TestFileHandling(DirectoriesMixin, TestCase): # Ensure file deletion after delete pk = document.pk document.delete() - self.assertEqual(os.path.isfile(settings.ORIGINALS_DIR + "/none/none-{:07d}.pdf".format(pk)), False) + self.assertEqual(os.path.isfile(settings.ORIGINALS_DIR + "/none/none.pdf"), False) self.assertEqual(os.path.isdir(settings.ORIGINALS_DIR + "/none"), False) @override_settings(PAPERLESS_FILENAME_FORMAT="{correspondent}/{correspondent}") @@ -168,7 +168,7 @@ class TestFileHandling(DirectoriesMixin, TestCase): # Ensure that filename is properly generated document.filename = generate_filename(document) self.assertEqual(document.filename, - "none/none-{:07d}.pdf".format(document.pk)) + "none/none.pdf") create_source_path_directory(document.source_path) @@ -199,7 +199,7 @@ class TestFileHandling(DirectoriesMixin, TestCase): # Ensure that filename is properly generated self.assertEqual(generate_filename(document), - "demo-{:07d}.pdf".format(document.pk)) + "demo.pdf") @override_settings(PAPERLESS_FILENAME_FORMAT="{tags[type]}") def test_tags_with_dash(self): @@ -215,7 +215,7 @@ class TestFileHandling(DirectoriesMixin, TestCase): # Ensure that filename is properly generated self.assertEqual(generate_filename(document), - "demo-{:07d}.pdf".format(document.pk)) + "demo.pdf") @override_settings(PAPERLESS_FILENAME_FORMAT="{tags[type]}") def test_tags_malformed(self): @@ -231,7 +231,7 @@ class TestFileHandling(DirectoriesMixin, TestCase): # Ensure that filename is properly generated self.assertEqual(generate_filename(document), - "none-{:07d}.pdf".format(document.pk)) + "none.pdf") @override_settings(PAPERLESS_FILENAME_FORMAT="{tags[0]}") def test_tags_all(self): @@ -246,7 +246,7 @@ class TestFileHandling(DirectoriesMixin, TestCase): # Ensure that filename is properly generated self.assertEqual(generate_filename(document), - "demo-{:07d}.pdf".format(document.pk)) + "demo.pdf") @override_settings(PAPERLESS_FILENAME_FORMAT="{tags[1]}") def test_tags_out_of_bounds(self): @@ -261,7 +261,7 @@ class TestFileHandling(DirectoriesMixin, TestCase): # Ensure that filename is properly generated self.assertEqual(generate_filename(document), - "none-{:07d}.pdf".format(document.pk)) + "none.pdf") @override_settings(PAPERLESS_FILENAME_FORMAT="{correspondent}/{correspondent}/{correspondent}") def test_nested_directory_cleanup(self): @@ -272,7 +272,7 @@ class TestFileHandling(DirectoriesMixin, TestCase): # Ensure that filename is properly generated document.filename = generate_filename(document) - self.assertEqual(document.filename, "none/none/none-{:07d}.pdf".format(document.pk)) + self.assertEqual(document.filename, "none/none/none.pdf") create_source_path_directory(document.source_path) Path(document.source_path).touch() @@ -282,7 +282,7 @@ class TestFileHandling(DirectoriesMixin, TestCase): pk = document.pk document.delete() - self.assertEqual(os.path.isfile(settings.ORIGINALS_DIR + "/none/none/none-{:07d}.pdf".format(pk)), False) + self.assertEqual(os.path.isfile(settings.ORIGINALS_DIR + "/none/none/none.pdf"), False) self.assertEqual(os.path.isdir(settings.ORIGINALS_DIR + "/none/none"), False) self.assertEqual(os.path.isdir(settings.ORIGINALS_DIR + "/none"), False) self.assertEqual(os.path.isdir(settings.ORIGINALS_DIR), True) @@ -330,6 +330,48 @@ class TestFileHandling(DirectoriesMixin, TestCase): self.assertEqual(generate_filename(document), "0000001.pdf") + @override_settings(PAPERLESS_FILENAME_FORMAT="{title}") + def test_duplicates(self): + document = Document.objects.create(mime_type="application/pdf", title="qwe", checksum="A", pk=1) + document2 = Document.objects.create(mime_type="application/pdf", title="qwe", checksum="B", pk=2) + Path(document.source_path).touch() + Path(document2.source_path).touch() + document.filename = "0000001.pdf" + document.save() + + self.assertTrue(os.path.isfile(document.source_path)) + self.assertEqual(document.filename, "qwe.pdf") + + document2.filename = "0000002.pdf" + document2.save() + + self.assertTrue(os.path.isfile(document.source_path)) + self.assertEqual(document2.filename, "qwe_01.pdf") + + # saving should not change the file names. + + document.save() + + self.assertTrue(os.path.isfile(document.source_path)) + self.assertEqual(document.filename, "qwe.pdf") + + document2.save() + + self.assertTrue(os.path.isfile(document.source_path)) + self.assertEqual(document2.filename, "qwe_01.pdf") + + document.delete() + + self.assertFalse(os.path.isfile(document.source_path)) + + # filename free, should remove _01 suffix + + document2.save() + + self.assertTrue(os.path.isfile(document.source_path)) + self.assertEqual(document2.filename, "qwe.pdf") + + class TestFileHandlingWithArchive(DirectoriesMixin, TestCase): @@ -358,15 +400,14 @@ class TestFileHandlingWithArchive(DirectoriesMixin, TestCase): self.assertFalse(os.path.isfile(archive)) self.assertTrue(os.path.isfile(doc.source_path)) self.assertTrue(os.path.isfile(doc.archive_path)) - self.assertEqual(doc.source_path, os.path.join(settings.ORIGINALS_DIR, "none", "my_doc-0000001.pdf")) - self.assertEqual(doc.archive_path, os.path.join(settings.ARCHIVE_DIR, "none", "my_doc-0000001.pdf")) + self.assertEqual(doc.source_path, os.path.join(settings.ORIGINALS_DIR, "none", "my_doc.pdf")) + self.assertEqual(doc.archive_path, os.path.join(settings.ARCHIVE_DIR, "none", "my_doc.pdf")) @override_settings(PAPERLESS_FILENAME_FORMAT="{correspondent}/{title}") def test_move_archive_gone(self): original = os.path.join(settings.ORIGINALS_DIR, "0000001.pdf") archive = os.path.join(settings.ARCHIVE_DIR, "0000001.pdf") Path(original).touch() - #Path(archive).touch() doc = Document.objects.create(mime_type="application/pdf", title="my_doc", filename="0000001.pdf", checksum="A", archive_checksum="B") self.assertTrue(os.path.isfile(original)) @@ -381,7 +422,7 @@ class TestFileHandlingWithArchive(DirectoriesMixin, TestCase): Path(original).touch() Path(archive).touch() os.makedirs(os.path.join(settings.ARCHIVE_DIR, "none")) - Path(os.path.join(settings.ARCHIVE_DIR, "none", "my_doc-0000001.pdf")).touch() + Path(os.path.join(settings.ARCHIVE_DIR, "none", "my_doc.pdf")).touch() doc = Document.objects.create(mime_type="application/pdf", title="my_doc", filename="0000001.pdf", checksum="A", archive_checksum="B") self.assertTrue(os.path.isfile(original)) @@ -494,14 +535,14 @@ class TestFilenameGeneration(TestCase): def test_invalid_characters(self): doc = Document.objects.create(title="This. is the title.", mime_type="application/pdf", pk=1, checksum="1") - self.assertEqual(generate_filename(doc), "This. is the title-0000001.pdf") + self.assertEqual(generate_filename(doc), "This. is the title.pdf") doc = Document.objects.create(title="my\\invalid/../title:yay", mime_type="application/pdf", pk=2, checksum="2") - self.assertEqual(generate_filename(doc), "my-invalid-..-title-yay-0000002.pdf") + self.assertEqual(generate_filename(doc), "my-invalid-..-title-yay.pdf") @override_settings( PAPERLESS_FILENAME_FORMAT="{created}" ) def test_date(self): doc = Document.objects.create(title="does not matter", created=datetime.datetime(2020,5,21, 7,36,51, 153), mime_type="application/pdf", pk=2, checksum="2") - self.assertEqual(generate_filename(doc), "2020-05-21-0000002.pdf") + self.assertEqual(generate_filename(doc), "2020-05-21.pdf") diff --git a/src/paperless/settings.py b/src/paperless/settings.py index c7ecf7645..cf0c3e28d 100644 --- a/src/paperless/settings.py +++ b/src/paperless/settings.py @@ -53,6 +53,10 @@ ARCHIVE_DIR = os.path.join(MEDIA_ROOT, "documents", "archive") THUMBNAIL_DIR = os.path.join(MEDIA_ROOT, "documents", "thumbnails") DATA_DIR = os.getenv('PAPERLESS_DATA_DIR', os.path.join(BASE_DIR, "..", "data")) + +# Lock file for synchronizing changes to the MEDIA directory across multiple +# threads. +MEDIA_LOCK = os.path.join(MEDIA_ROOT, "media.lock") INDEX_DIR = os.path.join(DATA_DIR, "index") MODEL_FILE = os.path.join(DATA_DIR, "classification_model.pickle") From ad527fe97ca975d646994af9135cc673e0f6aced Mon Sep 17 00:00:00 2001 From: jonaswinkler Date: Tue, 8 Dec 2020 15:28:09 +0100 Subject: [PATCH 024/522] reading and displaying PDF metadata --- Pipfile | 1 + Pipfile.lock | 4 +- .../document-detail.component.html | 69 +++++++++++++++++-- .../document-detail.component.ts | 3 + .../app/data/paperless-document-metadata.ts | 10 +-- src/documents/tests/test_api.py | 32 +++++++++ src/documents/views.py | 46 +++++++++++-- 7 files changed, 147 insertions(+), 18 deletions(-) diff --git a/Pipfile b/Pipfile index 830604a8d..48759307c 100644 --- a/Pipfile +++ b/Pipfile @@ -27,6 +27,7 @@ langdetect = "*" pdftotext = "*" pathvalidate = "*" pillow = "*" +pikepdf = "*" python-gnupg = "*" python-dotenv = "*" python-dateutil = "*" diff --git a/Pipfile.lock b/Pipfile.lock index 198351237..1cfccb8ff 100644 --- a/Pipfile.lock +++ b/Pipfile.lock @@ -1,7 +1,7 @@ { "_meta": { "hash": { - "sha256": "3c187671ead11714d48b56f4714b145f68814e09edea818610b87f18b4f7f6fd" + "sha256": "3d576f289958226a7583e4c471c7f8c11bff6933bf093185f623cfb381a92412" }, "pipfile-spec": 6, "requires": { @@ -433,7 +433,7 @@ "sha256:fe0ca120e3347c851c34a91041d574f3c588d832023906d8ae18d66d042e8a52", "sha256:fe8e0152672f24d8bfdecc725f97e9013f2de1b41849150959526ca3562bd3ef" ], - "markers": "python_version < '3.9'", + "index": "pypi", "version": "==2.2.0" }, "pillow": { diff --git a/src-ui/src/app/components/document-detail/document-detail.component.html b/src-ui/src/app/components/document-detail/document-detail.component.html index 42619845c..e905c35e6 100644 --- a/src-ui/src/app/components/document-detail/document-detail.component.html +++ b/src-ui/src/app/components/document-detail/document-detail.component.html @@ -15,7 +15,7 @@ Download -
+
diff --git a/src-ui/src/app/components/document-detail/document-detail.component.ts b/src-ui/src/app/components/document-detail/document-detail.component.ts index cf16f01c5..329077693 100644 --- a/src-ui/src/app/components/document-detail/document-detail.component.ts +++ b/src-ui/src/app/components/document-detail/document-detail.component.ts @@ -24,6 +24,9 @@ import { DocumentTypeEditDialogComponent } from '../manage/document-type-list/do }) export class DocumentDetailComponent implements OnInit { + public expandOriginalMetadata = false; + public expandArchivedMetadata = false; + documentId: number document: PaperlessDocument metadata: PaperlessDocumentMetadata diff --git a/src-ui/src/app/data/paperless-document-metadata.ts b/src-ui/src/app/data/paperless-document-metadata.ts index 22b3f692a..12f0a78d8 100644 --- a/src-ui/src/app/data/paperless-document-metadata.ts +++ b/src-ui/src/app/data/paperless-document-metadata.ts @@ -1,11 +1,13 @@ export interface PaperlessDocumentMetadata { - paperless__checksum?: string + original_checksum?: string - paperless__mime_type?: string + archived_checksum?: string - paperless__filename?: string + original_mime_type?: string - paperless__has_archive_version?: boolean + media_filename?: string + + has_archive_version?: boolean } \ No newline at end of file diff --git a/src/documents/tests/test_api.py b/src/documents/tests/test_api.py index 986094db6..c2f9c950c 100644 --- a/src/documents/tests/test_api.py +++ b/src/documents/tests/test_api.py @@ -1,4 +1,5 @@ import os +import shutil import tempfile from unittest import mock @@ -493,3 +494,34 @@ class TestDocumentApi(DirectoriesMixin, APITestCase): self.assertEqual(response.status_code, 400) async_task.assert_not_called() + + def test_get_metadata(self): + doc = Document.objects.create(title="test", filename="file.pdf", mime_type="image/png") + + shutil.copy(os.path.join(os.path.dirname(__file__), "samples", "documents", "thumbnails", "0000001.png"), doc.source_path) + shutil.copy(os.path.join(os.path.dirname(__file__), "samples", "simple.pdf"), doc.archive_path) + + response = self.client.get(f"/api/documents/{doc.pk}/metadata/") + self.assertEqual(response.status_code, 200) + + meta = response.data + + self.assertEqual(meta['original_mime_type'], "image/png") + self.assertTrue(meta['has_archive_version']) + self.assertEqual(len(meta['original_metadata']), 0) + self.assertGreater(len(meta['archive_metadata']), 0) + + def test_get_metadata_no_archive(self): + doc = Document.objects.create(title="test", filename="file.pdf", mime_type="application/pdf") + + shutil.copy(os.path.join(os.path.dirname(__file__), "samples", "simple.pdf"), doc.source_path) + + response = self.client.get(f"/api/documents/{doc.pk}/metadata/") + self.assertEqual(response.status_code, 200) + + meta = response.data + + self.assertEqual(meta['original_mime_type'], "application/pdf") + self.assertFalse(meta['has_archive_version']) + self.assertGreater(len(meta['original_metadata']), 0) + self.assertIsNone(meta['archive_metadata']) diff --git a/src/documents/views.py b/src/documents/views.py index 7d587ed3f..e058b0f56 100755 --- a/src/documents/views.py +++ b/src/documents/views.py @@ -1,8 +1,11 @@ +import logging import os +import re import tempfile from datetime import datetime from time import mktime +import pikepdf from django.conf import settings from django.db.models import Count, Max from django.http import HttpResponse, HttpResponseBadRequest, Http404 @@ -160,16 +163,49 @@ class DocumentViewSet(RetrieveModelMixin, disposition, filename) return response + def get_metadata(self, file, type): + if not os.path.isfile(file): + return None + + namespace_pattern = re.compile(r"\{(.*)\}(.*)") + + result = [] + if type == 'application/pdf': + pdf = pikepdf.open(file) + meta = pdf.open_metadata() + for key, value in meta.items(): + if isinstance(value, list): + value = " ".join([str(e) for e in value]) + value = str(value) + try: + m = namespace_pattern.match(key) + result.append({ + "namespace": m.group(1), + "prefix": meta.REVERSE_NS[m.group(1)], + "key": m.group(2), + "value": value + }) + except Exception as e: + logging.getLogger(__name__).warning( + f"Error while reading metadata {key}: {value}. Error: " + f"{e}" + ) + return result + @action(methods=['get'], detail=True) def metadata(self, request, pk=None): try: doc = Document.objects.get(pk=pk) return Response({ - "paperless__checksum": doc.checksum, - "paperless__mime_type": doc.mime_type, - "paperless__filename": doc.filename, - "paperless__has_archive_version": - os.path.isfile(doc.archive_path) + "original_checksum": doc.checksum, + "archived_checksum": doc.archive_checksum, + "original_mime_type": doc.mime_type, + "media_filename": doc.filename, + "has_archive_version": os.path.isfile(doc.archive_path), + "original_metadata": self.get_metadata( + doc.source_path, doc.mime_type), + "archive_metadata": self.get_metadata( + doc.archive_path, "application/pdf") }) except Document.DoesNotExist: raise Http404() From 0028fde2fd4e4d1db64d537a7f784f8ce1272c38 Mon Sep 17 00:00:00 2001 From: jonaswinkler Date: Tue, 8 Dec 2020 16:09:47 +0100 Subject: [PATCH 025/522] more metadata #32 --- docs/changelog.rst | 1 + src-ui/src/app/app.module.ts | 4 +- .../document-detail.component.html | 20 +++-- src-ui/src/app/pipes/file-size.pipe.spec.ts | 8 ++ src-ui/src/app/pipes/file-size.pipe.ts | 77 +++++++++++++++++++ src/documents/tests/test_api.py | 2 +- src/documents/views.py | 21 +++-- 7 files changed, 118 insertions(+), 15 deletions(-) create mode 100644 src-ui/src/app/pipes/file-size.pipe.spec.ts create mode 100644 src-ui/src/app/pipes/file-size.pipe.ts diff --git a/docs/changelog.rst b/docs/changelog.rst index 2e3ed07f6..b6c88be92 100644 --- a/docs/changelog.rst +++ b/docs/changelog.rst @@ -19,6 +19,7 @@ This release focusses primarily on many small issues with the UI. * There's a new filter to filter for documents that do *not* have a certain tag. * The file upload box now shows upload progress. * The document edit page was reorganized. + * The document edit page shows various information about a document. * Table issues with too long document titles fixed. * API diff --git a/src-ui/src/app/app.module.ts b/src-ui/src/app/app.module.ts index e186cde50..ad12c9c47 100644 --- a/src-ui/src/app/app.module.ts +++ b/src-ui/src/app/app.module.ts @@ -47,6 +47,7 @@ import { UploadFileWidgetComponent } from './components/dashboard/widgets/upload import { WidgetFrameComponent } from './components/dashboard/widgets/widget-frame/widget-frame.component'; import { WelcomeWidgetComponent } from './components/dashboard/widgets/welcome-widget/welcome-widget.component'; import { YesNoPipe } from './pipes/yes-no.pipe'; +import { FileSizePipe } from './pipes/file-size.pipe'; @NgModule({ declarations: [ @@ -86,7 +87,8 @@ import { YesNoPipe } from './pipes/yes-no.pipe'; UploadFileWidgetComponent, WidgetFrameComponent, WelcomeWidgetComponent, - YesNoPipe + YesNoPipe, + FileSizePipe ], imports: [ BrowserModule, diff --git a/src-ui/src/app/components/document-detail/document-detail.component.html b/src-ui/src/app/components/document-detail/document-detail.component.html index e905c35e6..774ea8869 100644 --- a/src-ui/src/app/components/document-detail/document-detail.component.html +++ b/src-ui/src/app/components/document-detail/document-detail.component.html @@ -83,25 +83,29 @@ Date added {{document.added | date}} + + Media filename + {{metadata?.media_filename}} + Original MD5 Checksum {{metadata?.original_checksum}} - Archive MD5 Checksum - {{metadata?.archived_checksum}} + Original file size + {{metadata?.original_size | fileSize}} Original mime type {{metadata?.original_mime_type}} - - Is archived? - {{metadata?.has_archive_version | yesno}} + + Archive MD5 Checksum + {{metadata?.archive_checksum}} - - Media filename - {{metadata?.media_filename}} + + Archive file size + {{metadata?.archive_size | fileSize}} diff --git a/src-ui/src/app/pipes/file-size.pipe.spec.ts b/src-ui/src/app/pipes/file-size.pipe.spec.ts new file mode 100644 index 000000000..8c7a39d22 --- /dev/null +++ b/src-ui/src/app/pipes/file-size.pipe.spec.ts @@ -0,0 +1,8 @@ +import { FileSizePipe } from './file-size.pipe'; + +describe('FileSizePipe', () => { + it('create an instance', () => { + const pipe = new FileSizePipe(); + expect(pipe).toBeTruthy(); + }); +}); diff --git a/src-ui/src/app/pipes/file-size.pipe.ts b/src-ui/src/app/pipes/file-size.pipe.ts new file mode 100644 index 000000000..7d742c876 --- /dev/null +++ b/src-ui/src/app/pipes/file-size.pipe.ts @@ -0,0 +1,77 @@ +/** + * https://gist.github.com/JonCatmull/ecdf9441aaa37336d9ae2c7f9cb7289a + * + * @license + * Copyright (c) 2019 Jonathan Catmull. + * + * Permission is hereby granted, free of charge, to any person obtaining a copy + * of this software and associated documentation files (the "Software"), to deal + * in the Software without restriction, including without limitation the rights + * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell + * copies of the Software, and to permit persons to whom the Software is + * furnished to do so, subject to the following conditions: + * + * The above copyright notice and this permission notice shall be included in all + * copies or substantial portions of the Software. + * + * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR + * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, + * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE + * AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER + * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, + * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE + * SOFTWARE. + */ +import { Pipe, PipeTransform } from '@angular/core'; + +type unit = 'bytes' | 'KB' | 'MB' | 'GB' | 'TB' | 'PB'; +type unitPrecisionMap = { + [u in unit]: number; +}; + +const defaultPrecisionMap: unitPrecisionMap = { + bytes: 0, + KB: 0, + MB: 1, + GB: 1, + TB: 2, + PB: 2 +}; + +/* + * Convert bytes into largest possible unit. + * Takes an precision argument that can be a number or a map for each unit. + * Usage: + * bytes | fileSize:precision + * @example + * // returns 1 KB + * {{ 1500 | fileSize }} + * @example + * // returns 2.1 GB + * {{ 2100000000 | fileSize }} + * @example + * // returns 1.46 KB + * {{ 1500 | fileSize:2 }} + */ +@Pipe({ name: 'fileSize' }) +export class FileSizePipe implements PipeTransform { + private readonly units: unit[] = ['bytes', 'KB', 'MB', 'GB', 'TB', 'PB']; + + transform(bytes: number = 0, precision: number | unitPrecisionMap = defaultPrecisionMap): string { + if (isNaN(parseFloat(String(bytes))) || !isFinite(bytes)) return '?'; + + let unitIndex = 0; + + while (bytes >= 1024) { + bytes /= 1024; + unitIndex++; + } + + const unit = this.units[unitIndex]; + + if (typeof precision === 'number') { + return `${bytes.toFixed(+precision)} ${unit}`; + } + return `${bytes.toFixed(precision[unit])} ${unit}`; + } +} diff --git a/src/documents/tests/test_api.py b/src/documents/tests/test_api.py index c2f9c950c..572667406 100644 --- a/src/documents/tests/test_api.py +++ b/src/documents/tests/test_api.py @@ -496,7 +496,7 @@ class TestDocumentApi(DirectoriesMixin, APITestCase): async_task.assert_not_called() def test_get_metadata(self): - doc = Document.objects.create(title="test", filename="file.pdf", mime_type="image/png") + doc = Document.objects.create(title="test", filename="file.pdf", mime_type="image/png", archive_checksum="A") shutil.copy(os.path.join(os.path.dirname(__file__), "samples", "documents", "thumbnails", "0000001.png"), doc.source_path) shutil.copy(os.path.join(os.path.dirname(__file__), "samples", "simple.pdf"), doc.archive_path) diff --git a/src/documents/views.py b/src/documents/views.py index e058b0f56..8dbb61dc7 100755 --- a/src/documents/views.py +++ b/src/documents/views.py @@ -196,17 +196,28 @@ class DocumentViewSet(RetrieveModelMixin, def metadata(self, request, pk=None): try: doc = Document.objects.get(pk=pk) - return Response({ + + meta = { "original_checksum": doc.checksum, - "archived_checksum": doc.archive_checksum, + "original_size": os.stat(doc.source_path).st_size, "original_mime_type": doc.mime_type, "media_filename": doc.filename, "has_archive_version": os.path.isfile(doc.archive_path), "original_metadata": self.get_metadata( - doc.source_path, doc.mime_type), - "archive_metadata": self.get_metadata( + doc.source_path, doc.mime_type) + } + + if doc.archive_checksum and os.path.isfile(doc.archive_path): + meta['archive_checksum'] = doc.archive_checksum + meta['archive_size'] = os.stat(doc.archive_path).st_size, + meta['archive_metadata'] = self.get_metadata( doc.archive_path, "application/pdf") - }) + else: + meta['archive_checksum'] = None + meta['archive_size'] = None + meta['archive_metadata'] = None + + return Response(meta) except Document.DoesNotExist: raise Http404() From 6613104b4fbb6c874742db85c986f13c03dd9006 Mon Sep 17 00:00:00 2001 From: jonaswinkler Date: Tue, 8 Dec 2020 16:21:38 +0100 Subject: [PATCH 026/522] date and time in metadata --- .../components/document-detail/document-detail.component.html | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/src-ui/src/app/components/document-detail/document-detail.component.html b/src-ui/src/app/components/document-detail/document-detail.component.html index 774ea8869..9f4c72cdd 100644 --- a/src-ui/src/app/components/document-detail/document-detail.component.html +++ b/src-ui/src/app/components/document-detail/document-detail.component.html @@ -77,11 +77,11 @@ Date modified - {{document.modified | date}} + {{document.modified | date:'medium'}} Date added - {{document.added | date}} + {{document.added | date:'medium'}} Media filename From bf3b2249c5a7852c234686230b68d70be4d32c2f Mon Sep 17 00:00:00 2001 From: jonaswinkler Date: Tue, 8 Dec 2020 16:36:14 +0100 Subject: [PATCH 027/522] Metadata documentation --- docs/api.rst | 37 +++++++++++++++++++++++++++++++++++++ 1 file changed, 37 insertions(+) diff --git a/docs/api.rst b/docs/api.rst index 7d486df7f..d352758fa 100644 --- a/docs/api.rst +++ b/docs/api.rst @@ -71,6 +71,43 @@ supply the query parameter ``original=true``. should update your app or script to use the new URLs. +Getting document metadata +######################### + +The api also has an endpoint to retrieve read-only metadata about specific documents. this +information is not served along with the document objects, since it requires reading +files and would therefore slow down document lists considerably. + +Access the metadata of a document with an ID ``id`` at ``/api/documents//metadata/``. + +The endpoint reports the following data: + +* ``original_checksum``: MD5 checksum of the original document. +* ``original_size``: Size of the original document, in bytes. +* ``original_mime_type``: Mime type of the original document. +* ``media_filename``: Current filename of the document, under which it is stored inside the media directory. +* ``has_archive_version``: True, if this document is archived, false otherwise. +* ``original_metadata``: A list of metadata associated with the original document. See below. +* ``archive_checksum``: MD5 checksum of the archived document, or null. +* ``archive_size``: Size of the archived document in bytes, or null. +* ``archive_metadata``: Metadata associated with the archived document, or null. See below. + +File metadata is reported as a list of objects in the following form: + +.. code:: json + + [ + { + "namespace": "http://ns.adobe.com/pdf/1.3/", + "prefix": "pdf", + "key": "Producer", + "value": "SparklePDF, Fancy edition" + }, + ] + +``namespace`` and ``prefix`` can be null. The actual metadata reported depends on the file type and the metadata +available in that specific document. Paperless only reports PDF metadata at this point. + Authorization ############# From 871e22e3a34abbc89c6ed74cd13f76a8b8787177 Mon Sep 17 00:00:00 2001 From: jonaswinkler Date: Tue, 8 Dec 2020 16:45:22 +0100 Subject: [PATCH 028/522] documentation --- docs/advanced_usage.rst | 2 +- docs/changelog.rst | 11 ++++++++++- 2 files changed, 11 insertions(+), 2 deletions(-) diff --git a/docs/advanced_usage.rst b/docs/advanced_usage.rst index fca3ff4df..b5ae254b3 100644 --- a/docs/advanced_usage.rst +++ b/docs/advanced_usage.rst @@ -298,6 +298,7 @@ avoids filename clashes. Paperless provides the following placeholders withing filenames: * ``{correspondent}``: The name of the correspondent, or "none". +* ``{document_type}``: The name of the document type, or "none". * ``{title}``: The title of the document. * ``{created}``: The full date and time the document was created. * ``{created_year}``: Year created only. @@ -307,7 +308,6 @@ Paperless provides the following placeholders withing filenames: * ``{added_year}``: Year added only. * ``{added_month}``: Month added only (number 1-12). * ``{added_day}``: Day added only (number 1-31). -* ``{tags}``: I don't know how this works. Look at the source. Paperless will convert all values for the placeholders into values which are safe for use in filenames. diff --git a/docs/changelog.rst b/docs/changelog.rst index b6c88be92..96578ac75 100644 --- a/docs/changelog.rst +++ b/docs/changelog.rst @@ -14,17 +14,20 @@ This release focusses primarily on many small issues with the UI. * Paperless now has proper window titles. * Fixed an issue with the small cards when more than 7 tags were used. - * Navigation of the "Show all" links adjusted. + * Navigation of the "Show all" links adjusted. They navigate to the saved view now, if available in the sidebar. * Some indication on the document lists that a filter is active was added. * There's a new filter to filter for documents that do *not* have a certain tag. * The file upload box now shows upload progress. * The document edit page was reorganized. * The document edit page shows various information about a document. + * An issue with the height of the preview was fixed. * Table issues with too long document titles fixed. * API * The API now serves file names with documents. + * The API now serves various metadata about documents. + * API documentation updated. * Other @@ -35,6 +38,12 @@ This release focusses primarily on many small issues with the UI. * The filename formatter does not include the document ID in filenames anymore. It will rather append ``_01``, ``_02``, etc when it detects duplicate filenames. +.. note:: + + The changes to the filename format will apply to newly added documents and changed documents. + If you want all files to reflect these changes, execute the ``document_renamer`` management + command. + paperless-ng 0.9.5 ################## From d3cf85b9e970cad298691b23e4dd41cb72d742b8 Mon Sep 17 00:00:00 2001 From: jonaswinkler Date: Tue, 8 Dec 2020 17:34:29 +0100 Subject: [PATCH 029/522] Added a section on best practices. --- docs/usage_overview.rst | 57 +++++++++++++++++++++++++++++++++++++++++ 1 file changed, 57 insertions(+) diff --git a/docs/usage_overview.rst b/docs/usage_overview.rst index db50d5706..980564cba 100644 --- a/docs/usage_overview.rst +++ b/docs/usage_overview.rst @@ -183,6 +183,63 @@ You can also submit a document using the REST API, see :ref:`api-file_uploads` f .. _basic-searching: + +Best practices +############## + +Paperless offers a couple tools that help you organize your document collection. However, +it is up to you to use them in a way that helps you organize documents and find specific +documents when you need them. This section offers a couple ideas for managing your collection. + +Document types allow you to classify documents according to what they are. You can define +types such as "Receipt", "Invoice", or "Contract". If you used to collect all your receipts +in a single binder, you can recreate that system in paperless by defining a document type, +assigning documents to that type and then filtering by that type to only see all receipts. + +Not all documents need document types. Sometimes its hard to determine what the type of a +document is or it is hard to justify creating a document type that you only need once or twice. +This is okay. As long as the types you define help you organize your collection in the way +you want, paperless is doing its job. + +Tags can be used in many different ways. Think of tags are more versatile folders or binders. +If you have a binder for documents related to university / your car or health care, you can +create these binders in paperless by creating tags and assigning them to relevant documents. +Just as with documents, you can filter the document list by tags and only see documents of +a certain topic. + +With physical documents, you'll often need to decide which folder the document belongs to. +The advantage of tags over folders and binders is that a single document can have multiple +tags. A physical document cannot magically appear in two different folders, but with tags, +this is entirely possible. + +.. hint:: + + This can be used in many different ways. One example: Imagine you're working on a particular + tasks, such as signing up for university. Usually you'll need to collect a bunch of different + documents that are already sorted into various folders. With the tag system of paperless, + you can create a new group of documents that are relevant to this task without destroying + the already existing organization. When you're done with the task, you could delete the + task again, which would be equal to sorting documents back into the folder they belong into. + Or keep the tag. + +All of the logic above applies to correspondents as well. Attach them to documents if you +feel that they help you organize your collection. + +When you've started organizing your documents, create a couple saved views for document collections +you regularly access. This is equal to having labeled physical binders on your desk, except +that these saved views are dynamic and simply update themselves as you add documents to the system. + +Here are a couple examples of tags and types that you could use in your collection. + +* An ``inbox`` tag for newly added documents that you haven't manually edited yet. +* A tag ``car`` for everything car related (repairs, registration, insurance, etc) +* A tag ``todo`` for documents that you still need to do something with, such as reply, or + perform some task online. +* A tag ``bank account x`` for all bank statement related to that account. +* A tag ``mail`` for anything that you added to paperless via its mail processing capabilities. +* A tag ``missing_metadata`` when you still need to add some metadata to a document, but can't + or don't want to do this right now. + Searching ######### From 001ab88fffeb8652adda3bd098396ec449269252 Mon Sep 17 00:00:00 2001 From: jonaswinkler Date: Tue, 8 Dec 2020 17:34:38 +0100 Subject: [PATCH 030/522] docs --- docs/usage_overview.rst | 17 +++++++++++------ 1 file changed, 11 insertions(+), 6 deletions(-) diff --git a/docs/usage_overview.rst b/docs/usage_overview.rst index 980564cba..bb9ecd452 100644 --- a/docs/usage_overview.rst +++ b/docs/usage_overview.rst @@ -57,7 +57,7 @@ Adding documents to paperless ############################# Once you've got Paperless setup, you need to start feeding documents into it. -Currently, there are three options: the consumption directory, IMAP (email), and +Currently, there are four options: the consumption directory, the dashboard, IMAP (email), and HTTP POST. When adding documents to paperless, it will perform the following operations on @@ -82,8 +82,7 @@ your documents: No matter which options you choose, Paperless will always store the original document that it found in the consumption directory or in the mail and will never overwrite that document. Archived versions are stored alongside the - digital versions. - + original versions. The consumption directory @@ -107,6 +106,12 @@ files from the scanner. Typically, you're looking at an FTP server like .. TODO: hyperref to configuration of the location of this magic folder. +Dashboard upload +================ + +The dashboard has a file drop field to upload documents to paperless. Simply drag a file +onto this field or select a file with the file dialog. Multiple files are supported. + .. _usage-email: IMAP (Email) @@ -215,12 +220,12 @@ this is entirely possible. .. hint:: This can be used in many different ways. One example: Imagine you're working on a particular - tasks, such as signing up for university. Usually you'll need to collect a bunch of different + task, such as signing up for university. Usually you'll need to collect a bunch of different documents that are already sorted into various folders. With the tag system of paperless, you can create a new group of documents that are relevant to this task without destroying the already existing organization. When you're done with the task, you could delete the - task again, which would be equal to sorting documents back into the folder they belong into. - Or keep the tag. + tag again, which would be equal to sorting documents back into the folder they belong into. + Or keep the tag, up to you. All of the logic above applies to correspondents as well. Attach them to documents if you feel that they help you organize your collection. From e428a8a0087d4bf067539d44ac0031c30e80c63c Mon Sep 17 00:00:00 2001 From: jonaswinkler Date: Tue, 8 Dec 2020 17:35:51 +0100 Subject: [PATCH 031/522] file upload improvements --- .../upload-file-widget.component.ts | 17 ++++++++++------- 1 file changed, 10 insertions(+), 7 deletions(-) diff --git a/src-ui/src/app/components/dashboard/widgets/upload-file-widget/upload-file-widget.component.ts b/src-ui/src/app/components/dashboard/widgets/upload-file-widget/upload-file-widget.component.ts index 90bfbf1e5..2ea4825f1 100644 --- a/src-ui/src/app/components/dashboard/widgets/upload-file-widget/upload-file-widget.component.ts +++ b/src-ui/src/app/components/dashboard/widgets/upload-file-widget/upload-file-widget.component.ts @@ -6,7 +6,6 @@ import { Toast, ToastService } from 'src/app/services/toast.service'; interface UploadStatus { - file: string loaded: number total: number } @@ -30,11 +29,12 @@ export class UploadFileWidgetComponent implements OnInit { } uploadStatus: UploadStatus[] = [] + completedFiles = 0 uploadVisible = false get loadedSum() { - return this.uploadStatus.map(s => s.loaded).reduce((a,b) => a+b, 1) + return this.uploadStatus.map(s => s.loaded).reduce((a,b) => a+b, this.completedFiles > 0 ? 1 : 0) } get totalSum() { @@ -44,32 +44,35 @@ export class UploadFileWidgetComponent implements OnInit { public dropped(files: NgxFileDropEntry[]) { for (const droppedFile of files) { if (droppedFile.fileEntry.isFile) { - const fileEntry = droppedFile.fileEntry as FileSystemFileEntry; + let uploadStatusObject: UploadStatus = {loaded: 0, total: 1} + this.uploadStatus.push(uploadStatusObject) + this.uploadVisible = true + + const fileEntry = droppedFile.fileEntry as FileSystemFileEntry; fileEntry.file((file: File) => { let formData = new FormData() formData.append('document', file, file.name) - let uploadStatusObject: UploadStatus = {file: file.name, loaded: 0, total: 1} - this.uploadStatus.push(uploadStatusObject) - this.uploadVisible = true this.documentService.uploadDocument(formData).subscribe(event => { if (event.type == HttpEventType.UploadProgress) { uploadStatusObject.loaded = event.loaded uploadStatusObject.total = event.total } else if (event.type == HttpEventType.Response) { this.uploadStatus.splice(this.uploadStatus.indexOf(uploadStatusObject), 1) + this.completedFiles += 1 this.toastService.showToast(Toast.make("Information", "The document has been uploaded and will be processed by the consumer shortly.")) } }, error => { this.uploadStatus.splice(this.uploadStatus.indexOf(uploadStatusObject), 1) + this.completedFiles += 1 switch (error.status) { case 400: { this.toastService.showToast(Toast.makeError(`There was an error while uploading the document: ${error.error.document}`)) break; } default: { - this.toastService.showToast(Toast.makeError("An error has occured while uploading the document. Sorry!")) + this.toastService.showToast(Toast.makeError("An error has occurred while uploading the document. Sorry!")) break; } } From 550a74347c36c260f2bdcd151885468077b83859 Mon Sep 17 00:00:00 2001 From: jonaswinkler Date: Tue, 8 Dec 2020 21:08:44 +0100 Subject: [PATCH 032/522] a test that "verifies" that the file renaming lock works and no inconsistencies are created. --- src/documents/consumer.py | 2 + src/documents/tests/test_file_handling.py | 47 ++++++++++++++++++++++- 2 files changed, 48 insertions(+), 1 deletion(-) diff --git a/src/documents/consumer.py b/src/documents/consumer.py index 23d17abc9..f52dd5a7d 100755 --- a/src/documents/consumer.py +++ b/src/documents/consumer.py @@ -206,6 +206,8 @@ class Consumer(LoggingMixin): document.archive_checksum = hashlib.md5( f.read()).hexdigest() + # Don't save with the lock active. Saving will cause the file + # renaming logic to aquire the lock as well. document.save() # Delete the file only if it was successfully consumed diff --git a/src/documents/tests/test_file_handling.py b/src/documents/tests/test_file_handling.py index f0a74ca4f..6d407a7ab 100644 --- a/src/documents/tests/test_file_handling.py +++ b/src/documents/tests/test_file_handling.py @@ -1,5 +1,9 @@ import datetime +import hashlib import os +import random +import uuid +from concurrent.futures.thread import ThreadPoolExecutor from pathlib import Path from unittest import mock @@ -8,8 +12,10 @@ from django.db import DatabaseError from django.test import TestCase, override_settings from .utils import DirectoriesMixin -from ..file_handling import generate_filename, create_source_path_directory, delete_empty_directories +from ..file_handling import generate_filename, create_source_path_directory, delete_empty_directories, \ + generate_unique_filename from ..models import Document, Correspondent +from ..sanity_checker import check_sanity class TestFileHandling(DirectoriesMixin, TestCase): @@ -546,3 +552,42 @@ class TestFilenameGeneration(TestCase): def test_date(self): doc = Document.objects.create(title="does not matter", created=datetime.datetime(2020,5,21, 7,36,51, 153), mime_type="application/pdf", pk=2, checksum="2") self.assertEqual(generate_filename(doc), "2020-05-21.pdf") + + +def run(): + doc = Document.objects.create(checksum=str(uuid.uuid4()), title=str(uuid.uuid4()), content="wow") + doc.filename = generate_unique_filename(doc, settings.ORIGINALS_DIR) + Path(doc.thumbnail_path).touch() + with open(doc.source_path, "w") as f: + f.write(str(uuid.uuid4())) + with open(doc.source_path, "rb") as f: + doc.checksum = hashlib.md5(f.read()).hexdigest() + + with open(doc.archive_path, "w") as f: + f.write(str(uuid.uuid4())) + with open(doc.archive_path, "rb") as f: + doc.archive_checksum = hashlib.md5(f.read()).hexdigest() + + doc.save() + + for i in range(30): + doc.title = str(random.randrange(1, 5)) + doc.save() + + +class TestSuperMassive(DirectoriesMixin, TestCase): + + @override_settings(PAPERLESS_FILENAME_FORMAT="{title}") + def test_super_massive(self): + # try to save as many documents in parallel as possible. + # try to make the system fail. + + with ThreadPoolExecutor(max_workers=16) as executor: + results = [executor.submit(run) for i in range(16)] + + for r in results: + if r.exception(): + raise r.exception() + + # nope, everything still good. Thank you, lockfiles. + self.assertEqual(len(check_sanity()), 0) From 5753c83618a66c68b254499177cfac9354b7c517 Mon Sep 17 00:00:00 2001 From: jonaswinkler Date: Tue, 8 Dec 2020 21:20:05 +0100 Subject: [PATCH 033/522] version bump --- docker/hub/docker-compose.postgres.yml | 2 +- docker/hub/docker-compose.sqlite.yml | 2 +- src/paperless/version.py | 2 +- 3 files changed, 3 insertions(+), 3 deletions(-) diff --git a/docker/hub/docker-compose.postgres.yml b/docker/hub/docker-compose.postgres.yml index 295d981e1..24f0e118f 100644 --- a/docker/hub/docker-compose.postgres.yml +++ b/docker/hub/docker-compose.postgres.yml @@ -15,7 +15,7 @@ services: POSTGRES_PASSWORD: paperless webserver: - image: jonaswinkler/paperless-ng:0.9.5 + image: jonaswinkler/paperless-ng:0.9.6 restart: always depends_on: - db diff --git a/docker/hub/docker-compose.sqlite.yml b/docker/hub/docker-compose.sqlite.yml index 80df40596..6ae619fd6 100644 --- a/docker/hub/docker-compose.sqlite.yml +++ b/docker/hub/docker-compose.sqlite.yml @@ -5,7 +5,7 @@ services: restart: always webserver: - image: jonaswinkler/paperless-ng:0.9.5 + image: jonaswinkler/paperless-ng:0.9.6 restart: always depends_on: - broker diff --git a/src/paperless/version.py b/src/paperless/version.py index 26e46fea8..527e0668d 100644 --- a/src/paperless/version.py +++ b/src/paperless/version.py @@ -1 +1 @@ -__version__ = (0, 9, 5) +__version__ = (0, 9, 6) From 74a99cf33084a0688930f912cd5b2fedb938d527 Mon Sep 17 00:00:00 2001 From: jonaswinkler Date: Wed, 9 Dec 2020 00:04:37 +0100 Subject: [PATCH 034/522] removed slugs entirely, since their only purpose was purely cosmetic anyway. --- src/documents/admin.py | 8 +----- src/documents/consumer.py | 2 +- .../management/commands/document_consumer.py | 5 +--- .../migrations/1006_auto_20201208_2209.py | 25 +++++++++++++++++++ src/documents/models.py | 11 ++------ src/documents/serialisers.py | 19 +++++++++++--- src/documents/signals/handlers.py | 4 +-- src/documents/tests/test_consumer.py | 12 ++++----- src/paperless_mail/mail.py | 5 +--- 9 files changed, 55 insertions(+), 36 deletions(-) create mode 100644 src/documents/migrations/1006_auto_20201208_2209.py diff --git a/src/documents/admin.py b/src/documents/admin.py index 2a4fb0031..055a6fd93 100755 --- a/src/documents/admin.py +++ b/src/documents/admin.py @@ -17,8 +17,6 @@ class CorrespondentAdmin(admin.ModelAdmin): list_filter = ("matching_algorithm",) list_editable = ("match", "matching_algorithm") - readonly_fields = ("slug",) - class TagAdmin(admin.ModelAdmin): @@ -31,8 +29,6 @@ class TagAdmin(admin.ModelAdmin): list_filter = ("colour", "matching_algorithm") list_editable = ("colour", "match", "matching_algorithm") - readonly_fields = ("slug", ) - class DocumentTypeAdmin(admin.ModelAdmin): @@ -44,8 +40,6 @@ class DocumentTypeAdmin(admin.ModelAdmin): list_filter = ("matching_algorithm",) list_editable = ("match", "matching_algorithm") - readonly_fields = ("slug",) - class DocumentAdmin(admin.ModelAdmin): @@ -106,7 +100,7 @@ class DocumentAdmin(admin.ModelAdmin): for tag in obj.tags.all(): r += self._html_tag( "span", - tag.slug + ", " + tag.name + ", " ) return r diff --git a/src/documents/consumer.py b/src/documents/consumer.py index f52dd5a7d..19ca3ed7e 100755 --- a/src/documents/consumer.py +++ b/src/documents/consumer.py @@ -259,7 +259,7 @@ class Consumer(LoggingMixin): relevant_tags = set(file_info.tags) if relevant_tags: - tag_names = ", ".join([t.slug for t in relevant_tags]) + tag_names = ", ".join([t.name for t in relevant_tags]) self.log("debug", "Tagging with {}".format(tag_names)) document.tags.add(*relevant_tags) diff --git a/src/documents/management/commands/document_consumer.py b/src/documents/management/commands/document_consumer.py index 5cecd6bf9..b2f689aed 100644 --- a/src/documents/management/commands/document_consumer.py +++ b/src/documents/management/commands/document_consumer.py @@ -29,10 +29,7 @@ def _tags_from_path(filepath): path_parts = Path(filepath).relative_to( settings.CONSUMPTION_DIR).parent.parts for part in path_parts: - tag_ids.add(Tag.objects.get_or_create( - slug=slugify(part), - defaults={"name": part}, - )[0].pk) + tag_ids.add(Tag.objects.get_or_create(name=part)[0].pk) return tag_ids diff --git a/src/documents/migrations/1006_auto_20201208_2209.py b/src/documents/migrations/1006_auto_20201208_2209.py new file mode 100644 index 000000000..49f8c8dfe --- /dev/null +++ b/src/documents/migrations/1006_auto_20201208_2209.py @@ -0,0 +1,25 @@ +# Generated by Django 3.1.4 on 2020-12-08 22:09 + +from django.db import migrations + + +class Migration(migrations.Migration): + + dependencies = [ + ('documents', '1005_checksums'), + ] + + operations = [ + migrations.RemoveField( + model_name='correspondent', + name='slug', + ), + migrations.RemoveField( + model_name='documenttype', + name='slug', + ), + migrations.RemoveField( + model_name='tag', + name='slug', + ), + ] diff --git a/src/documents/models.py b/src/documents/models.py index 366cb215d..f0678a843 100755 --- a/src/documents/models.py +++ b/src/documents/models.py @@ -36,7 +36,6 @@ class MatchingModel(models.Model): ) name = models.CharField(max_length=128, unique=True) - slug = models.SlugField(blank=True, editable=False) match = models.CharField(max_length=256, blank=True) matching_algorithm = models.PositiveIntegerField( @@ -69,7 +68,6 @@ class MatchingModel(models.Model): def save(self, *args, **kwargs): self.match = self.match.lower() - self.slug = slugify(self.name) models.Model.save(self, *args, **kwargs) @@ -384,9 +382,7 @@ class FileInfo: def _get_correspondent(cls, name): if not name: return None - return Correspondent.objects.get_or_create(name=name, defaults={ - "slug": slugify(name) - })[0] + return Correspondent.objects.get_or_create(name=name)[0] @classmethod def _get_title(cls, title): @@ -396,10 +392,7 @@ class FileInfo: def _get_tags(cls, tags): r = [] for t in tags.split(","): - r.append(Tag.objects.get_or_create( - slug=slugify(t), - defaults={"name": t} - )[0]) + r.append(Tag.objects.get_or_create(name=t)[0]) return tuple(r) @classmethod diff --git a/src/documents/serialisers.py b/src/documents/serialisers.py index 5aedeeb58..600645061 100644 --- a/src/documents/serialisers.py +++ b/src/documents/serialisers.py @@ -1,4 +1,5 @@ import magic +from django.utils.text import slugify from pathvalidate import validate_filename, ValidationError from rest_framework import serializers from rest_framework.fields import SerializerMethodField @@ -7,12 +8,16 @@ from .models import Correspondent, Tag, Document, Log, DocumentType from .parsers import is_mime_type_supported -class CorrespondentSerializer(serializers.HyperlinkedModelSerializer): +class CorrespondentSerializer(serializers.ModelSerializer): document_count = serializers.IntegerField(read_only=True) last_correspondence = serializers.DateTimeField(read_only=True) + def get_slug(self, obj): + return slugify(obj.name) + slug = SerializerMethodField() + class Meta: model = Correspondent fields = ( @@ -27,10 +32,14 @@ class CorrespondentSerializer(serializers.HyperlinkedModelSerializer): ) -class DocumentTypeSerializer(serializers.HyperlinkedModelSerializer): +class DocumentTypeSerializer(serializers.ModelSerializer): document_count = serializers.IntegerField(read_only=True) + def get_slug(self, obj): + return slugify(obj.name) + slug = SerializerMethodField() + class Meta: model = DocumentType fields = ( @@ -44,10 +53,14 @@ class DocumentTypeSerializer(serializers.HyperlinkedModelSerializer): ) -class TagSerializer(serializers.HyperlinkedModelSerializer): +class TagSerializer(serializers.ModelSerializer): document_count = serializers.IntegerField(read_only=True) + def get_slug(self, obj): + return slugify(obj.name) + slug = SerializerMethodField() + class Meta: model = Tag fields = ( diff --git a/src/documents/signals/handlers.py b/src/documents/signals/handlers.py index 8a9ce18d7..8121072bf 100755 --- a/src/documents/signals/handlers.py +++ b/src/documents/signals/handlers.py @@ -136,7 +136,7 @@ def set_tags(sender, message = 'Tagging "{}" with "{}"' logger( - message.format(document, ", ".join([t.slug for t in relevant_tags])), + message.format(document, ", ".join([t.name for t in relevant_tags])), logging_group ) @@ -165,7 +165,7 @@ def run_post_consume_script(sender, document, **kwargs): reverse("document-download", kwargs={"pk": document.pk}), reverse("document-thumb", kwargs={"pk": document.pk}), str(document.correspondent), - str(",".join(document.tags.all().values_list("slug", flat=True))) + str(",".join(document.tags.all().values_list("name", flat=True))) )).wait() diff --git a/src/documents/tests/test_consumer.py b/src/documents/tests/test_consumer.py index f828d3e11..b4b19be4c 100644 --- a/src/documents/tests/test_consumer.py +++ b/src/documents/tests/test_consumer.py @@ -27,7 +27,7 @@ class TestAttributes(TestCase): self.assertEqual(file_info.title, title, filename) - self.assertEqual(tuple([t.slug for t in file_info.tags]), tags, filename) + self.assertEqual(tuple([t.name for t in file_info.tags]), tags, filename) def test_guess_attributes_from_name0(self): self._test_guess_attributes_from_name( @@ -188,7 +188,7 @@ class TestFieldPermutations(TestCase): self.assertEqual(info.tags, (), filename) else: self.assertEqual( - [t.slug for t in info.tags], tags.split(','), + [t.name for t in info.tags], tags.split(','), filename ) @@ -342,8 +342,8 @@ class TestFieldPermutations(TestCase): info = FileInfo.from_filename(filename) self.assertEqual(info.title, "0001") self.assertEqual(len(info.tags), 2) - self.assertEqual(info.tags[0].slug, "tag1") - self.assertEqual(info.tags[1].slug, "tag2") + self.assertEqual(info.tags[0].name, "tag1") + self.assertEqual(info.tags[1].name, "tag2") self.assertIsNone(info.created) # Complex transformation with date in replacement string @@ -356,8 +356,8 @@ class TestFieldPermutations(TestCase): info = FileInfo.from_filename(filename) self.assertEqual(info.title, "0001") self.assertEqual(len(info.tags), 2) - self.assertEqual(info.tags[0].slug, "tag1") - self.assertEqual(info.tags[1].slug, "tag2") + self.assertEqual(info.tags[0].name, "tag1") + self.assertEqual(info.tags[1].name, "tag2") self.assertEqual(info.created.year, 2019) self.assertEqual(info.created.month, 9) self.assertEqual(info.created.day, 8) diff --git a/src/paperless_mail/mail.py b/src/paperless_mail/mail.py index 08f7365da..a82c34f15 100644 --- a/src/paperless_mail/mail.py +++ b/src/paperless_mail/mail.py @@ -103,10 +103,7 @@ class MailAccountHandler(LoggingMixin): def _correspondent_from_name(self, name): try: - return Correspondent.objects.get_or_create( - name=name, defaults={ - "slug": slugify(name) - })[0] + return Correspondent.objects.get_or_create(name=name)[0] except DatabaseError as e: self.log( "error", From 0a0d462938032f70d7dcc4485474f8311475e40f Mon Sep 17 00:00:00 2001 From: jonaswinkler Date: Wed, 9 Dec 2020 00:07:22 +0100 Subject: [PATCH 035/522] tags from folders: case insensitive --- src/documents/management/commands/document_consumer.py | 4 +++- src/documents/tests/test_management_consumer.py | 2 +- 2 files changed, 4 insertions(+), 2 deletions(-) diff --git a/src/documents/management/commands/document_consumer.py b/src/documents/management/commands/document_consumer.py index b2f689aed..8ac60aa6d 100644 --- a/src/documents/management/commands/document_consumer.py +++ b/src/documents/management/commands/document_consumer.py @@ -29,7 +29,9 @@ def _tags_from_path(filepath): path_parts = Path(filepath).relative_to( settings.CONSUMPTION_DIR).parent.parts for part in path_parts: - tag_ids.add(Tag.objects.get_or_create(name=part)[0].pk) + tag_ids.add(Tag.objects.get_or_create(name__iexact=part, defaults={ + "name": part + })[0].pk) return tag_ids diff --git a/src/documents/tests/test_management_consumer.py b/src/documents/tests/test_management_consumer.py index 6973fdacf..b6a61a167 100644 --- a/src/documents/tests/test_management_consumer.py +++ b/src/documents/tests/test_management_consumer.py @@ -230,7 +230,7 @@ class TestConsumerTags(DirectoriesMixin, ConsumerMixin, TransactionTestCase): tag_names = ("existingTag", "Space Tag") # Create a Tag prior to consuming a file using it in path - tag_ids = [Tag.objects.create(name=tag_names[0]).pk,] + tag_ids = [Tag.objects.create(name="existingtag").pk,] self.t_start() From 72706a335da809122c886576f50df4528c15c75f Mon Sep 17 00:00:00 2001 From: Jonas Winkler Date: Sun, 6 Dec 2020 23:30:51 +0100 Subject: [PATCH 036/522] Update CONTRIBUTING.md --- CONTRIBUTING.md | 4 ++++ 1 file changed, 4 insertions(+) diff --git a/CONTRIBUTING.md b/CONTRIBUTING.md index bd6080d35..a8fb1f8e9 100644 --- a/CONTRIBUTING.md +++ b/CONTRIBUTING.md @@ -24,3 +24,7 @@ feature-X branches is for experimental stuff that will eventually be merged into I'm trying to get most of paperless tested, so please do the same for your code! I know its a hassle, but it makes sure that your code works now and will allow us to detect regressions easily. To test your code, execute `pytest` in the src/ directory. Executing that in the project root is no good. This also generates a html coverage report, which you can use to see if you missed anything important during testing. + +## More info: + +... is available in the documentation. https://paperless-ng.readthedocs.io/en/latest/extending.html From f3fd0fcf72f8009e9b67cf18319e37100a97f0bb Mon Sep 17 00:00:00 2001 From: Michael Shamoon <4887959+nikonratm@users.noreply.github.com> Date: Tue, 8 Dec 2020 23:08:02 -0800 Subject: [PATCH 037/522] Basic tags, correspondents & document type dropdowns --- src-ui/src/app/app.module.ts | 4 +- .../document-list.component.html | 69 +++++++++++++++++-- .../document-list/document-list.component.ts | 30 ++++++-- src-ui/src/app/pipes/filter.pipe.ts | 17 +++++ 4 files changed, 107 insertions(+), 13 deletions(-) create mode 100644 src-ui/src/app/pipes/filter.pipe.ts diff --git a/src-ui/src/app/app.module.ts b/src-ui/src/app/app.module.ts index ad12c9c47..af2c46492 100644 --- a/src-ui/src/app/app.module.ts +++ b/src-ui/src/app/app.module.ts @@ -48,6 +48,7 @@ import { WidgetFrameComponent } from './components/dashboard/widgets/widget-fram import { WelcomeWidgetComponent } from './components/dashboard/widgets/welcome-widget/welcome-widget.component'; import { YesNoPipe } from './pipes/yes-no.pipe'; import { FileSizePipe } from './pipes/file-size.pipe'; +import { FilterPipe } from './pipes/filter.pipe'; @NgModule({ declarations: [ @@ -88,7 +89,8 @@ import { FileSizePipe } from './pipes/file-size.pipe'; WidgetFrameComponent, WelcomeWidgetComponent, YesNoPipe, - FileSizePipe + FileSizePipe, + FilterPipe ], imports: [ BrowserModule, diff --git a/src-ui/src/app/components/document-list/document-list.component.html b/src-ui/src/app/components/document-list/document-list.component.html index 8608ed92b..886b5832a 100644 --- a/src-ui/src/app/components/document-list/document-list.component.html +++ b/src-ui/src/app/components/document-list/document-list.component.html @@ -1,5 +1,4 @@ -
+
@@ -42,13 +42,14 @@
+
@@ -58,18 +59,69 @@ - +
+
+
+
+
+ + +
+ +
+ + +
+ +
+ + +
+ +
+
+
-
Filter
+
Advanced Filters
@@ -125,5 +177,12 @@
- +
+ + diff --git a/src-ui/src/app/components/document-list/document-list.component.ts b/src-ui/src/app/components/document-list/document-list.component.ts index 09e73dd96..9870f3dc1 100644 --- a/src-ui/src/app/components/document-list/document-list.component.ts +++ b/src-ui/src/app/components/document-list/document-list.component.ts @@ -11,6 +11,12 @@ import { SavedViewConfigService } from 'src/app/services/saved-view-config.servi import { Toast, ToastService } from 'src/app/services/toast.service'; import { environment } from 'src/environments/environment'; import { SaveViewConfigDialogComponent } from './save-view-config-dialog/save-view-config-dialog.component'; +import { PaperlessTag } from 'src/app/data/paperless-tag'; +import { PaperlessCorrespondent } from 'src/app/data/paperless-correspondent'; +import { PaperlessDocumentType } from 'src/app/data/paperless-document-type'; +import { TagService } from 'src/app/services/rest/tag.service'; +import { CorrespondentService } from 'src/app/services/rest/correspondent.service'; +import { DocumentTypeService } from 'src/app/services/rest/document-type.service'; @Component({ selector: 'app-document-list', @@ -25,13 +31,20 @@ export class DocumentListComponent implements OnInit { public route: ActivatedRoute, private toastService: ToastService, public modalService: NgbModal, - private titleService: Title) { } + private titleService: Title, + private tagService: TagService, + private correspondentService: CorrespondentService, + private documentTypeService: DocumentTypeService) { } displayMode = 'smallCards' // largeCards, smallCards, details filterRules: FilterRule[] = [] showFilter = false + tags: PaperlessTag[] = [] + correspondents: PaperlessCorrespondent[] = [] + documentTypes: PaperlessDocumentType[] = [] + get isFiltered() { return this.list.filterRules?.length > 0 } @@ -67,6 +80,9 @@ export class DocumentListComponent implements OnInit { this.list.clear() this.list.reload() }) + this.tagService.listAll().subscribe(result => this.tags = result.results) + this.correspondentService.listAll().subscribe(result => this.correspondents = result.results) + this.documentTypeService.listAll().subscribe(result => this.documentTypes = result.results) } applyFilterRules() { @@ -103,8 +119,8 @@ export class DocumentListComponent implements OnInit { }) } - filterByTag(tag_id: number) { - let filterRules = this.list.filterRules + filterByTag(tag_id: number, singleton: boolean = false) { + let filterRules = singleton ? [] : this.list.filterRules if (filterRules.find(rule => rule.type.id == FILTER_HAS_TAG && rule.value == tag_id)) { return } @@ -114,8 +130,8 @@ export class DocumentListComponent implements OnInit { this.applyFilterRules() } - filterByCorrespondent(correspondent_id: number) { - let filterRules = this.list.filterRules + filterByCorrespondent(correspondent_id: number, singleton: boolean = false) { + let filterRules = singleton ? [] : this.list.filterRules let existing_rule = filterRules.find(rule => rule.type.id == FILTER_CORRESPONDENT) if (existing_rule && existing_rule.value == correspondent_id) { return @@ -128,8 +144,8 @@ export class DocumentListComponent implements OnInit { this.applyFilterRules() } - filterByDocumentType(document_type_id: number) { - let filterRules = this.list.filterRules + filterByDocumentType(document_type_id: number, singleton: boolean = false) { + let filterRules = singleton ? [] : this.list.filterRules let existing_rule = filterRules.find(rule => rule.type.id == FILTER_DOCUMENT_TYPE) if (existing_rule && existing_rule.value == document_type_id) { return diff --git a/src-ui/src/app/pipes/filter.pipe.ts b/src-ui/src/app/pipes/filter.pipe.ts new file mode 100644 index 000000000..f799f40cc --- /dev/null +++ b/src-ui/src/app/pipes/filter.pipe.ts @@ -0,0 +1,17 @@ +import { Pipe, PipeTransform } from '@angular/core'; + +@Pipe({ + name: 'filter' +}) +export class FilterPipe implements PipeTransform { + transform(items: any[], searchText: string): any[] { + if (!items) return []; + if (!searchText) return items; + + return items.filter(item => { + return Object.keys(item).some(key => { + return String(item[key]).toLowerCase().includes(searchText.toLowerCase()); + }); + }); + } +} From 23ba3be68ff56f54abe8bba430d8fafa8ee25840 Mon Sep 17 00:00:00 2001 From: Michael Shamoon <4887959+nikonratm@users.noreply.github.com> Date: Tue, 8 Dec 2020 23:39:38 -0800 Subject: [PATCH 038/522] Toggling of items --- .../document-list.component.html | 15 ++++- .../document-list/document-list.component.ts | 64 +++++++++++++++++-- 2 files changed, 70 insertions(+), 9 deletions(-) diff --git a/src-ui/src/app/components/document-list/document-list.component.html b/src-ui/src/app/components/document-list/document-list.component.html index 886b5832a..7c89517be 100644 --- a/src-ui/src/app/components/document-list/document-list.component.html +++ b/src-ui/src/app/components/document-list/document-list.component.html @@ -77,7 +77,10 @@
- @@ -92,7 +95,10 @@
- @@ -107,7 +113,10 @@
- diff --git a/src-ui/src/app/components/document-list/document-list.component.ts b/src-ui/src/app/components/document-list/document-list.component.ts index 9870f3dc1..5e5134dc7 100644 --- a/src-ui/src/app/components/document-list/document-list.component.ts +++ b/src-ui/src/app/components/document-list/document-list.component.ts @@ -119,8 +119,8 @@ export class DocumentListComponent implements OnInit { }) } - filterByTag(tag_id: number, singleton: boolean = false) { - let filterRules = singleton ? [] : this.list.filterRules + filterByTag(tag_id: number) { + let filterRules = this.list.filterRules if (filterRules.find(rule => rule.type.id == FILTER_HAS_TAG && rule.value == tag_id)) { return } @@ -130,8 +130,8 @@ export class DocumentListComponent implements OnInit { this.applyFilterRules() } - filterByCorrespondent(correspondent_id: number, singleton: boolean = false) { - let filterRules = singleton ? [] : this.list.filterRules + filterByCorrespondent(correspondent_id: number) { + let filterRules = this.list.filterRules let existing_rule = filterRules.find(rule => rule.type.id == FILTER_CORRESPONDENT) if (existing_rule && existing_rule.value == correspondent_id) { return @@ -144,8 +144,8 @@ export class DocumentListComponent implements OnInit { this.applyFilterRules() } - filterByDocumentType(document_type_id: number, singleton: boolean = false) { - let filterRules = singleton ? [] : this.list.filterRules + filterByDocumentType(document_type_id: number) { + let filterRules = this.list.filterRules let existing_rule = filterRules.find(rule => rule.type.id == FILTER_DOCUMENT_TYPE) if (existing_rule && existing_rule.value == document_type_id) { return @@ -158,4 +158,56 @@ export class DocumentListComponent implements OnInit { this.applyFilterRules() } + findRuleIndex(type_id: number, value: any) { + return this.list.filterRules.findIndex(rule => rule.type.id == type_id && rule.value == value) + } + + toggleFilterByTag(tag_id: number) { + let existingRuleIndex = this.findRuleIndex(FILTER_HAS_TAG, tag_id) + if (existingRuleIndex !== -1) { + let filterRules = this.list.filterRules + filterRules.splice(existingRuleIndex, 1) + this.filterRules = filterRules + this.applyFilterRules() + } else { + this.filterByTag(tag_id) + } + } + + toggleFilterByCorrespondent(correspondent_id: number) { + let existingRuleIndex = this.findRuleIndex(FILTER_CORRESPONDENT, correspondent_id) + if (existingRuleIndex !== -1) { + let filterRules = this.list.filterRules + filterRules.splice(existingRuleIndex, 1) + this.filterRules = filterRules + this.applyFilterRules() + } else { + this.filterByCorrespondent(correspondent_id) + } + } + + toggleFilterByDocumentType(document_type_id: number) { + let existingRuleIndex = this.findRuleIndex(FILTER_DOCUMENT_TYPE, document_type_id) + if (existingRuleIndex !== -1) { + let filterRules = this.list.filterRules + filterRules.splice(existingRuleIndex, 1) + this.filterRules = filterRules + this.applyFilterRules() + } else { + this.filterByDocumentType(document_type_id) + } + } + + currentViewIncludesTag(tag_id: number) { + return this.findRuleIndex(FILTER_HAS_TAG, tag_id) !== -1 + } + + currentViewIncludesCorrespondent(correspondent_id: number) { + return this.findRuleIndex(FILTER_CORRESPONDENT, correspondent_id) !== -1 + } + + currentViewIncludesDocumentType(document_type_id: number) { + return this.findRuleIndex(FILTER_DOCUMENT_TYPE, document_type_id) !== -1 + } + } From da87542a5204db3244f2c270ac1ee82394110d71 Mon Sep 17 00:00:00 2001 From: Michael Shamoon <4887959+nikonratm@users.noreply.github.com> Date: Tue, 8 Dec 2020 23:53:19 -0800 Subject: [PATCH 039/522] Change advanced to show / hide --- .../components/document-list/document-list.component.html | 8 ++++---- 1 file changed, 4 insertions(+), 4 deletions(-) diff --git a/src-ui/src/app/components/document-list/document-list.component.html b/src-ui/src/app/components/document-list/document-list.component.html index 7c89517be..58fbbcbe8 100644 --- a/src-ui/src/app/components/document-list/document-list.component.html +++ b/src-ui/src/app/components/document-list/document-list.component.html @@ -49,13 +49,13 @@ - Advanced Filters + {{ showFilter ? 'Hide' : 'Show' }} Filter Editor