From 10a05569511e040001ff4f35989ecf70381a27f3 Mon Sep 17 00:00:00 2001 From: Daniel Quinn Date: Sun, 10 Jan 2016 15:51:38 +0000 Subject: [PATCH] Updated the docstring to show what's actually happening --- src/documents/management/commands/consume.py | 11 +++++------ 1 file changed, 5 insertions(+), 6 deletions(-) diff --git a/src/documents/management/commands/consume.py b/src/documents/management/commands/consume.py index da9a1c1a3..df050fdb9 100644 --- a/src/documents/management/commands/consume.py +++ b/src/documents/management/commands/consume.py @@ -21,12 +21,11 @@ from documents.models import Document class Command(BaseCommand): """ Loop over every file found in CONSUMPTION_DIR and: - 1. Convert it to a greyscale tif - 2. Convert it to a full-colour jpg - 3. Use tesseract on the tif - 4. Store the OCR'd text in the database along with the paths to the jpg - and original pdf - 5. Delete the pdf and images + 1. Convert it to a greyscale png + 2. Use tesseract on the png + 3. Encrypt and store the PDF in the MEDIA_ROOT + 4. Store the OCR'd text in the database + 5. Delete the pdf and image(s) """ LOOP_TIME = 10 # Seconds