From dafefa33d674646a142ffb4c6fec33351e4dd7ae Mon Sep 17 00:00:00 2001 From: Trenton H Date: Wed, 5 Oct 2022 12:19:07 -0700 Subject: [PATCH] Adds step to bare metal setup regarding downloading the required NLTK data --- Pipfile.lock | 2 +- docs/setup.rst | 7 +++++++ 2 files changed, 8 insertions(+), 1 deletion(-) diff --git a/Pipfile.lock b/Pipfile.lock index 4e87ca968..d594bf62f 100644 --- a/Pipfile.lock +++ b/Pipfile.lock @@ -1,7 +1,7 @@ { "_meta": { "hash": { - "sha256": "79ef8a0dae2a57c93935fa6ee7c591b53a64cf8c6925d16dc95aa8f8a937f9c7" + "sha256": "d73f1cfcc2ea4741e109317a991b271db292e708c119c560c523b0c74401d5fb" }, "pipfile-spec": 6, "requires": {}, diff --git a/docs/setup.rst b/docs/setup.rst index 8a4adabe0..15f16d193 100644 --- a/docs/setup.rst +++ b/docs/setup.rst @@ -520,6 +520,13 @@ writing. Windows is not and will never be supported. to compile this by yourself, because this software has been patented until around 2017 and binary packages are not available for most distributions. +15. Optional: If using the NLTK machine learning processing (see ``PAPERLESS_ENABLE_NLTK`` in + :ref:`configuration` for details), download the NLTK data for the Snowball Stemmer, Stopwords + and Punkt tokenizer to your ``PAPERLESS_DATA_DIR/nltk``. Refer to + the `NLTK instructions `_ for details on how to + download the data. + + Migrating to Paperless-ngx ##########################