Updates the pre-processing of document content to be much more robust, with tokenization, stemming and stop word removal

This commit is contained in:
Trenton Holmes
2022-09-15 08:39:47 -07:00
committed by Trenton H
parent 77a3f8ed60
commit 66884ea035
4 changed files with 76 additions and 19 deletions

View File

@@ -56,6 +56,7 @@ mysqlclient = "*"
celery = {extras = ["redis"], version = "*"}
django-celery-results = "*"
setproctitle = "*"
nltk = "*"
[dev-packages]
coveralls = "*"