Fixes the download and usage of the downloaded data

This commit is contained in:
Trenton Holmes
2022-09-16 06:55:42 -07:00
committed by Trenton H
parent 3c12f13df2
commit 70b1988a55
4 changed files with 25 additions and 20 deletions

View File

@@ -306,6 +306,12 @@ class DocumentClassifier:
from nltk.corpus import stopwords
from nltk.stem import SnowballStemmer
import nltk
# Not really hacky, since it isn't private and is documented, but
# set the search path for NLTK data to the single location it should be in
nltk.data.path = [settings.NLTK_DIR]
if self.stemmer is None:
self.stemmer = SnowballStemmer("english")