Add unpaper as another pre-processing step

This commit is contained in:
Pit Kleyersburg
2016-02-16 10:49:55 +01:00
parent 0e2d8cc0d8
commit fb36a49c26
5 changed files with 53 additions and 36 deletions

View File

@@ -5,7 +5,7 @@ MAINTAINER Pit Kleyersburg <pitkley@googlemail.com>
RUN apt-get update \
&& apt-get install -y --no-install-recommends \
sudo \
tesseract-ocr tesseract-ocr-eng imagemagick ghostscript \
tesseract-ocr tesseract-ocr-eng imagemagick ghostscript unpaper \
&& rm -rf /var/lib/apt/lists/*
# Install python dependencies