mirror of
https://github.com/paperless-ngx/paperless-ngx.git
synced 2025-04-02 13:45:10 -05:00
fixes #794
This commit is contained in:
parent
27cb243a2f
commit
d26c46e034
@ -119,6 +119,8 @@ class RasterisedDocumentParser(DocumentParser):
|
||||
try:
|
||||
text = extract_text(pdf_file)
|
||||
stripped = strip_excess_whitespace(text)
|
||||
stripped = stripped.replace("\0", " ")
|
||||
|
||||
self.log("debug", f"Extracted text from PDF file {pdf_file}")
|
||||
return stripped
|
||||
except PDFException:
|
||||
|
Loading…
x
Reference in New Issue
Block a user