mirror of
https://github.com/paperless-ngx/paperless-ngx.git
synced 2025-04-02 13:45:10 -05:00
fixes #794
This commit is contained in:
parent
27cb243a2f
commit
d26c46e034
@ -119,6 +119,8 @@ class RasterisedDocumentParser(DocumentParser):
|
|||||||
try:
|
try:
|
||||||
text = extract_text(pdf_file)
|
text = extract_text(pdf_file)
|
||||||
stripped = strip_excess_whitespace(text)
|
stripped = strip_excess_whitespace(text)
|
||||||
|
stripped = stripped.replace("\0", " ")
|
||||||
|
|
||||||
self.log("debug", f"Extracted text from PDF file {pdf_file}")
|
self.log("debug", f"Extracted text from PDF file {pdf_file}")
|
||||||
return stripped
|
return stripped
|
||||||
except PDFException:
|
except PDFException:
|
||||||
|
Loading…
x
Reference in New Issue
Block a user