mirror of
				https://github.com/paperless-ngx/paperless-ngx.git
				synced 2025-11-03 03:16:10 -06:00 
			
		
		
		
	fixes #794
This commit is contained in:
		@@ -119,6 +119,8 @@ class RasterisedDocumentParser(DocumentParser):
 | 
				
			|||||||
        try:
 | 
					        try:
 | 
				
			||||||
            text = extract_text(pdf_file)
 | 
					            text = extract_text(pdf_file)
 | 
				
			||||||
            stripped = strip_excess_whitespace(text)
 | 
					            stripped = strip_excess_whitespace(text)
 | 
				
			||||||
 | 
					            stripped = stripped.replace("\0", " ")
 | 
				
			||||||
 | 
					
 | 
				
			||||||
            self.log("debug", f"Extracted text from PDF file {pdf_file}")
 | 
					            self.log("debug", f"Extracted text from PDF file {pdf_file}")
 | 
				
			||||||
            return stripped
 | 
					            return stripped
 | 
				
			||||||
        except PDFException:
 | 
					        except PDFException:
 | 
				
			||||||
 
 | 
				
			|||||||
		Reference in New Issue
	
	Block a user