mirror of
				https://github.com/paperless-ngx/paperless-ngx.git
				synced 2025-10-30 03:56:23 -05:00 
			
		
		
		
	Workaround for all PDFminer.six issues.
This commit is contained in:
		| @@ -121,7 +121,12 @@ class RasterisedDocumentParser(DocumentParser): | ||||
|  | ||||
|             self.log("debug", f"Extracted text from PDF file {pdf_file}") | ||||
|             return stripped | ||||
|         except PDFException: | ||||
|         except Exception: | ||||
|             # TODO catch all for various issues with PDFminer.six. | ||||
|             #  If PDFminer fails, fall back to OCR. | ||||
|             self.log("warn", | ||||
|                      "Error while getting text from PDF document with " | ||||
|                      "pdfminer.six", exc_info=True) | ||||
|             # probably not a PDF file. | ||||
|             return None | ||||
|  | ||||
|   | ||||
		Reference in New Issue
	
	Block a user
	 jonaswinkler
					jonaswinkler