mirror of
				https://github.com/paperless-ngx/paperless-ngx.git
				synced 2025-10-28 03:46:06 -05:00 
			
		
		
		
	Merge pull request #421 from ddddavidmartin/clarify_forgiving_ocr_handling
Clarify forgiving ocr handling
This commit is contained in:
		| @@ -188,6 +188,11 @@ PAPERLESS_DEBUG="false" | |||||||
| #PAPERLESS_CONSUMER_LOOP_TIME=10 | #PAPERLESS_CONSUMER_LOOP_TIME=10 | ||||||
|  |  | ||||||
|  |  | ||||||
|  | # By default Paperless stops consuming a document if no language can be detected. | ||||||
|  | # Set to true to consume documents even if the language detection fails. | ||||||
|  | #PAPERLESS_FORGIVING_OCR="false" | ||||||
|  |  | ||||||
|  |  | ||||||
| ############################################################################### | ############################################################################### | ||||||
| ####                            Interface                                  #### | ####                            Interface                                  #### | ||||||
| ############################################################################### | ############################################################################### | ||||||
|   | |||||||
| @@ -153,7 +153,10 @@ class RasterisedDocumentParser(DocumentParser): | |||||||
|                 ) |                 ) | ||||||
|                 raw_text = self._assemble_ocr_sections(imgs, middle, raw_text) |                 raw_text = self._assemble_ocr_sections(imgs, middle, raw_text) | ||||||
|                 return raw_text |                 return raw_text | ||||||
|             raise OCRError("Language detection failed") |             error_msg = ("Language detection failed. Set " | ||||||
|  |                          "PAPERLESS_FORGIVING_OCR in config file to continue " | ||||||
|  |                          "anyway.") | ||||||
|  |             raise OCRError(error_msg) | ||||||
|  |  | ||||||
|         if ISO639[guessed_language] == self.DEFAULT_OCR_LANGUAGE: |         if ISO639[guessed_language] == self.DEFAULT_OCR_LANGUAGE: | ||||||
|             raw_text = self._assemble_ocr_sections(imgs, middle, raw_text) |             raw_text = self._assemble_ocr_sections(imgs, middle, raw_text) | ||||||
|   | |||||||
		Reference in New Issue
	
	Block a user
	 Daniel Quinn
					Daniel Quinn