mirror of
https://github.com/paperless-ngx/paperless-ngx.git
synced 2025-04-02 13:45:10 -05:00
Enhancement: add timeout for Tika client (#8520)
Co-authored-by: shamoon <4887959+shamoon@users.noreply.github.com>
This commit is contained in:
parent
2bcbed31e9
commit
452ea2ccf9
@ -33,7 +33,10 @@ class TikaDocumentParser(DocumentParser):
|
|||||||
|
|
||||||
def extract_metadata(self, document_path, mime_type):
|
def extract_metadata(self, document_path, mime_type):
|
||||||
try:
|
try:
|
||||||
with TikaClient(tika_url=settings.TIKA_ENDPOINT) as client:
|
with TikaClient(
|
||||||
|
tika_url=settings.TIKA_ENDPOINT,
|
||||||
|
timeout=settings.CELERY_TASK_TIME_LIMIT,
|
||||||
|
) as client:
|
||||||
parsed = client.metadata.from_file(document_path, mime_type)
|
parsed = client.metadata.from_file(document_path, mime_type)
|
||||||
return [
|
return [
|
||||||
{
|
{
|
||||||
@ -54,7 +57,10 @@ class TikaDocumentParser(DocumentParser):
|
|||||||
self.log.info(f"Sending {document_path} to Tika server")
|
self.log.info(f"Sending {document_path} to Tika server")
|
||||||
|
|
||||||
try:
|
try:
|
||||||
with TikaClient(tika_url=settings.TIKA_ENDPOINT) as client:
|
with TikaClient(
|
||||||
|
tika_url=settings.TIKA_ENDPOINT,
|
||||||
|
timeout=settings.CELERY_TASK_TIME_LIMIT,
|
||||||
|
) as client:
|
||||||
try:
|
try:
|
||||||
parsed = client.tika.as_text.from_file(document_path, mime_type)
|
parsed = client.tika.as_text.from_file(document_path, mime_type)
|
||||||
except httpx.HTTPStatusError as err:
|
except httpx.HTTPStatusError as err:
|
||||||
|
Loading…
x
Reference in New Issue
Block a user