From 47434dcb72ddbc4bec3e8ed40f20a06e5ef118d4 Mon Sep 17 00:00:00 2001 From: shamoon <4887959+shamoon@users.noreply.github.com> Date: Wed, 30 Apr 2025 10:25:13 -0700 Subject: [PATCH] Truncate similar docs content --- src/paperless_ai/ai_classifier.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/src/paperless_ai/ai_classifier.py b/src/paperless_ai/ai_classifier.py index fd660763c..b75ceb1e5 100644 --- a/src/paperless_ai/ai_classifier.py +++ b/src/paperless_ai/ai_classifier.py @@ -90,7 +90,7 @@ def get_context_for_document( )[:max_docs] context_blocks = [] for similar in similar_docs: - text = similar.content or "" + text = similar.content[:1000] or "" title = similar.title or similar.filename or "Untitled" context_blocks.append(f"TITLE: {title}\n{text}") return "\n\n".join(context_blocks)