From: shamoon <4887959+shamoon@users.noreply.github.com> Date: Wed, 30 Apr 2025 17:25:13 +0000 (-0700) Subject: Truncate similar docs content X-Git-Url: http://git.ipfire.org/cgi-bin/gitweb.cgi?a=commitdiff_plain;h=90bd878cf2da995ae7be114605f756e16240e8d7;p=thirdparty%2Fpaperless-ngx.git Truncate similar docs content --- diff --git a/src/paperless_ai/ai_classifier.py b/src/paperless_ai/ai_classifier.py index fd660763c..b75ceb1e5 100644 --- a/src/paperless_ai/ai_classifier.py +++ b/src/paperless_ai/ai_classifier.py @@ -90,7 +90,7 @@ def get_context_for_document( )[:max_docs] context_blocks = [] for similar in similar_docs: - text = similar.content or "" + text = similar.content[:1000] or "" title = similar.title or similar.filename or "Untitled" context_blocks.append(f"TITLE: {title}\n{text}") return "\n\n".join(context_blocks)