Fix: skip fuzzy matching for empty document content (#10914)

This commit is contained in:
shamoon
2025-09-22 23:30:24 -07:00
committed by GitHub
parent 8d1f23e9d6
commit 6119c215e7
2 changed files with 29 additions and 0 deletions

View File

@@ -92,6 +92,9 @@ class Command(MultiProcessMixin, ProgressBarMixin, BaseCommand):
# doc to doc is obviously not useful
if first_doc.pk == second_doc.pk:
continue
# Skip empty documents (e.g. password-protected)
if first_doc.content.strip() == "" or second_doc.content.strip() == "":
continue
# Skip matching which have already been matched together
# doc 1 to doc 2 is the same as doc 2 to doc 1
doc_1_to_doc_2 = (first_doc.pk, second_doc.pk)