# doc to doc is obviously not useful
if first_doc.pk == second_doc.pk:
continue
+ # Skip empty documents (e.g. password-protected)
+ if first_doc.content.strip() == "" or second_doc.content.strip() == "":
+ continue
# Skip matching which have already been matched together
# doc 1 to doc 2 is the same as doc 2 to doc 1
doc_1_to_doc_2 = (first_doc.pk, second_doc.pk)
self.assertEqual(Document.objects.count(), 2)
self.assertIsNotNone(Document.objects.get(pk=1))
self.assertIsNotNone(Document.objects.get(pk=2))
+
+ def test_empty_content(self):
+ """
+ GIVEN:
+ - 2 documents exist, content is empty (pw-protected)
+ WHEN:
+ - Command is called
+ THEN:
+ - No matches are found
+ """
+ Document.objects.create(
+ checksum="BEEFCAFE",
+ title="A",
+ content="",
+ mime_type="application/pdf",
+ filename="test.pdf",
+ )
+ Document.objects.create(
+ checksum="DEADBEAF",
+ title="A",
+ content="",
+ mime_type="application/pdf",
+ filename="other_test.pdf",
+ )
+ stdout, _ = self.call_command()
+ self.assertIn("No matches found", stdout)