]> git.ipfire.org Git - thirdparty/paperless-ngx.git/commitdiff
Chore: add headers for wikipedia CI tests (#11253)
authorshamoon <4887959+shamoon@users.noreply.github.com>
Sat, 1 Nov 2025 16:37:49 +0000 (09:37 -0700)
committerGitHub <noreply@github.com>
Sat, 1 Nov 2025 16:37:49 +0000 (09:37 -0700)
src/paperless_mail/tests/test_parsers_live.py

index e1febb1e5d2fd1e3af091de9faeb79a6ae585821..2c3ef262aa953515da0ff9bc716245e37f3df366 100644 (file)
@@ -53,6 +53,15 @@ class TestUrlCanary:
     Verify certain URLs are still available so testing is valid still
     """
 
+    # Wikimedia rejects requests without a browser-like User-Agent header and returns 403.
+    _WIKIMEDIA_HEADERS = {
+        "User-Agent": (
+            "Mozilla/5.0 (X11; Linux x86_64) "
+            "AppleWebKit/537.36 (KHTML, like Gecko) "
+            "Chrome/123.0.0.0 Safari/537.36"
+        ),
+    }
+
     def test_online_image_exception_on_not_available(self):
         """
         GIVEN:
@@ -70,6 +79,7 @@ class TestUrlCanary:
         with pytest.raises(httpx.HTTPStatusError) as exec_info:
             resp = httpx.get(
                 "https://upload.wikimedia.org/wikipedia/en/f/f7/nonexistent.png",
+                headers=self._WIKIMEDIA_HEADERS,
             )
             resp.raise_for_status()
 
@@ -90,7 +100,10 @@ class TestUrlCanary:
         """
 
         # Now check the URL used in samples/sample.html
-        resp = httpx.get("https://upload.wikimedia.org/wikipedia/en/f/f7/RickRoll.png")
+        resp = httpx.get(
+            "https://upload.wikimedia.org/wikipedia/en/f/f7/RickRoll.png",
+            headers=self._WIKIMEDIA_HEADERS,
+        )
         resp.raise_for_status()