sources: give each filename from a source a unique filename

author Jason Ish <jason.ish@oisf.net>

Tue, 5 Mar 2024 23:12:55 +0000 (17:12 -0600)

committer Jason Ish <jason.ish@oisf.net>

Tue, 5 Mar 2024 23:12:55 +0000 (17:12 -0600)
author Jason Ish <jason.ish@oisf.net>
Tue, 5 Mar 2024 23:12:55 +0000 (17:12 -0600)
committer Jason Ish <jason.ish@oisf.net>
Tue, 5 Mar 2024 23:12:55 +0000 (17:12 -0600)
diff --git a/CHANGELOG.md b/CHANGELOG.md

index a231f002c1655a5f29afc2836a14dbe479f44c01..738c000c06fa4f7196fd896c5f51b3dd0654cd56 100644 (file)
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -10,6 +10,10 @@
  - Don't base dataset filenames on the contents of the file, but
    instead the filename path:
    https://redmine.openinfosecfoundation.org/issues/6763
+- Give each file in a source a unique filename by prefixing the files
+  with a hash of the URL to prevent duplicate filenames from
+  cloberring each other, in particular dataset files:
+  https://redmine.openinfosecfoundation.org/issues/6833
  
  ## 1.3.0 - 2023-07-07
  
diff --git a/suricata/update/main.py b/suricata/update/main.py

index d41944e2049ca96a7f2bac6cbf6f9bde7d18a6ae..a1e9e70594da924b435560ae8a16bbd1e3d0ed9d 100644 (file)
--- a/suricata/update/main.py
+++ b/suricata/update/main.py
@@ -985,9 +985,14 @@ def load_sources(suricata_version):
      # Now download each URL.
      files = []
      for url in urls:
+
+        # To de-duplicate filenames, add a prefix that is a hash of the URL.
+        prefix = hashlib.md5(url[0].encode()).hexdigest()
          source_files = Fetch().run(url)
          for key in source_files:
-            files.append(SourceFile(key, source_files[key]))
+            content = source_files[key]
+            key = format("{}/{}".format(prefix, key))
+            files.append(SourceFile(key, content))
  
      # Now load local rules.
      if config.get("local") is not None:
author	Jason Ish <jason.ish@oisf.net>
	Tue, 5 Mar 2024 23:12:55 +0000 (17:12 -0600)
committer	Jason Ish <jason.ish@oisf.net>
	Tue, 5 Mar 2024 23:12:55 +0000 (17:12 -0600)
CHANGELOG.md		patch \| blob \| blame \| history
suricata/update/main.py		patch \| blob \| blame \| history