]> git.ipfire.org Git - thirdparty/Python/cpython.git/commitdiff
bpo-40330: Fix utf-8 size check in ShareableList (GH-19606)
authorAntoine Pitrou <antoine@python.org>
Mon, 20 Apr 2020 18:54:55 +0000 (20:54 +0200)
committerGitHub <noreply@github.com>
Mon, 20 Apr 2020 18:54:55 +0000 (11:54 -0700)
The item size must be checked after encoding to bytes, not before.

Automerge-Triggered-By: @pitrou
Lib/multiprocessing/shared_memory.py
Lib/test/_test_multiprocessing.py
Misc/NEWS.d/next/Library/2020-04-19-17-31-29.bpo-40330.DGjoIS.rst [new file with mode: 0644]

index 87e46cfbe526d9cca1c8cecfedbaa995a12d7592..a3a5fcf4aba1e7d76fa1cc66baaf011de65d0a6a 100644 (file)
@@ -445,11 +445,14 @@ class ShareableList:
 
         if not isinstance(value, (str, bytes)):
             new_format = self._types_mapping[type(value)]
+            encoded_value = value
         else:
             allocated_length = self._allocated_offsets[position + 1] - item_offset
 
-            if len(value) > allocated_length:
-                raise ValueError("exceeds available storage for existing str")
+            encoded_value = (value.encode(_encoding)
+                             if isinstance(value, str) else value)
+            if len(encoded_value) > allocated_length:
+                raise ValueError("bytes/str item exceeds available storage")
             if current_format[-1] == "s":
                 new_format = current_format
             else:
@@ -462,8 +465,7 @@ class ShareableList:
             new_format,
             value
         )
-        value = value.encode(_encoding) if isinstance(value, str) else value
-        struct.pack_into(new_format, self.shm.buf, offset, value)
+        struct.pack_into(new_format, self.shm.buf, offset, encoded_value)
 
     def __reduce__(self):
         return partial(self.__class__, name=self.shm.name), ()
index d00e928c17790585c6889cb778989f608b14a680..d633e02d016fc240bd57c6d4a36ef620aa3583e3 100644 (file)
@@ -3995,9 +3995,21 @@ class _TestSharedMemory(BaseTestCase):
         sl[4] = 'some'  # Change type at a given position.
         self.assertEqual(sl[4], 'some')
         self.assertEqual(sl.format, '8s8sdq8sxxxxxxx?q')
-        with self.assertRaises(ValueError):
-            sl[4] = 'far too many'  # Exceeds available storage.
+        with self.assertRaisesRegex(ValueError,
+                                    "exceeds available storage"):
+            sl[4] = 'far too many'
         self.assertEqual(sl[4], 'some')
+        sl[0] = 'encodés'  # Exactly 8 bytes of UTF-8 data
+        self.assertEqual(sl[0], 'encodés')
+        self.assertEqual(sl[1], b'HoWdY')  # no spillage
+        with self.assertRaisesRegex(ValueError,
+                                    "exceeds available storage"):
+            sl[0] = 'encodées'  # Exactly 9 bytes of UTF-8 data
+        self.assertEqual(sl[1], b'HoWdY')
+        with self.assertRaisesRegex(ValueError,
+                                    "exceeds available storage"):
+            sl[1] = b'123456789'
+        self.assertEqual(sl[1], b'HoWdY')
 
         # Exercise count().
         with warnings.catch_warnings():
diff --git a/Misc/NEWS.d/next/Library/2020-04-19-17-31-29.bpo-40330.DGjoIS.rst b/Misc/NEWS.d/next/Library/2020-04-19-17-31-29.bpo-40330.DGjoIS.rst
new file mode 100644 (file)
index 0000000..98cb62f
--- /dev/null
@@ -0,0 +1,2 @@
+In :meth:`ShareableList.__setitem__`, check the size of a new string item
+after encoding it to utf-8, not before.