bpo-36502: Correct documentation of str.isspace() (GH-15019) (GH-15296)

author Miss Islington (bot) <31488909+miss-islington@users.noreply.github.com>

Mon, 19 Aug 2019 10:10:14 +0000 (03:10 -0700)

committer GitHub <noreply@github.com>

Mon, 19 Aug 2019 10:10:14 +0000 (03:10 -0700)
author Miss Islington (bot) <31488909+miss-islington@users.noreply.github.com>
Mon, 19 Aug 2019 10:10:14 +0000 (03:10 -0700)
committer GitHub <noreply@github.com>
Mon, 19 Aug 2019 10:10:14 +0000 (03:10 -0700)
diff --git a/Doc/library/stdtypes.rst b/Doc/library/stdtypes.rst

index d35c171aba39c02f2db746a9965f96c4feb06c82..b9581ce1c9ae80d9a1236bf1ee3af93da315a765 100644 (file)
--- a/Doc/library/stdtypes.rst
+++ b/Doc/library/stdtypes.rst
@@ -1731,9 +1731,13 @@ expression support in the :mod:`re` module).
  .. method:: str.isspace()
  
     Return true if there are only whitespace characters in the string and there is
-   at least one character, false otherwise.  Whitespace characters  are those
-   characters defined in the Unicode character database as "Other" or "Separator"
-   and those with bidirectional property being one of "WS", "B", or "S".
+   at least one character, false otherwise.
+
+   A character is *whitespace* if in the Unicode character database
+   (see :mod:`unicodedata`), either its general category is ``Zs``
+   ("Separator, space"), or its bidirectional class is one of ``WS``,
+   ``B``, or ``S``.
+
  
  .. method:: str.istitle()
  
diff --git a/Lib/test/test_unicode.py b/Lib/test/test_unicode.py

index 1aad9334074c5cc22af16414826d8db67292e0f5..4ebd82d3e0c2f131d74ffd132c4bf7ecad7706b0 100644 (file)
--- a/Lib/test/test_unicode.py
+++ b/Lib/test/test_unicode.py
@@ -11,6 +11,7 @@ import itertools
  import operator
  import struct
  import sys
+import unicodedata
  import unittest
  import warnings
  from test import support, string_tests
@@ -615,11 +616,21 @@ class UnicodeTest(string_tests.CommonTest,
          self.checkequalnofix(True, '\u2000', 'isspace')
          self.checkequalnofix(True, '\u200a', 'isspace')
          self.checkequalnofix(False, '\u2014', 'isspace')
-        # apparently there are no non-BMP spaces chars in Unicode 6
+        # There are no non-BMP whitespace chars as of Unicode 12.
          for ch in ['\U00010401', '\U00010427', '\U00010429', '\U0001044E',
                     '\U0001F40D', '\U0001F46F']:
              self.assertFalse(ch.isspace(), '{!a} is not space.'.format(ch))
  
+    @support.requires_resource('cpu')
+    def test_isspace_invariant(self):
+        for codepoint in range(sys.maxunicode + 1):
+            char = chr(codepoint)
+            bidirectional = unicodedata.bidirectional(char)
+            category = unicodedata.category(char)
+            self.assertEqual(char.isspace(),
+                             (bidirectional in ('WS', 'B', 'S')
+                              or category == 'Zs'))
+
      def test_isalnum(self):
          super().test_isalnum()
          for ch in ['\U00010401', '\U00010427', '\U00010429', '\U0001044E',
author	Miss Islington (bot) <31488909+miss-islington@users.noreply.github.com>
	Mon, 19 Aug 2019 10:10:14 +0000 (03:10 -0700)
committer	GitHub <noreply@github.com>
	Mon, 19 Aug 2019 10:10:14 +0000 (03:10 -0700)
Doc/library/stdtypes.rst		patch \| blob \| blame \| history
Lib/test/test_unicode.py		patch \| blob \| blame \| history