Issue #19405: Fixed outdated comments in the _sre module.

author Serhiy Storchaka <storchaka@gmail.com>

Sun, 27 Oct 2013 06:04:58 +0000 (08:04 +0200)

committer Serhiy Storchaka <storchaka@gmail.com>

Sun, 27 Oct 2013 06:04:58 +0000 (08:04 +0200)
author Serhiy Storchaka <storchaka@gmail.com>
Sun, 27 Oct 2013 06:04:58 +0000 (08:04 +0200)
committer Serhiy Storchaka <storchaka@gmail.com>
Sun, 27 Oct 2013 06:04:58 +0000 (08:04 +0200)
diff --git a/Lib/sre_compile.py b/Lib/sre_compile.py

index a80c74dc6005725be99aded605b99ae2a4161f9c..b984a54b037e82e0a218035459e3dbedf2d34a55 100644 (file)
--- a/Lib/sre_compile.py
+++ b/Lib/sre_compile.py
@@ -276,10 +276,10 @@ def _mk_bitmap(bits):
  # set is constructed. Then, this bitmap is sliced into chunks of 256
  # characters, duplicate chunks are eliminated, and each chunk is
  # given a number. In the compiled expression, the charset is
-# represented by a 16-bit word sequence, consisting of one word for
-# the number of different chunks, a sequence of 256 bytes (128 words)
+# represented by a 32-bit word sequence, consisting of one word for
+# the number of different chunks, a sequence of 256 bytes (64 words)
  # of chunk numbers indexed by their original chunk position, and a
-# sequence of chunks (16 words each).
+# sequence of 256-bit chunks (8 words each).
  
  # Compression is normally good: in a typical charset, large ranges of
  # Unicode will be either completely excluded (e.g. if only cyrillic
@@ -292,9 +292,9 @@ def _mk_bitmap(bits):
  # less significant byte is a bit index in the chunk (just like the
  # CHARSET matching).
  
-# In UCS-4 mode, the BIGCHARSET opcode still supports only subsets
+# The BIGCHARSET opcode still supports only subsets
  # of the basic multilingual plane; an efficient representation
-# for all of UTF-16 has not yet been developed. This means,
+# for all of Unicode has not yet been developed. This means,
  # in particular, that negated charsets cannot be represented as
  # bigcharsets.
  
diff --git a/Modules/_sre.c b/Modules/_sre.c

index 787809fd0f51aac602930241b0412c009b93fb6d..1c76d24dbd31a09518a5c71d73af8f448a07438c 100644 (file)
--- a/Modules/_sre.c
+++ b/Modules/_sre.c
@@ -2749,8 +2749,7 @@ _compile(PyObject* self_, PyObject* args)
      \_________\_____/        /
                 \____________/
  
-   It also helps that SRE_CODE is always an unsigned type, either 2 bytes or 4
-   bytes wide (the latter if Python is compiled for "wide" unicode support).
+   It also helps that SRE_CODE is always an unsigned type.
  */
  
  /* Defining this one enables tracing of the validator */
author	Serhiy Storchaka <storchaka@gmail.com>
	Sun, 27 Oct 2013 06:04:58 +0000 (08:04 +0200)
committer	Serhiy Storchaka <storchaka@gmail.com>
	Sun, 27 Oct 2013 06:04:58 +0000 (08:04 +0200)
Lib/sre_compile.py		patch \| blob \| blame \| history
Modules/_sre.c		patch \| blob \| blame \| history