do a backport of r75928

author Benjamin Peterson <benjamin@python.org>

Thu, 29 Oct 2009 01:49:07 +0000 (01:49 +0000)

committer Benjamin Peterson <benjamin@python.org>

Thu, 29 Oct 2009 01:49:07 +0000 (01:49 +0000)
author Benjamin Peterson <benjamin@python.org>
Thu, 29 Oct 2009 01:49:07 +0000 (01:49 +0000)
committer Benjamin Peterson <benjamin@python.org>
Thu, 29 Oct 2009 01:49:07 +0000 (01:49 +0000)
diff --git a/Lib/test/test_pep263.py b/Lib/test/test_pep263.py

index b7bb5a2965995edc60381e1266550b8811f8bdad..e4faa9ff56afb3dc953e1c8b6d5fbcd245f47613 100644 (file)
--- a/Lib/test/test_pep263.py
+++ b/Lib/test/test_pep263.py
@@ -23,6 +23,13 @@ class PEP263Test(unittest.TestCase):
          self.assertEqual(d['u'], u'\xf3')
  
  
+    def test_issue3297(self):
+        c = compile("a, b = '\U0001010F', '\\U0001010F'", "dummy", "exec")
+        d = {}
+        exec(c, d)
+        self.assertEqual(d['a'], d['b'])
+        self.assertEqual(len(d['a']), len(d['b']))
+
  def test_main():
      test_support.run_unittest(PEP263Test)
  
diff --git a/Python/ast.c b/Python/ast.c

index 347da2aa95669ad368874c772a63f701d635a2a4..7f379a5957b01eda6d512ffdfff3a140ba452617 100644 (file)
--- a/Python/ast.c
+++ b/Python/ast.c
@@ -3289,10 +3289,11 @@ decode_unicode(struct compiling *c, const char *s, size_t len, int rawmode, cons
                  u = NULL;
          } else {
                  /* check for integer overflow */
-                if (len > PY_SIZE_MAX / 4)
+                if (len > PY_SIZE_MAX / 6)
                          return NULL;
-                /* "\XX" may become "\u005c\uHHLL" (12 bytes) */
-                u = PyString_FromStringAndSize((char *)NULL, len * 4);
+               /* "<C3><A4>" (2 bytes) may become "\U000000E4" (10 bytes), or 1:5
+                  "\ä" (3 bytes) may become "\u005c\U000000E4" (16 bytes), or ~1:6 */
+                u = PyString_FromStringAndSize((char *)NULL, len * 6);
                  if (u == NULL)
                          return NULL;
                  p = buf = PyString_AsString(u);
@@ -3309,19 +3310,21 @@ decode_unicode(struct compiling *c, const char *s, size_t len, int rawmode, cons
                                  PyObject *w;
                                  char *r;
                                  Py_ssize_t rn, i;
-                                w = decode_utf8(c, &s, end, "utf-16-be");
+                                w = decode_utf8(c, &s, end, "utf-32-be");
                                  if (w == NULL) {
                                          Py_DECREF(u);
                                          return NULL;
                                  }
                                  r = PyString_AsString(w);
                                  rn = PyString_Size(w);
-                                assert(rn % 2 == 0);
-                                for (i = 0; i < rn; i += 2) {
-                                        sprintf(p, "\\u%02x%02x",
+                                assert(rn % 4 == 0);
+                                for (i = 0; i < rn; i += 4) {
+                                        sprintf(p, "\\U%02x%02x%02x%02x",
                                                  r[i + 0] & 0xFF,
-                                                r[i + 1] & 0xFF);
-                                        p += 6;
+                                                r[i + 1] & 0xFF,
+                                               r[i + 2] & 0xFF,
+                                               r[i + 3] & 0xFF);
+                                        p += 10;
                                  }
                                  Py_DECREF(w);
                          } else {
author	Benjamin Peterson <benjamin@python.org>
	Thu, 29 Oct 2009 01:49:07 +0000 (01:49 +0000)
committer	Benjamin Peterson <benjamin@python.org>
	Thu, 29 Oct 2009 01:49:07 +0000 (01:49 +0000)
Lib/test/test_pep263.py		patch \| blob \| blame \| history
Python/ast.c		patch \| blob \| blame \| history