From: Serhiy Storchaka Date: Fri, 22 Apr 2022 18:08:49 +0000 (+0300) Subject: [3.10] gh-90568: Fix exception type for \N with a named sequence in RE (GH-91665... X-Git-Tag: v3.10.5~153 X-Git-Url: http://git.ipfire.org/gitweb.cgi?a=commitdiff_plain;h=9c18d783c38fca57a63b61aa778d8a8d18945d95;p=thirdparty%2FPython%2Fcpython.git [3.10] gh-90568: Fix exception type for \N with a named sequence in RE (GH-91665) (GH-91830) re.error is now raised instead of TypeError. (cherry picked from commit 6ccfa31421393910b52936e0447625db06f2a655) --- diff --git a/Lib/sre_parse.py b/Lib/sre_parse.py index 53706676e9f7..d3ff196032b3 100644 --- a/Lib/sre_parse.py +++ b/Lib/sre_parse.py @@ -330,7 +330,7 @@ def _class_escape(source, escape): charname = source.getuntil('}', 'character name') try: c = ord(unicodedata.lookup(charname)) - except KeyError: + except (KeyError, TypeError): raise source.error("undefined character name %r" % charname, len(charname) + len(r'\N{}')) return LITERAL, c @@ -390,7 +390,7 @@ def _escape(source, escape, state): charname = source.getuntil('}', 'character name') try: c = ord(unicodedata.lookup(charname)) - except KeyError: + except (KeyError, TypeError): raise source.error("undefined character name %r" % charname, len(charname) + len(r'\N{}')) return LITERAL, c diff --git a/Lib/test/test_re.py b/Lib/test/test_re.py index 9e5223a125b0..305ec8eef326 100644 --- a/Lib/test/test_re.py +++ b/Lib/test/test_re.py @@ -754,6 +754,10 @@ class ReTests(unittest.TestCase): "undefined character name 'SPAM'", 0) self.checkPatternError(r'[\N{SPAM}]', "undefined character name 'SPAM'", 1) + self.checkPatternError(r'\N{KEYCAP NUMBER SIGN}', + "undefined character name 'KEYCAP NUMBER SIGN'", 0) + self.checkPatternError(r'[\N{KEYCAP NUMBER SIGN}]', + "undefined character name 'KEYCAP NUMBER SIGN'", 1) self.checkPatternError(br'\N{LESS-THAN SIGN}', r'bad escape \N', 0) self.checkPatternError(br'[\N{LESS-THAN SIGN}]', r'bad escape \N', 1) diff --git a/Misc/NEWS.d/next/Library/2022-04-18-16-31-33.gh-issue-90568.9kiU7o.rst b/Misc/NEWS.d/next/Library/2022-04-18-16-31-33.gh-issue-90568.9kiU7o.rst new file mode 100644 index 000000000000..4411c715830e --- /dev/null +++ b/Misc/NEWS.d/next/Library/2022-04-18-16-31-33.gh-issue-90568.9kiU7o.rst @@ -0,0 +1,3 @@ +Parsing ``\N`` escapes of Unicode Named Character Sequences in a +:mod:`regular expression ` raises now :exc:`re.error` instead of +``TypeError``.