]> git.ipfire.org Git - thirdparty/Python/cpython.git/commitdiff
gh-95731: Fix module docstring extraction in pygettext (GH-95732)
authorMiss Islington (bot) <31488909+miss-islington@users.noreply.github.com>
Sat, 15 Oct 2022 15:33:19 +0000 (08:33 -0700)
committerGitHub <noreply@github.com>
Sat, 15 Oct 2022 15:33:19 +0000 (08:33 -0700)
(cherry picked from commit 120b4ab2b68aebf96ce0de243eab89a25fc2d282)

Co-authored-by: Jakub Kuczys <me@jacken.men>
Lib/test/test_tools/test_i18n.py
Misc/NEWS.d/next/Tools-Demos/2022-08-05-23-25-59.gh-issue-95731.N2KohU.rst [new file with mode: 0644]
Tools/i18n/pygettext.py

index 12f778dbf8405d01ce03f33f3e6361e473a67185..985e2262c7c62e70253d8865e986419dbd3223fc 100644 (file)
@@ -155,6 +155,26 @@ class Test_pygettext(unittest.TestCase):
         '''))
         self.assertFalse([msgid for msgid in msgids if 'doc' in msgid])
 
+    def test_moduledocstring(self):
+        for doc in ('"""doc"""', "r'''doc'''", "R'doc'", 'u"doc"'):
+            with self.subTest(doc):
+                msgids = self.extract_docstrings_from_str(dedent('''\
+                %s
+                ''' % doc))
+                self.assertIn('doc', msgids)
+
+    def test_moduledocstring_bytes(self):
+        msgids = self.extract_docstrings_from_str(dedent('''\
+        b"""doc"""
+        '''))
+        self.assertFalse([msgid for msgid in msgids if 'doc' in msgid])
+
+    def test_moduledocstring_fstring(self):
+        msgids = self.extract_docstrings_from_str(dedent('''\
+        f"""doc"""
+        '''))
+        self.assertFalse([msgid for msgid in msgids if 'doc' in msgid])
+
     def test_msgid(self):
         msgids = self.extract_docstrings_from_str(
                 '''_("""doc""" r'str' u"ing")''')
diff --git a/Misc/NEWS.d/next/Tools-Demos/2022-08-05-23-25-59.gh-issue-95731.N2KohU.rst b/Misc/NEWS.d/next/Tools-Demos/2022-08-05-23-25-59.gh-issue-95731.N2KohU.rst
new file mode 100644 (file)
index 0000000..6b21461
--- /dev/null
@@ -0,0 +1 @@
+Fix handling of module docstrings in :file:`Tools/i18n/pygettext.py`.
index 6f889adffe6c7a260e9626dd5a36a00fd15a950e..7ada79105db1cad46db22b597cb71e74d06361ca 100755 (executable)
@@ -335,9 +335,10 @@ class TokenEater:
                 if ttype == tokenize.STRING and is_literal_string(tstring):
                     self.__addentry(safe_eval(tstring), lineno, isdocstring=1)
                     self.__freshmodule = 0
-                elif ttype not in (tokenize.COMMENT, tokenize.NL):
-                    self.__freshmodule = 0
-                return
+                    return
+                if ttype in (tokenize.COMMENT, tokenize.NL, tokenize.ENCODING):
+                    return
+                self.__freshmodule = 0
             # class or func/method docstring?
             if ttype == tokenize.NAME and tstring in ('class', 'def'):
                 self.__state = self.__suiteseen