[3.11] gh-108303: Move tokenize-related data to Lib/test/tokenizedata (GH-109265...

author Victor Stinner <vstinner@python.org>

Thu, 21 Sep 2023 19:46:05 +0000 (21:46 +0200)

committer GitHub <noreply@github.com>

Thu, 21 Sep 2023 19:46:05 +0000 (21:46 +0200)
author Victor Stinner <vstinner@python.org>
Thu, 21 Sep 2023 19:46:05 +0000 (21:46 +0200)
committer GitHub <noreply@github.com>
Thu, 21 Sep 2023 19:46:05 +0000 (21:46 +0200)
diff --git a/.gitattributes b/.gitattributes

index 6da587a4c6ea5aeddebf3d7661e2c7b5e983aaaa..1479ca074cda129612a22bc523cab58f241825f3 100644 (file)
--- a/.gitattributes
+++ b/.gitattributes
@@ -25,7 +25,7 @@ PC/classicAppCompat.* binary
  [attr]noeol -text
  
  Lib/test/cjkencodings/*                    noeol
-Lib/test/coding20731.py                    noeol
+Lib/test/tokenizedata/coding20731.py       noeol
  Lib/test/decimaltestdata/*.decTest         noeol
  Lib/test/test_email/data/*.txt             noeol
  Lib/test/test_importlib/data01/*           noeol
diff --git a/Lib/test/test_py_compile.py b/Lib/test/test_py_compile.py

index a4a52b180dbb550b075965c54f3378c6378d89c9..6a54d48eb16e93036043a2db717ce4b71ae7ff47 100644 (file)
--- a/Lib/test/test_py_compile.py
+++ b/Lib/test/test_py_compile.py
@@ -132,7 +132,9 @@ class PyCompileTestsBase:
              os.chmod(self.directory, mode.st_mode)
  
      def test_bad_coding(self):
-        bad_coding = os.path.join(os.path.dirname(__file__), 'bad_coding2.py')
+        bad_coding = os.path.join(os.path.dirname(__file__),
+                                  'tokenizedata',
+                                  'bad_coding2.py')
          with support.captured_stderr():
              self.assertIsNone(py_compile.compile(bad_coding, doraise=False))
          self.assertFalse(os.path.exists(
@@ -195,7 +197,9 @@ class PyCompileTestsBase:
          self.assertEqual(flags, 0b1)
  
      def test_quiet(self):
-        bad_coding = os.path.join(os.path.dirname(__file__), 'bad_coding2.py')
+        bad_coding = os.path.join(os.path.dirname(__file__),
+                                  'tokenizedata',
+                                  'bad_coding2.py')
          with support.captured_stderr() as stderr:
              self.assertIsNone(py_compile.compile(bad_coding, doraise=False, quiet=2))
              self.assertIsNone(py_compile.compile(bad_coding, doraise=True, quiet=2))
@@ -259,14 +263,18 @@ class PyCompileCLITestCase(unittest.TestCase):
          self.assertTrue(os.path.exists(self.cache_path))
  
      def test_bad_syntax(self):
-        bad_syntax = os.path.join(os.path.dirname(__file__), 'badsyntax_3131.py')
+        bad_syntax = os.path.join(os.path.dirname(__file__),
+                                  'tokenizedata',
+                                  'badsyntax_3131.py')
          rc, stdout, stderr = self.pycompilecmd_failure(bad_syntax)
          self.assertEqual(rc, 1)
          self.assertEqual(stdout, b'')
          self.assertIn(b'SyntaxError', stderr)
  
      def test_bad_syntax_with_quiet(self):
-        bad_syntax = os.path.join(os.path.dirname(__file__), 'badsyntax_3131.py')
+        bad_syntax = os.path.join(os.path.dirname(__file__),
+                                  'tokenizedata',
+                                  'badsyntax_3131.py')
          rc, stdout, stderr = self.pycompilecmd_failure('-q', bad_syntax)
          self.assertEqual(rc, 1)
          self.assertEqual(stdout, b'')
diff --git a/Lib/test/test_source_encoding.py b/Lib/test/test_source_encoding.py

index ae680c516400a3586115c4e0330a51731a821393..0c7f8ee861cfe21efca9d15546f8d01ed65ebda3 100644 (file)
--- a/Lib/test/test_source_encoding.py
+++ b/Lib/test/test_source_encoding.py
@@ -69,6 +69,7 @@ class MiscSourceEncodingTest(unittest.TestCase):
      def test_20731(self):
          sub = subprocess.Popen([sys.executable,
                          os.path.join(os.path.dirname(__file__),
+                                     'tokenizedata',
                                       'coding20731.py')],
                          stderr=subprocess.PIPE)
          err = sub.communicate()[1]
@@ -101,10 +102,10 @@ class MiscSourceEncodingTest(unittest.TestCase):
          self.verify_bad_module(module_name)
  
      def verify_bad_module(self, module_name):
-        self.assertRaises(SyntaxError, __import__, 'test.' + module_name)
+        self.assertRaises(SyntaxError, __import__, 'test.tokenizedata.' + module_name)
  
          path = os.path.dirname(__file__)
-        filename = os.path.join(path, module_name + '.py')
+        filename = os.path.join(path, 'tokenizedata', module_name + '.py')
          with open(filename, "rb") as fp:
              bytes = fp.read()
          self.assertRaises(SyntaxError, compile, bytes, filename, 'exec')
diff --git a/Lib/test/test_tarfile.py b/Lib/test/test_tarfile.py

index 13a75f39f9ba525b28626436c6ce816409a189e8..623452d50ce84238522d206123702523301dee6f 100644 (file)
--- a/Lib/test/test_tarfile.py
+++ b/Lib/test/test_tarfile.py
@@ -2493,16 +2493,17 @@ class CommandLineTest(unittest.TestCase):
          return script_helper.assert_python_failure('-m', 'tarfile', *args)
  
      def make_simple_tarfile(self, tar_name):
-        files = [support.findfile('tokenize_tests.txt'),
+        files = [support.findfile('tokenize_tests.txt',
+                                  subdir='tokenizedata'),
                   support.findfile('tokenize_tests-no-coding-cookie-'
-                                  'and-utf8-bom-sig-only.txt')]
+                                  'and-utf8-bom-sig-only.txt',
+                                  subdir='tokenizedata')]
          self.addCleanup(os_helper.unlink, tar_name)
          with tarfile.open(tar_name, 'w') as tf:
              for tardata in files:
                  tf.add(tardata, arcname=os.path.basename(tardata))
  
      def make_evil_tarfile(self, tar_name):
-        files = [support.findfile('tokenize_tests.txt')]
          self.addCleanup(os_helper.unlink, tar_name)
          with tarfile.open(tar_name, 'w') as tf:
              benign = tarfile.TarInfo('benign')
@@ -2583,9 +2584,11 @@ class CommandLineTest(unittest.TestCase):
          self.assertEqual(rc, 1)
  
      def test_create_command(self):
-        files = [support.findfile('tokenize_tests.txt'),
+        files = [support.findfile('tokenize_tests.txt',
+                                  subdir='tokenizedata'),
                   support.findfile('tokenize_tests-no-coding-cookie-'
-                                  'and-utf8-bom-sig-only.txt')]
+                                  'and-utf8-bom-sig-only.txt',
+                                  subdir='tokenizedata')]
          for opt in '-c', '--create':
              try:
                  out = self.tarfilecmd(opt, tmpname, *files)
@@ -2596,9 +2599,11 @@ class CommandLineTest(unittest.TestCase):
                  os_helper.unlink(tmpname)
  
      def test_create_command_verbose(self):
-        files = [support.findfile('tokenize_tests.txt'),
+        files = [support.findfile('tokenize_tests.txt',
+                                  subdir='tokenizedata'),
                   support.findfile('tokenize_tests-no-coding-cookie-'
-                                  'and-utf8-bom-sig-only.txt')]
+                                  'and-utf8-bom-sig-only.txt',
+                                  subdir='tokenizedata')]
          for opt in '-v', '--verbose':
              try:
                  out = self.tarfilecmd(opt, '-c', tmpname, *files,
@@ -2610,7 +2615,7 @@ class CommandLineTest(unittest.TestCase):
                  os_helper.unlink(tmpname)
  
      def test_create_command_dotless_filename(self):
-        files = [support.findfile('tokenize_tests.txt')]
+        files = [support.findfile('tokenize_tests.txt', subdir='tokenizedata')]
          try:
              out = self.tarfilecmd('-c', dotlessname, *files)
              self.assertEqual(out, b'')
@@ -2621,7 +2626,7 @@ class CommandLineTest(unittest.TestCase):
  
      def test_create_command_dot_started_filename(self):
          tar_name = os.path.join(TEMPDIR, ".testtar")
-        files = [support.findfile('tokenize_tests.txt')]
+        files = [support.findfile('tokenize_tests.txt', subdir='tokenizedata')]
          try:
              out = self.tarfilecmd('-c', tar_name, *files)
              self.assertEqual(out, b'')
@@ -2631,9 +2636,11 @@ class CommandLineTest(unittest.TestCase):
              os_helper.unlink(tar_name)
  
      def test_create_command_compressed(self):
-        files = [support.findfile('tokenize_tests.txt'),
+        files = [support.findfile('tokenize_tests.txt',
+                                  subdir='tokenizedata'),
                   support.findfile('tokenize_tests-no-coding-cookie-'
-                                  'and-utf8-bom-sig-only.txt')]
+                                  'and-utf8-bom-sig-only.txt',
+                                  subdir='tokenizedata')]
          for filetype in (GzipTest, Bz2Test, LzmaTest):
              if not filetype.open:
                  continue
diff --git a/Lib/test/test_tokenize.py b/Lib/test/test_tokenize.py

index 63c2501cfe2338d7040a0e390c2473ee163924b8..62f152fe431d5beacc8b1daeca9ff3f8a1d77539 100644 (file)
--- a/Lib/test/test_tokenize.py
+++ b/Lib/test/test_tokenize.py
@@ -999,7 +999,7 @@ class TestTokenizerAdheresToPep0263(TestCase):
      """
  
      def _testFile(self, filename):
-        path = os.path.join(os.path.dirname(__file__), filename)
+        path = os.path.join(os.path.dirname(__file__), 'tokenizedata', filename)
          TestRoundtrip.check_roundtrip(self, open(path, 'rb'))
  
      def test_utf8_coding_cookie_and_no_utf8_bom(self):
@@ -1560,7 +1560,7 @@ class TestRoundtrip(TestCase):
  
          self.check_roundtrip("if x == 1 : \n"
                               "  print(x)\n")
-        fn = support.findfile("tokenize_tests.txt")
+        fn = support.findfile("tokenize_tests.txt", subdir="tokenizedata")
          with open(fn, 'rb') as f:
              self.check_roundtrip(f)
          self.check_roundtrip("if x == 1:\n"
@@ -1615,8 +1615,7 @@ class TestRoundtrip(TestCase):
          # pass the '-ucpu' option to process the full directory.
  
          import glob, random
-        fn = support.findfile("tokenize_tests.txt")
-        tempdir = os.path.dirname(fn) or os.curdir
+        tempdir = os.path.dirname(__file__) or os.curdir
          testfiles = glob.glob(os.path.join(glob.escape(tempdir), "test*.py"))
  
          # Tokenize is broken on test_pep3131.py because regular expressions are
diff --git a/Lib/test/test_tools/test_reindent.py b/Lib/test/test_tools/test_reindent.py

index 34df0c5d5119047dee35300b746144618f33572d..3aa09130a5c5eb7b4e061474b17a638eb53bb839 100644 (file)
--- a/Lib/test/test_tools/test_reindent.py
+++ b/Lib/test/test_tools/test_reindent.py
@@ -25,7 +25,7 @@ class ReindentTests(unittest.TestCase):
          self.assertGreater(err, b'')
  
      def test_reindent_file_with_bad_encoding(self):
-        bad_coding_path = findfile('bad_coding.py')
+        bad_coding_path = findfile('bad_coding.py', subdir='tokenizedata')
          rc, out, err = assert_python_ok(self.script, '-r', bad_coding_path)
          self.assertEqual(out, b'')
          self.assertNotEqual(err, b'')
diff --git a/Lib/test/test_unicode_identifiers.py b/Lib/test/test_unicode_identifiers.py

index 5b9ced5d1cb837f3f3874bb1b605f30373dadebc..63c6c055824b20f1428bea3a066984271c64b031 100644 (file)
--- a/Lib/test/test_unicode_identifiers.py
+++ b/Lib/test/test_unicode_identifiers.py
@@ -19,7 +19,7 @@ class PEP3131Test(unittest.TestCase):
  
      def test_invalid(self):
          try:
-            from test import badsyntax_3131
+            from test.tokenizedata import badsyntax_3131
          except SyntaxError as err:
              self.assertEqual(str(err),
                "invalid character '€' (U+20AC) (badsyntax_3131.py, line 2)")
diff --git a/Lib/test/tokenizedata/__init__.py b/Lib/test/tokenizedata/__init__.py

new file mode 100644 (file)

index 0000000..e69de29
diff --git a/Lib/test/bad_coding.py b/Lib/test/tokenizedata/bad_coding.py

similarity index 100%

rename from Lib/test/bad_coding.py

rename to Lib/test/tokenizedata/bad_coding.py
diff --git a/Lib/test/bad_coding2.py b/Lib/test/tokenizedata/bad_coding2.py

similarity index 100%

rename from Lib/test/bad_coding2.py

rename to Lib/test/tokenizedata/bad_coding2.py
diff --git a/Lib/test/badsyntax_3131.py b/Lib/test/tokenizedata/badsyntax_3131.py

similarity index 100%

rename from Lib/test/badsyntax_3131.py

rename to Lib/test/tokenizedata/badsyntax_3131.py
diff --git a/Lib/test/coding20731.py b/Lib/test/tokenizedata/coding20731.py

similarity index 100%

rename from Lib/test/coding20731.py

rename to Lib/test/tokenizedata/coding20731.py
diff --git a/Lib/test/tokenize_tests-latin1-coding-cookie-and-utf8-bom-sig.txt b/Lib/test/tokenizedata/tokenize_tests-latin1-coding-cookie-and-utf8-bom-sig.txt

similarity index 100%

rename from Lib/test/tokenize_tests-latin1-coding-cookie-and-utf8-bom-sig.txt

rename to Lib/test/tokenizedata/tokenize_tests-latin1-coding-cookie-and-utf8-bom-sig.txt
diff --git a/Lib/test/tokenize_tests-no-coding-cookie-and-utf8-bom-sig-only.txt b/Lib/test/tokenizedata/tokenize_tests-no-coding-cookie-and-utf8-bom-sig-only.txt

similarity index 100%

rename from Lib/test/tokenize_tests-no-coding-cookie-and-utf8-bom-sig-only.txt

rename to Lib/test/tokenizedata/tokenize_tests-no-coding-cookie-and-utf8-bom-sig-only.txt
diff --git a/Lib/test/tokenize_tests-utf8-coding-cookie-and-no-utf8-bom-sig.txt b/Lib/test/tokenizedata/tokenize_tests-utf8-coding-cookie-and-no-utf8-bom-sig.txt

similarity index 100%

rename from Lib/test/tokenize_tests-utf8-coding-cookie-and-no-utf8-bom-sig.txt

rename to Lib/test/tokenizedata/tokenize_tests-utf8-coding-cookie-and-no-utf8-bom-sig.txt
diff --git a/Lib/test/tokenize_tests-utf8-coding-cookie-and-utf8-bom-sig.txt b/Lib/test/tokenizedata/tokenize_tests-utf8-coding-cookie-and-utf8-bom-sig.txt

similarity index 100%

rename from Lib/test/tokenize_tests-utf8-coding-cookie-and-utf8-bom-sig.txt

rename to Lib/test/tokenizedata/tokenize_tests-utf8-coding-cookie-and-utf8-bom-sig.txt
diff --git a/Lib/test/tokenize_tests.txt b/Lib/test/tokenizedata/tokenize_tests.txt

similarity index 100%

rename from Lib/test/tokenize_tests.txt

rename to Lib/test/tokenizedata/tokenize_tests.txt
diff --git a/Makefile.pre.in b/Makefile.pre.in

index 254820a2509bd7b74ec1ef70c5f5253108ea9516..0d0ac1315bdc7d50a758af3922dc26c29afd4606 100644 (file)
--- a/Makefile.pre.in
+++ b/Makefile.pre.in
@@ -2043,6 +2043,7 @@ TESTSUBDIRS=      ctypes/test \
                 test/test_warnings/data \
                 test/test_zoneinfo \
                 test/test_zoneinfo/data \
+               test/tokenizedata \
                 test/tracedmodules \
                 test/typinganndata \
                 test/xmltestdata \
author	Victor Stinner <vstinner@python.org>
	Thu, 21 Sep 2023 19:46:05 +0000 (21:46 +0200)
committer	GitHub <noreply@github.com>
	Thu, 21 Sep 2023 19:46:05 +0000 (21:46 +0200)
.gitattributes		patch \| blob \| blame \| history
Lib/test/test_py_compile.py		patch \| blob \| blame \| history
Lib/test/test_source_encoding.py		patch \| blob \| blame \| history
Lib/test/test_tarfile.py		patch \| blob \| blame \| history
Lib/test/test_tokenize.py		patch \| blob \| blame \| history
Lib/test/test_tools/test_reindent.py		patch \| blob \| blame \| history
Lib/test/test_unicode_identifiers.py		patch \| blob \| blame \| history
Lib/test/tokenizedata/__init__.py	[new file with mode: 0644]	patch \| blob
Lib/test/tokenizedata/bad_coding.py	[moved from Lib/test/bad_coding.py with 100% similarity]	patch \| blob \| blame \| history
Lib/test/tokenizedata/bad_coding2.py	[moved from Lib/test/bad_coding2.py with 100% similarity]	patch \| blob \| blame \| history
Lib/test/tokenizedata/badsyntax_3131.py	[moved from Lib/test/badsyntax_3131.py with 100% similarity]	patch \| blob \| blame \| history
Lib/test/tokenizedata/coding20731.py	[moved from Lib/test/coding20731.py with 100% similarity]	patch \| blob \| blame \| history
Lib/test/tokenizedata/tokenize_tests-latin1-coding-cookie-and-utf8-bom-sig.txt	[moved from Lib/test/tokenize_tests-latin1-coding-cookie-and-utf8-bom-sig.txt with 100% similarity]	patch \| blob \| blame \| history
Lib/test/tokenizedata/tokenize_tests-no-coding-cookie-and-utf8-bom-sig-only.txt	[moved from Lib/test/tokenize_tests-no-coding-cookie-and-utf8-bom-sig-only.txt with 100% similarity]	patch \| blob \| blame \| history
Lib/test/tokenizedata/tokenize_tests-utf8-coding-cookie-and-no-utf8-bom-sig.txt	[moved from Lib/test/tokenize_tests-utf8-coding-cookie-and-no-utf8-bom-sig.txt with 100% similarity]	patch \| blob \| blame \| history
Lib/test/tokenizedata/tokenize_tests-utf8-coding-cookie-and-utf8-bom-sig.txt	[moved from Lib/test/tokenize_tests-utf8-coding-cookie-and-utf8-bom-sig.txt with 100% similarity]	patch \| blob \| blame \| history
Lib/test/tokenizedata/tokenize_tests.txt	[moved from Lib/test/tokenize_tests.txt with 100% similarity]	patch \| blob \| blame \| history
Makefile.pre.in		patch \| blob \| blame \| history