gh-108834: regrtest reruns failed tests in subprocesses (#108839)

author Victor Stinner <vstinner@python.org>

Sun, 3 Sep 2023 21:37:15 +0000 (23:37 +0200)

committer GitHub <noreply@github.com>

Sun, 3 Sep 2023 21:37:15 +0000 (21:37 +0000)
author Victor Stinner <vstinner@python.org>
Sun, 3 Sep 2023 21:37:15 +0000 (23:37 +0200)
committer GitHub <noreply@github.com>
Sun, 3 Sep 2023 21:37:15 +0000 (21:37 +0000)
diff --git a/Lib/test/bisect_cmd.py b/Lib/test/bisect_cmd.py

index 0bdd7a43c03f7bf818d4356460a92d7c7cdb5be9..5cb804bd469dc35176e94deb7032daaf6df4cab0 100755 (executable)
--- a/Lib/test/bisect_cmd.py
+++ b/Lib/test/bisect_cmd.py
@@ -109,9 +109,10 @@ def parse_args():
  
  def main():
      args = parse_args()
-    if '-w' in args.test_args or '--verbose2' in args.test_args:
-        print("WARNING: -w/--verbose2 option should not be used to bisect!")
-        print()
+    for opt in ('-w', '--rerun', '--verbose2'):
+        if opt in args.test_args:
+            print(f"WARNING: {opt} option should not be used to bisect!")
+            print()
  
      if args.input:
          with open(args.input) as fp:
diff --git a/Lib/test/libregrtest/cmdline.py b/Lib/test/libregrtest/cmdline.py

index ebe57920d9185cad8fa85b3871e9f534eb47c743..251fcacb1d14f77148607d497e06d28e6e4cafa6 100644 (file)
--- a/Lib/test/libregrtest/cmdline.py
+++ b/Lib/test/libregrtest/cmdline.py
@@ -156,7 +156,7 @@ class Namespace(argparse.Namespace):
          self.coverdir = 'coverage'
          self.runleaks = False
          self.huntrleaks = False
-        self.verbose2 = False
+        self.rerun = False
          self.verbose3 = False
          self.print_slow = False
          self.random_seed = None
@@ -213,8 +213,10 @@ def _create_parser():
      group = parser.add_argument_group('Verbosity')
      group.add_argument('-v', '--verbose', action='count',
                         help='run tests in verbose mode with output to stdout')
-    group.add_argument('-w', '--verbose2', action='store_true',
+    group.add_argument('-w', '--rerun', action='store_true',
                         help='re-run failed tests in verbose mode')
+    group.add_argument('--verbose2', action='store_true', dest='rerun',
+                       help='deprecated alias to --rerun')
      group.add_argument('-W', '--verbose3', action='store_true',
                         help='display test output on failure')
      group.add_argument('-q', '--quiet', action='store_true',
@@ -309,6 +311,9 @@ def _create_parser():
      group.add_argument('--fail-env-changed', action='store_true',
                         help='if a test file alters the environment, mark '
                              'the test as failed')
+    group.add_argument('--fail-rerun', action='store_true',
+                       help='if a test failed and then passed when re-run, '
+                            'mark the tests as failed')
  
      group.add_argument('--junit-xml', dest='xmlpath', metavar='FILENAME',
                         help='writes JUnit-style XML results to the specified '
@@ -380,7 +385,7 @@ def _parse_args(args, **kwargs):
          ns.python = shlex.split(ns.python)
      if ns.failfast and not (ns.verbose or ns.verbose3):
          parser.error("-G/--failfast needs either -v or -W")
-    if ns.pgo and (ns.verbose or ns.verbose2 or ns.verbose3):
+    if ns.pgo and (ns.verbose or ns.rerun or ns.verbose3):
          parser.error("--pgo/-v don't go together!")
      if ns.pgo_extended:
          ns.pgo = True  # pgo_extended implies pgo
diff --git a/Lib/test/libregrtest/main.py b/Lib/test/libregrtest/main.py

index 6e6423e156781bd2f955c29f6ae735db33887c0a..77a4090a826e069b0fc34791d06d269374cb3331 100644 (file)
--- a/Lib/test/libregrtest/main.py
+++ b/Lib/test/libregrtest/main.py
@@ -11,11 +11,11 @@ import time
  import unittest
  from test.libregrtest.cmdline import _parse_args
  from test.libregrtest.runtest import (
-    findtests, split_test_packages, runtest, get_abs_module,
-    PROGRESS_MIN_TIME, State)
+    findtests, split_test_packages, runtest, abs_module_name,
+    PROGRESS_MIN_TIME, State, MatchTestsDict, RunTests)
  from test.libregrtest.setup import setup_tests
  from test.libregrtest.pgo import setup_pgo_tests
-from test.libregrtest.utils import (removepy, count, format_duration,
+from test.libregrtest.utils import (strip_py_suffix, count, format_duration,
                                      printlist, get_build_info)
  from test import support
  from test.support import TestStats
@@ -28,14 +28,6 @@ from test.support import threading_helper
  # Must be smaller than buildbot "1200 seconds without output" limit.
  EXIT_TIMEOUT = 120.0
  
-# gh-90681: When rerunning tests, we might need to rerun the whole
-# class or module suite if some its life-cycle hooks fail.
-# Test level hooks are not affected.
-_TEST_LIFECYCLE_HOOKS = frozenset((
-    'setUpClass', 'tearDownClass',
-    'setUpModule', 'tearDownModule',
-))
-
  EXITCODE_BAD_TEST = 2
  EXITCODE_INTERRUPTED = 130
  EXITCODE_ENV_CHANGED = 3
@@ -72,19 +64,22 @@ class Regrtest:
          # tests
          self.tests = []
          self.selected = []
+        self.all_runtests: list[RunTests] = []
  
          # test results
-        self.good = []
-        self.bad = []
-        self.skipped = []
-        self.resource_denied = []
-        self.environment_changed = []
-        self.run_no_tests = []
-        self.need_rerun = []
-        self.rerun = []
-        self.first_result = None
+        self.good: list[str] = []
+        self.bad: list[str] = []
+        self.rerun_bad: list[str] = []
+        self.skipped: list[str] = []
+        self.resource_denied: list[str] = []
+        self.environment_changed: list[str] = []
+        self.run_no_tests: list[str] = []
+        self.rerun: list[str] = []
+
+        self.need_rerun: list[TestResult] = []
+        self.first_state: str | None = None
          self.interrupted = False
-        self.stats_dict: dict[str, TestStats] = {}
+        self.total_stats = TestStats()
  
          # used by --slow
          self.test_times = []
@@ -94,7 +89,7 @@ class Regrtest:
  
          # used to display the progress bar "[ 3/100]"
          self.start_time = time.perf_counter()
-        self.test_count = ''
+        self.test_count_text = ''
          self.test_count_width = 1
  
          # used by --single
@@ -107,7 +102,6 @@ class Regrtest:
          # misc
          self.win_load_tracker = None
          self.tmp_dir = None
-        self.worker_test_name = None
  
      def get_executed(self):
          return (set(self.good) | set(self.bad) | set(self.skipped)
@@ -115,11 +109,9 @@ class Regrtest:
                  | set(self.run_no_tests))
  
      def accumulate_result(self, result, rerun=False):
+        fail_env_changed = self.ns.fail_env_changed
          test_name = result.test_name
  
-        if result.has_meaningful_duration() and not rerun:
-            self.test_times.append((result.duration, test_name))
-
          match result.state:
              case State.PASSED:
                  self.good.append(test_name)
@@ -128,25 +120,24 @@ class Regrtest:
              case State.SKIPPED:
                  self.skipped.append(test_name)
              case State.RESOURCE_DENIED:
-                self.skipped.append(test_name)
                  self.resource_denied.append(test_name)
              case State.INTERRUPTED:
                  self.interrupted = True
              case State.DID_NOT_RUN:
                  self.run_no_tests.append(test_name)
              case _:
-                if result.is_failed(self.ns.fail_env_changed):
-                    if not rerun:
-                        self.bad.append(test_name)
-                        self.need_rerun.append(result)
+                if result.is_failed(fail_env_changed):
+                    self.bad.append(test_name)
+                    self.need_rerun.append(result)
                  else:
-                    raise ValueError(f"invalid test state: {state!r}")
+                    raise ValueError(f"invalid test state: {result.state!r}")
  
+        if result.has_meaningful_duration() and not rerun:
+            self.test_times.append((result.duration, test_name))
          if result.stats is not None:
-            self.stats_dict[result.test_name] = result.stats
-
-        if rerun and not(result.is_failed(False) or result.state == State.INTERRUPTED):
-            self.bad.remove(test_name)
+            self.total_stats.accumulate(result.stats)
+        if rerun:
+            self.rerun.append(test_name)
  
          xml_data = result.xml_data
          if xml_data:
@@ -180,13 +171,15 @@ class Regrtest:
          print(line, flush=True)
  
      def display_progress(self, test_index, text):
-        if self.ns.quiet:
+        quiet = self.ns.quiet
+        pgo = self.ns.pgo
+        if quiet:
              return
  
          # "[ 51/405/1] test_tcl passed"
-        line = f"{test_index:{self.test_count_width}}{self.test_count}"
+        line = f"{test_index:{self.test_count_width}}{self.test_count_text}"
          fails = len(self.bad) + len(self.environment_changed)
-        if fails and not self.ns.pgo:
+        if fails and not pgo:
              line = f"{line}/{fails}"
          self.log(f"[{line}] {text}")
  
@@ -196,15 +189,7 @@ class Regrtest:
          if ns.xmlpath:
              support.junit_xml_list = self.testsuite_xml = []
  
-        worker_args = ns.worker_args
-        if worker_args is not None:
-            from test.libregrtest.runtest_mp import parse_worker_args
-            ns, test_name = parse_worker_args(ns.worker_args)
-            ns.worker_args = worker_args
-            self.worker_test_name = test_name
-
-        # Strip .py extensions.
-        removepy(ns.args)
+        strip_py_suffix(ns.args)
  
          if ns.huntrleaks:
              warmup, repetitions, _ = ns.huntrleaks
@@ -221,9 +206,18 @@ class Regrtest:
          self.ns = ns
  
      def find_tests(self, tests):
+        ns = self.ns
+        single = ns.single
+        fromfile = ns.fromfile
+        pgo = ns.pgo
+        exclude = ns.exclude
+        test_dir = ns.testdir
+        starting_test = ns.start
+        randomize = ns.randomize
+
          self.tests = tests
  
-        if self.ns.single:
+        if single:
              self.next_single_filename = os.path.join(self.tmp_dir, 'pynexttest')
              try:
                  with open(self.next_single_filename, 'r') as fp:
@@ -232,12 +226,12 @@ class Regrtest:
              except OSError:
                  pass
  
-        if self.ns.fromfile:
+        if fromfile:
              self.tests = []
              # regex to match 'test_builtin' in line:
              # '0:00:00 [  4/400] test_builtin -- test_dict took 1 sec'
              regex = re.compile(r'\btest_[a-zA-Z0-9_]+\b')
-            with open(os.path.join(os_helper.SAVEDCWD, self.ns.fromfile)) as fp:
+            with open(os.path.join(os_helper.SAVEDCWD, fromfile)) as fp:
                  for line in fp:
                      line = line.split('#', 1)[0]
                      line = line.strip()
@@ -245,22 +239,22 @@ class Regrtest:
                      if match is not None:
                          self.tests.append(match.group())
  
-        removepy(self.tests)
+        strip_py_suffix(self.tests)
  
-        if self.ns.pgo:
+        if pgo:
              # add default PGO tests if no tests are specified
-            setup_pgo_tests(self.ns)
+            setup_pgo_tests(ns)
  
-        exclude = set()
-        if self.ns.exclude:
-            for arg in self.ns.args:
-                exclude.add(arg)
-            self.ns.args = []
+        exclude_tests = set()
+        if exclude:
+            for arg in ns.args:
+                exclude_tests.add(arg)
+            ns.args = []
  
-        alltests = findtests(testdir=self.ns.testdir, exclude=exclude)
+        alltests = findtests(testdir=test_dir, exclude=exclude_tests)
  
-        if not self.ns.fromfile:
-            self.selected = self.tests or self.ns.args
+        if not fromfile:
+            self.selected = self.tests or ns.args
              if self.selected:
                  self.selected = split_test_packages(self.selected)
              else:
@@ -268,7 +262,7 @@ class Regrtest:
          else:
              self.selected = self.tests
  
-        if self.ns.single:
+        if single:
              self.selected = self.selected[:1]
              try:
                  pos = alltests.index(self.selected[0])
@@ -277,17 +271,17 @@ class Regrtest:
                  pass
  
          # Remove all the selected tests that precede start if it's set.
-        if self.ns.start:
+        if starting_test:
              try:
-                del self.selected[:self.selected.index(self.ns.start)]
+                del self.selected[:self.selected.index(starting_test)]
              except ValueError:
-                print("Couldn't find starting test (%s), using all tests"
-                      % self.ns.start, file=sys.stderr)
+                print(f"Cannot find starting test: {starting_test}")
+                sys.exit(1)
  
-        if self.ns.randomize:
-            if self.ns.random_seed is None:
-                self.ns.random_seed = random.randrange(10000000)
-            random.seed(self.ns.random_seed)
+        if randomize:
+            if ns.random_seed is None:
+                ns.random_seed = random.randrange(10000000)
+            random.seed(ns.random_seed)
              random.shuffle(self.selected)
  
      def list_tests(self):
@@ -305,25 +299,63 @@ class Regrtest:
                      print(test.id())
  
      def list_cases(self):
+        ns = self.ns
+        test_dir = ns.testdir
          support.verbose = False
-        support.set_match_tests(self.ns.match_tests, self.ns.ignore_tests)
+        support.set_match_tests(ns.match_tests, ns.ignore_tests)
  
+        skipped = []
          for test_name in self.selected:
-            abstest = get_abs_module(self.ns, test_name)
+            module_name = abs_module_name(test_name, test_dir)
              try:
-                suite = unittest.defaultTestLoader.loadTestsFromName(abstest)
+                suite = unittest.defaultTestLoader.loadTestsFromName(module_name)
                  self._list_cases(suite)
              except unittest.SkipTest:
-                self.skipped.append(test_name)
+                skipped.append(test_name)
  
-        if self.skipped:
-            print(file=sys.stderr)
-            print(count(len(self.skipped), "test"), "skipped:", file=sys.stderr)
-            printlist(self.skipped, file=sys.stderr)
+        if skipped:
+            sys.stdout.flush()
+            stderr = sys.stderr
+            print(file=stderr)
+            print(count(len(skipped), "test"), "skipped:", file=stderr)
+            printlist(skipped, file=stderr)
  
-    def rerun_failed_tests(self):
-        self.log()
+    def get_rerun_match(self, rerun_list) -> MatchTestsDict:
+        rerun_match_tests = {}
+        for result in rerun_list:
+            match_tests = result.get_rerun_match_tests()
+            # ignore empty match list
+            if match_tests:
+                rerun_match_tests[result.test_name] = match_tests
+        return rerun_match_tests
+
+    def _rerun_failed_tests(self, need_rerun):
+        # Configure the runner to re-run tests
+        ns = self.ns
+        ns.verbose = True
+        ns.failfast = False
+        ns.verbose3 = False
+        ns.forever = False
+        if ns.use_mp is None:
+            ns.use_mp = 1
+
+        # Get tests to re-run
+        tests = [result.test_name for result in need_rerun]
+        match_tests = self.get_rerun_match(need_rerun)
+        self.set_tests(tests)
+
+        # Clear previously failed tests
+        self.rerun_bad.extend(self.bad)
+        self.bad.clear()
+        self.need_rerun.clear()
+
+        # Re-run failed tests
+        self.log(f"Re-running {len(tests)} failed tests in verbose mode in subprocesses")
+        runtests = RunTests(tests, match_tests=match_tests, rerun=True)
+        self.all_runtests.append(runtests)
+        self._run_tests_mp(runtests)
  
+    def rerun_failed_tests(self, need_rerun):
          if self.ns.python:
              # Temp patch for https://github.com/python/cpython/issues/94052
              self.log(
@@ -332,45 +364,10 @@ class Regrtest:
              )
              return
  
-        self.ns.verbose = True
-        self.ns.failfast = False
-        self.ns.verbose3 = False
-
-        self.first_result = self.get_tests_result()
-
-        self.log("Re-running failed tests in verbose mode")
-        rerun_list = list(self.need_rerun)
-        self.need_rerun.clear()
-        for result in rerun_list:
-            test_name = result.test_name
-            self.rerun.append(test_name)
+        self.first_state = self.get_tests_state()
  
-            errors = result.errors or []
-            failures = result.failures or []
-            error_names = [
-                self.normalize_test_name(test_full_name, is_error=True)
-                for (test_full_name, *_) in errors]
-            failure_names = [
-                self.normalize_test_name(test_full_name)
-                for (test_full_name, *_) in failures]
-            self.ns.verbose = True
-            orig_match_tests = self.ns.match_tests
-            if errors or failures:
-                if self.ns.match_tests is None:
-                    self.ns.match_tests = []
-                self.ns.match_tests.extend(error_names)
-                self.ns.match_tests.extend(failure_names)
-                matching = "matching: " + ", ".join(self.ns.match_tests)
-                self.log(f"Re-running {test_name} in verbose mode ({matching})")
-            else:
-                self.log(f"Re-running {test_name} in verbose mode")
-            result = runtest(self.ns, test_name)
-            self.ns.match_tests = orig_match_tests
-
-            self.accumulate_result(result, rerun=True)
-
-            if result.state == State.INTERRUPTED:
-                break
+        print()
+        self._rerun_failed_tests(need_rerun)
  
          if self.bad:
              print(count(len(self.bad), 'test'), "failed again:")
@@ -378,28 +375,17 @@ class Regrtest:
  
          self.display_result()
  
-    def normalize_test_name(self, test_full_name, *, is_error=False):
-        short_name = test_full_name.split(" ")[0]
-        if is_error and short_name in _TEST_LIFECYCLE_HOOKS:
-            # This means that we have a failure in a life-cycle hook,
-            # we need to rerun the whole module or class suite.
-            # Basically the error looks like this:
-            #    ERROR: setUpClass (test.test_reg_ex.RegTest)
-            # or
-            #    ERROR: setUpModule (test.test_reg_ex)
-            # So, we need to parse the class / module name.
-            lpar = test_full_name.index('(')
-            rpar = test_full_name.index(')')
-            return test_full_name[lpar + 1: rpar].split('.')[-1]
-        return short_name
-
      def display_result(self):
+        pgo = self.ns.pgo
+        quiet = self.ns.quiet
+        print_slow = self.ns.print_slow
+
          # If running the test suite for PGO then no one cares about results.
-        if self.ns.pgo:
+        if pgo:
              return
  
          print()
-        print("== Tests result: %s ==" % self.get_tests_result())
+        print("== Tests result: %s ==" % self.get_tests_state())
  
          if self.interrupted:
              print("Test suite interrupted by signal SIGINT.")
@@ -410,7 +396,7 @@ class Regrtest:
              print(count(len(omitted), "test"), "omitted:")
              printlist(omitted)
  
-        if self.good and not self.ns.quiet:
+        if self.good and not quiet:
              print()
              if (not self.bad
                  and not self.skipped
@@ -419,7 +405,7 @@ class Regrtest:
                  print("All", end=' ')
              print(count(len(self.good), "test"), "OK.")
  
-        if self.ns.print_slow:
+        if print_slow:
              self.test_times.sort(reverse=True)
              print()
              print("10 slowest tests:")
@@ -437,11 +423,16 @@ class Regrtest:
                       count(len(self.environment_changed), "test")))
              printlist(self.environment_changed)
  
-        if self.skipped and not self.ns.quiet:
+        if self.skipped and not quiet:
              print()
              print(count(len(self.skipped), "test"), "skipped:")
              printlist(self.skipped)
  
+        if self.resource_denied and not quiet:
+            print()
+            print(count(len(self.resource_denied), "test"), "skipped (resource denied):")
+            printlist(self.resource_denied)
+
          if self.rerun:
              print()
              print("%s:" % count(len(self.rerun), "re-run test"))
@@ -452,40 +443,58 @@ class Regrtest:
              print(count(len(self.run_no_tests), "test"), "run no tests:")
              printlist(self.run_no_tests)
  
-    def run_tests_sequential(self):
-        if self.ns.trace:
+    def run_test(self, test_index, test_name, previous_test, save_modules):
+        text = test_name
+        if previous_test:
+            text = '%s -- %s' % (text, previous_test)
+        self.display_progress(test_index, text)
+
+        if self.tracer:
+            # If we're tracing code coverage, then we don't exit with status
+            # if on a false return value from main.
+            cmd = ('result = runtest(self.ns, test_name); '
+                   'self.accumulate_result(result)')
+            ns = dict(locals())
+            self.tracer.runctx(cmd, globals=globals(), locals=ns)
+            result = ns['result']
+        else:
+            result = runtest(self.ns, test_name)
+            self.accumulate_result(result)
+
+        # Unload the newly imported modules (best effort finalization)
+        for module in sys.modules.keys():
+            if module not in save_modules and module.startswith("test."):
+                support.unload(module)
+
+        return result
+
+    def run_tests_sequentially(self, runtests):
+        ns = self.ns
+        coverage = ns.trace
+        fail_fast = ns.failfast
+        fail_env_changed = ns.fail_env_changed
+        timeout = ns.timeout
+
+        if coverage:
              import trace
              self.tracer = trace.Trace(trace=False, count=True)
  
          save_modules = sys.modules.keys()
  
          msg = "Run tests sequentially"
-        if self.ns.timeout:
-            msg += " (timeout: %s)" % format_duration(self.ns.timeout)
+        if timeout:
+            msg += " (timeout: %s)" % format_duration(timeout)
          self.log(msg)
  
          previous_test = None
-        for test_index, test_name in enumerate(self.tests, 1):
+        tests_iter = runtests.iter_tests()
+        for test_index, test_name in enumerate(tests_iter, 1):
              start_time = time.perf_counter()
  
-            text = test_name
-            if previous_test:
-                text = '%s -- %s' % (text, previous_test)
-            self.display_progress(test_index, text)
-
-            if self.tracer:
-                # If we're tracing code coverage, then we don't exit with status
-                # if on a false return value from main.
-                cmd = ('result = runtest(self.ns, test_name); '
-                       'self.accumulate_result(result)')
-                ns = dict(locals())
-                self.tracer.runctx(cmd, globals=globals(), locals=ns)
-                result = ns['result']
-            else:
-                result = runtest(self.ns, test_name)
-                self.accumulate_result(result)
+            result = self.run_test(test_index, test_name,
+                                   previous_test, save_modules)
  
-            if result.state == State.INTERRUPTED:
+            if result.must_stop(fail_fast, fail_env_changed):
                  break
  
              previous_test = str(result)
@@ -496,26 +505,9 @@ class Regrtest:
                  # be quiet: say nothing if the test passed shortly
                  previous_test = None
  
-            # Unload the newly imported modules (best effort finalization)
-            for module in sys.modules.keys():
-                if module not in save_modules and module.startswith("test."):
-                    support.unload(module)
-
-            if self.ns.failfast and result.is_failed(self.ns.fail_env_changed):
-                break
-
          if previous_test:
              print(previous_test)
  
-    def _test_forever(self, tests):
-        while True:
-            for test_name in tests:
-                yield test_name
-                if self.bad:
-                    return
-                if self.ns.fail_env_changed and self.environment_changed:
-                    return
-
      def display_header(self):
          # Print basic platform information
          print("==", platform.python_implementation(), *sys.version.split())
@@ -560,11 +552,13 @@ class Regrtest:
          return not any((self.good, self.bad, self.skipped, self.interrupted,
                          self.environment_changed))
  
-    def get_tests_result(self):
+    def get_tests_state(self):
+        fail_env_changed = self.ns.fail_env_changed
+
          result = []
          if self.bad:
              result.append("FAILURE")
-        elif self.ns.fail_env_changed and self.environment_changed:
+        elif fail_env_changed and self.environment_changed:
              result.append("ENV CHANGED")
          elif self.no_tests_run():
              result.append("NO TESTS RAN")
@@ -576,10 +570,40 @@ class Regrtest:
              result.append("SUCCESS")
  
          result = ', '.join(result)
-        if self.first_result:
-            result = '%s then %s' % (self.first_result, result)
+        if self.first_state:
+            result = '%s then %s' % (self.first_state, result)
          return result
  
+    def _run_tests_mp(self, runtests: RunTests) -> None:
+        from test.libregrtest.runtest_mp import run_tests_multiprocess
+        # If we're on windows and this is the parent runner (not a worker),
+        # track the load average.
+        if sys.platform == 'win32':
+            from test.libregrtest.win_utils import WindowsLoadTracker
+
+            try:
+                self.win_load_tracker = WindowsLoadTracker()
+            except PermissionError as error:
+                # Standard accounts may not have access to the performance
+                # counters.
+                print(f'Failed to create WindowsLoadTracker: {error}')
+
+        try:
+            run_tests_multiprocess(self, runtests)
+        finally:
+            if self.win_load_tracker is not None:
+                self.win_load_tracker.close()
+                self.win_load_tracker = None
+
+    def set_tests(self, tests):
+        self.tests = tests
+        if self.ns.forever:
+            self.test_count_text = ''
+            self.test_count_width = 3
+        else:
+            self.test_count_text = '/{}'.format(len(self.tests))
+            self.test_count_width = len(self.test_count_text) - 1
+
      def run_tests(self):
          # For a partial run, we do not need to clutter the output.
          if (self.ns.header
@@ -597,37 +621,14 @@ class Regrtest:
          if self.ns.randomize:
              print("Using random seed", self.ns.random_seed)
  
-        if self.ns.forever:
-            self.tests = self._test_forever(list(self.selected))
-            self.test_count = ''
-            self.test_count_width = 3
-        else:
-            self.tests = iter(self.selected)
-            self.test_count = '/{}'.format(len(self.selected))
-            self.test_count_width = len(self.test_count) - 1
-
+        tests = self.selected
+        self.set_tests(tests)
+        runtests = RunTests(tests, forever=self.ns.forever)
+        self.all_runtests.append(runtests)
          if self.ns.use_mp:
-            from test.libregrtest.runtest_mp import run_tests_multiprocess
-            # If we're on windows and this is the parent runner (not a worker),
-            # track the load average.
-            if sys.platform == 'win32' and self.worker_test_name is None:
-                from test.libregrtest.win_utils import WindowsLoadTracker
-
-                try:
-                    self.win_load_tracker = WindowsLoadTracker()
-                except PermissionError as error:
-                    # Standard accounts may not have access to the performance
-                    # counters.
-                    print(f'Failed to create WindowsLoadTracker: {error}')
-
-            try:
-                run_tests_multiprocess(self)
-            finally:
-                if self.win_load_tracker is not None:
-                    self.win_load_tracker.close()
-                    self.win_load_tracker = None
+            self._run_tests_mp(runtests)
          else:
-            self.run_tests_sequential()
+            self.run_tests_sequentially(runtests)
  
      def finalize(self):
          if self.next_single_filename:
@@ -642,23 +643,29 @@ class Regrtest:
              r.write_results(show_missing=True, summary=True,
                              coverdir=self.ns.coverdir)
  
-        print()
-        self.display_summary()
-
          if self.ns.runleaks:
              os.system("leaks %d" % os.getpid())
  
+        self.save_xml_result()
+
      def display_summary(self):
          duration = time.perf_counter() - self.start_time
+        first_runtests = self.all_runtests[0]
+        # the second runtests (re-run failed tests) disables forever,
+        # use the first runtests
+        forever = first_runtests.forever
+        filtered = bool(self.ns.match_tests) or bool(self.ns.ignore_tests)
  
          # Total duration
+        print()
          print("Total duration: %s" % format_duration(duration))
  
          # Total tests
-        total = TestStats()
-        for stats in self.stats_dict.values():
-            total.accumulate(stats)
-        stats = [f'run={total.tests_run:,}']
+        total = self.total_stats
+        text = f'run={total.tests_run:,}'
+        if filtered:
+            text = f"{text} (filtered)"
+        stats = [text]
          if total.failures:
              stats.append(f'failures={total.failures:,}')
          if total.skipped:
@@ -666,23 +673,31 @@ class Regrtest:
          print(f"Total tests: {' '.join(stats)}")
  
          # Total test files
-        report = [f'success={len(self.good)}']
-        if self.bad:
-            report.append(f'failed={len(self.bad)}')
-        if self.environment_changed:
-            report.append(f'env_changed={len(self.environment_changed)}')
-        if self.skipped:
-            report.append(f'skipped={len(self.skipped)}')
-        if self.resource_denied:
-            report.append(f'resource_denied={len(self.resource_denied)}')
-        if self.rerun:
-            report.append(f'rerun={len(self.rerun)}')
-        if self.run_no_tests:
-            report.append(f'run_no_tests={len(self.run_no_tests)}')
+        all_tests = [self.good, self.bad, self.rerun,
+                     self.skipped,
+                     self.environment_changed, self.run_no_tests]
+        run = sum(map(len, all_tests))
+        text = f'run={run}'
+        if not forever:
+            ntest = len(first_runtests.tests)
+            text = f"{text}/{ntest}"
+        if filtered:
+            text = f"{text} (filtered)"
+        report = [text]
+        for name, tests in (
+            ('failed', self.bad),
+            ('env_changed', self.environment_changed),
+            ('skipped', self.skipped),
+            ('resource_denied', self.resource_denied),
+            ('rerun', self.rerun),
+            ('run_no_tests', self.run_no_tests),
+        ):
+            if tests:
+                report.append(f'{name}={len(tests)}')
          print(f"Total test files: {' '.join(report)}")
  
          # Result
-        result = self.get_tests_result()
+        result = self.get_tests_state()
          print(f"Result: {result}")
  
      def save_xml_result(self):
@@ -742,6 +757,9 @@ class Regrtest:
  
          self.tmp_dir = os.path.abspath(self.tmp_dir)
  
+    def is_worker(self):
+        return (self.ns.worker_args is not None)
+
      def create_temp_dir(self):
          os.makedirs(self.tmp_dir, exist_ok=True)
  
@@ -754,7 +772,8 @@ class Regrtest:
              nounce = random.randint(0, 1_000_000)
          else:
              nounce = os.getpid()
-        if self.worker_test_name is not None:
+
+        if self.is_worker():
              test_cwd = 'test_python_worker_{}'.format(nounce)
          else:
              test_cwd = 'test_python_{}'.format(nounce)
@@ -817,48 +836,53 @@ class Regrtest:
  
          return None
  
+    def get_exitcode(self):
+        exitcode = 0
+        if self.bad:
+            exitcode = EXITCODE_BAD_TEST
+        elif self.interrupted:
+            exitcode = EXITCODE_INTERRUPTED
+        elif self.ns.fail_env_changed and self.environment_changed:
+            exitcode = EXITCODE_ENV_CHANGED
+        elif self.no_tests_run():
+            exitcode = EXITCODE_NO_TESTS_RAN
+        elif self.rerun and self.ns.fail_rerun:
+            exitcode = EXITCODE_BAD_TEST
+        return exitcode
+
+    def action_run_tests(self):
+        self.run_tests()
+        self.display_result()
+
+        need_rerun = self.need_rerun
+        if self.ns.rerun and need_rerun:
+            self.rerun_failed_tests(need_rerun)
+
+        self.display_summary()
+        self.finalize()
+
      def _main(self, tests, kwargs):
-        if self.worker_test_name is not None:
+        if self.is_worker():
              from test.libregrtest.runtest_mp import run_tests_worker
-            run_tests_worker(self.ns, self.worker_test_name)
+            run_tests_worker(self.ns.worker_args)
+            return
  
          if self.ns.wait:
              input("Press any key to continue...")
  
-        support.PGO = self.ns.pgo
-        support.PGO_EXTENDED = self.ns.pgo_extended
-
          setup_tests(self.ns)
-
          self.find_tests(tests)
  
+        exitcode = 0
          if self.ns.list_tests:
              self.list_tests()
-            sys.exit(0)
-
-        if self.ns.list_cases:
+        elif self.ns.list_cases:
              self.list_cases()
-            sys.exit(0)
-
-        self.run_tests()
-        self.display_result()
-
-        if self.ns.verbose2 and self.bad:
-            self.rerun_failed_tests()
-
-        self.finalize()
-
-        self.save_xml_result()
+        else:
+            self.action_run_tests()
+            exitcode = self.get_exitcode()
  
-        if self.bad:
-            sys.exit(EXITCODE_BAD_TEST)
-        if self.interrupted:
-            sys.exit(EXITCODE_INTERRUPTED)
-        if self.ns.fail_env_changed and self.environment_changed:
-            sys.exit(EXITCODE_ENV_CHANGED)
-        if self.no_tests_run():
-            sys.exit(EXITCODE_NO_TESTS_RAN)
-        sys.exit(0)
+        sys.exit(exitcode)
  
  
  def main(tests=None, **kwargs):
diff --git a/Lib/test/libregrtest/runtest.py b/Lib/test/libregrtest/runtest.py

index 6fa60697371b728a2ba6c689322ba6c5697988e8..6e3fab1a88318f79ebffe30c63eb9009123518e9 100644 (file)
--- a/Lib/test/libregrtest/runtest.py
+++ b/Lib/test/libregrtest/runtest.py
@@ -1,7 +1,6 @@
  import dataclasses
  import doctest
  import faulthandler
-import functools
  import gc
  import importlib
  import io
@@ -20,6 +19,10 @@ from test.libregrtest.save_env import saved_test_environment
  from test.libregrtest.utils import clear_caches, format_duration, print_warning
  
  
+MatchTests = list[str]
+MatchTestsDict = dict[str, MatchTests]
+
+
  # Avoid enum.Enum to reduce the number of imports when tests are run
  class State:
      PASSED = "PASSED"
@@ -56,6 +59,41 @@ class State:
              State.MULTIPROCESSING_ERROR,
              State.DID_NOT_RUN}
  
+    @staticmethod
+    def must_stop(state):
+        return state in {
+            State.INTERRUPTED,
+            State.MULTIPROCESSING_ERROR}
+
+
+# gh-90681: When rerunning tests, we might need to rerun the whole
+# class or module suite if some its life-cycle hooks fail.
+# Test level hooks are not affected.
+_TEST_LIFECYCLE_HOOKS = frozenset((
+    'setUpClass', 'tearDownClass',
+    'setUpModule', 'tearDownModule',
+))
+
+def normalize_test_name(test_full_name, *, is_error=False):
+    short_name = test_full_name.split(" ")[0]
+    if is_error and short_name in _TEST_LIFECYCLE_HOOKS:
+        if test_full_name.startswith(('setUpModule (', 'tearDownModule (')):
+            # if setUpModule() or tearDownModule() failed, don't filter
+            # tests with the test file name, don't use use filters.
+            return None
+
+        # This means that we have a failure in a life-cycle hook,
+        # we need to rerun the whole module or class suite.
+        # Basically the error looks like this:
+        #    ERROR: setUpClass (test.test_reg_ex.RegTest)
+        # or
+        #    ERROR: setUpModule (test.test_reg_ex)
+        # So, we need to parse the class / module name.
+        lpar = test_full_name.index('(')
+        rpar = test_full_name.index(')')
+        return test_full_name[lpar + 1: rpar].split('.')[-1]
+    return short_name
+
  
  @dataclasses.dataclass(slots=True)
  class TestResult:
@@ -129,6 +167,58 @@ class TestResult:
          if self.state is None or self.state == State.PASSED:
              self.state = State.ENV_CHANGED
  
+    def must_stop(self, fail_fast: bool, fail_env_changed: bool) -> bool:
+        if State.must_stop(self.state):
+            return True
+        if fail_fast and self.is_failed(fail_env_changed):
+            return True
+        return False
+
+    def get_rerun_match_tests(self):
+        match_tests = []
+
+        errors = self.errors or []
+        failures = self.failures or []
+        for error_list, is_error in (
+            (errors, True),
+            (failures, False),
+        ):
+            for full_name, *_ in error_list:
+                match_name = normalize_test_name(full_name, is_error=is_error)
+                if match_name is None:
+                    # 'setUpModule (test.test_sys)': don't filter tests
+                    return None
+                if not match_name:
+                    error_type = "ERROR" if is_error else "FAIL"
+                    print_warning(f"rerun failed to parse {error_type} test name: "
+                                  f"{full_name!r}: don't filter tests")
+                    return None
+                match_tests.append(match_name)
+
+        return match_tests
+
+
+@dataclasses.dataclass(slots=True, frozen=True)
+class RunTests:
+    tests: list[str]
+    match_tests: MatchTestsDict | None = None
+    rerun: bool = False
+    forever: bool = False
+
+    def get_match_tests(self, test_name) -> MatchTests | None:
+        if self.match_tests is not None:
+            return self.match_tests.get(test_name, None)
+        else:
+            return None
+
+    def iter_tests(self):
+        tests = tuple(self.tests)
+        if self.forever:
+            while True:
+                yield from tests
+        else:
+            yield from tests
+
  
  # Minimum duration of a test to display its duration or to mention that
  # the test is running in background
@@ -147,9 +237,6 @@ SPLITTESTDIRS = {
      "test_multiprocessing_spawn",
  }
  
-# Storage of uncollectable objects
-FOUND_GARBAGE = []
-
  
  def findtestdir(path=None):
      return path or os.path.dirname(os.path.dirname(__file__)) or os.curdir
@@ -189,31 +276,41 @@ def split_test_packages(tests, *, testdir=None, exclude=(),
      return splitted
  
  
-def get_abs_module(ns: Namespace, test_name: str) -> str:
-    if test_name.startswith('test.') or ns.testdir:
+def abs_module_name(test_name: str, test_dir: str | None) -> str:
+    if test_name.startswith('test.') or test_dir:
          return test_name
      else:
          # Import it from the test package
          return 'test.' + test_name
  
  
-def _runtest_capture_output_timeout_junit(result: TestResult, ns: Namespace) -> None:
+def setup_support(ns: Namespace):
+    support.PGO = ns.pgo
+    support.PGO_EXTENDED = ns.pgo_extended
+    support.set_match_tests(ns.match_tests, ns.ignore_tests)
+    support.failfast = ns.failfast
+    support.verbose = ns.verbose
+    if ns.xmlpath:
+        support.junit_xml_list = []
+    else:
+        support.junit_xml_list = None
+
+
+def _runtest(result: TestResult, ns: Namespace) -> None:
      # Capture stdout and stderr, set faulthandler timeout,
      # and create JUnit XML report.
-
+    verbose = ns.verbose
      output_on_failure = ns.verbose3
+    timeout = ns.timeout
  
      use_timeout = (
-        ns.timeout is not None and threading_helper.can_start_thread
+        timeout is not None and threading_helper.can_start_thread
      )
      if use_timeout:
-        faulthandler.dump_traceback_later(ns.timeout, exit=True)
+        faulthandler.dump_traceback_later(timeout, exit=True)
  
      try:
-        support.set_match_tests(ns.match_tests, ns.ignore_tests)
-        support.junit_xml_list = xml_list = [] if ns.xmlpath else None
-        if ns.failfast:
-            support.failfast = True
+        setup_support(ns)
  
          if output_on_failure:
              support.verbose = True
@@ -247,11 +344,10 @@ def _runtest_capture_output_timeout_junit(result: TestResult, ns: Namespace) ->
                  sys.stderr.flush()
          else:
              # Tell tests to be moderately quiet
-            support.verbose = ns.verbose
-
-            _runtest_env_changed_exc(result, ns,
-                                     display_failure=not ns.verbose)
+            support.verbose = verbose
+            _runtest_env_changed_exc(result, ns, display_failure=not verbose)
  
+        xml_list = support.junit_xml_list
          if xml_list:
              import xml.etree.ElementTree as ET
              result.xml_data = [ET.tostring(x).decode('us-ascii')
@@ -276,7 +372,7 @@ def runtest(ns: Namespace, test_name: str) -> TestResult:
      start_time = time.perf_counter()
      result = TestResult(test_name)
      try:
-        _runtest_capture_output_timeout_junit(result, ns)
+        _runtest(result, ns)
      except:
          if not ns.pgo:
              msg = traceback.format_exc()
@@ -287,9 +383,9 @@ def runtest(ns: Namespace, test_name: str) -> TestResult:
      return result
  
  
-def _test_module(the_module):
+def run_unittest(test_mod):
      loader = unittest.TestLoader()
-    tests = loader.loadTestsFromModule(the_module)
+    tests = loader.loadTestsFromModule(test_mod)
      for error in loader.errors:
          print(error, file=sys.stderr)
      if loader.errors:
@@ -304,7 +400,6 @@ def save_env(ns: Namespace, test_name: str):
  def regrtest_runner(result, test_func, ns) -> None:
      # Run test_func(), collect statistics, and detect reference and memory
      # leaks.
-
      if ns.huntrleaks:
          from test.libregrtest.refleak import dash_R
          refleak, test_result = dash_R(ns, result.test_name, test_func)
@@ -332,24 +427,27 @@ def regrtest_runner(result, test_func, ns) -> None:
      result.stats = stats
  
  
+# Storage of uncollectable objects
+FOUND_GARBAGE = []
+
+
  def _load_run_test(result: TestResult, ns: Namespace) -> None:
      # Load the test function, run the test function.
+    module_name = abs_module_name(result.test_name, ns.testdir)
  
-    abstest = get_abs_module(ns, result.test_name)
-
-    # remove the module from sys.module to reload it if it was already imported
-    try:
-        del sys.modules[abstest]
-    except KeyError:
-        pass
+    # Remove the module from sys.module to reload it if it was already imported
+    sys.modules.pop(module_name, None)
  
-    the_module = importlib.import_module(abstest)
+    test_mod = importlib.import_module(module_name)
  
      # If the test has a test_main, that will run the appropriate
-    # tests.  If not, use normal unittest test loading.
-    test_func = getattr(the_module, "test_main", None)
-    if test_func is None:
-        test_func = functools.partial(_test_module, the_module)
+    # tests.  If not, use normal unittest test runner.
+    test_main = getattr(test_mod, "test_main", None)
+    if test_main is not None:
+        test_func = test_main
+    else:
+        def test_func():
+            return run_unittest(test_mod)
  
      try:
          with save_env(ns, result.test_name):
@@ -361,12 +459,12 @@ def _load_run_test(result: TestResult, ns: Namespace) -> None:
          # failures.
          support.gc_collect()
  
-        cleanup_test_droppings(result.test_name, ns.verbose)
+        remove_testfn(result.test_name, ns.verbose)
  
      if gc.garbage:
          support.environment_altered = True
          print_warning(f"{result.test_name} created {len(gc.garbage)} "
-                      f"uncollectable object(s).")
+                      f"uncollectable object(s)")
  
          # move the uncollectable objects somewhere,
          # so we don't see them again
@@ -444,35 +542,37 @@ def _runtest_env_changed_exc(result: TestResult, ns: Namespace,
          result.state = State.PASSED
  
  
-def cleanup_test_droppings(test_name: str, verbose: int) -> None:
-    # Try to clean up junk commonly left behind.  While tests shouldn't leave
-    # any files or directories behind, when a test fails that can be tedious
-    # for it to arrange.  The consequences can be especially nasty on Windows,
-    # since if a test leaves a file open, it cannot be deleted by name (while
-    # there's nothing we can do about that here either, we can display the
-    # name of the offending test, which is a real help).
-    for name in (os_helper.TESTFN,):
-        if not os.path.exists(name):
-            continue
+def remove_testfn(test_name: str, verbose: int) -> None:
+    # Try to clean up os_helper.TESTFN if left behind.
+    #
+    # While tests shouldn't leave any files or directories behind, when a test
+    # fails that can be tedious for it to arrange.  The consequences can be
+    # especially nasty on Windows, since if a test leaves a file open, it
+    # cannot be deleted by name (while there's nothing we can do about that
+    # here either, we can display the name of the offending test, which is a
+    # real help).
+    name = os_helper.TESTFN
+    if not os.path.exists(name):
+        return
  
-        if os.path.isdir(name):
-            import shutil
-            kind, nuker = "directory", shutil.rmtree
-        elif os.path.isfile(name):
-            kind, nuker = "file", os.unlink
-        else:
-            raise RuntimeError(f"os.path says {name!r} exists but is neither "
-                               f"directory nor file")
-
-        if verbose:
-            print_warning(f"{test_name} left behind {kind} {name!r}")
-            support.environment_altered = True
-
-        try:
-            import stat
-            # fix possible permissions problems that might prevent cleanup
-            os.chmod(name, stat.S_IRWXU | stat.S_IRWXG | stat.S_IRWXO)
-            nuker(name)
-        except Exception as exc:
-            print_warning(f"{test_name} left behind {kind} {name!r} "
-                          f"and it couldn't be removed: {exc}")
+    if os.path.isdir(name):
+        import shutil
+        kind, nuker = "directory", shutil.rmtree
+    elif os.path.isfile(name):
+        kind, nuker = "file", os.unlink
+    else:
+        raise RuntimeError(f"os.path says {name!r} exists but is neither "
+                           f"directory nor file")
+
+    if verbose:
+        print_warning(f"{test_name} left behind {kind} {name!r}")
+        support.environment_altered = True
+
+    try:
+        import stat
+        # fix possible permissions problems that might prevent cleanup
+        os.chmod(name, stat.S_IRWXU | stat.S_IRWXG | stat.S_IRWXO)
+        nuker(name)
+    except Exception as exc:
+        print_warning(f"{test_name} left behind {kind} {name!r} "
+                      f"and it couldn't be removed: {exc}")
diff --git a/Lib/test/libregrtest/runtest_mp.py b/Lib/test/libregrtest/runtest_mp.py

index fb1f80b0c054e3334286731c73ec607d7feadbfe..60089554cab5dd047571cb1b77b40cc2aeebcb13 100644 (file)
--- a/Lib/test/libregrtest/runtest_mp.py
+++ b/Lib/test/libregrtest/runtest_mp.py
@@ -19,8 +19,8 @@ from test.support import TestStats
  from test.libregrtest.cmdline import Namespace
  from test.libregrtest.main import Regrtest
  from test.libregrtest.runtest import (
-    runtest, TestResult, State,
-    PROGRESS_MIN_TIME)
+    runtest, TestResult, State, PROGRESS_MIN_TIME,
+    MatchTests, RunTests)
  from test.libregrtest.setup import setup_tests
  from test.libregrtest.utils import format_duration, print_warning
  
@@ -44,26 +44,54 @@ JOIN_TIMEOUT = 30.0   # seconds
  USE_PROCESS_GROUP = (hasattr(os, "setsid") and hasattr(os, "killpg"))
  
  
-def must_stop(result: TestResult, ns: Namespace) -> bool:
-    if result.state == State.INTERRUPTED:
-        return True
-    if ns.failfast and result.is_failed(ns.fail_env_changed):
-        return True
-    return False
+@dataclasses.dataclass(slots=True)
+class WorkerJob:
+    test_name: str
+    namespace: Namespace
+    rerun: bool = False
+    match_tests: MatchTests | None = None
  
  
-def parse_worker_args(worker_args) -> tuple[Namespace, str]:
-    ns_dict, test_name = json.loads(worker_args)
-    ns = Namespace(**ns_dict)
-    return (ns, test_name)
+class _EncodeWorkerJob(json.JSONEncoder):
+    def default(self, o: Any) -> dict[str, Any]:
+        match o:
+            case WorkerJob():
+                result = dataclasses.asdict(o)
+                result["__worker_job__"] = True
+                return result
+            case Namespace():
+                result = vars(o)
+                result["__namespace__"] = True
+                return result
+            case _:
+                return super().default(o)
+
+
+def _decode_worker_job(d: dict[str, Any]) -> WorkerJob | dict[str, Any]:
+    if "__worker_job__" in d:
+        d.pop('__worker_job__')
+        return WorkerJob(**d)
+    if "__namespace__" in d:
+        d.pop('__namespace__')
+        return Namespace(**d)
+    else:
+        return d
+
+
+def _parse_worker_args(worker_json: str) -> tuple[Namespace, str]:
+    return json.loads(worker_json,
+                      object_hook=_decode_worker_job)
  
  
-def run_test_in_subprocess(testname: str, ns: Namespace, tmp_dir: str, stdout_fh: TextIO) -> subprocess.Popen:
-    ns_dict = vars(ns)
-    worker_args = (ns_dict, testname)
-    worker_args = json.dumps(worker_args)
-    if ns.python is not None:
-        executable = ns.python
+def run_test_in_subprocess(worker_job: WorkerJob,
+                           output_file: TextIO,
+                           tmp_dir: str | None = None) -> subprocess.Popen:
+    ns = worker_job.namespace
+    python = ns.python
+    worker_args = json.dumps(worker_job, cls=_EncodeWorkerJob)
+
+    if python is not None:
+        executable = python
      else:
          executable = [sys.executable]
      cmd = [*executable, *support.args_from_interpreter_flags(),
@@ -82,9 +110,9 @@ def run_test_in_subprocess(testname: str, ns: Namespace, tmp_dir: str, stdout_fh
      # sysconfig.is_python_build() is true. See issue 15300.
      kw = dict(
          env=env,
-        stdout=stdout_fh,
+        stdout=output_file,
          # bpo-45410: Write stderr into stdout to keep messages order
-        stderr=stdout_fh,
+        stderr=output_file,
          text=True,
          close_fds=(os.name != 'nt'),
          cwd=os_helper.SAVEDCWD,
@@ -94,11 +122,27 @@ def run_test_in_subprocess(testname: str, ns: Namespace, tmp_dir: str, stdout_fh
      return subprocess.Popen(cmd, **kw)
  
  
-def run_tests_worker(ns: Namespace, test_name: str) -> NoReturn:
+def run_tests_worker(worker_json: str) -> NoReturn:
+    worker_job = _parse_worker_args(worker_json)
+    ns = worker_job.namespace
+    test_name = worker_job.test_name
+    rerun = worker_job.rerun
+    match_tests = worker_job.match_tests
+
      setup_tests(ns)
  
-    result = runtest(ns, test_name)
+    if rerun:
+        if match_tests:
+            matching = "matching: " + ", ".join(match_tests)
+            print(f"Re-running {test_name} in verbose mode ({matching})", flush=True)
+        else:
+            print(f"Re-running {test_name} in verbose mode", flush=True)
+        ns.verbose = True
  
+    if match_tests is not None:
+        ns.match_tests = match_tests
+
+    result = runtest(ns, test_name)
      print()   # Force a newline (just in case)
  
      # Serialize TestResult as dict in JSON
@@ -148,11 +192,13 @@ class TestWorkerProcess(threading.Thread):
      def __init__(self, worker_id: int, runner: "MultiprocessTestRunner") -> None:
          super().__init__()
          self.worker_id = worker_id
+        self.runtests = runner.runtests
          self.pending = runner.pending
          self.output = runner.output
          self.ns = runner.ns
          self.timeout = runner.worker_timeout
          self.regrtest = runner.regrtest
+        self.rerun = runner.rerun
          self.current_test_name = None
          self.start_time = None
          self._popen = None
@@ -216,10 +262,11 @@ class TestWorkerProcess(threading.Thread):
      ) -> MultiprocessResult:
          return MultiprocessResult(test_result, stdout, err_msg)
  
-    def _run_process(self, test_name: str, tmp_dir: str, stdout_fh: TextIO) -> int:
-        self.current_test_name = test_name
+    def _run_process(self, worker_job, output_file: TextIO,
+                     tmp_dir: str | None = None) -> int:
+        self.current_test_name = worker_job.test_name
          try:
-            popen = run_test_in_subprocess(test_name, self.ns, tmp_dir, stdout_fh)
+            popen = run_test_in_subprocess(worker_job, output_file, tmp_dir)
  
              self._killed = False
              self._popen = popen
@@ -277,9 +324,15 @@ class TestWorkerProcess(threading.Thread):
          else:
              encoding = sys.stdout.encoding
  
+        match_tests = self.runtests.get_match_tests(test_name)
+
          # gh-94026: Write stdout+stderr to a tempfile as workaround for
          # non-blocking pipes on Emscripten with NodeJS.
-        with tempfile.TemporaryFile('w+', encoding=encoding) as stdout_fh:
+        with tempfile.TemporaryFile('w+', encoding=encoding) as stdout_file:
+            worker_job = WorkerJob(test_name,
+                                   namespace=self.ns,
+                                   rerun=self.rerun,
+                                   match_tests=match_tests)
              # gh-93353: Check for leaked temporary files in the parent process,
              # since the deletion of temporary files can happen late during
              # Python finalization: too late for libregrtest.
@@ -290,17 +343,17 @@ class TestWorkerProcess(threading.Thread):
                  tmp_dir = tempfile.mkdtemp(prefix="test_python_")
                  tmp_dir = os.path.abspath(tmp_dir)
                  try:
-                    retcode = self._run_process(test_name, tmp_dir, stdout_fh)
+                    retcode = self._run_process(worker_job, stdout_file, tmp_dir)
                  finally:
                      tmp_files = os.listdir(tmp_dir)
                      os_helper.rmtree(tmp_dir)
              else:
-                retcode = self._run_process(test_name, None, stdout_fh)
+                retcode = self._run_process(worker_job, stdout_file)
                  tmp_files = ()
-            stdout_fh.seek(0)
+            stdout_file.seek(0)
  
              try:
-                stdout = stdout_fh.read().strip()
+                stdout = stdout_file.read().strip()
              except Exception as exc:
                  # gh-101634: Catch UnicodeDecodeError if stdout cannot be
                  # decoded from encoding
@@ -342,6 +395,8 @@ class TestWorkerProcess(threading.Thread):
          return MultiprocessResult(result, stdout)
  
      def run(self) -> None:
+        fail_fast = self.ns.failfast
+        fail_env_changed = self.ns.fail_env_changed
          while not self._stopped:
              try:
                  try:
@@ -354,7 +409,7 @@ class TestWorkerProcess(threading.Thread):
                  mp_result.result.duration = time.monotonic() - self.start_time
                  self.output.put((False, mp_result))
  
-                if must_stop(mp_result.result, self.ns):
+                if mp_result.result.must_stop(fail_fast, fail_env_changed):
                      break
              except ExitThread:
                  break
@@ -410,29 +465,36 @@ def get_running(workers: list[TestWorkerProcess]) -> list[TestWorkerProcess]:
  
  
  class MultiprocessTestRunner:
-    def __init__(self, regrtest: Regrtest) -> None:
+    def __init__(self, regrtest: Regrtest, runtests: RunTests) -> None:
+        ns = regrtest.ns
+        timeout = ns.timeout
+
          self.regrtest = regrtest
+        self.runtests = runtests
+        self.rerun = runtests.rerun
          self.log = self.regrtest.log
-        self.ns = regrtest.ns
+        self.ns = ns
          self.output: queue.Queue[QueueOutput] = queue.Queue()
-        self.pending = MultiprocessIterator(self.regrtest.tests)
-        if self.ns.timeout is not None:
+        tests_iter = runtests.iter_tests()
+        self.pending = MultiprocessIterator(tests_iter)
+        if timeout is not None:
              # Rely on faulthandler to kill a worker process. This timouet is
              # when faulthandler fails to kill a worker process. Give a maximum
              # of 5 minutes to faulthandler to kill the worker.
-            self.worker_timeout = min(self.ns.timeout * 1.5,
-                                      self.ns.timeout + 5 * 60)
+            self.worker_timeout = min(timeout * 1.5, timeout + 5 * 60)
          else:
              self.worker_timeout = None
          self.workers = None
  
      def start_workers(self) -> None:
+        use_mp = self.ns.use_mp
+        timeout = self.ns.timeout
          self.workers = [TestWorkerProcess(index, self)
-                        for index in range(1, self.ns.use_mp + 1)]
+                        for index in range(1, use_mp + 1)]
          msg = f"Run tests in parallel using {len(self.workers)} child processes"
-        if self.ns.timeout:
+        if timeout:
              msg += (" (timeout: %s, worker timeout: %s)"
-                    % (format_duration(self.ns.timeout),
+                    % (format_duration(timeout),
                         format_duration(self.worker_timeout)))
          self.log(msg)
          for worker in self.workers:
@@ -446,6 +508,7 @@ class MultiprocessTestRunner:
              worker.wait_stopped(start_time)
  
      def _get_result(self) -> QueueOutput | None:
+        pgo = self.ns.pgo
          use_faulthandler = (self.ns.timeout is not None)
          timeout = PROGRESS_UPDATE
  
@@ -464,7 +527,7 @@ class MultiprocessTestRunner:
  
              # display progress
              running = get_running(self.workers)
-            if running and not self.ns.pgo:
+            if running and not pgo:
                  self.log('running: %s' % ', '.join(running))
  
          # all worker threads are done: consume pending results
@@ -475,42 +538,46 @@ class MultiprocessTestRunner:
  
      def display_result(self, mp_result: MultiprocessResult) -> None:
          result = mp_result.result
+        pgo = self.ns.pgo
  
          text = str(result)
          if mp_result.err_msg:
              # MULTIPROCESSING_ERROR
              text += ' (%s)' % mp_result.err_msg
-        elif (result.duration >= PROGRESS_MIN_TIME and not self.ns.pgo):
+        elif (result.duration >= PROGRESS_MIN_TIME and not pgo):
              text += ' (%s)' % format_duration(result.duration)
          running = get_running(self.workers)
-        if running and not self.ns.pgo:
+        if running and not pgo:
              text += ' -- running: %s' % ', '.join(running)
          self.regrtest.display_progress(self.test_index, text)
  
      def _process_result(self, item: QueueOutput) -> bool:
          """Returns True if test runner must stop."""
+        rerun = self.runtests.rerun
          if item[0]:
              # Thread got an exception
              format_exc = item[1]
              print_warning(f"regrtest worker thread failed: {format_exc}")
              result = TestResult("<regrtest worker>", state=State.MULTIPROCESSING_ERROR)
-            self.regrtest.accumulate_result(result)
-            return True
+            self.regrtest.accumulate_result(result, rerun=rerun)
+            return result
  
          self.test_index += 1
          mp_result = item[1]
-        self.regrtest.accumulate_result(mp_result.result)
+        result = mp_result.result
+        self.regrtest.accumulate_result(result, rerun=rerun)
          self.display_result(mp_result)
  
          if mp_result.worker_stdout:
              print(mp_result.worker_stdout, flush=True)
  
-        if must_stop(mp_result.result, self.ns):
-            return True
-
-        return False
+        return result
  
      def run_tests(self) -> None:
+        fail_fast = self.ns.failfast
+        fail_env_changed = self.ns.fail_env_changed
+        timeout = self.ns.timeout
+
          self.start_workers()
  
          self.test_index = 0
@@ -520,14 +587,14 @@ class MultiprocessTestRunner:
                  if item is None:
                      break
  
-                stop = self._process_result(item)
-                if stop:
+                result = self._process_result(item)
+                if result.must_stop(fail_fast, fail_env_changed):
                      break
          except KeyboardInterrupt:
              print()
              self.regrtest.interrupted = True
          finally:
-            if self.ns.timeout is not None:
+            if timeout is not None:
                  faulthandler.cancel_dump_traceback_later()
  
              # Always ensure that all worker processes are no longer
@@ -536,8 +603,8 @@ class MultiprocessTestRunner:
              self.stop_workers()
  
  
-def run_tests_multiprocess(regrtest: Regrtest) -> None:
-    MultiprocessTestRunner(regrtest).run_tests()
+def run_tests_multiprocess(regrtest: Regrtest, runtests: RunTests) -> None:
+    MultiprocessTestRunner(regrtest, runtests).run_tests()
  
  
  class EncodeTestResult(json.JSONEncoder):
@@ -552,7 +619,7 @@ class EncodeTestResult(json.JSONEncoder):
          return super().default(o)
  
  
-def decode_test_result(d: dict[str, Any]) -> TestResult | TestStats | dict[str, Any]:
+def decode_test_result(d: dict[str, Any]) -> TestResult | dict[str, Any]:
      """Decode a TestResult (sub)class object from a JSON dict."""
  
      if "__test_result__" not in d:
diff --git a/Lib/test/libregrtest/utils.py b/Lib/test/libregrtest/utils.py

index 89a149ec5d6b366693a528e12ac72ae09d3f729f..9a60a3d40b4c2cb12f0d2796c96f600fcd1b6bd7 100644 (file)
--- a/Lib/test/libregrtest/utils.py
+++ b/Lib/test/libregrtest/utils.py
@@ -31,7 +31,7 @@ def format_duration(seconds):
      return ' '.join(parts)
  
  
-def removepy(names):
+def strip_py_suffix(names: list[str]):
      if not names:
          return
      for idx, name in enumerate(names):
diff --git a/Lib/test/support/__init__.py b/Lib/test/support/__init__.py

index f28a3a2632c1c5233dc77a8f53a921a3db48915a..7bac1160fd8e0a02ccae945748cfa5fd5db05d43 100644 (file)
--- a/Lib/test/support/__init__.py
+++ b/Lib/test/support/__init__.py
@@ -1189,7 +1189,6 @@ def _is_full_match_test(pattern):
  def set_match_tests(accept_patterns=None, ignore_patterns=None):
      global _match_test_func, _accept_test_patterns, _ignore_test_patterns
  
-
      if accept_patterns is None:
          accept_patterns = ()
      if ignore_patterns is None:
diff --git a/Lib/test/support/testresult.py b/Lib/test/support/testresult.py

index 14474be222dc4b30e2a526dc4c921113395210af..de23fdd59ded957736f0ce63e1c43acaf7eb7f49 100644 (file)
--- a/Lib/test/support/testresult.py
+++ b/Lib/test/support/testresult.py
@@ -8,6 +8,7 @@ import sys
  import time
  import traceback
  import unittest
+from test import support
  
  class RegressionTestResult(unittest.TextTestResult):
      USE_XML = False
@@ -112,6 +113,8 @@ class RegressionTestResult(unittest.TextTestResult):
      def addFailure(self, test, err):
          self._add_result(test, True, failure=self.__makeErrorDict(*err))
          super().addFailure(test, err)
+        if support.failfast:
+            self.stop()
  
      def addSkip(self, test, reason):
          self._add_result(test, skipped=reason)
diff --git a/Lib/test/test_regrtest.py b/Lib/test/test_regrtest.py

index 1c02d802c0b061c01cb62f3c2637eb2cfe6393dd..eb321c4ca05f1a839eb9ba97cb16905e8bf08017 100644 (file)
--- a/Lib/test/test_regrtest.py
+++ b/Lib/test/test_regrtest.py
@@ -5,6 +5,7 @@ Note: test_regrtest cannot be run twice in parallel.
  """
  
  import contextlib
+import dataclasses
  import glob
  import io
  import locale
@@ -21,6 +22,7 @@ from test import libregrtest
  from test import support
  from test.support import os_helper, TestStats
  from test.libregrtest import utils, setup
+from test.libregrtest.runtest import normalize_test_name
  
  if not support.has_subprocess_support:
      raise unittest.SkipTest("test module requires subprocess")
@@ -96,11 +98,11 @@ class ParseArgsTestCase(unittest.TestCase):
          ns = libregrtest._parse_args([])
          self.assertEqual(ns.verbose, 0)
  
-    def test_verbose2(self):
-        for opt in '-w', '--verbose2':
+    def test_rerun(self):
+        for opt in '-w', '--rerun', '--verbose2':
              with self.subTest(opt=opt):
                  ns = libregrtest._parse_args([opt])
-                self.assertTrue(ns.verbose2)
+                self.assertTrue(ns.rerun)
  
      def test_verbose3(self):
          for opt in '-W', '--verbose3':
@@ -362,6 +364,13 @@ class ParseArgsTestCase(unittest.TestCase):
                          'unrecognized arguments: --unknown-option')
  
  
+@dataclasses.dataclass(slots=True)
+class Rerun:
+    name: str
+    match: str | None
+    success: bool
+
+
  class BaseTestCase(unittest.TestCase):
      TEST_UNIQUE_ID = 1
      TESTNAME_PREFIX = 'test_regrtest_'
@@ -423,11 +432,11 @@ class BaseTestCase(unittest.TestCase):
  
      def check_executed_tests(self, output, tests, skipped=(), failed=(),
                               env_changed=(), omitted=(),
-                             rerun={}, run_no_tests=(),
+                             rerun=None, run_no_tests=(),
                               resource_denied=(),
                               randomize=False, interrupted=False,
                               fail_env_changed=False,
-                             *, stats):
+                             *, stats, forever=False, filtered=False):
          if isinstance(tests, str):
              tests = [tests]
          if isinstance(skipped, str):
@@ -445,11 +454,20 @@ class BaseTestCase(unittest.TestCase):
          if isinstance(stats, int):
              stats = TestStats(stats)
  
+        rerun_failed = []
+        if rerun is not None:
+            failed = [rerun.name]
+            if not rerun.success:
+                rerun_failed.append(rerun.name)
+
          executed = self.parse_executed_tests(output)
+        total_tests = list(tests)
+        if rerun is not None:
+            total_tests.append(rerun.name)
          if randomize:
-            self.assertEqual(set(executed), set(tests), output)
+            self.assertEqual(set(executed), set(total_tests), output)
          else:
-            self.assertEqual(executed, tests, output)
+            self.assertEqual(executed, total_tests, output)
  
          def plural(count):
              return 's' if count != 1 else ''
@@ -465,6 +483,10 @@ class BaseTestCase(unittest.TestCase):
              regex = list_regex('%s test%s skipped', skipped)
              self.check_line(output, regex)
  
+        if resource_denied:
+            regex = list_regex(r'%s test%s skipped \(resource denied\)', resource_denied)
+            self.check_line(output, regex)
+
          if failed:
              regex = list_regex('%s test%s failed', failed)
              self.check_line(output, regex)
@@ -478,32 +500,36 @@ class BaseTestCase(unittest.TestCase):
              regex = list_regex('%s test%s omitted', omitted)
              self.check_line(output, regex)
  
-        if rerun:
-            regex = list_regex('%s re-run test%s', rerun.keys())
+        if rerun is not None:
+            regex = list_regex('%s re-run test%s', [rerun.name])
              self.check_line(output, regex)
-            regex = LOG_PREFIX + r"Re-running failed tests in verbose mode"
+            regex = LOG_PREFIX + fr"Re-running 1 failed tests in verbose mode"
+            self.check_line(output, regex)
+            regex = fr"Re-running {rerun.name} in verbose mode"
+            if rerun.match:
+                regex = fr"{regex} \(matching: {rerun.match}\)"
              self.check_line(output, regex)
-            for name, match in rerun.items():
-                regex = LOG_PREFIX + f"Re-running {name} in verbose mode \\(matching: {match}\\)"
-                self.check_line(output, regex)
  
          if run_no_tests:
              regex = list_regex('%s test%s run no tests', run_no_tests)
              self.check_line(output, regex)
  
-        good = (len(tests) - len(skipped) - len(failed)
+        good = (len(tests) - len(skipped) - len(resource_denied) - len(failed)
                  - len(omitted) - len(env_changed) - len(run_no_tests))
          if good:
-            regex = r'%s test%s OK\.$' % (good, plural(good))
-            if not skipped and not failed and good > 1:
+            regex = r'%s test%s OK\.' % (good, plural(good))
+            if not skipped and not failed and (rerun is None or rerun.success) and good > 1:
                  regex = 'All %s' % regex
-            self.check_line(output, regex)
+            self.check_line(output, regex, full=True)
  
          if interrupted:
              self.check_line(output, 'Test suite interrupted by signal SIGINT.')
  
          # Total tests
-        parts = [f'run={stats.tests_run:,}']
+        text = f'run={stats.tests_run:,}'
+        if filtered:
+            text = fr'{text} \(filtered\)'
+        parts = [text]
          if stats.failures:
              parts.append(f'failures={stats.failures:,}')
          if stats.skipped:
@@ -512,39 +538,52 @@ class BaseTestCase(unittest.TestCase):
          self.check_line(output, line, full=True)
  
          # Total test files
-        report = [f'success={good}']
-        if failed:
-            report.append(f'failed={len(failed)}')
-        if env_changed:
-            report.append(f'env_changed={len(env_changed)}')
-        if skipped:
-            report.append(f'skipped={len(skipped)}')
-        if resource_denied:
-            report.append(f'resource_denied={len(resource_denied)}')
-        if rerun:
-            report.append(f'rerun={len(rerun)}')
-        if run_no_tests:
-            report.append(f'run_no_tests={len(run_no_tests)}')
+        run = len(total_tests) - len(resource_denied)
+        if rerun is not None:
+            total_failed = len(rerun_failed)
+            total_rerun = 1
+        else:
+            total_failed = len(failed)
+            total_rerun = 0
+        if interrupted:
+            run = 0
+        text = f'run={run}'
+        if not forever:
+            text = f'{text}/{len(tests)}'
+        if filtered:
+            text = fr'{text} \(filtered\)'
+        report = [text]
+        for name, ntest in (
+            ('failed', total_failed),
+            ('env_changed', len(env_changed)),
+            ('skipped', len(skipped)),
+            ('resource_denied', len(resource_denied)),
+            ('rerun', total_rerun),
+            ('run_no_tests', len(run_no_tests)),
+        ):
+            if ntest:
+                report.append(f'{name}={ntest}')
          line = fr'Total test files: {" ".join(report)}'
          self.check_line(output, line, full=True)
  
          # Result
-        result = []
+        state = []
          if failed:
-            result.append('FAILURE')
+            state.append('FAILURE')
          elif fail_env_changed and env_changed:
-            result.append('ENV CHANGED')
+            state.append('ENV CHANGED')
          if interrupted:
-            result.append('INTERRUPTED')
-        if not any((good, result, failed, interrupted, skipped,
+            state.append('INTERRUPTED')
+        if not any((good, failed, interrupted, skipped,
                      env_changed, fail_env_changed)):
-            result.append("NO TESTS RAN")
-        elif not result:
-            result.append('SUCCESS')
-        result = ', '.join(result)
-        if rerun:
-            result = 'FAILURE then %s' % result
-        self.check_line(output, f'Result: {result}', full=True)
+            state.append("NO TESTS RAN")
+        elif not state:
+            state.append('SUCCESS')
+        state = ', '.join(state)
+        if rerun is not None:
+            new_state = 'SUCCESS' if rerun.success else 'FAILURE'
+            state = 'FAILURE then ' + new_state
+        self.check_line(output, f'Result: {state}', full=True)
  
      def parse_random_seed(self, output):
          match = self.regex_search(r'Using random seed ([0-9]+)', output)
@@ -563,13 +602,13 @@ class BaseTestCase(unittest.TestCase):
                                stdout=subprocess.PIPE,
                                **kw)
          if proc.returncode != exitcode:
-            msg = ("Command %s failed with exit code %s\n"
+            msg = ("Command %s failed with exit code %s, but exit code %s expected!\n"
                     "\n"
                     "stdout:\n"
                     "---\n"
                     "%s\n"
                     "---\n"
-                   % (str(args), proc.returncode, proc.stdout))
+                   % (str(args), proc.returncode, exitcode, proc.stdout))
              if proc.stderr:
                  msg += ("\n"
                          "stderr:\n"
@@ -738,6 +777,40 @@ class ArgsTestCase(BaseTestCase):
          cmdargs = ['-m', 'test', '--testdir=%s' % self.tmptestdir, *testargs]
          return self.run_python(cmdargs, **kw)
  
+    def test_success(self):
+        code = textwrap.dedent("""
+            import unittest
+
+            class PassingTests(unittest.TestCase):
+                def test_test1(self):
+                    pass
+
+                def test_test2(self):
+                    pass
+
+                def test_test3(self):
+                    pass
+        """)
+        tests = [self.create_test(f'ok{i}', code=code) for i in range(1, 6)]
+
+        output = self.run_tests(*tests)
+        self.check_executed_tests(output, tests,
+                                  stats=3 * len(tests))
+
+    def test_skip(self):
+        code = textwrap.dedent("""
+            import unittest
+            raise unittest.SkipTest("nope")
+        """)
+        test_ok = self.create_test('ok')
+        test_skip = self.create_test('skip', code=code)
+        tests = [test_ok, test_skip]
+
+        output = self.run_tests(*tests)
+        self.check_executed_tests(output, tests,
+                                  skipped=[test_skip],
+                                  stats=1)
+
      def test_failing_test(self):
          # test a failing test
          code = textwrap.dedent("""
@@ -777,14 +850,12 @@ class ArgsTestCase(BaseTestCase):
          # -u audio: 1 resource enabled
          output = self.run_tests('-uaudio', *test_names)
          self.check_executed_tests(output, test_names,
-                                  skipped=tests['network'],
                                    resource_denied=tests['network'],
                                    stats=1)
  
          # no option: 0 resources enabled
-        output = self.run_tests(*test_names)
+        output = self.run_tests(*test_names, exitcode=EXITCODE_NO_TESTS_RAN)
          self.check_executed_tests(output, test_names,
-                                  skipped=test_names,
                                    resource_denied=test_names,
                                    stats=0)
  
@@ -930,9 +1001,21 @@ class ArgsTestCase(BaseTestCase):
                          builtins.__dict__['RUN'] = 1
          """)
          test = self.create_test('forever', code=code)
+
+        # --forever
          output = self.run_tests('--forever', test, exitcode=EXITCODE_BAD_TEST)
          self.check_executed_tests(output, [test]*3, failed=test,
-                                  stats=TestStats(1, 1))
+                                  stats=TestStats(3, 1),
+                                  forever=True)
+
+        # --forever --rerun
+        output = self.run_tests('--forever', '--rerun', test, exitcode=0)
+        self.check_executed_tests(output, [test]*3,
+                                  rerun=Rerun(test,
+                                              match='test_run',
+                                              success=True),
+                                  stats=TestStats(4, 1),
+                                  forever=True)
  
      def check_leak(self, code, what):
          test = self.create_test('huntrleaks', code=code)
@@ -1143,33 +1226,55 @@ class ArgsTestCase(BaseTestCase):
          """)
          testname = self.create_test(code=code)
  
-        output = self.run_tests("-w", testname, exitcode=EXITCODE_BAD_TEST)
+        output = self.run_tests("--rerun", testname, exitcode=EXITCODE_BAD_TEST)
          self.check_executed_tests(output, [testname],
-                                  failed=testname,
-                                  rerun={testname: "test_fail_always"},
-                                  stats=TestStats(1, 1))
+                                  rerun=Rerun(testname,
+                                              "test_fail_always",
+                                              success=False),
+                                  stats=TestStats(3, 2))
  
      def test_rerun_success(self):
          # FAILURE then SUCCESS
-        code = textwrap.dedent("""
-            import builtins
+        marker_filename = os.path.abspath("regrtest_marker_filename")
+        self.addCleanup(os_helper.unlink, marker_filename)
+        self.assertFalse(os.path.exists(marker_filename))
+
+        code = textwrap.dedent(f"""
+            import os.path
              import unittest
  
+            marker_filename = {marker_filename!r}
+
              class Tests(unittest.TestCase):
                  def test_succeed(self):
                      return
  
                  def test_fail_once(self):
-                    if not hasattr(builtins, '_test_failed'):
-                        builtins._test_failed = True
+                    if not os.path.exists(marker_filename):
+                        open(marker_filename, "w").close()
                          self.fail("bug")
          """)
          testname = self.create_test(code=code)
  
-        output = self.run_tests("-w", testname, exitcode=0)
+        # FAILURE then SUCCESS => exit code 0
+        output = self.run_tests("--rerun", testname, exitcode=0)
          self.check_executed_tests(output, [testname],
-                                  rerun={testname: "test_fail_once"},
-                                  stats=1)
+                                  rerun=Rerun(testname,
+                                              match="test_fail_once",
+                                              success=True),
+                                  stats=TestStats(3, 1))
+        os_helper.unlink(marker_filename)
+
+        # with --fail-rerun, exit code EXITCODE_BAD_TEST
+        # on "FAILURE then SUCCESS" state.
+        output = self.run_tests("--rerun", "--fail-rerun", testname,
+                                exitcode=EXITCODE_BAD_TEST)
+        self.check_executed_tests(output, [testname],
+                                  rerun=Rerun(testname,
+                                              match="test_fail_once",
+                                              success=True),
+                                  stats=TestStats(3, 1))
+        os_helper.unlink(marker_filename)
  
      def test_rerun_setup_class_hook_failure(self):
          # FAILURE then FAILURE
@@ -1186,10 +1291,12 @@ class ArgsTestCase(BaseTestCase):
          """)
          testname = self.create_test(code=code)
  
-        output = self.run_tests("-w", testname, exitcode=EXITCODE_BAD_TEST)
+        output = self.run_tests("--rerun", testname, exitcode=EXITCODE_BAD_TEST)
          self.check_executed_tests(output, testname,
                                    failed=[testname],
-                                  rerun={testname: "ExampleTests"},
+                                  rerun=Rerun(testname,
+                                              match="ExampleTests",
+                                              success=False),
                                    stats=0)
  
      def test_rerun_teardown_class_hook_failure(self):
@@ -1207,11 +1314,13 @@ class ArgsTestCase(BaseTestCase):
          """)
          testname = self.create_test(code=code)
  
-        output = self.run_tests("-w", testname, exitcode=EXITCODE_BAD_TEST)
+        output = self.run_tests("--rerun", testname, exitcode=EXITCODE_BAD_TEST)
          self.check_executed_tests(output, testname,
                                    failed=[testname],
-                                  rerun={testname: "ExampleTests"},
-                                  stats=1)
+                                  rerun=Rerun(testname,
+                                              match="ExampleTests",
+                                              success=False),
+                                  stats=2)
  
      def test_rerun_setup_module_hook_failure(self):
          # FAILURE then FAILURE
@@ -1227,10 +1336,12 @@ class ArgsTestCase(BaseTestCase):
          """)
          testname = self.create_test(code=code)
  
-        output = self.run_tests("-w", testname, exitcode=EXITCODE_BAD_TEST)
+        output = self.run_tests("--rerun", testname, exitcode=EXITCODE_BAD_TEST)
          self.check_executed_tests(output, testname,
                                    failed=[testname],
-                                  rerun={testname: testname},
+                                  rerun=Rerun(testname,
+                                              match=None,
+                                              success=False),
                                    stats=0)
  
      def test_rerun_teardown_module_hook_failure(self):
@@ -1247,11 +1358,13 @@ class ArgsTestCase(BaseTestCase):
          """)
          testname = self.create_test(code=code)
  
-        output = self.run_tests("-w", testname, exitcode=EXITCODE_BAD_TEST)
-        self.check_executed_tests(output, testname,
+        output = self.run_tests("--rerun", testname, exitcode=EXITCODE_BAD_TEST)
+        self.check_executed_tests(output, [testname],
                                    failed=[testname],
-                                  rerun={testname: testname},
-                                  stats=1)
+                                  rerun=Rerun(testname,
+                                              match=None,
+                                              success=False),
+                                  stats=2)
  
      def test_rerun_setup_hook_failure(self):
          # FAILURE then FAILURE
@@ -1267,11 +1380,13 @@ class ArgsTestCase(BaseTestCase):
          """)
          testname = self.create_test(code=code)
  
-        output = self.run_tests("-w", testname, exitcode=EXITCODE_BAD_TEST)
+        output = self.run_tests("--rerun", testname, exitcode=EXITCODE_BAD_TEST)
          self.check_executed_tests(output, testname,
                                    failed=[testname],
-                                  rerun={testname: "test_success"},
-                                  stats=1)
+                                  rerun=Rerun(testname,
+                                              match="test_success",
+                                              success=False),
+                                  stats=2)
  
      def test_rerun_teardown_hook_failure(self):
          # FAILURE then FAILURE
@@ -1287,11 +1402,13 @@ class ArgsTestCase(BaseTestCase):
          """)
          testname = self.create_test(code=code)
  
-        output = self.run_tests("-w", testname, exitcode=EXITCODE_BAD_TEST)
+        output = self.run_tests("--rerun", testname, exitcode=EXITCODE_BAD_TEST)
          self.check_executed_tests(output, testname,
                                    failed=[testname],
-                                  rerun={testname: "test_success"},
-                                  stats=1)
+                                  rerun=Rerun(testname,
+                                              match="test_success",
+                                              success=False),
+                                  stats=2)
  
      def test_rerun_async_setup_hook_failure(self):
          # FAILURE then FAILURE
@@ -1307,11 +1424,12 @@ class ArgsTestCase(BaseTestCase):
          """)
          testname = self.create_test(code=code)
  
-        output = self.run_tests("-w", testname, exitcode=EXITCODE_BAD_TEST)
+        output = self.run_tests("--rerun", testname, exitcode=EXITCODE_BAD_TEST)
          self.check_executed_tests(output, testname,
-                                  failed=[testname],
-                                  rerun={testname: "test_success"},
-                                  stats=1)
+                                  rerun=Rerun(testname,
+                                              match="test_success",
+                                              success=False),
+                                  stats=2)
  
      def test_rerun_async_teardown_hook_failure(self):
          # FAILURE then FAILURE
@@ -1327,11 +1445,13 @@ class ArgsTestCase(BaseTestCase):
          """)
          testname = self.create_test(code=code)
  
-        output = self.run_tests("-w", testname, exitcode=EXITCODE_BAD_TEST)
+        output = self.run_tests("--rerun", testname, exitcode=EXITCODE_BAD_TEST)
          self.check_executed_tests(output, testname,
                                    failed=[testname],
-                                  rerun={testname: "test_success"},
-                                  stats=1)
+                                  rerun=Rerun(testname,
+                                              match="test_success",
+                                              success=False),
+                                  stats=2)
  
      def test_no_tests_ran(self):
          code = textwrap.dedent("""
@@ -1347,7 +1467,7 @@ class ArgsTestCase(BaseTestCase):
                                  exitcode=EXITCODE_NO_TESTS_RAN)
          self.check_executed_tests(output, [testname],
                                    run_no_tests=testname,
-                                  stats=0)
+                                  stats=0, filtered=True)
  
      def test_no_tests_ran_skip(self):
          code = textwrap.dedent("""
@@ -1378,7 +1498,7 @@ class ArgsTestCase(BaseTestCase):
                                  exitcode=EXITCODE_NO_TESTS_RAN)
          self.check_executed_tests(output, [testname, testname2],
                                    run_no_tests=[testname, testname2],
-                                  stats=0)
+                                  stats=0, filtered=True)
  
      def test_no_test_ran_some_test_exist_some_not(self):
          code = textwrap.dedent("""
@@ -1402,7 +1522,7 @@ class ArgsTestCase(BaseTestCase):
                                  "-m", "test_other_bug", exitcode=0)
          self.check_executed_tests(output, [testname, testname2],
                                    run_no_tests=[testname],
-                                  stats=1)
+                                  stats=1, filtered=True)
  
      @support.cpython_only
      def test_uncollectable(self):
@@ -1719,6 +1839,17 @@ class TestUtils(unittest.TestCase):
          self.assertEqual(utils.format_duration(3 * 3600 + 1),
                           '3 hour 1 sec')
  
+    def test_normalize_test_name(self):
+        normalize = normalize_test_name
+        self.assertEqual(normalize('test_access (test.test_os.FileTests.test_access)'),
+                         'test_access')
+        self.assertEqual(normalize('setUpClass (test.test_os.ChownFileTests)', is_error=True),
+                         'ChownFileTests')
+        self.assertEqual(normalize('test_success (test.test_bug.ExampleTests.test_success)', is_error=True),
+                         'test_success')
+        self.assertIsNone(normalize('setUpModule (test.test_x)', is_error=True))
+        self.assertIsNone(normalize('tearDownModule (test.test_module)', is_error=True))
+
  
  if __name__ == '__main__':
      unittest.main()
diff --git a/Misc/NEWS.d/next/Tests/2023-09-03-02-01-55.gh-issue-108834.iAwXzj.rst b/Misc/NEWS.d/next/Tests/2023-09-03-02-01-55.gh-issue-108834.iAwXzj.rst

new file mode 100644 (file)

index 0000000..43b9948
--- /dev/null
+++ b/Misc/NEWS.d/next/Tests/2023-09-03-02-01-55.gh-issue-108834.iAwXzj.rst
@@ -0,0 +1,6 @@
+When regrtest reruns failed tests in verbose mode (``./python -m test
+--rerun``), tests are now rerun in fresh worker processes rather than being
+executed in the main process. If a test does crash or is killed by a timeout,
+the main process can detect and handle the killed worker process. Tests are
+rerun in parallel if the ``-jN`` option is used to run tests in parallel.
+Patch by Victor Stinner.
diff --git a/Misc/NEWS.d/next/Tests/2023-09-03-06-17-12.gh-issue-108834.fjV-CJ.rst b/Misc/NEWS.d/next/Tests/2023-09-03-06-17-12.gh-issue-108834.fjV-CJ.rst

new file mode 100644 (file)

index 0000000..734cc66
--- /dev/null
+++ b/Misc/NEWS.d/next/Tests/2023-09-03-06-17-12.gh-issue-108834.fjV-CJ.rst
@@ -0,0 +1,2 @@
+Rename regrtest ``--verbose2`` option (``-w``) to ``--rerun``. Keep
+``--verbose2`` as a deprecated alias. Patch by Victor Stinner.
diff --git a/Misc/NEWS.d/next/Tests/2023-09-03-20-15-49.gh-issue-108834.Osvmhf.rst b/Misc/NEWS.d/next/Tests/2023-09-03-20-15-49.gh-issue-108834.Osvmhf.rst

new file mode 100644 (file)

index 0000000..098861f
--- /dev/null
+++ b/Misc/NEWS.d/next/Tests/2023-09-03-20-15-49.gh-issue-108834.Osvmhf.rst
@@ -0,0 +1,3 @@
+Add ``--fail-rerun option`` option to regrtest: if a test failed when then
+passed when rerun in verbose mode, exit the process with exit code 2
+(error), instead of exit code 0 (success). Patch by Victor Stinner.
author	Victor Stinner <vstinner@python.org>
	Sun, 3 Sep 2023 21:37:15 +0000 (23:37 +0200)
committer	GitHub <noreply@github.com>
	Sun, 3 Sep 2023 21:37:15 +0000 (21:37 +0000)
Lib/test/bisect_cmd.py		patch \| blob \| blame \| history
Lib/test/libregrtest/cmdline.py		patch \| blob \| blame \| history
Lib/test/libregrtest/main.py		patch \| blob \| blame \| history
Lib/test/libregrtest/runtest.py		patch \| blob \| blame \| history
Lib/test/libregrtest/runtest_mp.py		patch \| blob \| blame \| history
Lib/test/libregrtest/utils.py		patch \| blob \| blame \| history
Lib/test/support/__init__.py		patch \| blob \| blame \| history
Lib/test/support/testresult.py		patch \| blob \| blame \| history
Lib/test/test_regrtest.py		patch \| blob \| blame \| history
Misc/NEWS.d/next/Tests/2023-09-03-02-01-55.gh-issue-108834.iAwXzj.rst	[new file with mode: 0644]	patch \| blob
Misc/NEWS.d/next/Tests/2023-09-03-06-17-12.gh-issue-108834.fjV-CJ.rst	[new file with mode: 0644]	patch \| blob
Misc/NEWS.d/next/Tests/2023-09-03-20-15-49.gh-issue-108834.Osvmhf.rst	[new file with mode: 0644]	patch \| blob