runtests: add retry option to reduce flakiness

author Viktor Szakats <commit@vsz.me>

Thu, 17 Apr 2025 14:25:37 +0000 (16:25 +0200)

committer Viktor Szakats <commit@vsz.me>

Sat, 19 Apr 2025 08:41:58 +0000 (10:41 +0200)
author Viktor Szakats <commit@vsz.me>
Thu, 17 Apr 2025 14:25:37 +0000 (16:25 +0200)
committer Viktor Szakats <commit@vsz.me>
Sat, 19 Apr 2025 08:41:58 +0000 (10:41 +0200)
diff --git a/tests/CMakeLists.txt b/tests/CMakeLists.txt

index 12ed61275f234b1acaf591571f0e219325644408..5fb7b764b014919259e06e6f21a3150839ce1e6d 100644 (file)
--- a/tests/CMakeLists.txt
+++ b/tests/CMakeLists.txt
@@ -103,7 +103,7 @@ curl_add_runtests(test-am        "-a -am")
  curl_add_runtests(test-full      "-a -p -r")
  # ~flaky means that it ignores results of tests using the flaky keyword
  curl_add_runtests(test-nonflaky  "-a -p ~flaky ~timing-dependent")
-curl_add_runtests(test-ci        "-a -p ~flaky ~timing-dependent -r -j20")
+curl_add_runtests(test-ci        "-a -p ~flaky ~timing-dependent -r --retry=5 -j20")
  curl_add_runtests(test-torture   "-a -t -j20")
  curl_add_runtests(test-event     "-a -e")
  
diff --git a/tests/Makefile.am b/tests/Makefile.am

index b885a7edd08a209738648cf76d9aa450f29b6387..8c40bc3a1a52fcfd32fc2fea3263f121838f71a4 100644 (file)
--- a/tests/Makefile.am
+++ b/tests/Makefile.am
@@ -142,7 +142,7 @@ TEST_E = -a -e
  TEST_NF = -a -p ~flaky ~timing-dependent
  
  # special CI target derived from nonflaky with CI-specific flags
-TEST_CI = $(TEST_NF) -r -j20
+TEST_CI = $(TEST_NF) -r --retry=5 -j20
  
  PYTEST = pytest
  endif
diff --git a/tests/runtests.md b/tests/runtests.md

index 60b1c293812dd69bd2c0017d3e24917a4872deb6..346ce5aca1f268c1dae00f873b9cb5055064a2ac 100644 (file)
--- a/tests/runtests.md
+++ b/tests/runtests.md
@@ -228,6 +228,10 @@ sequence at the end of the initially given one.
  If **-R** option is also used, the scrambling is done after the repeats have
  extended the test sequence.
  
+## `--retry=[num]`
+
+Number of attempts for the whole test run to retry failed tests.
+
  ## `-s`
  
  Shorter output. Speaks less than default.
diff --git a/tests/runtests.pl b/tests/runtests.pl

index a3c6c2d8b20dde0cedcc5aecd63fc97f6637ee81..fde25538eedde73397508c1475ed4e99741dbc02 100755 (executable)
--- a/tests/runtests.pl
+++ b/tests/runtests.pl
@@ -123,6 +123,7 @@ my $TESTCASES="all";
  
  my $libtool;
  my $repeat = 0;
+my $retry = 0;
  
  my $start;          # time at which testing started
  my $args;           # command-line arguments
@@ -2353,6 +2354,10 @@ while(@ARGV) {
          # Repeat-run the given tests this many times
          $repeat = $1;
      }
+    elsif($ARGV[0] =~ /--retry=(\d+)/) {
+        # Number of attempts for the whole test run to retry failed tests
+        $retry = $1;
+    }
      elsif($ARGV[0] =~ /--seed=(\d+)/) {
          # Set a fixed random seed (used for -R and --shallow)
          $randseed = $1;
@@ -2461,6 +2466,7 @@ Usage: runtests.pl [options] [test selection(s)]
    -r       run time statistics
    -rf      full run time statistics
    --repeat=[num] run the given tests this many times
+  --retry=[num] number of attempts for the whole test run to retry failed tests
    -s       short output
    --seed=[num] set the random seed to a fixed number
    --shallow=[num] randomly makes the torture tests "thinner"
@@ -2875,9 +2881,12 @@ sub displaylogs {
  
  my $failed;
  my $failedign;
+my $failedre;
  my $ok=0;
  my $ign=0;
  my $total=0;
+my $executed=0;
+my $retry_done=0;
  my $lasttest=0;
  my @at = split(" ", $TESTCASES);
  my $count=0;
@@ -2925,6 +2934,16 @@ createrunners($numrunners);
  
  # run through each candidate test and execute it
  my $runner_wait_cnt = 0;
+
+# number of retry attempts for the whole test run
+my $retry_left;
+if($torture) {
+    $retry_left = 0;  # No use of retrying torture tests
+}
+else {
+    $retry_left = $retry;
+}
+
  while () {
      # check the abort flag
      if($globalabort) {
@@ -3014,6 +3033,7 @@ while () {
                      }
  
                      $total++; # number of tests we've run
+                    $executed++;
  
                      if($error>0) {
                          if($error==2) {
@@ -3021,7 +3041,17 @@ while () {
                              $failedign .= "$testnum ";
                          }
                          else {
-                            $failed.= "$testnum ";
+                            # make another attempt to counteract flaky failures
+                            if($retry_left > 0) {
+                                $retry_left--;
+                                $retry_done++;
+                                $total--;
+                                push(@runtests, $testnum);
+                                $failedre .= "$testnum ";
+                            }
+                            else {
+                                $failed.= "$testnum ";
+                            }
                          }
                          if($postmortem) {
                              # display all files in $LOGDIR/ in a nice way
@@ -3176,7 +3206,15 @@ sub testnumdetails {
      }
  }
  
-if($total) {
+if($executed) {
+    if($failedre) {
+        my $sorted = numsortwords($failedre);
+        logmsg "::group::Failed Retried Test details\n";
+        testnumdetails("FAIL-RETRIED", $sorted);
+        logmsg "RETRIED: failed tests: $sorted\n";
+        logmsg "::endgroup::\n";
+    }
+
      if($passedign) {
          my $sorted = numsortwords($passedign);
          logmsg "::group::Passed Ignored Test details\n";
author	Viktor Szakats <commit@vsz.me>
	Thu, 17 Apr 2025 14:25:37 +0000 (16:25 +0200)
committer	Viktor Szakats <commit@vsz.me>
	Sat, 19 Apr 2025 08:41:58 +0000 (10:41 +0200)
tests/CMakeLists.txt		patch \| blob \| blame \| history
tests/Makefile.am		patch \| blob \| blame \| history
tests/runtests.md		patch \| blob \| blame \| history
tests/runtests.pl		patch \| blob \| blame \| history