libgomp: Enforce tasks executed lexically after scheduled

author Matthew Malcolmson <mmalcolmson@nvidia.com>

Tue, 20 Jan 2026 03:29:04 +0000 (03:29 +0000)

committer Prathamesh Kulkarni <prathameshk@nvidia.com>

Tue, 20 Jan 2026 03:29:04 +0000 (03:29 +0000)
author Matthew Malcolmson <mmalcolmson@nvidia.com>
Tue, 20 Jan 2026 03:29:04 +0000 (03:29 +0000)
committer Prathamesh Kulkarni <prathameshk@nvidia.com>
Tue, 20 Jan 2026 03:29:04 +0000 (03:29 +0000)
diff --git a/libgomp/config/gcn/bar.c b/libgomp/config/gcn/bar.c

index a655015f612db03e97838208ae4e0622318519e6..10c3f5d13623a2cbbef216e02248ada692b02982 100644 (file)
--- a/libgomp/config/gcn/bar.c
+++ b/libgomp/config/gcn/bar.c
@@ -128,7 +128,7 @@ gomp_team_barrier_wait_end (gomp_barrier_t *bar, gomp_barrier_state_t state)
           gen = __atomic_load_n (&bar->generation, MEMMODEL_ACQUIRE);
         }
      }
-  while (gen != state + BAR_INCR);
+  while (!gomp_barrier_state_is_incremented (gen, state));
  }
  
  void
@@ -207,7 +207,7 @@ gomp_team_barrier_wait_cancel_end (gomp_barrier_t *bar,
           gen = __atomic_load_n (&bar->generation, MEMMODEL_RELAXED);
         }
      }
-  while (gen != state + BAR_INCR);
+  while (!gomp_barrier_state_is_incremented (gen, state));
  
    return false;
  }
diff --git a/libgomp/config/gcn/bar.h b/libgomp/config/gcn/bar.h

index 4df46960470e37592dbbdb93113152c7bbfc66fa..0507efb7d2d1320154aac22731a4784a23ea69ae 100644 (file)
--- a/libgomp/config/gcn/bar.h
+++ b/libgomp/config/gcn/bar.h
@@ -165,4 +165,20 @@ gomp_team_barrier_done (gomp_barrier_t *bar, gomp_barrier_state_t state)
    bar->generation = (state & -BAR_INCR) + BAR_INCR;
  }
  
+static inline bool
+gomp_barrier_state_is_incremented (gomp_barrier_state_t gen,
+                                  gomp_barrier_state_t state)
+{
+  unsigned next_state = (state & -BAR_INCR) + BAR_INCR;
+  return next_state > state ? gen >= next_state : gen < state;
+}
+
+static inline bool
+gomp_barrier_has_completed (gomp_barrier_state_t state, gomp_barrier_t *bar)
+{
+  /* Handling overflow in the generation.  The "next" state could be less than
+     or greater than the current one.  */
+  return gomp_barrier_state_is_incremented (bar->generation, state);
+}
+
  #endif /* GOMP_BARRIER_H */
diff --git a/libgomp/config/linux/bar.c b/libgomp/config/linux/bar.c

index e850cebb51f8ff500e60413fa92aa116e5b83d97..2a1b052b11e6ccd569ac2a936b636002366ebf1b 100644 (file)
--- a/libgomp/config/linux/bar.c
+++ b/libgomp/config/linux/bar.c
@@ -118,7 +118,7 @@ gomp_team_barrier_wait_end (gomp_barrier_t *bar, gomp_barrier_state_t state)
         }
        generation |= gen & BAR_WAITING_FOR_TASK;
      }
-  while (gen != state + BAR_INCR);
+  while (!gomp_barrier_state_is_incremented (gen, state));
  }
  
  void
@@ -185,7 +185,7 @@ gomp_team_barrier_wait_cancel_end (gomp_barrier_t *bar,
         }
        generation |= gen & BAR_WAITING_FOR_TASK;
      }
-  while (gen != state + BAR_INCR);
+  while (!gomp_barrier_state_is_incremented (gen, state));
  
    return false;
  }
diff --git a/libgomp/config/linux/bar.h b/libgomp/config/linux/bar.h

index 3ad3111f3ddb624f04bb0af88870dafb88025961..b1fff01105a71b79e4329a1fd74a597be26be122 100644 (file)
--- a/libgomp/config/linux/bar.h
+++ b/libgomp/config/linux/bar.h
@@ -165,4 +165,20 @@ gomp_team_barrier_done (gomp_barrier_t *bar, gomp_barrier_state_t state)
    bar->generation = (state & -BAR_INCR) + BAR_INCR;
  }
  
+static inline bool
+gomp_barrier_state_is_incremented (gomp_barrier_state_t gen,
+                                  gomp_barrier_state_t state)
+{
+  unsigned next_state = (state & -BAR_INCR) + BAR_INCR;
+  return next_state > state ? gen >= next_state : gen < state;
+}
+
+static inline bool
+gomp_barrier_has_completed (gomp_barrier_state_t state, gomp_barrier_t *bar)
+{
+  /* Handling overflow in the generation.  The "next" state could be less than
+     or greater than the current one.  */
+  return gomp_barrier_state_is_incremented (bar->generation, state);
+}
+
  #endif /* GOMP_BARRIER_H */
diff --git a/libgomp/config/nvptx/bar.h b/libgomp/config/nvptx/bar.h

index 2ec1eb0f39b3f59a3ae66995cf8107e86518c828..aa2592ba5b3f433358f693de846889e2a78c81bc 100644 (file)
--- a/libgomp/config/nvptx/bar.h
+++ b/libgomp/config/nvptx/bar.h
@@ -169,4 +169,20 @@ gomp_team_barrier_done (gomp_barrier_t *bar, gomp_barrier_state_t state)
    bar->generation = (state & -BAR_INCR) + BAR_INCR;
  }
  
+static inline bool
+gomp_barrier_state_is_incremented (gomp_barrier_state_t gen,
+                                  gomp_barrier_state_t state)
+{
+  unsigned next_state = (state & -BAR_INCR) + BAR_INCR;
+  return next_state > state ? gen >= next_state : gen < state;
+}
+
+static inline bool
+gomp_barrier_has_completed (gomp_barrier_state_t state, gomp_barrier_t *bar)
+{
+  /* Handling overflow in the generation.  The "next" state could be less than
+     or greater than the current one.  */
+  return gomp_barrier_state_is_incremented (bar->generation, state);
+}
+
  #endif /* GOMP_BARRIER_H */
diff --git a/libgomp/config/posix/bar.c b/libgomp/config/posix/bar.c

index 31451cd8bfa7033e9501d32fa0944f706b7359d1..ce69905ba6744c1e3b90fa36587fcdd6715608cf 100644 (file)
--- a/libgomp/config/posix/bar.c
+++ b/libgomp/config/posix/bar.c
@@ -156,7 +156,7 @@ gomp_team_barrier_wait_end (gomp_barrier_t *bar, gomp_barrier_state_t state)
               gen = __atomic_load_n (&bar->generation, MEMMODEL_ACQUIRE);
             }
         }
-      while (gen != state + BAR_INCR);
+      while (!gomp_barrier_state_is_incremented (gen, state));
  
  #ifdef HAVE_SYNC_BUILTINS
        n = __sync_add_and_fetch (&bar->arrived, -1);
@@ -228,7 +228,7 @@ gomp_team_barrier_wait_cancel_end (gomp_barrier_t *bar,
                 break;
             }
         }
-      while (gen != state + BAR_INCR);
+      while (!gomp_barrier_state_is_incremented (gen, state));
  
  #ifdef HAVE_SYNC_BUILTINS
        n = __sync_add_and_fetch (&bar->arrived, -1);
diff --git a/libgomp/config/posix/bar.h b/libgomp/config/posix/bar.h

index 33d25592daa2de8d31bb49f456f7269964c24ce4..5a175c228c260d37b0952b75fd5e0367cfc44041 100644 (file)
--- a/libgomp/config/posix/bar.h
+++ b/libgomp/config/posix/bar.h
@@ -155,4 +155,20 @@ gomp_team_barrier_done (gomp_barrier_t *bar, gomp_barrier_state_t state)
    bar->generation = (state & -BAR_INCR) + BAR_INCR;
  }
  
+static inline bool
+gomp_barrier_state_is_incremented (gomp_barrier_state_t gen,
+                                  gomp_barrier_state_t state)
+{
+  unsigned next_state = (state & -BAR_INCR) + BAR_INCR;
+  return next_state > state ? gen >= next_state : gen < state;
+}
+
+static inline bool
+gomp_barrier_has_completed (gomp_barrier_state_t state, gomp_barrier_t *bar)
+{
+  /* Handling overflow in the generation.  The "next" state could be less than
+     or greater than the current one.  */
+  return gomp_barrier_state_is_incremented (bar->generation, state);
+}
+
  #endif /* GOMP_BARRIER_H */
diff --git a/libgomp/config/rtems/bar.h b/libgomp/config/rtems/bar.h

index 27326db9c77cf205bb21a9cf849a0ff56acff6b5..61fa91f300f2e94999bc02b218c18a37997df15b 100644 (file)
--- a/libgomp/config/rtems/bar.h
+++ b/libgomp/config/rtems/bar.h
@@ -167,4 +167,20 @@ gomp_team_barrier_done (gomp_barrier_t *bar, gomp_barrier_state_t state)
    bar->generation = (state & -BAR_INCR) + BAR_INCR;
  }
  
+static inline bool
+gomp_barrier_state_is_incremented (gomp_barrier_state_t gen,
+                                  gomp_barrier_state_t state)
+{
+  unsigned next_state = (state & -BAR_INCR) + BAR_INCR;
+  return next_state > state ? gen >= next_state : gen < state;
+}
+
+static inline bool
+gomp_barrier_has_completed (gomp_barrier_state_t state, gomp_barrier_t *bar)
+{
+  /* Handling overflow in the generation.  The "next" state could be less than
+     or greater than the current one.  */
+  return gomp_barrier_state_is_incremented (bar->generation, state);
+}
+
  #endif /* GOMP_BARRIER_H */
diff --git a/libgomp/task.c b/libgomp/task.c

index a6f21b05687f66e57f4a1a36435f8996f1432693..554636aadd5c8b6e08cc7179fe4c17aad9c56722 100644 (file)
--- a/libgomp/task.c
+++ b/libgomp/task.c
@@ -1559,6 +1559,23 @@ gomp_barrier_handle_tasks (gomp_barrier_state_t state)
    int do_wake = 0;
  
    gomp_mutex_lock (&team->task_lock);
+  /* Avoid running tasks from next task scheduling region (PR122314).
+     N.b. we check that `team->task_count != 0` in order to avoid the
+     non-atomic read of `bar->generation` "conflicting" (in the C standard
+     sense) with the atomic write of `bar->generation` in
+     `gomp_team_barrier_wait_end`.  That conflict would otherwise be a
+     data-race and hence UB.  One alternate approach could have been to
+     atomically load `bar->generation` in `gomp_barrier_has_completed`.
+
+     When `task_count == 0` we're not going to perform tasks anyway, so the
+     problem of PR122314 is naturally avoided.  */
+  if (team->task_count != 0
+      && gomp_barrier_has_completed (state, &team->barrier))
+    {
+      gomp_mutex_unlock (&team->task_lock);
+      return;
+    }
+
    if (gomp_barrier_last_thread (state))
      {
        if (team->task_count == 0)
diff --git a/libgomp/testsuite/libgomp.c/pr122314.c b/libgomp/testsuite/libgomp.c/pr122314.c

new file mode 100644 (file)

index 0000000..bb9565d
--- /dev/null
+++ b/libgomp/testsuite/libgomp.c/pr122314.c
@@ -0,0 +1,42 @@
+#include <omp.h>
+
+void abort ();
+
+#define NUM_THREADS 8
+unsigned full_data[NUM_THREADS] = {0};
+#pragma omp declare target enter(full_data)
+
+void
+test ()
+{
+#pragma omp parallel num_threads(8)
+  {
+#pragma omp barrier
+    /* Initialise so that if tasks are performed on the previous barrier their
+       updates get overridden.  This is a key behaviour of this test.  */
+    full_data[omp_get_thread_num ()] = 0;
+#pragma omp for
+    for (int i = 0; i < 10; i++)
+#pragma omp task
+      {
+       full_data[omp_get_thread_num ()] += 1;
+      }
+  }
+
+  unsigned total = 0;
+  for (int i = 0; i < NUM_THREADS; i++)
+    total += full_data[i];
+
+  if (total != 10)
+    abort ();
+}
+#pragma omp declare target enter(test)
+
+int
+main ()
+{
+  test ();
+
+#pragma omp target
+  test ();
+}
author	Matthew Malcolmson <mmalcolmson@nvidia.com>
	Tue, 20 Jan 2026 03:29:04 +0000 (03:29 +0000)
committer	Prathamesh Kulkarni <prathameshk@nvidia.com>
	Tue, 20 Jan 2026 03:29:04 +0000 (03:29 +0000)
libgomp/config/gcn/bar.c		patch \| blob \| blame \| history
libgomp/config/gcn/bar.h		patch \| blob \| blame \| history
libgomp/config/linux/bar.c		patch \| blob \| blame \| history
libgomp/config/linux/bar.h		patch \| blob \| blame \| history
libgomp/config/nvptx/bar.h		patch \| blob \| blame \| history
libgomp/config/posix/bar.c		patch \| blob \| blame \| history
libgomp/config/posix/bar.h		patch \| blob \| blame \| history
libgomp/config/rtems/bar.h		patch \| blob \| blame \| history
libgomp/task.c		patch \| blob \| blame \| history
libgomp/testsuite/libgomp.c/pr122314.c	[new file with mode: 0644]	patch \| blob