openmp: allocate clause vs. *reduction array sections [PR97670]

author Jakub Jelinek <jakub@redhat.com>

Wed, 4 Nov 2020 08:37:22 +0000 (09:37 +0100)

committer Jakub Jelinek <jakub@redhat.com>

Wed, 4 Nov 2020 09:02:01 +0000 (10:02 +0100)
author Jakub Jelinek <jakub@redhat.com>
Wed, 4 Nov 2020 08:37:22 +0000 (09:37 +0100)
committer Jakub Jelinek <jakub@redhat.com>
Wed, 4 Nov 2020 09:02:01 +0000 (10:02 +0100)
diff --git a/gcc/c-family/c-omp.c b/gcc/c-family/c-omp.c

index bce2f8e076f46885f18eeaee948daac7cc4aa097..da5564be5badc6a8903a511f2fd87c6081181e81 100644 (file)
--- a/gcc/c-family/c-omp.c
+++ b/gcc/c-family/c-omp.c
@@ -2289,13 +2289,36 @@ c_omp_split_clauses (location_t loc, enum tree_code code,
             for (c = cclauses[i]; c; c = OMP_CLAUSE_CHAIN (c))
               switch (OMP_CLAUSE_CODE (c))
                 {
+               case OMP_CLAUSE_REDUCTION:
+               case OMP_CLAUSE_IN_REDUCTION:
+               case OMP_CLAUSE_TASK_REDUCTION:
+                 if (TREE_CODE (OMP_CLAUSE_DECL (c)) == MEM_REF)
+                   {
+                     tree t = TREE_OPERAND (OMP_CLAUSE_DECL (c), 0);
+                     if (TREE_CODE (t) == POINTER_PLUS_EXPR)
+                       t = TREE_OPERAND (t, 0);
+                     if (TREE_CODE (t) == ADDR_EXPR
+                         || TREE_CODE (t) == INDIRECT_REF)
+                       t = TREE_OPERAND (t, 0);
+                     if (DECL_P (t))
+                       bitmap_clear_bit (&allocate_head, DECL_UID (t));
+                     break;
+                   }
+                 else if (TREE_CODE (OMP_CLAUSE_DECL (c)) == TREE_LIST)
+                   {
+                     tree t;
+                     for (t = OMP_CLAUSE_DECL (c);
+                          TREE_CODE (t) == TREE_LIST; t = TREE_CHAIN (t))
+                       ;
+                     if (DECL_P (t))
+                       bitmap_clear_bit (&allocate_head, DECL_UID (t));
+                     break;
+                   }
+                 /* FALLTHRU */
                 case OMP_CLAUSE_PRIVATE:
                 case OMP_CLAUSE_FIRSTPRIVATE:
                 case OMP_CLAUSE_LASTPRIVATE:
                 case OMP_CLAUSE_LINEAR:
-               case OMP_CLAUSE_REDUCTION:
-               case OMP_CLAUSE_IN_REDUCTION:
-               case OMP_CLAUSE_TASK_REDUCTION:
                   if (DECL_P (OMP_CLAUSE_DECL (c)))
                     bitmap_clear_bit (&allocate_head,
                                       DECL_UID (OMP_CLAUSE_DECL (c)));
diff --git a/gcc/c/c-typeck.c b/gcc/c/c-typeck.c

index 0d75ed4f8b1f5fad39aab687aab15e76f87a737b..2bf46f44c6e379d74343395edb3fdd6ae6f646ff 100644 (file)
--- a/gcc/c/c-typeck.c
+++ b/gcc/c/c-typeck.c
@@ -15153,13 +15153,26 @@ c_finish_omp_clauses (tree clauses, enum c_omp_region_type ort)
         if (allocate_seen)
           switch (OMP_CLAUSE_CODE (c))
             {
+           case OMP_CLAUSE_REDUCTION:
+           case OMP_CLAUSE_IN_REDUCTION:
+           case OMP_CLAUSE_TASK_REDUCTION:
+             if (TREE_CODE (OMP_CLAUSE_DECL (c)) == MEM_REF)
+               {
+                 t = TREE_OPERAND (OMP_CLAUSE_DECL (c), 0);
+                 if (TREE_CODE (t) == POINTER_PLUS_EXPR)
+                   t = TREE_OPERAND (t, 0);
+                 if (TREE_CODE (t) == ADDR_EXPR
+                     || TREE_CODE (t) == INDIRECT_REF)
+                   t = TREE_OPERAND (t, 0);
+                 if (DECL_P (t))
+                   bitmap_clear_bit (&aligned_head, DECL_UID (t));
+                 break;
+               }
+             /* FALLTHRU */
             case OMP_CLAUSE_PRIVATE:
             case OMP_CLAUSE_FIRSTPRIVATE:
             case OMP_CLAUSE_LASTPRIVATE:
             case OMP_CLAUSE_LINEAR:
-           case OMP_CLAUSE_REDUCTION:
-           case OMP_CLAUSE_IN_REDUCTION:
-           case OMP_CLAUSE_TASK_REDUCTION:
               if (DECL_P (OMP_CLAUSE_DECL (c)))
                 bitmap_clear_bit (&aligned_head,
                                   DECL_UID (OMP_CLAUSE_DECL (c)));
diff --git a/gcc/cp/semantics.c b/gcc/cp/semantics.c

index 352ebe03436f23e574e748570c6dc724e79038b7..a550db694881714c080d30262ad55265f89345d2 100644 (file)
--- a/gcc/cp/semantics.c
+++ b/gcc/cp/semantics.c
@@ -8190,17 +8190,11 @@ finish_omp_clauses (tree clauses, enum c_omp_region_type ort)
         }
  
        t = OMP_CLAUSE_DECL (c);
-      if (processing_template_decl
-         && !VAR_P (t) && TREE_CODE (t) != PARM_DECL)
-       {
-         pc = &OMP_CLAUSE_CHAIN (c);
-         continue;
-       }
-
        switch (c_kind)
         {
         case OMP_CLAUSE_LASTPRIVATE:
-         if (!bitmap_bit_p (&firstprivate_head, DECL_UID (t)))
+         if (DECL_P (t)
+             && !bitmap_bit_p (&firstprivate_head, DECL_UID (t)))
             {
               need_default_ctor = true;
               need_dtor = true;
@@ -8210,6 +8204,34 @@ finish_omp_clauses (tree clauses, enum c_omp_region_type ort)
         case OMP_CLAUSE_REDUCTION:
         case OMP_CLAUSE_IN_REDUCTION:
         case OMP_CLAUSE_TASK_REDUCTION:
+         if (allocate_seen)
+           {
+             if (TREE_CODE (t) == MEM_REF)
+               {
+                 t = TREE_OPERAND (t, 0);
+                 if (TREE_CODE (t) == POINTER_PLUS_EXPR)
+                   t = TREE_OPERAND (t, 0);
+                 if (TREE_CODE (t) == ADDR_EXPR
+                     || TREE_CODE (t) == INDIRECT_REF)
+                   t = TREE_OPERAND (t, 0);
+                 if (DECL_P (t))
+                   bitmap_clear_bit (&aligned_head, DECL_UID (t));
+               }
+             else if (TREE_CODE (t) == TREE_LIST)
+               {
+                 while (TREE_CODE (t) == TREE_LIST)
+                   t = TREE_CHAIN (t);
+                 if (DECL_P (t))
+                   bitmap_clear_bit (&aligned_head, DECL_UID (t));
+                 t = OMP_CLAUSE_DECL (c);
+               }
+             else if (DECL_P (t))
+               bitmap_clear_bit (&aligned_head, DECL_UID (t));
+             t = OMP_CLAUSE_DECL (c);
+           }
+         if (processing_template_decl
+             && !VAR_P (t) && TREE_CODE (t) != PARM_DECL)
+           break;
           if (finish_omp_reduction_clause (c, &need_default_ctor,
                                            &need_dtor))
             remove = true;
@@ -8218,6 +8240,9 @@ finish_omp_clauses (tree clauses, enum c_omp_region_type ort)
           break;
  
         case OMP_CLAUSE_COPYIN:
+         if (processing_template_decl
+             && !VAR_P (t) && TREE_CODE (t) != PARM_DECL)
+           break;
           if (!VAR_P (t) || !CP_DECL_THREAD_LOCAL_P (t))
             {
               error_at (OMP_CLAUSE_LOCATION (c),
@@ -8230,6 +8255,13 @@ finish_omp_clauses (tree clauses, enum c_omp_region_type ort)
           break;
         }
  
+      if (processing_template_decl
+         && !VAR_P (t) && TREE_CODE (t) != PARM_DECL)
+       {
+         pc = &OMP_CLAUSE_CHAIN (c);
+         continue;
+       }
+
        if (need_complete_type || need_copy_assignment)
         {
           t = require_complete_type (t);
@@ -8247,8 +8279,7 @@ finish_omp_clauses (tree clauses, enum c_omp_region_type ort)
           if (allocate_seen
               && OMP_CLAUSE_CODE (c) != OMP_CLAUSE_SHARED
               && DECL_P (t))
-           bitmap_clear_bit (&aligned_head,
-                             DECL_UID (OMP_CLAUSE_DECL (c)));
+           bitmap_clear_bit (&aligned_head, DECL_UID (t));
             
           if (VAR_P (t) && CP_DECL_THREAD_LOCAL_P (t))
             share_name = "threadprivate";
@@ -8349,6 +8380,7 @@ finish_omp_clauses (tree clauses, enum c_omp_region_type ort)
         bool remove = false;
         if (OMP_CLAUSE_CODE (c) == OMP_CLAUSE_ALLOCATE
             && !OMP_CLAUSE_ALLOCATE_COMBINED (c)
+           && DECL_P (OMP_CLAUSE_DECL (c))
             && bitmap_bit_p (&aligned_head, DECL_UID (OMP_CLAUSE_DECL (c))))
           {
             error_at (OMP_CLAUSE_LOCATION (c),
diff --git a/gcc/testsuite/c-c++-common/gomp/allocate-4.c b/gcc/testsuite/c-c++-common/gomp/allocate-4.c

new file mode 100644 (file)

index 0000000..4e0f44a
--- /dev/null
+++ b/gcc/testsuite/c-c++-common/gomp/allocate-4.c
@@ -0,0 +1,39 @@
+void
+foo (void)
+{
+  int s[4] = { 0, 0, 0, 0 };
+  int *p = s;
+#pragma omp parallel reduction (+: s) allocate(s)
+  s[0]++;
+#pragma omp parallel reduction (+: s[0:3]) allocate(s)
+  s[0]++;
+#pragma omp parallel reduction (+: s[2:2]) allocate(s)
+  s[2]++;
+#pragma omp parallel reduction (+: p[:2]) allocate(p)
+  p[0]++;
+#pragma omp parallel reduction (+: p[2:2]) allocate(p)
+  p[2]++;
+}
+
+void
+bar (void)
+{
+  int s[4] = { 0, 0, 0, 0 };
+  int *p = s;
+  int i;
+#pragma omp teams distribute parallel for reduction (+: s) allocate(s)
+  for (i = 0; i < 64; i++)
+    s[0]++;
+#pragma omp teams distribute parallel for reduction (+: s[0:3]) allocate(s)
+  for (i = 0; i < 64; i++)
+    s[0]++;
+#pragma omp teams distribute parallel for reduction (+: s[2:2]) allocate(s)
+  for (i = 0; i < 64; i++)
+    s[2]++;
+#pragma omp teams distribute parallel for reduction (+: p[:2]) allocate(p)
+  for (i = 0; i < 64; i++)
+    p[0]++;
+#pragma omp teams distribute parallel for reduction (+: p[2:2]) allocate(p)
+  for (i = 0; i < 64; i++)
+    p[2]++;
+}
diff --git a/gcc/testsuite/g++.dg/gomp/allocate-2.C b/gcc/testsuite/g++.dg/gomp/allocate-2.C

new file mode 100644 (file)

index 0000000..b8cf480
--- /dev/null
+++ b/gcc/testsuite/g++.dg/gomp/allocate-2.C
@@ -0,0 +1,11 @@
+// PR c++/97670
+
+struct S { int s; };
+
+void
+foo ()
+{
+  S s[1] = { S () };
+#pragma omp parallel reduction (+: s) allocate(s)      // { dg-error "user defined reduction not found for 's'" }
+  s[0].s++;
+}
diff --git a/gcc/testsuite/g++.dg/gomp/allocate-3.C b/gcc/testsuite/g++.dg/gomp/allocate-3.C

new file mode 100644 (file)

index 0000000..e778314
--- /dev/null
+++ b/gcc/testsuite/g++.dg/gomp/allocate-3.C
@@ -0,0 +1,206 @@
+template <typename T>
+void
+foo (T &x, T (&y)[4], T *&z, int &u, int (&v)[4], int *&w)
+{
+  T s[4] = { 0, 0, 0, 0 };
+  T *p = s;
+#pragma omp parallel reduction (+: s) allocate(s)
+  s[0]++;
+#pragma omp parallel reduction (+: s[0:3]) allocate(s)
+  s[0]++;
+#pragma omp parallel reduction (+: s[2:2]) allocate(s)
+  s[2]++;
+#pragma omp parallel reduction (+: p[:2]) allocate(p)
+  p[0]++;
+#pragma omp parallel reduction (+: p[2:2]) allocate(p)
+  p[2]++;
+  int s2[4] = { 0, 0, 0, 0 };
+  int *p2 = s2;
+#pragma omp parallel reduction (+: s2) allocate(s2)
+  s2[0]++;
+#pragma omp parallel reduction (+: s2[0:3]) allocate(s2)
+  s2[0]++;
+#pragma omp parallel reduction (+: s2[2:2]) allocate(s2)
+  s2[2]++;
+#pragma omp parallel reduction (+: p2[:2]) allocate(p2)
+  p2[0]++;
+#pragma omp parallel reduction (+: p2[2:2]) allocate(p2)
+  p2[2]++;
+#pragma omp parallel reduction (+: x) allocate(x)
+  x++;
+#pragma omp parallel reduction (+: y) allocate(y)
+  y[0]++;
+#pragma omp parallel reduction (+: y[0:3]) allocate(y)
+  y[0]++;
+#pragma omp parallel reduction (+: y[2:2]) allocate(y)
+  y[2]++;
+#pragma omp parallel reduction (+: z[:2]) allocate(z)
+  z[0]++;
+#pragma omp parallel reduction (+: z[2:2]) allocate(z)
+  z[2]++;
+#pragma omp parallel reduction (+: u) allocate(u)
+  u++;
+#pragma omp parallel reduction (+: v) allocate(v)
+  v[0]++;
+#pragma omp parallel reduction (+: v[0:3]) allocate(v)
+  v[0]++;
+#pragma omp parallel reduction (+: v[2:2]) allocate(v)
+  v[2]++;
+#pragma omp parallel reduction (+: w[:2]) allocate(w)
+  w[0]++;
+#pragma omp parallel reduction (+: w[2:2]) allocate(w)
+  w[2]++;
+}
+
+template <typename T>
+void
+bar (T &x, T (&y)[4], T *&z, int &u, int (&v)[4], int *&w)
+{
+  T s[4] = { 0, 0, 0, 0 };
+  T *p = s;
+  int i;
+#pragma omp teams distribute parallel for reduction (+: s) allocate(s)
+  for (i = 0; i < 64; i++)
+    s[0]++;
+#pragma omp teams distribute parallel for reduction (+: s[0:3]) allocate(s)
+  for (i = 0; i < 64; i++)
+    s[0]++;
+#pragma omp teams distribute parallel for reduction (+: s[2:2]) allocate(s)
+  for (i = 0; i < 64; i++)
+    s[2]++;
+#pragma omp teams distribute parallel for reduction (+: p[:2]) allocate(p)
+  for (i = 0; i < 64; i++)
+    p[0]++;
+#pragma omp teams distribute parallel for reduction (+: p[2:2]) allocate(p)
+  for (i = 0; i < 64; i++)
+    p[2]++;
+  int s2[4] = { 0, 0, 0, 0 };
+  int *p2 = s2;
+#pragma omp teams distribute parallel for reduction (+: s2) allocate(s2)
+  for (i = 0; i < 64; i++)
+    s2[0]++;
+#pragma omp teams distribute parallel for reduction (+: s2[0:3]) allocate(s2)
+  for (i = 0; i < 64; i++)
+    s2[0]++;
+#pragma omp teams distribute parallel for reduction (+: s2[2:2]) allocate(s2)
+  for (i = 0; i < 64; i++)
+    s2[2]++;
+#pragma omp teams distribute parallel for reduction (+: p2[:2]) allocate(p2)
+  for (i = 0; i < 64; i++)
+    p2[0]++;
+#pragma omp teams distribute parallel for reduction (+: p2[2:2]) allocate(p2)
+  for (i = 0; i < 64; i++)
+    p2[2]++;
+#pragma omp teams distribute parallel for reduction (+: x) allocate(x)
+  for (i = 0; i < 64; i++)
+    x++;
+#pragma omp teams distribute parallel for reduction (+: y) allocate(y)
+  for (i = 0; i < 64; i++)
+    y[0]++;
+#pragma omp teams distribute parallel for reduction (+: y[0:3]) allocate(y)
+  for (i = 0; i < 64; i++)
+    y[0]++;
+#pragma omp teams distribute parallel for reduction (+: y[2:2]) allocate(y)
+  for (i = 0; i < 64; i++)
+    y[2]++;
+#pragma omp teams distribute parallel for reduction (+: z[:2]) allocate(z)
+  for (i = 0; i < 64; i++)
+    z[0]++;
+#pragma omp teams distribute parallel for reduction (+: z[2:2]) allocate(z)
+  for (i = 0; i < 64; i++)
+    z[2]++;
+#pragma omp teams distribute parallel for reduction (+: u) allocate(u)
+  for (i = 0; i < 64; i++)
+    u++;
+#pragma omp teams distribute parallel for reduction (+: v) allocate(v)
+  for (i = 0; i < 64; i++)
+    v[0]++;
+#pragma omp teams distribute parallel for reduction (+: v[0:3]) allocate(v)
+  for (i = 0; i < 64; i++)
+    v[0]++;
+#pragma omp teams distribute parallel for reduction (+: v[2:2]) allocate(v)
+  for (i = 0; i < 64; i++)
+    v[2]++;
+#pragma omp teams distribute parallel for reduction (+: w[:2]) allocate(w)
+  for (i = 0; i < 64; i++)
+    w[0]++;
+#pragma omp teams distribute parallel for reduction (+: w[2:2]) allocate(w)
+  for (i = 0; i < 64; i++)
+    w[2]++;
+}
+
+void
+baz (long int &x, long int (&y)[4], long int *&z)
+{
+#pragma omp parallel reduction (+: x) allocate(x)
+  x++;
+#pragma omp parallel reduction (+: y) allocate(y)
+  y[0]++;
+#pragma omp parallel reduction (+: y[0:3]) allocate(y)
+  y[0]++;
+#pragma omp parallel reduction (+: y[2:2]) allocate(y)
+  y[2]++;
+#pragma omp parallel reduction (+: z[:2]) allocate(z)
+  z[0]++;
+#pragma omp parallel reduction (+: z[2:2]) allocate(z)
+  z[2]++;
+}
+
+void
+qux (long long int &x, long long int (&y)[4], long long int *&z)
+{
+  int i;
+#pragma omp teams distribute parallel for reduction (+: x) allocate(x)
+  for (i = 0; i < 64; i++)
+    x++;
+#pragma omp teams distribute parallel for reduction (+: y) allocate(y)
+  for (i = 0; i < 64; i++)
+    y[0]++;
+#pragma omp teams distribute parallel for reduction (+: y[0:3]) allocate(y)
+  for (i = 0; i < 64; i++)
+    y[0]++;
+#pragma omp teams distribute parallel for reduction (+: y[2:2]) allocate(y)
+  for (i = 0; i < 64; i++)
+    y[2]++;
+#pragma omp teams distribute parallel for reduction (+: z[:2]) allocate(z)
+  for (i = 0; i < 64; i++)
+    z[0]++;
+#pragma omp teams distribute parallel for reduction (+: z[2:2]) allocate(z)
+  for (i = 0; i < 64; i++)
+    z[2]++;
+}
+
+void
+test ()
+{
+  long int x = 0;
+  long int y[4] = { 0, 0, 0, 0 };
+  long int *z = y;
+  int u = 0;
+  int v[4] = { 0, 0, 0, 0 };
+  int *w = v;
+  long long int x2 = 0;
+  long long int y2[4] = { 0, 0, 0, 0 };
+  long long int *z2 = y2;
+  foo (x, y, z, u, v, w);
+  bar (x2, y2, z2, u, v, w);
+}
+
+namespace N
+{
+  int a;
+  void foo ()
+  {
+    int i;
+    #pragma omp parallel firstprivate (N::a) allocate (a)
+    a++;
+    #pragma omp parallel firstprivate (a) allocate (N::a)
+    a++;
+    #pragma omp teams distribute parallel for firstprivate (N::a) allocate (a)
+    for (i = 0; i < 64; i++)
+      a++;
+    #pragma omp teams distribute parallel for firstprivate (a) allocate (N::a)
+    for (i = 0; i < 64; i++)
+      a++;
+  }
+}
author	Jakub Jelinek <jakub@redhat.com>
	Wed, 4 Nov 2020 08:37:22 +0000 (09:37 +0100)
committer	Jakub Jelinek <jakub@redhat.com>
	Wed, 4 Nov 2020 09:02:01 +0000 (10:02 +0100)
gcc/c-family/c-omp.c		patch \| blob \| blame \| history
gcc/c/c-typeck.c		patch \| blob \| blame \| history
gcc/cp/semantics.c		patch \| blob \| blame \| history
gcc/testsuite/c-c++-common/gomp/allocate-4.c	[new file with mode: 0644]	patch \| blob
gcc/testsuite/g++.dg/gomp/allocate-2.C	[new file with mode: 0644]	patch \| blob
gcc/testsuite/g++.dg/gomp/allocate-3.C	[new file with mode: 0644]	patch \| blob