]> git.ipfire.org Git - thirdparty/gcc.git/blobdiff - libgomp/oacc-cuda.c
PR libstdc++/90920 restore previous checks for empty ranges
[thirdparty/gcc.git] / libgomp / oacc-cuda.c
index 20774c1b48763b2fb092c07bfe6d6bffea609400..7a42085c877705383215e2bbf1a5a093b8ef4bd7 100644 (file)
@@ -1,6 +1,6 @@
 /* OpenACC Runtime Library: CUDA support glue.
 
-   Copyright (C) 2014-2018 Free Software Foundation, Inc.
+   Copyright (C) 2014-2019 Free Software Foundation, Inc.
 
    Contributed by Mentor Embedded.
 
    <http://www.gnu.org/licenses/>.  */
 
 #include "openacc.h"
-#include "config.h"
 #include "libgomp.h"
 #include "oacc-int.h"
+#include <assert.h>
 
 void *
 acc_get_current_cuda_device (void)
 {
   struct goacc_thread *thr = goacc_thread ();
 
+  void *ret = NULL;
   if (thr && thr->dev && thr->dev->openacc.cuda.get_current_device_func)
-    return thr->dev->openacc.cuda.get_current_device_func ();
+    {
+      acc_prof_info prof_info;
+      acc_api_info api_info;
+      bool profiling_p = GOACC_PROFILING_SETUP_P (thr, &prof_info, &api_info);
 
-  return NULL;
+      ret = thr->dev->openacc.cuda.get_current_device_func ();
+
+      if (profiling_p)
+       {
+         thr->prof_info = NULL;
+         thr->api_info = NULL;
+       }
+    }
+
+  return ret;
 }
 
 void *
@@ -47,10 +60,23 @@ acc_get_current_cuda_context (void)
 {
   struct goacc_thread *thr = goacc_thread ();
 
+  void *ret = NULL;
   if (thr && thr->dev && thr->dev->openacc.cuda.get_current_context_func)
-    return thr->dev->openacc.cuda.get_current_context_func ();
-  return NULL;
+    {
+      acc_prof_info prof_info;
+      acc_api_info api_info;
+      bool profiling_p = GOACC_PROFILING_SETUP_P (thr, &prof_info, &api_info);
+
+      ret = thr->dev->openacc.cuda.get_current_context_func ();
+
+      if (profiling_p)
+       {
+         thr->prof_info = NULL;
+         thr->api_info = NULL;
+       }
+    }
+
+  return ret;
 }
 
 void *
@@ -58,13 +84,35 @@ acc_get_cuda_stream (int async)
 {
   struct goacc_thread *thr = goacc_thread ();
 
-  if (!async_valid_stream_id_p (async))
+  if (!async_valid_p (async))
     return NULL;
 
+  void *ret = NULL;
   if (thr && thr->dev && thr->dev->openacc.cuda.get_stream_func)
-    return thr->dev->openacc.cuda.get_stream_func (async);
-  return NULL;
+    {
+      goacc_aq aq = lookup_goacc_asyncqueue (thr, false, async);
+      if (!aq)
+       return ret;
+
+      acc_prof_info prof_info;
+      acc_api_info api_info;
+      bool profiling_p = GOACC_PROFILING_SETUP_P (thr, &prof_info, &api_info);
+      if (profiling_p)
+       {
+         prof_info.async = async;
+         prof_info.async_queue = prof_info.async;
+       }
+
+      ret = thr->dev->openacc.cuda.get_stream_func (aq);
+
+      if (profiling_p)
+       {
+         thr->prof_info = NULL;
+         thr->api_info = NULL;
+       }
+    }
+
+  return ret;
 }
 
 int
@@ -72,15 +120,47 @@ acc_set_cuda_stream (int async, void *stream)
 {
   struct goacc_thread *thr;
 
-  if (!async_valid_stream_id_p (async) || stream == NULL)
+  if (!async_valid_p (async) || stream == NULL)
     return 0;
 
   goacc_lazy_initialize ();
 
   thr = goacc_thread ();
 
+  int ret = -1;
   if (thr && thr->dev && thr->dev->openacc.cuda.set_stream_func)
-    return thr->dev->openacc.cuda.set_stream_func (async, stream);
-
-  return -1;
+    {
+      acc_prof_info prof_info;
+      acc_api_info api_info;
+      bool profiling_p = GOACC_PROFILING_SETUP_P (thr, &prof_info, &api_info);
+      if (profiling_p)
+       {
+         prof_info.async = async;
+         prof_info.async_queue = prof_info.async;
+       }
+
+      goacc_aq aq = get_goacc_asyncqueue (async);
+      /* Due to not using an asyncqueue for "acc_async_sync", this cannot be
+        used to change the CUDA stream associated with "acc_async_sync".  */
+      if (!aq)
+       {
+         assert (async == acc_async_sync);
+         gomp_debug (0, "Refusing request to set CUDA stream associated"
+                     " with \"acc_async_sync\"\n");
+         ret = 0;
+         goto out_prof;
+       }
+      gomp_mutex_lock (&thr->dev->openacc.async.lock);
+      ret = thr->dev->openacc.cuda.set_stream_func (aq, stream);
+      gomp_mutex_unlock (&thr->dev->openacc.async.lock);
+
+    out_prof:
+      if (profiling_p)
+       {
+         thr->prof_info = NULL;
+         thr->api_info = NULL;
+       }
+    }
+
+  return ret;
 }