123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166 |
- /* OpenACC Runtime Library: CUDA support glue.
- Copyright (C) 2014-2022 Free Software Foundation, Inc.
- Contributed by Mentor Embedded.
- This file is part of the GNU Offloading and Multi Processing Library
- (libgomp).
- Libgomp is free software; you can redistribute it and/or modify it
- under the terms of the GNU General Public License as published by
- the Free Software Foundation; either version 3, or (at your option)
- any later version.
- Libgomp is distributed in the hope that it will be useful, but WITHOUT ANY
- WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS
- FOR A PARTICULAR PURPOSE. See the GNU General Public License for
- more details.
- Under Section 7 of GPL version 3, you are granted additional
- permissions described in the GCC Runtime Library Exception, version
- 3.1, as published by the Free Software Foundation.
- You should have received a copy of the GNU General Public License and
- a copy of the GCC Runtime Library Exception along with this program;
- see the files COPYING3 and COPYING.RUNTIME respectively. If not, see
- <http://www.gnu.org/licenses/>. */
- #include "openacc.h"
- #include "libgomp.h"
- #include "oacc-int.h"
- #include <assert.h>
- void *
- acc_get_current_cuda_device (void)
- {
- struct goacc_thread *thr = goacc_thread ();
- void *ret = NULL;
- if (thr && thr->dev && thr->dev->openacc.cuda.get_current_device_func)
- {
- acc_prof_info prof_info;
- acc_api_info api_info;
- bool profiling_p = GOACC_PROFILING_SETUP_P (thr, &prof_info, &api_info);
- ret = thr->dev->openacc.cuda.get_current_device_func ();
- if (profiling_p)
- {
- thr->prof_info = NULL;
- thr->api_info = NULL;
- }
- }
- return ret;
- }
- void *
- acc_get_current_cuda_context (void)
- {
- struct goacc_thread *thr = goacc_thread ();
- void *ret = NULL;
- if (thr && thr->dev && thr->dev->openacc.cuda.get_current_context_func)
- {
- acc_prof_info prof_info;
- acc_api_info api_info;
- bool profiling_p = GOACC_PROFILING_SETUP_P (thr, &prof_info, &api_info);
- ret = thr->dev->openacc.cuda.get_current_context_func ();
- if (profiling_p)
- {
- thr->prof_info = NULL;
- thr->api_info = NULL;
- }
- }
- return ret;
- }
- void *
- acc_get_cuda_stream (int async)
- {
- struct goacc_thread *thr = goacc_thread ();
- if (!async_valid_p (async))
- return NULL;
- void *ret = NULL;
- if (thr && thr->dev && thr->dev->openacc.cuda.get_stream_func)
- {
- goacc_aq aq = lookup_goacc_asyncqueue (thr, false, async);
- if (!aq)
- return ret;
- acc_prof_info prof_info;
- acc_api_info api_info;
- bool profiling_p = GOACC_PROFILING_SETUP_P (thr, &prof_info, &api_info);
- if (profiling_p)
- {
- prof_info.async = async;
- prof_info.async_queue = prof_info.async;
- }
- ret = thr->dev->openacc.cuda.get_stream_func (aq);
- if (profiling_p)
- {
- thr->prof_info = NULL;
- thr->api_info = NULL;
- }
- }
- return ret;
- }
- int
- acc_set_cuda_stream (int async, void *stream)
- {
- struct goacc_thread *thr;
- if (!async_valid_p (async) || stream == NULL)
- return 0;
- goacc_lazy_initialize ();
- thr = goacc_thread ();
- int ret = -1;
- if (thr && thr->dev && thr->dev->openacc.cuda.set_stream_func)
- {
- acc_prof_info prof_info;
- acc_api_info api_info;
- bool profiling_p = GOACC_PROFILING_SETUP_P (thr, &prof_info, &api_info);
- if (profiling_p)
- {
- prof_info.async = async;
- prof_info.async_queue = prof_info.async;
- }
- goacc_aq aq = get_goacc_asyncqueue (async);
- /* Due to not using an asyncqueue for "acc_async_sync", this cannot be
- used to change the CUDA stream associated with "acc_async_sync". */
- if (!aq)
- {
- assert (async == acc_async_sync);
- gomp_debug (0, "Refusing request to set CUDA stream associated"
- " with \"acc_async_sync\"\n");
- ret = 0;
- goto out_prof;
- }
- gomp_mutex_lock (&thr->dev->openacc.async.lock);
- ret = thr->dev->openacc.cuda.set_stream_func (aq, stream);
- gomp_mutex_unlock (&thr->dev->openacc.async.lock);
- out_prof:
- if (profiling_p)
- {
- thr->prof_info = NULL;
- thr->api_info = NULL;
- }
- }
- return ret;
- }
|