b5c26449f3
PR libgomp/90585 * plugin/plugin-hsa.c: Include gstdint.h. Include inttypes.h only if HAVE_INTTYPES_H is defined. (print_uint64_t): New typedef. (PRIu64): Define if HAVE_INTTYPES_H is not defined. (print_kernel_dispatch, run_kernel): Use PRIu64 macro instead of "lu", cast uint64_t HSA_DEBUG and fprintf arguments to print_uint64_t. (release_kernel_dispatch): Likewise. Cast shadow->debug to uintptr_t before casting to void *. * plugin/plugin-nvptx.c: Include gstdint.h instead of stdint.h. * oacc-mem.c: Don't include config.h nor stdint.h. * target.c: Don't include config.h. * oacc-cuda.c: Likewise. * oacc-host.c: Don't include stdint.h. From-SVN: r271597
167 lines
4.1 KiB
C
167 lines
4.1 KiB
C
/* OpenACC Runtime Library: CUDA support glue.
|
|
|
|
Copyright (C) 2014-2019 Free Software Foundation, Inc.
|
|
|
|
Contributed by Mentor Embedded.
|
|
|
|
This file is part of the GNU Offloading and Multi Processing Library
|
|
(libgomp).
|
|
|
|
Libgomp is free software; you can redistribute it and/or modify it
|
|
under the terms of the GNU General Public License as published by
|
|
the Free Software Foundation; either version 3, or (at your option)
|
|
any later version.
|
|
|
|
Libgomp is distributed in the hope that it will be useful, but WITHOUT ANY
|
|
WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS
|
|
FOR A PARTICULAR PURPOSE. See the GNU General Public License for
|
|
more details.
|
|
|
|
Under Section 7 of GPL version 3, you are granted additional
|
|
permissions described in the GCC Runtime Library Exception, version
|
|
3.1, as published by the Free Software Foundation.
|
|
|
|
You should have received a copy of the GNU General Public License and
|
|
a copy of the GCC Runtime Library Exception along with this program;
|
|
see the files COPYING3 and COPYING.RUNTIME respectively. If not, see
|
|
<http://www.gnu.org/licenses/>. */
|
|
|
|
#include "openacc.h"
|
|
#include "libgomp.h"
|
|
#include "oacc-int.h"
|
|
#include <assert.h>
|
|
|
|
void *
|
|
acc_get_current_cuda_device (void)
|
|
{
|
|
struct goacc_thread *thr = goacc_thread ();
|
|
|
|
void *ret = NULL;
|
|
if (thr && thr->dev && thr->dev->openacc.cuda.get_current_device_func)
|
|
{
|
|
acc_prof_info prof_info;
|
|
acc_api_info api_info;
|
|
bool profiling_p = GOACC_PROFILING_SETUP_P (thr, &prof_info, &api_info);
|
|
|
|
ret = thr->dev->openacc.cuda.get_current_device_func ();
|
|
|
|
if (profiling_p)
|
|
{
|
|
thr->prof_info = NULL;
|
|
thr->api_info = NULL;
|
|
}
|
|
}
|
|
|
|
return ret;
|
|
}
|
|
|
|
void *
|
|
acc_get_current_cuda_context (void)
|
|
{
|
|
struct goacc_thread *thr = goacc_thread ();
|
|
|
|
void *ret = NULL;
|
|
if (thr && thr->dev && thr->dev->openacc.cuda.get_current_context_func)
|
|
{
|
|
acc_prof_info prof_info;
|
|
acc_api_info api_info;
|
|
bool profiling_p = GOACC_PROFILING_SETUP_P (thr, &prof_info, &api_info);
|
|
|
|
ret = thr->dev->openacc.cuda.get_current_context_func ();
|
|
|
|
if (profiling_p)
|
|
{
|
|
thr->prof_info = NULL;
|
|
thr->api_info = NULL;
|
|
}
|
|
}
|
|
|
|
return ret;
|
|
}
|
|
|
|
void *
|
|
acc_get_cuda_stream (int async)
|
|
{
|
|
struct goacc_thread *thr = goacc_thread ();
|
|
|
|
if (!async_valid_p (async))
|
|
return NULL;
|
|
|
|
void *ret = NULL;
|
|
if (thr && thr->dev && thr->dev->openacc.cuda.get_stream_func)
|
|
{
|
|
goacc_aq aq = lookup_goacc_asyncqueue (thr, false, async);
|
|
if (!aq)
|
|
return ret;
|
|
|
|
acc_prof_info prof_info;
|
|
acc_api_info api_info;
|
|
bool profiling_p = GOACC_PROFILING_SETUP_P (thr, &prof_info, &api_info);
|
|
if (profiling_p)
|
|
{
|
|
prof_info.async = async;
|
|
prof_info.async_queue = prof_info.async;
|
|
}
|
|
|
|
ret = thr->dev->openacc.cuda.get_stream_func (aq);
|
|
|
|
if (profiling_p)
|
|
{
|
|
thr->prof_info = NULL;
|
|
thr->api_info = NULL;
|
|
}
|
|
}
|
|
|
|
return ret;
|
|
}
|
|
|
|
int
|
|
acc_set_cuda_stream (int async, void *stream)
|
|
{
|
|
struct goacc_thread *thr;
|
|
|
|
if (!async_valid_p (async) || stream == NULL)
|
|
return 0;
|
|
|
|
goacc_lazy_initialize ();
|
|
|
|
thr = goacc_thread ();
|
|
|
|
int ret = -1;
|
|
if (thr && thr->dev && thr->dev->openacc.cuda.set_stream_func)
|
|
{
|
|
acc_prof_info prof_info;
|
|
acc_api_info api_info;
|
|
bool profiling_p = GOACC_PROFILING_SETUP_P (thr, &prof_info, &api_info);
|
|
if (profiling_p)
|
|
{
|
|
prof_info.async = async;
|
|
prof_info.async_queue = prof_info.async;
|
|
}
|
|
|
|
goacc_aq aq = get_goacc_asyncqueue (async);
|
|
/* Due to not using an asyncqueue for "acc_async_sync", this cannot be
|
|
used to change the CUDA stream associated with "acc_async_sync". */
|
|
if (!aq)
|
|
{
|
|
assert (async == acc_async_sync);
|
|
gomp_debug (0, "Refusing request to set CUDA stream associated"
|
|
" with \"acc_async_sync\"\n");
|
|
ret = 0;
|
|
goto out_prof;
|
|
}
|
|
gomp_mutex_lock (&thr->dev->openacc.async.lock);
|
|
ret = thr->dev->openacc.cuda.set_stream_func (aq, stream);
|
|
gomp_mutex_unlock (&thr->dev->openacc.async.lock);
|
|
|
|
out_prof:
|
|
if (profiling_p)
|
|
{
|
|
thr->prof_info = NULL;
|
|
thr->api_info = NULL;
|
|
}
|
|
}
|
|
|
|
return ret;
|
|
}
|