18c247cc0b
Per my reading of the OpenACC specification (and as supported by secondary documentation, such as code examples, or presentations), it's valid to call "acc_get_cuda_stream"/"acc_set_cuda_stream" also with "acc_async_sync", "acc_async_noval" arguments, not just with the nonnegative values as currently implemented. libgomp/ PR libgomp/88370 * libgomp.texi (acc_get_current_cuda_context, acc_get_cuda_stream) (acc_set_cuda_stream): Clarify. * oacc-cuda.c (acc_get_cuda_stream, acc_set_cuda_stream): Use "async_valid_p". * plugin/plugin-nvptx.c (nvptx_set_cuda_stream): Refuse "async == acc_async_sync". * testsuite/libgomp.oacc-c-c++-common/acc_set_cuda_stream-1.c: New file. * testsuite/libgomp.oacc-c-c++-common/async_queue-1.c: Likewise. * testsuite/libgomp.oacc-c-c++-common/lib-84.c: Update. * testsuite/libgomp.oacc-c-c++-common/lib-85.c: Likewise. From-SVN: r267147
72 lines
1.3 KiB
C
72 lines
1.3 KiB
C
/* { dg-do run { target openacc_nvidia_accel_selected } } */
|
|
/* { dg-additional-options "-lcuda" } */
|
|
|
|
#include <stdlib.h>
|
|
#include <unistd.h>
|
|
#include <openacc.h>
|
|
#include <stdio.h>
|
|
#include <cuda.h>
|
|
|
|
#if !defined __cplusplus
|
|
# undef static_assert
|
|
# define static_assert _Static_assert
|
|
#endif
|
|
|
|
static_assert (acc_async_sync == -2, "acc_async_sync?");
|
|
static_assert (acc_async_noval == -1, "acc_async_noval?");
|
|
|
|
int
|
|
main (int argc, char **argv)
|
|
{
|
|
const int N = 100;
|
|
int i;
|
|
CUstream *streams;
|
|
CUstream s;
|
|
CUresult r;
|
|
|
|
acc_init (acc_device_nvidia);
|
|
|
|
(void) acc_get_device_num (acc_device_nvidia);
|
|
|
|
streams = (CUstream *) malloc ((2 + N) * sizeof (void *));
|
|
streams += 2;
|
|
/* "streams[i]" is valid for i in [acc_async_sync..N). */
|
|
|
|
for (i = acc_async_sync; i < N; i++)
|
|
{
|
|
streams[i] = (CUstream) acc_get_cuda_stream (i);
|
|
if (streams[i] != NULL)
|
|
abort ();
|
|
|
|
r = cuStreamCreate (&streams[i], CU_STREAM_DEFAULT);
|
|
if (r != CUDA_SUCCESS)
|
|
{
|
|
fprintf (stderr, "cuStreamCreate failed: %d\n", r);
|
|
abort ();
|
|
}
|
|
|
|
int ret = acc_set_cuda_stream (i, streams[i]);
|
|
if (i == acc_async_sync)
|
|
{
|
|
if (ret == 1)
|
|
abort ();
|
|
}
|
|
else
|
|
{
|
|
if (ret != 1)
|
|
abort ();
|
|
}
|
|
}
|
|
|
|
s = NULL;
|
|
|
|
if (acc_set_cuda_stream (N + 1, s) != 0)
|
|
abort ();
|
|
|
|
acc_shutdown (acc_device_nvidia);
|
|
|
|
exit (0);
|
|
}
|
|
|
|
/* { dg-output "" } */
|