Thomas Schwinge 937fa5fb78 'libgomp.c-c++-common/reduction-{5,6}.c': Restrict '-latomic' to nvptx offloading compilation
Fix-up for recent commit 33b647956caa977d1ae489f9baed9cef70b4f382
"OpenMP: Fix SIMT for complex/float reduction with && and ||"; see
commit d42088e453042f4f8ba9190a7e29efd937ea2181 "Avoid -latomic for amdgcn
offloading".

	libgomp/
	* testsuite/libgomp.c-c++-common/reduction-5.c: Restrict
	'-latomic' to nvptx offloading compilation.
	* testsuite/libgomp.c-c++-common/reduction-6.c: Likewise.
2021-05-18 12:57:45 +02:00

197 lines
4.8 KiB
C

/* { dg-additional-options "-foffload=nvptx-none=-latomic" { target { offload_target_nvptx } } } */
/* C / C++'s logical AND and OR operators take any scalar argument
which compares (un)equal to 0 - the result 1 or 0 and of type int.
In this testcase, the int result is again converted to an integer complex
type.
While having a floating-point/complex array element with || and && can make
sense, having a complex reduction variable is odd but valid.
Test: int complex reduction variable + int complex array.
as reduction-4.c but with target. */
#define N 1024
_Complex char rcc[N];
_Complex short rcs[N];
_Complex int rci[N];
_Complex long long rcl[N];
int
reduction_or ()
{
_Complex char orc = 0;
_Complex short ors = 0;
_Complex int ori = 0;
_Complex long orl = 0;
#pragma omp target parallel reduction(||: orc) map(orc)
for (int i=0; i < N; ++i)
orc = orc || rcl[i];
#pragma omp target parallel for reduction(||: ors) map(ors)
for (int i=0; i < N; ++i)
ors = ors || rci[i];
#pragma omp target parallel for simd reduction(||: ori) map(ori)
for (int i=0; i < N; ++i)
ori = ori || rcs[i];
#pragma omp target parallel loop reduction(||: orl) map(orl)
for (int i=0; i < N; ++i)
orl = orl || rcc[i];
return __real__ (orc + ors + ori + orl) + __imag__ (orc + ors + ori + orl);
}
int
reduction_or_teams ()
{
_Complex char orc = 0;
_Complex short ors = 0;
_Complex int ori = 0;
_Complex long orl = 0;
#pragma omp target teams distribute parallel for reduction(||: orc) map(orc)
for (int i=0; i < N; ++i)
orc = orc || rcc[i];
#pragma omp target teams distribute parallel for simd reduction(||: ors) map(ors)
for (int i=0; i < N; ++i)
ors = ors || rcs[i];
#pragma omp target teams distribute parallel for reduction(||: ori) map(ori)
for (int i=0; i < N; ++i)
ori = ori || rci[i];
#pragma omp target teams distribute parallel for simd reduction(||: orl) map(orl)
for (int i=0; i < N; ++i)
orl = orl || rcl[i];
return __real__ (orc + ors + ori + orl) + __imag__ (orc + ors + ori + orl);
}
int
reduction_and ()
{
_Complex char andc = 1;
_Complex short ands = 1;
_Complex int andi = 1;
_Complex long andl = 1;
#pragma omp target parallel reduction(&&: andc) map(andc)
for (int i=0; i < N; ++i)
andc = andc && rcc[i];
#pragma omp target parallel for reduction(&&: ands) map(ands)
for (int i=0; i < N; ++i)
ands = ands && rcs[i];
#pragma omp target parallel for simd reduction(&&: andi) map(andi)
for (int i=0; i < N; ++i)
andi = andi && rci[i];
#pragma omp target parallel loop reduction(&&: andl) map(andl)
for (int i=0; i < N; ++i)
andl = andl && rcl[i];
return __real__ (andc + ands + andi + andl)
+ __imag__ (andc + ands + andi + andl);
}
int
reduction_and_teams ()
{
_Complex char andc = 1;
_Complex short ands = 1;
_Complex int andi = 1;
_Complex long andl = 1;
#pragma omp target teams distribute parallel for reduction(&&: andc) map(andc)
for (int i=0; i < N; ++i)
andc = andc && rcl[i];
#pragma omp target teams distribute parallel for simd reduction(&&: ands) map(ands)
for (int i=0; i < N; ++i)
ands = ands && rci[i];
#pragma omp target teams distribute parallel for reduction(&&: andi) map(andi)
for (int i=0; i < N; ++i)
andi = andi && rcs[i];
#pragma omp target teams distribute parallel for simd reduction(&&: andl) map(andl)
for (int i=0; i < N; ++i)
andl = andl && rcc[i];
return __real__ (andc + ands + andi + andl)
+ __imag__ (andc + ands + andi + andl);
}
int
main ()
{
for (int i = 0; i < N; ++i)
{
rcc[i] = 0;
rcs[i] = 0;
rci[i] = 0;
rcl[i] = 0;
}
if (reduction_or () != 0)
__builtin_abort ();
if (reduction_or_teams () != 0)
__builtin_abort ();
if (reduction_and () != 0)
__builtin_abort ();
if (reduction_and_teams () != 0)
__builtin_abort ();
rcc[10] = 1.0;
rcs[15] = 1.0i;
rci[10] = 1.0;
rcl[15] = 1.0i;
if (reduction_or () != 4)
__builtin_abort ();
if (reduction_or_teams () != 4)
__builtin_abort ();
if (reduction_and () != 0)
__builtin_abort ();
if (reduction_and_teams () != 0)
__builtin_abort ();
for (int i = 0; i < N; ++i)
{
rcc[i] = 1;
rcs[i] = 1i;
rci[i] = 1;
rcl[i] = 1 + 1i;
}
if (reduction_or () != 4)
__builtin_abort ();
if (reduction_or_teams () != 4)
__builtin_abort ();
if (reduction_and () != 4)
__builtin_abort ();
if (reduction_and_teams () != 4)
__builtin_abort ();
rcc[10] = 0.0;
rcs[15] = 0.0;
rci[10] = 0.0;
rcl[15] = 0.0;
if (reduction_or () != 4)
__builtin_abort ();
if (reduction_or_teams () != 4)
__builtin_abort ();
if (reduction_and () != 0)
__builtin_abort ();
if (reduction_and_teams () != 0)
__builtin_abort ();
return 0;
}