937fa5fb78
Fix-up for recent commit 33b647956caa977d1ae489f9baed9cef70b4f382 "OpenMP: Fix SIMT for complex/float reduction with && and ||"; see commit d42088e453042f4f8ba9190a7e29efd937ea2181 "Avoid -latomic for amdgcn offloading". libgomp/ * testsuite/libgomp.c-c++-common/reduction-5.c: Restrict '-latomic' to nvptx offloading compilation. * testsuite/libgomp.c-c++-common/reduction-6.c: Likewise.
197 lines
4.8 KiB
C
197 lines
4.8 KiB
C
/* { dg-additional-options "-foffload=nvptx-none=-latomic" { target { offload_target_nvptx } } } */
|
|
/* C / C++'s logical AND and OR operators take any scalar argument
|
|
which compares (un)equal to 0 - the result 1 or 0 and of type int.
|
|
|
|
In this testcase, the int result is again converted to an integer complex
|
|
type.
|
|
|
|
While having a floating-point/complex array element with || and && can make
|
|
sense, having a complex reduction variable is odd but valid.
|
|
|
|
Test: int complex reduction variable + int complex array.
|
|
as reduction-4.c but with target. */
|
|
|
|
#define N 1024
|
|
_Complex char rcc[N];
|
|
_Complex short rcs[N];
|
|
_Complex int rci[N];
|
|
_Complex long long rcl[N];
|
|
|
|
int
|
|
reduction_or ()
|
|
{
|
|
_Complex char orc = 0;
|
|
_Complex short ors = 0;
|
|
_Complex int ori = 0;
|
|
_Complex long orl = 0;
|
|
|
|
#pragma omp target parallel reduction(||: orc) map(orc)
|
|
for (int i=0; i < N; ++i)
|
|
orc = orc || rcl[i];
|
|
|
|
#pragma omp target parallel for reduction(||: ors) map(ors)
|
|
for (int i=0; i < N; ++i)
|
|
ors = ors || rci[i];
|
|
|
|
#pragma omp target parallel for simd reduction(||: ori) map(ori)
|
|
for (int i=0; i < N; ++i)
|
|
ori = ori || rcs[i];
|
|
|
|
#pragma omp target parallel loop reduction(||: orl) map(orl)
|
|
for (int i=0; i < N; ++i)
|
|
orl = orl || rcc[i];
|
|
|
|
return __real__ (orc + ors + ori + orl) + __imag__ (orc + ors + ori + orl);
|
|
}
|
|
|
|
int
|
|
reduction_or_teams ()
|
|
{
|
|
_Complex char orc = 0;
|
|
_Complex short ors = 0;
|
|
_Complex int ori = 0;
|
|
_Complex long orl = 0;
|
|
|
|
#pragma omp target teams distribute parallel for reduction(||: orc) map(orc)
|
|
for (int i=0; i < N; ++i)
|
|
orc = orc || rcc[i];
|
|
|
|
#pragma omp target teams distribute parallel for simd reduction(||: ors) map(ors)
|
|
for (int i=0; i < N; ++i)
|
|
ors = ors || rcs[i];
|
|
|
|
#pragma omp target teams distribute parallel for reduction(||: ori) map(ori)
|
|
for (int i=0; i < N; ++i)
|
|
ori = ori || rci[i];
|
|
|
|
#pragma omp target teams distribute parallel for simd reduction(||: orl) map(orl)
|
|
for (int i=0; i < N; ++i)
|
|
orl = orl || rcl[i];
|
|
|
|
return __real__ (orc + ors + ori + orl) + __imag__ (orc + ors + ori + orl);
|
|
}
|
|
|
|
int
|
|
reduction_and ()
|
|
{
|
|
_Complex char andc = 1;
|
|
_Complex short ands = 1;
|
|
_Complex int andi = 1;
|
|
_Complex long andl = 1;
|
|
|
|
#pragma omp target parallel reduction(&&: andc) map(andc)
|
|
for (int i=0; i < N; ++i)
|
|
andc = andc && rcc[i];
|
|
|
|
#pragma omp target parallel for reduction(&&: ands) map(ands)
|
|
for (int i=0; i < N; ++i)
|
|
ands = ands && rcs[i];
|
|
|
|
#pragma omp target parallel for simd reduction(&&: andi) map(andi)
|
|
for (int i=0; i < N; ++i)
|
|
andi = andi && rci[i];
|
|
|
|
#pragma omp target parallel loop reduction(&&: andl) map(andl)
|
|
for (int i=0; i < N; ++i)
|
|
andl = andl && rcl[i];
|
|
|
|
return __real__ (andc + ands + andi + andl)
|
|
+ __imag__ (andc + ands + andi + andl);
|
|
}
|
|
|
|
int
|
|
reduction_and_teams ()
|
|
{
|
|
_Complex char andc = 1;
|
|
_Complex short ands = 1;
|
|
_Complex int andi = 1;
|
|
_Complex long andl = 1;
|
|
|
|
#pragma omp target teams distribute parallel for reduction(&&: andc) map(andc)
|
|
for (int i=0; i < N; ++i)
|
|
andc = andc && rcl[i];
|
|
|
|
#pragma omp target teams distribute parallel for simd reduction(&&: ands) map(ands)
|
|
for (int i=0; i < N; ++i)
|
|
ands = ands && rci[i];
|
|
|
|
#pragma omp target teams distribute parallel for reduction(&&: andi) map(andi)
|
|
for (int i=0; i < N; ++i)
|
|
andi = andi && rcs[i];
|
|
|
|
#pragma omp target teams distribute parallel for simd reduction(&&: andl) map(andl)
|
|
for (int i=0; i < N; ++i)
|
|
andl = andl && rcc[i];
|
|
|
|
return __real__ (andc + ands + andi + andl)
|
|
+ __imag__ (andc + ands + andi + andl);
|
|
}
|
|
|
|
int
|
|
main ()
|
|
{
|
|
for (int i = 0; i < N; ++i)
|
|
{
|
|
rcc[i] = 0;
|
|
rcs[i] = 0;
|
|
rci[i] = 0;
|
|
rcl[i] = 0;
|
|
}
|
|
|
|
if (reduction_or () != 0)
|
|
__builtin_abort ();
|
|
if (reduction_or_teams () != 0)
|
|
__builtin_abort ();
|
|
if (reduction_and () != 0)
|
|
__builtin_abort ();
|
|
if (reduction_and_teams () != 0)
|
|
__builtin_abort ();
|
|
|
|
rcc[10] = 1.0;
|
|
rcs[15] = 1.0i;
|
|
rci[10] = 1.0;
|
|
rcl[15] = 1.0i;
|
|
|
|
if (reduction_or () != 4)
|
|
__builtin_abort ();
|
|
if (reduction_or_teams () != 4)
|
|
__builtin_abort ();
|
|
if (reduction_and () != 0)
|
|
__builtin_abort ();
|
|
if (reduction_and_teams () != 0)
|
|
__builtin_abort ();
|
|
|
|
for (int i = 0; i < N; ++i)
|
|
{
|
|
rcc[i] = 1;
|
|
rcs[i] = 1i;
|
|
rci[i] = 1;
|
|
rcl[i] = 1 + 1i;
|
|
}
|
|
|
|
if (reduction_or () != 4)
|
|
__builtin_abort ();
|
|
if (reduction_or_teams () != 4)
|
|
__builtin_abort ();
|
|
if (reduction_and () != 4)
|
|
__builtin_abort ();
|
|
if (reduction_and_teams () != 4)
|
|
__builtin_abort ();
|
|
|
|
rcc[10] = 0.0;
|
|
rcs[15] = 0.0;
|
|
rci[10] = 0.0;
|
|
rcl[15] = 0.0;
|
|
|
|
if (reduction_or () != 4)
|
|
__builtin_abort ();
|
|
if (reduction_or_teams () != 4)
|
|
__builtin_abort ();
|
|
if (reduction_and () != 0)
|
|
__builtin_abort ();
|
|
if (reduction_and_teams () != 0)
|
|
__builtin_abort ();
|
|
|
|
return 0;
|
|
}
|