c42cfb5ca3
gcc/ PR lto/70289 PR ipa/70348 PR tree-optimization/70373 PR middle-end/70533 PR middle-end/70534 PR middle-end/70535 * gimplify.c (gimplify_adjust_omp_clauses): Add or adjust data clauses for acc parallel reductions as necessary. Error on those that are private. * omp-low.c (scan_sharing_clauses): Don't install variables which are used in acc parallel reductions. (lower_rec_input_clauses): Remove dead code. (lower_oacc_reductions): Add support for reference reductions. (lower_reduction_clauses): Remove dead code. (lower_omp_target): Don't remap variables appearing in acc parallel reductions. * tree.h (OMP_CLAUSE_MAP_IN_REDUCTION): New macro. gcc/testsuite/ * c-c++-common/goacc/reduction-5.c: New test. * c-c++-common/goacc/reduction-promotions.c: New test. * gfortran.dg/goacc/reduction-3.f95: New test. * gfortran.dg/goacc/reduction-promotions.f90: New test. libgomp/ * testsuite/libgomp.oacc-c-c++-common/loop-reduction-gang-np-1.c: New test. * testsuite/libgomp.oacc-c-c++-common/loop-reduction-gw-np-1.c: New test. * testsuite/libgomp.oacc-c-c++-common/loop-reduction-gwv-np-1.c: New test. * testsuite/libgomp.oacc-c-c++-common/loop-reduction-gwv-np-2.c: New test. * testsuite/libgomp.oacc-c-c++-common/loop-reduction-gwv-np-3.c: New test. * testsuite/libgomp.oacc-c-c++-common/loop-reduction-gwv-np-4.c: New test. * testsuite/libgomp.oacc-c-c++-common/loop-reduction-vector-p-1.c: New test. * testsuite/libgomp.oacc-c-c++-common/loop-reduction-vector-p-2.c: New test. * testsuite/libgomp.oacc-c-c++-common/loop-reduction-worker-p-1.c: New test. * testsuite/libgomp.oacc-c-c++-common/loop-reduction-wv-p-1.c: New test. * testsuite/libgomp.oacc-c-c++-common/loop-reduction-wv-p-2.c: New test. * testsuite/libgomp.oacc-c-c++-common/loop-reduction-wv-p-3.c: New test. * testsuite/libgomp.oacc-c-c++-common/par-loop-comb-reduction-1.c: New test. * testsuite/libgomp.oacc-c-c++-common/par-loop-comb-reduction-2.c: New test. * testsuite/libgomp.oacc-c-c++-common/par-loop-comb-reduction-3.c: New test. * testsuite/libgomp.oacc-c-c++-common/par-loop-comb-reduction-4.c: New test. * testsuite/libgomp.oacc-c-c++-common/par-reduction-1.c: Add test coverage. * testsuite/libgomp.oacc-c-c++-common/par-reduction-2.c: Likewise. * testsuite/libgomp.oacc-c-c++-common/parallel-dims.c: Likewise. * testsuite/libgomp.oacc-c-c++-common/parallel-reduction.c: New test. * testsuite/libgomp.oacc-c-c++-common/pr70289.c: New test. * testsuite/libgomp.oacc-c-c++-common/pr70373.c: New test. * testsuite/libgomp.oacc-c-c++-common/reduction-1.c: Add test coverage. * testsuite/libgomp.oacc-c-c++-common/reduction-2.c: Likewise. * testsuite/libgomp.oacc-c-c++-common/reduction-3.c: Likewise. * testsuite/libgomp.oacc-c-c++-common/reduction-4.c: Likewise. * testsuite/libgomp.oacc-c-c++-common/reduction-5.c: Likewise. * testsuite/libgomp.oacc-c-c++-common/reduction-6.c: New test. * testsuite/libgomp.oacc-c-c++-common/reduction.h: New test. * testsuite/libgomp.oacc-fortran/parallel-reduction.f90: New test. * testsuite/libgomp.oacc-fortran/pr70289.f90: New test. * testsuite/libgomp.oacc-fortran/reduction-1.f90: Add test coverage. * testsuite/libgomp.oacc-fortran/reduction-2.f90: Likewise. * testsuite/libgomp.oacc-fortran/reduction-3.f90: Likewise. * testsuite/libgomp.oacc-fortran/reduction-4.f90: Likewise. * testsuite/libgomp.oacc-fortran/reduction-5.f90: Likewise. * testsuite/libgomp.oacc-fortran/reduction-6.f90: Likewise. * testsuite/libgomp.oacc-fortran/reduction-7.f90: New test. From-SVN: r234840
73 lines
978 B
C
73 lines
978 B
C
/* { dg-do run } */
|
|
/* { dg-additional-options "-w" } */
|
|
|
|
#include <stdlib.h>
|
|
#include <openacc.h>
|
|
|
|
#define N 10
|
|
|
|
int
|
|
main ()
|
|
{
|
|
int s1 = 0, s2 = 0;
|
|
int i;
|
|
int dummy = 0;
|
|
|
|
#pragma acc data copy (dummy)
|
|
{
|
|
#pragma acc parallel num_gangs (N) reduction (+:s1) copy(s1)
|
|
{
|
|
s1++;
|
|
}
|
|
}
|
|
|
|
if (acc_get_device_type () != acc_device_nvidia)
|
|
{
|
|
if (s1 != 1)
|
|
abort ();
|
|
}
|
|
else
|
|
{
|
|
if (s1 != N)
|
|
abort ();
|
|
}
|
|
|
|
s1 = 0;
|
|
s2 = 0;
|
|
|
|
#pragma acc parallel num_gangs (10) reduction (+:s1, s2) copy(s1, s2)
|
|
{
|
|
s1++;
|
|
s2 += N;
|
|
}
|
|
|
|
if (acc_get_device_type () != acc_device_nvidia)
|
|
{
|
|
if (s1 != 1)
|
|
abort ();
|
|
if (s2 != N)
|
|
abort ();
|
|
}
|
|
else
|
|
{
|
|
if (s1 != N)
|
|
abort ();
|
|
if (s2 != N*N)
|
|
abort ();
|
|
}
|
|
|
|
s1 = 0;
|
|
|
|
#pragma acc parallel num_gangs (10) reduction (+:s1) copy(s1)
|
|
{
|
|
#pragma acc loop gang reduction (+:s1)
|
|
for (i = 0; i < 10; i++)
|
|
s1++;
|
|
}
|
|
|
|
if (s1 != N)
|
|
abort ();
|
|
|
|
return 0;
|
|
}
|