11b8286a83
gcc/ PR middle-end/90115 * flag-types.h (enum openacc_privatization): New. * params.opt (-param=openacc-privatization): New. * doc/invoke.texi (openacc-privatization): Document it. * omp-general.h (get_openacc_privatization_dump_flags): New function. * omp-low.c (oacc_privatization_candidate_p): Add diagnostics. * omp-offload.c (execute_oacc_device_lower) <IFN_UNIQUE_OACC_PRIVATE>: Re-work diagnostics. * target.def (goacc.adjust_private_decl): Add 'location_t' parameter. * doc/tm.texi: Regenerate. * config/gcn/gcn-protos.h (gcn_goacc_adjust_private_decl): Adjust. * config/gcn/gcn-tree.c (gcn_goacc_adjust_private_decl): Likewise. * config/nvptx/nvptx.c (nvptx_goacc_adjust_private_decl): Likewise. Preserve it for... (nvptx_goacc_expand_var_decl): ... use here. gcc/testsuite/ PR middle-end/90115 * c-c++-common/goacc/privatization-1-compute-loop.c: New file. * c-c++-common/goacc/privatization-1-compute.c: Likewise. * c-c++-common/goacc/privatization-1-routine_gang-loop.c: Likewise. * c-c++-common/goacc/privatization-1-routine_gang.c: Likewise. * gfortran.dg/goacc/privatization-1-compute-loop.f90: Likewise. * gfortran.dg/goacc/privatization-1-compute.f90: Likewise. * gfortran.dg/goacc/privatization-1-routine_gang-loop.f90: Likewise. * gfortran.dg/goacc/privatization-1-routine_gang.f90: Likewise. * c-c++-common/goacc-gomp/nesting-1.c: Update. * c-c++-common/goacc/private-reduction-1.c: Likewise. * gfortran.dg/goacc/private-3.f95: Likewise. libgomp/ PR middle-end/90115 * testsuite/libgomp.oacc-fortran/private-atomic-1-vector.f90: New file. * testsuite/libgomp.oacc-c-c++-common/firstprivate-1.c: Update. * testsuite/libgomp.oacc-c-c++-common/host_data-7.c: Likewise. * testsuite/libgomp.oacc-c-c++-common/kernels-decompose-1.c: Likewise. * testsuite/libgomp.oacc-c-c++-common/kernels-private-vars-local-worker-1.c: Likewise. * testsuite/libgomp.oacc-c-c++-common/kernels-private-vars-local-worker-2.c: Likewise. * testsuite/libgomp.oacc-c-c++-common/kernels-private-vars-local-worker-3.c: Likewise. * testsuite/libgomp.oacc-c-c++-common/kernels-private-vars-local-worker-4.c: Likewise. * testsuite/libgomp.oacc-c-c++-common/kernels-private-vars-local-worker-5.c: Likewise. * testsuite/libgomp.oacc-c-c++-common/kernels-private-vars-loop-gang-1.c: Likewise. * testsuite/libgomp.oacc-c-c++-common/kernels-private-vars-loop-gang-2.c: Likewise. * testsuite/libgomp.oacc-c-c++-common/kernels-private-vars-loop-gang-3.c: Likewise. * testsuite/libgomp.oacc-c-c++-common/kernels-private-vars-loop-gang-4.c: Likewise. * testsuite/libgomp.oacc-c-c++-common/kernels-private-vars-loop-gang-5.c: Likewise. * testsuite/libgomp.oacc-c-c++-common/kernels-private-vars-loop-gang-6.c: Likewise. * testsuite/libgomp.oacc-c-c++-common/kernels-private-vars-loop-vector-1.c: Likewise. * testsuite/libgomp.oacc-c-c++-common/kernels-private-vars-loop-vector-2.c: Likewise. * testsuite/libgomp.oacc-c-c++-common/kernels-private-vars-loop-worker-1.c: Likewise. * testsuite/libgomp.oacc-c-c++-common/kernels-private-vars-loop-worker-2.c: Likewise. * testsuite/libgomp.oacc-c-c++-common/kernels-private-vars-loop-worker-3.c: Likewise. * testsuite/libgomp.oacc-c-c++-common/kernels-private-vars-loop-worker-4.c: Likewise. * testsuite/libgomp.oacc-c-c++-common/kernels-private-vars-loop-worker-5.c: Likewise. * testsuite/libgomp.oacc-c-c++-common/kernels-private-vars-loop-worker-6.c: Likewise. * testsuite/libgomp.oacc-c-c++-common/kernels-private-vars-loop-worker-7.c: Likewise. * testsuite/libgomp.oacc-c-c++-common/loop-g-1.c: Likewise. * testsuite/libgomp.oacc-c-c++-common/loop-g-2.c: Likewise. * testsuite/libgomp.oacc-c-c++-common/loop-gwv-1.c: Likewise. * testsuite/libgomp.oacc-c-c++-common/loop-gwv-2.c: Likewise. * testsuite/libgomp.oacc-c-c++-common/loop-red-g-1.c: Likewise. * testsuite/libgomp.oacc-c-c++-common/loop-red-gwv-1.c: Likewise. * testsuite/libgomp.oacc-c-c++-common/loop-red-v-1.c: Likewise. * testsuite/libgomp.oacc-c-c++-common/loop-red-v-2.c: Likewise. * testsuite/libgomp.oacc-c-c++-common/loop-red-w-1.c: Likewise. * testsuite/libgomp.oacc-c-c++-common/loop-red-w-2.c: Likewise. * testsuite/libgomp.oacc-c-c++-common/loop-red-wv-1.c: Likewise. * testsuite/libgomp.oacc-c-c++-common/loop-v-1.c: Likewise. * testsuite/libgomp.oacc-c-c++-common/loop-w-1.c: Likewise. * testsuite/libgomp.oacc-c-c++-common/loop-wv-1.c: Likewise. * testsuite/libgomp.oacc-c-c++-common/parallel-reduction.c: Likewise. * testsuite/libgomp.oacc-c-c++-common/private-atomic-1-gang.c: Likewise. * testsuite/libgomp.oacc-c-c++-common/private-atomic-1.c: Likewise. * testsuite/libgomp.oacc-c-c++-common/private-variables.c: Likewise. * testsuite/libgomp.oacc-c-c++-common/routine-4.c: Likewise. * testsuite/libgomp.oacc-c-c++-common/static-variable-1.c: Likewise. * testsuite/libgomp.oacc-fortran/acc_on_device-1-1.f90: Likewise. * testsuite/libgomp.oacc-fortran/acc_on_device-1-2.f: Likewise. * testsuite/libgomp.oacc-fortran/acc_on_device-1-3.f: Likewise. * testsuite/libgomp.oacc-fortran/declare-1.f90: Likewise. * testsuite/libgomp.oacc-fortran/host_data-5.F90: Likewise. * testsuite/libgomp.oacc-fortran/if-1.f90: Likewise. * testsuite/libgomp.oacc-fortran/kernels-private-vars-loop-gang-1.f90: Likewise. * testsuite/libgomp.oacc-fortran/kernels-private-vars-loop-gang-2.f90: Likewise. * testsuite/libgomp.oacc-fortran/kernels-private-vars-loop-gang-3.f90: Likewise. * testsuite/libgomp.oacc-fortran/kernels-private-vars-loop-gang-6.f90: Likewise. * testsuite/libgomp.oacc-fortran/kernels-private-vars-loop-vector-1.f90: Likewise. * testsuite/libgomp.oacc-fortran/kernels-private-vars-loop-vector-2.f90: Likewise. * testsuite/libgomp.oacc-fortran/kernels-private-vars-loop-worker-1.f90: Likewise. * testsuite/libgomp.oacc-fortran/kernels-private-vars-loop-worker-2.f90: Likewise. * testsuite/libgomp.oacc-fortran/kernels-private-vars-loop-worker-3.f90: Likewise. * testsuite/libgomp.oacc-fortran/kernels-private-vars-loop-worker-4.f90: Likewise. * testsuite/libgomp.oacc-fortran/kernels-private-vars-loop-worker-5.f90: Likewise. * testsuite/libgomp.oacc-fortran/kernels-private-vars-loop-worker-6.f90: Likewise. * testsuite/libgomp.oacc-fortran/kernels-private-vars-loop-worker-7.f90: Likewise. * testsuite/libgomp.oacc-fortran/optional-private.f90: Likewise. * testsuite/libgomp.oacc-fortran/parallel-dims.f90: Likewise. * testsuite/libgomp.oacc-fortran/private-atomic-1-gang.f90: Likewise. * testsuite/libgomp.oacc-fortran/private-atomic-1-worker.f90: Likewise. * testsuite/libgomp.oacc-fortran/private-variables.f90: Likewise. * testsuite/libgomp.oacc-fortran/privatized-ref-2.f90: Likewise. * testsuite/libgomp.oacc-fortran/routine-7.f90: Likewise.
1134 lines
48 KiB
C
1134 lines
48 KiB
C
/* { dg-additional-options "-fopt-info-note-omp" }
|
|
{ dg-additional-options "--param=openacc-privatization=noisy" }
|
|
{ dg-additional-options "-foffload=-fopt-info-note-omp" }
|
|
{ dg-additional-options "-foffload=--param=openacc-privatization=noisy" }
|
|
for testing/documenting aspects of that functionality. */
|
|
|
|
/* { dg-additional-options "-Wopenacc-parallelism" } for testing/documenting
|
|
aspects of that functionality. */
|
|
|
|
/* It's only with Tcl 8.5 (released in 2007) that "the variable 'varName'
|
|
passed to 'incr' may be unset, and in that case, it will be set to [...]",
|
|
so to maintain compatibility with earlier Tcl releases, we manually
|
|
initialize counter variables:
|
|
{ dg-line l_dummy[variable c_compute 0 c_loop 0] }
|
|
{ dg-message "dummy" "" { target iN-VAl-Id } l_dummy } to avoid
|
|
"WARNING: dg-line var l_dummy defined, but not used". */
|
|
|
|
#include <assert.h>
|
|
#include <openacc.h>
|
|
|
|
typedef struct {
|
|
int x, y;
|
|
} vec2;
|
|
|
|
typedef struct {
|
|
int x, y, z;
|
|
int attr[13];
|
|
} vec3_attr;
|
|
|
|
|
|
/* Test of gang-private variables declared in local scope with parallel
|
|
directive. */
|
|
|
|
void local_g_1()
|
|
{
|
|
int i, arr[32];
|
|
|
|
for (i = 0; i < 32; i++)
|
|
arr[i] = 3;
|
|
|
|
#pragma acc parallel copy(arr) num_gangs(32) num_workers(8) vector_length(32) /* { dg-line l_compute[incr c_compute] } */
|
|
/* { dg-note {variable 'x' declared in block isn't candidate for adjusting OpenACC privatization level: not addressable} "" { target *-*-* } l_compute$c_compute } */
|
|
/* { dg-warning "region is worker partitioned but does not contain worker partitioned code" "" { target *-*-* } l_compute$c_compute } */
|
|
/* { dg-warning "region is vector partitioned but does not contain vector partitioned code" "" { target *-*-* } l_compute$c_compute } */
|
|
{
|
|
int x;
|
|
|
|
#pragma acc loop gang(static:1) /* { dg-line l_loop[incr c_loop] } */
|
|
/* { dg-note {variable 'i' in 'private' clause isn't candidate for adjusting OpenACC privatization level: not addressable} "" { target *-*-* } l_loop$c_loop } */
|
|
for (i = 0; i < 32; i++)
|
|
x = i * 2;
|
|
|
|
#pragma acc loop gang(static:1) /* { dg-line l_loop[incr c_loop] } */
|
|
/* { dg-note {variable 'i' in 'private' clause isn't candidate for adjusting OpenACC privatization level: not addressable} "" { target *-*-* } l_loop$c_loop } */
|
|
for (i = 0; i < 32; i++)
|
|
{
|
|
if (acc_on_device (acc_device_host))
|
|
x = i * 2;
|
|
arr[i] += x;
|
|
}
|
|
}
|
|
|
|
for (i = 0; i < 32; i++)
|
|
assert (arr[i] == 3 + i * 2);
|
|
}
|
|
|
|
|
|
/* Test of worker-private variables declared in a local scope, broadcasting
|
|
to vector-partitioned mode. Back-to-back worker loops. */
|
|
|
|
void local_w_1()
|
|
{
|
|
int i, arr[32 * 32 * 32];
|
|
|
|
for (i = 0; i < 32 * 32 * 32; i++)
|
|
arr[i] = i;
|
|
|
|
#pragma acc parallel copy(arr) num_gangs(32) num_workers(32) vector_length(32) /* { dg-line l_compute[incr c_compute] } */
|
|
/* { dg-note {variable 'j' declared in block isn't candidate for adjusting OpenACC privatization level: not addressable} "" { target *-*-* } l_compute$c_compute } */
|
|
{
|
|
int j;
|
|
|
|
#pragma acc loop gang /* { dg-line l_loop[incr c_loop] } */
|
|
/* { dg-note {variable 'i' in 'private' clause isn't candidate for adjusting OpenACC privatization level: not addressable} "" { target *-*-* } l_loop$c_loop } */
|
|
for (i = 0; i < 32; i++)
|
|
{
|
|
#pragma acc loop worker /* { dg-line l_loop[incr c_loop] } */
|
|
/* { dg-note {variable 'j' in 'private' clause isn't candidate for adjusting OpenACC privatization level: not addressable} "" { target *-*-* } l_loop$c_loop } */
|
|
/* { dg-note {variable 'k' declared in block isn't candidate for adjusting OpenACC privatization level: not addressable} "" { target *-*-* } l_loop$c_loop } */
|
|
/* { dg-note {variable 'x' declared in block isn't candidate for adjusting OpenACC privatization level: not addressable} "" { target *-*-* } l_loop$c_loop } */
|
|
for (j = 0; j < 32; j++)
|
|
{
|
|
int k;
|
|
int x = i ^ j * 3;
|
|
|
|
#pragma acc loop vector /* { dg-line l_loop[incr c_loop] } */
|
|
/* { dg-note {variable 'k' in 'private' clause isn't candidate for adjusting OpenACC privatization level: not addressable} "" { target *-*-* } l_loop$c_loop } */
|
|
for (k = 0; k < 32; k++)
|
|
arr[i * 1024 + j * 32 + k] += x * k;
|
|
}
|
|
|
|
#pragma acc loop worker /* { dg-line l_loop[incr c_loop] } */
|
|
/* { dg-note {variable 'j' in 'private' clause isn't candidate for adjusting OpenACC privatization level: not addressable} "" { target *-*-* } l_loop$c_loop } */
|
|
/* { dg-note {variable 'k' declared in block isn't candidate for adjusting OpenACC privatization level: not addressable} "" { target *-*-* } l_loop$c_loop } */
|
|
/* { dg-note {variable 'x' declared in block isn't candidate for adjusting OpenACC privatization level: not addressable} "" { target *-*-* } l_loop$c_loop } */
|
|
for (j = 0; j < 32; j++)
|
|
{
|
|
int k;
|
|
int x = i | j * 5;
|
|
|
|
#pragma acc loop vector /* { dg-line l_loop[incr c_loop] } */
|
|
/* { dg-note {variable 'k' in 'private' clause isn't candidate for adjusting OpenACC privatization level: not addressable} "" { target *-*-* } l_loop$c_loop } */
|
|
for (k = 0; k < 32; k++)
|
|
arr[i * 1024 + j * 32 + k] += x * k;
|
|
}
|
|
}
|
|
}
|
|
|
|
for (i = 0; i < 32; i++)
|
|
for (int j = 0; j < 32; j++)
|
|
for (int k = 0; k < 32; k++)
|
|
{
|
|
int idx = i * 1024 + j * 32 + k;
|
|
assert (arr[idx] == idx + (i ^ j * 3) * k + (i | j * 5) * k);
|
|
}
|
|
}
|
|
|
|
|
|
/* Test of worker-private variables declared in a local scope, broadcasting
|
|
to vector-partitioned mode. Successive vector loops. */
|
|
|
|
void local_w_2()
|
|
{
|
|
int i, arr[32 * 32 * 32];
|
|
|
|
for (i = 0; i < 32 * 32 * 32; i++)
|
|
arr[i] = i;
|
|
|
|
#pragma acc parallel copy(arr) num_gangs(32) num_workers(32) vector_length(32) /* { dg-line l_compute[incr c_compute] } */
|
|
/* { dg-note {variable 'j' declared in block isn't candidate for adjusting OpenACC privatization level: not addressable} "" { target *-*-* } l_compute$c_compute } */
|
|
{
|
|
int j;
|
|
|
|
#pragma acc loop gang /* { dg-line l_loop[incr c_loop] } */
|
|
/* { dg-note {variable 'i' in 'private' clause isn't candidate for adjusting OpenACC privatization level: not addressable} "" { target *-*-* } l_loop$c_loop } */
|
|
for (i = 0; i < 32; i++)
|
|
{
|
|
#pragma acc loop worker /* { dg-line l_loop[incr c_loop] } */
|
|
/* { dg-note {variable 'j' in 'private' clause isn't candidate for adjusting OpenACC privatization level: not addressable} "" { target *-*-* } l_loop$c_loop } */
|
|
/* { dg-note {variable 'k' declared in block isn't candidate for adjusting OpenACC privatization level: not addressable} "" { target *-*-* } l_loop$c_loop } */
|
|
/* { dg-note {variable 'x' declared in block isn't candidate for adjusting OpenACC privatization level: not addressable} "" { target *-*-* } l_loop$c_loop } */
|
|
for (j = 0; j < 32; j++)
|
|
{
|
|
int k;
|
|
int x = i ^ j * 3;
|
|
|
|
#pragma acc loop vector /* { dg-line l_loop[incr c_loop] } */
|
|
/* { dg-note {variable 'k' in 'private' clause isn't candidate for adjusting OpenACC privatization level: not addressable} "" { target *-*-* } l_loop$c_loop } */
|
|
for (k = 0; k < 32; k++)
|
|
arr[i * 1024 + j * 32 + k] += x * k;
|
|
|
|
x = i | j * 5;
|
|
|
|
#pragma acc loop vector /* { dg-line l_loop[incr c_loop] } */
|
|
/* { dg-note {variable 'k' in 'private' clause isn't candidate for adjusting OpenACC privatization level: not addressable} "" { target *-*-* } l_loop$c_loop } */
|
|
for (k = 0; k < 32; k++)
|
|
arr[i * 1024 + j * 32 + k] += x * k;
|
|
}
|
|
}
|
|
}
|
|
|
|
for (i = 0; i < 32; i++)
|
|
for (int j = 0; j < 32; j++)
|
|
for (int k = 0; k < 32; k++)
|
|
{
|
|
int idx = i * 1024 + j * 32 + k;
|
|
assert (arr[idx] == idx + (i ^ j * 3) * k + (i | j * 5) * k);
|
|
}
|
|
}
|
|
|
|
|
|
/* Test of worker-private variables declared in a local scope, broadcasting
|
|
to vector-partitioned mode. Aggregate worker variable. */
|
|
|
|
void local_w_3()
|
|
{
|
|
int i, arr[32 * 32 * 32];
|
|
|
|
for (i = 0; i < 32 * 32 * 32; i++)
|
|
arr[i] = i;
|
|
|
|
#pragma acc parallel copy(arr) num_gangs(32) num_workers(32) vector_length(32) /* { dg-line l_compute[incr c_compute] } */
|
|
/* { dg-note {variable 'j' declared in block isn't candidate for adjusting OpenACC privatization level: not addressable} "" { target *-*-* } l_compute$c_compute } */
|
|
{
|
|
int j;
|
|
|
|
#pragma acc loop gang /* { dg-line l_loop[incr c_loop] } */
|
|
/* { dg-note {variable 'i' in 'private' clause isn't candidate for adjusting OpenACC privatization level: not addressable} "" { target *-*-* } l_loop$c_loop } */
|
|
for (i = 0; i < 32; i++)
|
|
{
|
|
#pragma acc loop worker /* { dg-line l_loop[incr c_loop] } */
|
|
/* { dg-note {variable 'j' in 'private' clause isn't candidate for adjusting OpenACC privatization level: not addressable} "" { target *-*-* } l_loop$c_loop } */
|
|
/* { dg-note {variable 'k' declared in block isn't candidate for adjusting OpenACC privatization level: not addressable} "" { target *-*-* } l_loop$c_loop } */
|
|
/* { dg-note {variable 'pt' declared in block isn't candidate for adjusting OpenACC privatization level: not addressable} "" { target *-*-* } l_loop$c_loop } */
|
|
for (j = 0; j < 32; j++)
|
|
{
|
|
int k;
|
|
vec2 pt;
|
|
|
|
pt.x = i ^ j * 3;
|
|
pt.y = i | j * 5;
|
|
|
|
#pragma acc loop vector /* { dg-line l_loop[incr c_loop] } */
|
|
/* { dg-note {variable 'k' in 'private' clause isn't candidate for adjusting OpenACC privatization level: not addressable} "" { target *-*-* } l_loop$c_loop } */
|
|
for (k = 0; k < 32; k++)
|
|
arr[i * 1024 + j * 32 + k] += pt.x * k;
|
|
|
|
#pragma acc loop vector /* { dg-line l_loop[incr c_loop] } */
|
|
/* { dg-note {variable 'k' in 'private' clause isn't candidate for adjusting OpenACC privatization level: not addressable} "" { target *-*-* } l_loop$c_loop } */
|
|
for (k = 0; k < 32; k++)
|
|
arr[i * 1024 + j * 32 + k] += pt.y * k;
|
|
}
|
|
}
|
|
}
|
|
|
|
for (i = 0; i < 32; i++)
|
|
for (int j = 0; j < 32; j++)
|
|
for (int k = 0; k < 32; k++)
|
|
{
|
|
int idx = i * 1024 + j * 32 + k;
|
|
assert (arr[idx] == idx + (i ^ j * 3) * k + (i | j * 5) * k);
|
|
}
|
|
}
|
|
|
|
|
|
/* Test of worker-private variables declared in a local scope, broadcasting
|
|
to vector-partitioned mode. Addressable worker variable. */
|
|
|
|
void local_w_4()
|
|
{
|
|
int i, arr[32 * 32 * 32];
|
|
|
|
for (i = 0; i < 32 * 32 * 32; i++)
|
|
arr[i] = i;
|
|
|
|
#pragma acc parallel copy(arr) num_gangs(32) num_workers(32) vector_length(32) /* { dg-line l_compute[incr c_compute] } */
|
|
/* { dg-note {variable 'j' declared in block isn't candidate for adjusting OpenACC privatization level: not addressable} "" { target *-*-* } l_compute$c_compute } */
|
|
{
|
|
int j;
|
|
|
|
#pragma acc loop gang /* { dg-line l_loop[incr c_loop] } */
|
|
/* { dg-note {variable 'i' in 'private' clause isn't candidate for adjusting OpenACC privatization level: not addressable} "" { target *-*-* } l_loop$c_loop } */
|
|
for (i = 0; i < 32; i++)
|
|
{
|
|
#pragma acc loop worker /* { dg-line l_loop[incr c_loop] } */
|
|
/* { dg-note {variable 'j' in 'private' clause isn't candidate for adjusting OpenACC privatization level: not addressable} "" { target *-*-* } l_loop$c_loop } */
|
|
/* { dg-note {variable 'k' declared in block isn't candidate for adjusting OpenACC privatization level: not addressable} "" { target *-*-* } l_loop$c_loop } */
|
|
/* { dg-note {variable 'pt' declared in block is candidate for adjusting OpenACC privatization level} "" { target *-*-* } l_loop$c_loop }
|
|
{ dg-note {variable 'pt' ought to be adjusted for OpenACC privatization level: 'worker'} "" { target *-*-* } l_loop$c_loop }
|
|
{ dg-note {variable 'pt' adjusted for OpenACC privatization level: 'worker'} "TODO" { target { ! openacc_host_selected } xfail *-*-* } l_loop$c_loop } */
|
|
/* { dg-note {variable 'ptp' declared in block isn't candidate for adjusting OpenACC privatization level: not addressable} "" { target *-*-* } l_loop$c_loop } */
|
|
for (j = 0; j < 32; j++)
|
|
{
|
|
int k;
|
|
vec2 pt, *ptp;
|
|
|
|
ptp = &pt;
|
|
|
|
pt.x = i ^ j * 3;
|
|
|
|
#pragma acc loop vector /* { dg-line l_loop[incr c_loop] } */
|
|
/* { dg-note {variable 'k' in 'private' clause isn't candidate for adjusting OpenACC privatization level: not addressable} "" { target *-*-* } l_loop$c_loop } */
|
|
for (k = 0; k < 32; k++)
|
|
arr[i * 1024 + j * 32 + k] += ptp->x * k;
|
|
|
|
ptp->y = i | j * 5;
|
|
|
|
#pragma acc loop vector /* { dg-line l_loop[incr c_loop] } */
|
|
/* { dg-note {variable 'k' in 'private' clause isn't candidate for adjusting OpenACC privatization level: not addressable} "" { target *-*-* } l_loop$c_loop } */
|
|
for (k = 0; k < 32; k++)
|
|
arr[i * 1024 + j * 32 + k] += pt.y * k;
|
|
}
|
|
}
|
|
}
|
|
|
|
for (i = 0; i < 32; i++)
|
|
for (int j = 0; j < 32; j++)
|
|
for (int k = 0; k < 32; k++)
|
|
{
|
|
int idx = i * 1024 + j * 32 + k;
|
|
assert (arr[idx] == idx + (i ^ j * 3) * k + (i | j * 5) * k);
|
|
}
|
|
}
|
|
|
|
|
|
/* Test of worker-private variables declared in a local scope, broadcasting
|
|
to vector-partitioned mode. Array worker variable. */
|
|
|
|
void local_w_5()
|
|
{
|
|
int i, arr[32 * 32 * 32];
|
|
|
|
for (i = 0; i < 32 * 32 * 32; i++)
|
|
arr[i] = i;
|
|
|
|
#pragma acc parallel copy(arr) num_gangs(32) num_workers(32) vector_length(32) /* { dg-line l_compute[incr c_compute] } */
|
|
/* { dg-note {variable 'j' declared in block isn't candidate for adjusting OpenACC privatization level: not addressable} "" { target *-*-* } l_compute$c_compute } */
|
|
{
|
|
int j;
|
|
|
|
#pragma acc loop gang /* { dg-line l_loop[incr c_loop] } */
|
|
/* { dg-note {variable 'i' in 'private' clause isn't candidate for adjusting OpenACC privatization level: not addressable} "" { target *-*-* } l_loop$c_loop } */
|
|
for (i = 0; i < 32; i++)
|
|
{
|
|
#pragma acc loop worker /* { dg-line l_loop[incr c_loop] } */
|
|
/* { dg-note {variable 'j' in 'private' clause isn't candidate for adjusting OpenACC privatization level: not addressable} "" { target *-*-* } l_loop$c_loop } */
|
|
/* { dg-note {variable 'k' declared in block isn't candidate for adjusting OpenACC privatization level: not addressable} "" { target *-*-* } l_loop$c_loop } */
|
|
/* { dg-note {variable 'pt' declared in block isn't candidate for adjusting OpenACC privatization level: not addressable} "" { target *-*-* } l_loop$c_loop } */
|
|
for (j = 0; j < 32; j++)
|
|
{
|
|
int k;
|
|
int pt[2];
|
|
|
|
pt[0] = i ^ j * 3;
|
|
|
|
#pragma acc loop vector /* { dg-line l_loop[incr c_loop] } */
|
|
/* { dg-note {variable 'k' in 'private' clause isn't candidate for adjusting OpenACC privatization level: not addressable} "" { target *-*-* } l_loop$c_loop } */
|
|
for (k = 0; k < 32; k++)
|
|
arr[i * 1024 + j * 32 + k] += pt[0] * k;
|
|
|
|
pt[1] = i | j * 5;
|
|
|
|
#pragma acc loop vector /* { dg-line l_loop[incr c_loop] } */
|
|
/* { dg-note {variable 'k' in 'private' clause isn't candidate for adjusting OpenACC privatization level: not addressable} "" { target *-*-* } l_loop$c_loop } */
|
|
for (k = 0; k < 32; k++)
|
|
arr[i * 1024 + j * 32 + k] += pt[1] * k;
|
|
}
|
|
}
|
|
}
|
|
|
|
for (i = 0; i < 32; i++)
|
|
for (int j = 0; j < 32; j++)
|
|
for (int k = 0; k < 32; k++)
|
|
{
|
|
int idx = i * 1024 + j * 32 + k;
|
|
assert (arr[idx] == idx + (i ^ j * 3) * k + (i | j * 5) * k);
|
|
}
|
|
}
|
|
|
|
|
|
/* Test of gang-private variables declared on loop directive. */
|
|
|
|
void loop_g_1()
|
|
{
|
|
int x = 5, i, arr[32];
|
|
|
|
for (i = 0; i < 32; i++)
|
|
arr[i] = i;
|
|
|
|
#pragma acc parallel copy(arr) num_gangs(32) num_workers(8) vector_length(32) /* { dg-line l_compute[incr c_compute] } */
|
|
/* { dg-warning "region is worker partitioned but does not contain worker partitioned code" "" { target *-*-* } l_compute$c_compute } */
|
|
/* { dg-warning "region is vector partitioned but does not contain vector partitioned code" "" { target *-*-* } l_compute$c_compute } */
|
|
{
|
|
#pragma acc loop gang private(x) /* { dg-line l_loop[incr c_loop] } */
|
|
/* { dg-note {variable 'i' in 'private' clause isn't candidate for adjusting OpenACC privatization level: not addressable} "" { target *-*-* } l_loop$c_loop } */
|
|
/* { dg-note {variable 'x' in 'private' clause isn't candidate for adjusting OpenACC privatization level: not addressable} "" { target *-*-* } l_loop$c_loop } */
|
|
for (i = 0; i < 32; i++)
|
|
{
|
|
x = i * 2;
|
|
arr[i] += x;
|
|
}
|
|
}
|
|
|
|
for (i = 0; i < 32; i++)
|
|
assert (arr[i] == i * 3);
|
|
}
|
|
|
|
|
|
/* Test of gang-private variables declared on loop directive, with broadcasting
|
|
to partitioned workers. */
|
|
|
|
void loop_g_2()
|
|
{
|
|
int x = 5, i, arr[32 * 32];
|
|
|
|
for (i = 0; i < 32 * 32; i++)
|
|
arr[i] = i;
|
|
|
|
#pragma acc parallel copy(arr) num_gangs(32) num_workers(8) vector_length(32) /* { dg-line l_compute[incr c_compute] } */
|
|
/* { dg-warning "region is vector partitioned but does not contain vector partitioned code" "" { target *-*-* } l_compute$c_compute } */
|
|
{
|
|
#pragma acc loop gang private(x) /* { dg-line l_loop[incr c_loop] } */
|
|
/* { dg-note {variable 'i' in 'private' clause isn't candidate for adjusting OpenACC privatization level: not addressable} "" { target *-*-* } l_loop$c_loop } */
|
|
/* { dg-note {variable 'x' in 'private' clause isn't candidate for adjusting OpenACC privatization level: not addressable} "" { target *-*-* } l_loop$c_loop } */
|
|
/* { dg-note {variable 'j' declared in block isn't candidate for adjusting OpenACC privatization level: not addressable} "" { target *-*-* } l_loop$c_loop } */
|
|
for (i = 0; i < 32; i++)
|
|
{
|
|
x = i * 2;
|
|
|
|
#pragma acc loop worker /* { dg-line l_loop[incr c_loop] } */
|
|
/* { dg-note {variable 'j' in 'private' clause isn't candidate for adjusting OpenACC privatization level: not addressable} "" { target *-*-* } l_loop$c_loop } */
|
|
for (int j = 0; j < 32; j++)
|
|
arr[i * 32 + j] += x;
|
|
}
|
|
}
|
|
|
|
for (i = 0; i < 32 * 32; i++)
|
|
assert (arr[i] == i + (i / 32) * 2);
|
|
}
|
|
|
|
|
|
/* Test of gang-private variables declared on loop directive, with broadcasting
|
|
to partitioned vectors. */
|
|
|
|
void loop_g_3()
|
|
{
|
|
int x = 5, i, arr[32 * 32];
|
|
|
|
for (i = 0; i < 32 * 32; i++)
|
|
arr[i] = i;
|
|
|
|
#pragma acc parallel copy(arr) num_gangs(32) num_workers(8) vector_length(32) /* { dg-line l_compute[incr c_compute] } */
|
|
/* { dg-warning "region is worker partitioned but does not contain worker partitioned code" "" { target *-*-* } l_compute$c_compute } */
|
|
{
|
|
#pragma acc loop gang private(x) /* { dg-line l_loop[incr c_loop] } */
|
|
/* { dg-note {variable 'i' in 'private' clause isn't candidate for adjusting OpenACC privatization level: not addressable} "" { target *-*-* } l_loop$c_loop } */
|
|
/* { dg-note {variable 'x' in 'private' clause isn't candidate for adjusting OpenACC privatization level: not addressable} "" { target *-*-* } l_loop$c_loop } */
|
|
/* { dg-note {variable 'j' declared in block isn't candidate for adjusting OpenACC privatization level: not addressable} "" { target *-*-* } l_loop$c_loop } */
|
|
for (i = 0; i < 32; i++)
|
|
{
|
|
x = i * 2;
|
|
|
|
#pragma acc loop vector /* { dg-line l_loop[incr c_loop] } */
|
|
/* { dg-note {variable 'j' in 'private' clause isn't candidate for adjusting OpenACC privatization level: not addressable} "" { target *-*-* } l_loop$c_loop } */
|
|
for (int j = 0; j < 32; j++)
|
|
arr[i * 32 + j] += x;
|
|
}
|
|
}
|
|
|
|
for (i = 0; i < 32 * 32; i++)
|
|
assert (arr[i] == i + (i / 32) * 2);
|
|
}
|
|
|
|
|
|
/* Test of gang-private addressable variable declared on loop directive, with
|
|
broadcasting to partitioned workers. */
|
|
|
|
void loop_g_4()
|
|
{
|
|
int x = 5, i, arr[32 * 32];
|
|
|
|
for (i = 0; i < 32 * 32; i++)
|
|
arr[i] = i;
|
|
|
|
#pragma acc parallel copy(arr) num_gangs(32) num_workers(8) vector_length(32) /* { dg-line l_compute[incr c_compute] } */
|
|
/* { dg-warning "region is vector partitioned but does not contain vector partitioned code" "" { target *-*-* } l_compute$c_compute } */
|
|
{
|
|
#pragma acc loop gang private(x) /* { dg-line l_loop[incr c_loop] } */
|
|
/* { dg-note {variable 'x' in 'private' clause is candidate for adjusting OpenACC privatization level} "" { target *-*-* } l_loop$c_loop }
|
|
But, with optimizations enabled, per the '*.ssa' dump ('gcc/tree-ssa.c:execute_update_addresses_taken'):
|
|
No longer having address taken: x
|
|
Now a gimple register: x
|
|
However, 'x' remains in the candidate set:
|
|
{ dg-note {variable 'x' ought to be adjusted for OpenACC privatization level: 'gang'} "" { target *-*-* } l_loop$c_loop }
|
|
Now, for GCN offloading, 'adjust_private_decl' does the privatization change right away:
|
|
{ dg-note {variable 'x' adjusted for OpenACC privatization level: 'gang'} "" { target openacc_radeon_accel_selected } l_loop$c_loop }
|
|
For nvptx offloading however, we first mark up 'x', and then later apply the privatization change -- or, with optimizations enabled, don't, because we then don't actually call 'expand_var_decl'.
|
|
{ dg-note {variable 'x' adjusted for OpenACC privatization level: 'gang'} "" { target { openacc_nvidia_accel_selected && { ! __OPTIMIZE__ } } } l_loop$c_loop }
|
|
{ dg-bogus {note: variable 'x' adjusted for OpenACC privatization level: 'gang'} "" { target { openacc_nvidia_accel_selected && __OPTIMIZE__ } } l_loop$c_loop }
|
|
*/
|
|
/* { dg-note {variable 'i' in 'private' clause isn't candidate for adjusting OpenACC privatization level: not addressable} "" { target *-*-* } l_loop$c_loop } */
|
|
/* { dg-note {variable 'j' declared in block isn't candidate for adjusting OpenACC privatization level: not addressable} "" { target *-*-* } l_loop$c_loop } */
|
|
/* { dg-note {variable 'p' declared in block isn't candidate for adjusting OpenACC privatization level: not addressable} "" { target *-*-* } l_loop$c_loop } */
|
|
for (i = 0; i < 32; i++)
|
|
{
|
|
int *p = &x;
|
|
|
|
x = i * 2;
|
|
|
|
#pragma acc loop worker /* { dg-line l_loop[incr c_loop] } */
|
|
/* { dg-note {variable 'j' in 'private' clause isn't candidate for adjusting OpenACC privatization level: not addressable} "" { target *-*-* } l_loop$c_loop } */
|
|
for (int j = 0; j < 32; j++)
|
|
arr[i * 32 + j] += x;
|
|
|
|
(*p)--;
|
|
}
|
|
}
|
|
|
|
for (i = 0; i < 32 * 32; i++)
|
|
assert (arr[i] == i + (i / 32) * 2);
|
|
}
|
|
|
|
|
|
/* Test of gang-private array variable declared on loop directive, with
|
|
broadcasting to partitioned workers. */
|
|
|
|
void loop_g_5()
|
|
{
|
|
int x[8], i, arr[32 * 32];
|
|
|
|
for (i = 0; i < 32 * 32; i++)
|
|
arr[i] = i;
|
|
|
|
#pragma acc parallel copy(arr) num_gangs(32) num_workers(8) vector_length(32) /* { dg-line l_compute[incr c_compute] } */
|
|
/* { dg-warning "region is vector partitioned but does not contain vector partitioned code" "" { target *-*-* } l_compute$c_compute } */
|
|
{
|
|
#pragma acc loop gang private(x) /* { dg-line l_loop[incr c_loop] } */
|
|
/* { dg-note {variable 'x' in 'private' clause is candidate for adjusting OpenACC privatization level} "" { target *-*-* } l_loop$c_loop }
|
|
{ dg-note {variable 'x' ought to be adjusted for OpenACC privatization level: 'gang'} "" { target *-*-* } l_loop$c_loop }
|
|
{ dg-note {variable 'x' adjusted for OpenACC privatization level: 'gang'} "" { target { ! openacc_host_selected } } l_loop$c_loop } */
|
|
/* { dg-note {variable 'i' in 'private' clause isn't candidate for adjusting OpenACC privatization level: not addressable} "" { target *-*-* } l_loop$c_loop } */
|
|
/* { dg-note {variable 'j' declared in block isn't candidate for adjusting OpenACC privatization level: not addressable} "" { target *-*-* } l_loop$c_loop } */
|
|
for (i = 0; i < 32; i++)
|
|
{
|
|
for (int j = 0; j < 8; j++)
|
|
x[j] = j * 2;
|
|
|
|
#pragma acc loop worker /* { dg-line l_loop[incr c_loop] } */
|
|
/* { dg-note {variable 'j' in 'private' clause isn't candidate for adjusting OpenACC privatization level: not addressable} "" { target *-*-* } l_loop$c_loop } */
|
|
for (int j = 0; j < 32; j++)
|
|
arr[i * 32 + j] += x[j % 8];
|
|
}
|
|
}
|
|
|
|
for (i = 0; i < 32 * 32; i++)
|
|
assert (arr[i] == i + (i % 8) * 2);
|
|
}
|
|
|
|
|
|
/* Test of gang-private aggregate variable declared on loop directive, with
|
|
broadcasting to partitioned workers. */
|
|
|
|
void loop_g_6()
|
|
{
|
|
int i, arr[32 * 32];
|
|
vec3_attr pt;
|
|
|
|
for (i = 0; i < 32 * 32; i++)
|
|
arr[i] = i;
|
|
|
|
#pragma acc parallel copy(arr) num_gangs(32) num_workers(8) vector_length(32) /* { dg-line l_compute[incr c_compute] } */
|
|
/* { dg-warning "region is vector partitioned but does not contain vector partitioned code" "" { target *-*-* } l_compute$c_compute } */
|
|
{
|
|
#pragma acc loop gang private(pt) /* { dg-line l_loop[incr c_loop] } */
|
|
/* { dg-note {variable 'i' in 'private' clause isn't candidate for adjusting OpenACC privatization level: not addressable} "" { target *-*-* } l_loop$c_loop } */
|
|
/* { dg-note {variable 'pt' in 'private' clause isn't candidate for adjusting OpenACC privatization level: not addressable} "" { target *-*-* } l_loop$c_loop } */
|
|
/* { dg-note {variable 'j' declared in block isn't candidate for adjusting OpenACC privatization level: not addressable} "" { target *-*-* } l_loop$c_loop } */
|
|
for (i = 0; i < 32; i++)
|
|
{
|
|
pt.x = i;
|
|
pt.y = i * 2;
|
|
pt.z = i * 4;
|
|
pt.attr[5] = i * 6;
|
|
|
|
#pragma acc loop worker /* { dg-line l_loop[incr c_loop] } */
|
|
/* { dg-note {variable 'j' in 'private' clause isn't candidate for adjusting OpenACC privatization level: not addressable} "" { target *-*-* } l_loop$c_loop } */
|
|
for (int j = 0; j < 32; j++)
|
|
arr[i * 32 + j] += pt.x + pt.y + pt.z + pt.attr[5];
|
|
}
|
|
}
|
|
|
|
for (i = 0; i < 32 * 32; i++)
|
|
assert (arr[i] == i + (i / 32) * 13);
|
|
}
|
|
|
|
|
|
/* Test of vector-private variables declared on loop directive. */
|
|
|
|
void loop_v_1()
|
|
{
|
|
int x, i, arr[32 * 32 * 32];
|
|
|
|
for (i = 0; i < 32 * 32 * 32; i++)
|
|
arr[i] = i;
|
|
|
|
#pragma acc parallel copy(arr) num_gangs(32) num_workers(32) vector_length(32) /* { dg-line l_compute[incr c_compute] } */
|
|
/* { dg-note {variable 'j' declared in block isn't candidate for adjusting OpenACC privatization level: not addressable} "" { target *-*-* } l_compute$c_compute } */
|
|
{
|
|
int j;
|
|
|
|
#pragma acc loop gang /* { dg-line l_loop[incr c_loop] } */
|
|
/* { dg-note {variable 'i' in 'private' clause isn't candidate for adjusting OpenACC privatization level: not addressable} "" { target *-*-* } l_loop$c_loop } */
|
|
for (i = 0; i < 32; i++)
|
|
{
|
|
#pragma acc loop worker /* { dg-line l_loop[incr c_loop] } */
|
|
/* { dg-note {variable 'j' in 'private' clause isn't candidate for adjusting OpenACC privatization level: not addressable} "" { target *-*-* } l_loop$c_loop } */
|
|
/* { dg-note {variable 'k' declared in block isn't candidate for adjusting OpenACC privatization level: not addressable} "" { target *-*-* } l_loop$c_loop } */
|
|
for (j = 0; j < 32; j++)
|
|
{
|
|
int k;
|
|
|
|
#pragma acc loop vector private(x) /* { dg-line l_loop[incr c_loop] } */
|
|
/* { dg-note {variable 'k' in 'private' clause isn't candidate for adjusting OpenACC privatization level: not addressable} "" { target *-*-* } l_loop$c_loop } */
|
|
/* { dg-note {variable 'x' in 'private' clause isn't candidate for adjusting OpenACC privatization level: not addressable} "" { target *-*-* } l_loop$c_loop } */
|
|
for (k = 0; k < 32; k++)
|
|
{
|
|
x = i ^ j * 3;
|
|
arr[i * 1024 + j * 32 + k] += x * k;
|
|
}
|
|
|
|
#pragma acc loop vector private(x) /* { dg-line l_loop[incr c_loop] } */
|
|
/* { dg-note {variable 'k' in 'private' clause isn't candidate for adjusting OpenACC privatization level: not addressable} "" { target *-*-* } l_loop$c_loop } */
|
|
/* { dg-note {variable 'x' in 'private' clause isn't candidate for adjusting OpenACC privatization level: not addressable} "" { target *-*-* } l_loop$c_loop } */
|
|
for (k = 0; k < 32; k++)
|
|
{
|
|
x = i | j * 5;
|
|
arr[i * 1024 + j * 32 + k] += x * k;
|
|
}
|
|
}
|
|
}
|
|
}
|
|
|
|
for (i = 0; i < 32; i++)
|
|
for (int j = 0; j < 32; j++)
|
|
for (int k = 0; k < 32; k++)
|
|
{
|
|
int idx = i * 1024 + j * 32 + k;
|
|
assert (arr[idx] == idx + (i ^ j * 3) * k + (i | j * 5) * k);
|
|
}
|
|
}
|
|
|
|
|
|
/* Test of vector-private variables declared on loop directive. Array type. */
|
|
|
|
void loop_v_2()
|
|
{
|
|
int pt[2], i, arr[32 * 32 * 32];
|
|
|
|
for (i = 0; i < 32 * 32 * 32; i++)
|
|
arr[i] = i;
|
|
|
|
#pragma acc parallel copy(arr) num_gangs(32) num_workers(32) vector_length(32) /* { dg-line l_compute[incr c_compute] } */
|
|
/* { dg-note {variable 'j' declared in block isn't candidate for adjusting OpenACC privatization level: not addressable} "" { target *-*-* } l_compute$c_compute } */
|
|
{
|
|
int j;
|
|
|
|
#pragma acc loop gang /* { dg-line l_loop[incr c_loop] } */
|
|
/* { dg-note {variable 'i' in 'private' clause isn't candidate for adjusting OpenACC privatization level: not addressable} "" { target *-*-* } l_loop$c_loop } */
|
|
for (i = 0; i < 32; i++)
|
|
{
|
|
#pragma acc loop worker /* { dg-line l_loop[incr c_loop] } */
|
|
/* { dg-note {variable 'j' in 'private' clause isn't candidate for adjusting OpenACC privatization level: not addressable} "" { target *-*-* } l_loop$c_loop } */
|
|
/* { dg-note {variable 'k' declared in block isn't candidate for adjusting OpenACC privatization level: not addressable} "" { target *-*-* } l_loop$c_loop } */
|
|
for (j = 0; j < 32; j++)
|
|
{
|
|
int k;
|
|
|
|
#pragma acc loop vector private(pt) /* { dg-line l_loop[incr c_loop] } */
|
|
/* { dg-note {variable 'k' in 'private' clause isn't candidate for adjusting OpenACC privatization level: not addressable} "" { target *-*-* } l_loop$c_loop } */
|
|
/* { dg-note {variable 'pt' in 'private' clause isn't candidate for adjusting OpenACC privatization level: not addressable} "" { target *-*-* } l_loop$c_loop } */
|
|
for (k = 0; k < 32; k++)
|
|
{
|
|
pt[0] = i ^ j * 3;
|
|
pt[1] = i | j * 5;
|
|
arr[i * 1024 + j * 32 + k] += pt[0] * k;
|
|
arr[i * 1024 + j * 32 + k] += pt[1] * k;
|
|
}
|
|
}
|
|
}
|
|
}
|
|
|
|
for (i = 0; i < 32; i++)
|
|
for (int j = 0; j < 32; j++)
|
|
for (int k = 0; k < 32; k++)
|
|
{
|
|
int idx = i * 1024 + j * 32 + k;
|
|
assert (arr[idx] == idx + (i ^ j * 3) * k + (i | j * 5) * k);
|
|
}
|
|
}
|
|
|
|
|
|
/* Test of worker-private variables declared on a loop directive. */
|
|
|
|
void loop_w_1()
|
|
{
|
|
int x = 5, i, arr[32 * 32];
|
|
|
|
for (i = 0; i < 32 * 32; i++)
|
|
arr[i] = i;
|
|
|
|
#pragma acc parallel copy(arr) num_gangs(32) num_workers(8) vector_length(32) /* { dg-line l_compute[incr c_compute] } */
|
|
/* { dg-note {variable 'j' declared in block isn't candidate for adjusting OpenACC privatization level: not addressable} "" { target *-*-* } l_compute$c_compute } */
|
|
/* { dg-warning "region is vector partitioned but does not contain vector partitioned code" "" { target *-*-* } l_compute$c_compute } */
|
|
{
|
|
int j;
|
|
|
|
#pragma acc loop gang /* { dg-line l_loop[incr c_loop] } */
|
|
/* { dg-note {variable 'i' in 'private' clause isn't candidate for adjusting OpenACC privatization level: not addressable} "" { target *-*-* } l_loop$c_loop } */
|
|
for (i = 0; i < 32; i++)
|
|
{
|
|
#pragma acc loop worker private(x) /* { dg-line l_loop[incr c_loop] } */
|
|
/* { dg-note {variable 'j' in 'private' clause isn't candidate for adjusting OpenACC privatization level: not addressable} "" { target *-*-* } l_loop$c_loop } */
|
|
/* { dg-note {variable 'x' in 'private' clause isn't candidate for adjusting OpenACC privatization level: not addressable} "" { target *-*-* } l_loop$c_loop } */
|
|
for (j = 0; j < 32; j++)
|
|
{
|
|
x = i ^ j * 3;
|
|
/* Try to ensure 'x' accesses doesn't get optimized into a
|
|
temporary. */
|
|
__asm__ __volatile__ ("");
|
|
arr[i * 32 + j] += x;
|
|
}
|
|
}
|
|
}
|
|
|
|
for (i = 0; i < 32 * 32; i++)
|
|
assert (arr[i] == i + ((i / 32) ^ (i % 32) * 3));
|
|
}
|
|
|
|
|
|
/* Test of worker-private variables declared on a loop directive, broadcasting
|
|
to vector-partitioned mode. */
|
|
|
|
void loop_w_2()
|
|
{
|
|
int x = 5, i, arr[32 * 32 * 32];
|
|
|
|
for (i = 0; i < 32 * 32 * 32; i++)
|
|
arr[i] = i;
|
|
|
|
#pragma acc parallel copy(arr) num_gangs(32) num_workers(32) vector_length(32) /* { dg-line l_compute[incr c_compute] } */
|
|
/* { dg-note {variable 'j' declared in block isn't candidate for adjusting OpenACC privatization level: not addressable} "" { target *-*-* } l_compute$c_compute } */
|
|
{
|
|
int j;
|
|
|
|
#pragma acc loop gang /* { dg-line l_loop[incr c_loop] } */
|
|
/* { dg-note {variable 'i' in 'private' clause isn't candidate for adjusting OpenACC privatization level: not addressable} "" { target *-*-* } l_loop$c_loop } */
|
|
for (i = 0; i < 32; i++)
|
|
{
|
|
#pragma acc loop worker private(x) /* { dg-line l_loop[incr c_loop] } */
|
|
/* { dg-note {variable 'j' in 'private' clause isn't candidate for adjusting OpenACC privatization level: not addressable} "" { target *-*-* } l_loop$c_loop } */
|
|
/* { dg-note {variable 'x' in 'private' clause isn't candidate for adjusting OpenACC privatization level: not addressable} "" { target *-*-* } l_loop$c_loop } */
|
|
/* { dg-note {variable 'k' declared in block isn't candidate for adjusting OpenACC privatization level: not addressable} "" { target *-*-* } l_loop$c_loop } */
|
|
for (j = 0; j < 32; j++)
|
|
{
|
|
int k;
|
|
x = i ^ j * 3;
|
|
|
|
#pragma acc loop vector /* { dg-line l_loop[incr c_loop] } */
|
|
/* { dg-note {variable 'k' in 'private' clause isn't candidate for adjusting OpenACC privatization level: not addressable} "" { target *-*-* } l_loop$c_loop } */
|
|
for (k = 0; k < 32; k++)
|
|
arr[i * 1024 + j * 32 + k] += x * k;
|
|
}
|
|
}
|
|
}
|
|
|
|
for (i = 0; i < 32; i++)
|
|
for (int j = 0; j < 32; j++)
|
|
for (int k = 0; k < 32; k++)
|
|
{
|
|
int idx = i * 1024 + j * 32 + k;
|
|
assert (arr[idx] == idx + (i ^ j * 3) * k);
|
|
}
|
|
}
|
|
|
|
|
|
/* Test of worker-private variables declared on a loop directive, broadcasting
|
|
to vector-partitioned mode. Back-to-back worker loops. */
|
|
|
|
void loop_w_3()
|
|
{
|
|
int x = 5, i, arr[32 * 32 * 32];
|
|
|
|
for (i = 0; i < 32 * 32 * 32; i++)
|
|
arr[i] = i;
|
|
|
|
#pragma acc parallel copy(arr) num_gangs(32) num_workers(32) vector_length(32) /* { dg-line l_compute[incr c_compute] } */
|
|
/* { dg-note {variable 'j' declared in block isn't candidate for adjusting OpenACC privatization level: not addressable} "" { target *-*-* } l_compute$c_compute } */
|
|
{
|
|
int j;
|
|
|
|
#pragma acc loop gang /* { dg-line l_loop[incr c_loop] } */
|
|
/* { dg-note {variable 'i' in 'private' clause isn't candidate for adjusting OpenACC privatization level: not addressable} "" { target *-*-* } l_loop$c_loop } */
|
|
for (i = 0; i < 32; i++)
|
|
{
|
|
#pragma acc loop worker private(x) /* { dg-line l_loop[incr c_loop] } */
|
|
/* { dg-note {variable 'j' in 'private' clause isn't candidate for adjusting OpenACC privatization level: not addressable} "" { target *-*-* } l_loop$c_loop } */
|
|
/* { dg-note {variable 'x' in 'private' clause isn't candidate for adjusting OpenACC privatization level: not addressable} "" { target *-*-* } l_loop$c_loop } */
|
|
/* { dg-note {variable 'k' declared in block isn't candidate for adjusting OpenACC privatization level: not addressable} "" { target *-*-* } l_loop$c_loop } */
|
|
for (j = 0; j < 32; j++)
|
|
{
|
|
int k;
|
|
x = i ^ j * 3;
|
|
|
|
#pragma acc loop vector /* { dg-line l_loop[incr c_loop] } */
|
|
/* { dg-note {variable 'k' in 'private' clause isn't candidate for adjusting OpenACC privatization level: not addressable} "" { target *-*-* } l_loop$c_loop } */
|
|
for (k = 0; k < 32; k++)
|
|
arr[i * 1024 + j * 32 + k] += x * k;
|
|
}
|
|
|
|
#pragma acc loop worker private(x) /* { dg-line l_loop[incr c_loop] } */
|
|
/* { dg-note {variable 'j' in 'private' clause isn't candidate for adjusting OpenACC privatization level: not addressable} "" { target *-*-* } l_loop$c_loop } */
|
|
/* { dg-note {variable 'x' in 'private' clause isn't candidate for adjusting OpenACC privatization level: not addressable} "" { target *-*-* } l_loop$c_loop } */
|
|
/* { dg-note {variable 'k' declared in block isn't candidate for adjusting OpenACC privatization level: not addressable} "" { target *-*-* } l_loop$c_loop } */
|
|
for (j = 0; j < 32; j++)
|
|
{
|
|
int k;
|
|
x = i | j * 5;
|
|
|
|
#pragma acc loop vector /* { dg-line l_loop[incr c_loop] } */
|
|
/* { dg-note {variable 'k' in 'private' clause isn't candidate for adjusting OpenACC privatization level: not addressable} "" { target *-*-* } l_loop$c_loop } */
|
|
for (k = 0; k < 32; k++)
|
|
arr[i * 1024 + j * 32 + k] += x * k;
|
|
}
|
|
}
|
|
}
|
|
|
|
for (i = 0; i < 32; i++)
|
|
for (int j = 0; j < 32; j++)
|
|
for (int k = 0; k < 32; k++)
|
|
{
|
|
int idx = i * 1024 + j * 32 + k;
|
|
assert (arr[idx] == idx + (i ^ j * 3) * k + (i | j * 5) * k);
|
|
}
|
|
}
|
|
|
|
|
|
/* Test of worker-private variables declared on a loop directive, broadcasting
|
|
to vector-partitioned mode. Successive vector loops. */
|
|
|
|
void loop_w_4()
|
|
{
|
|
int x = 5, i, arr[32 * 32 * 32];
|
|
|
|
for (i = 0; i < 32 * 32 * 32; i++)
|
|
arr[i] = i;
|
|
|
|
#pragma acc parallel copy(arr) num_gangs(32) num_workers(32) vector_length(32) /* { dg-line l_compute[incr c_compute] } */
|
|
/* { dg-note {variable 'j' declared in block isn't candidate for adjusting OpenACC privatization level: not addressable} "" { target *-*-* } l_compute$c_compute } */
|
|
{
|
|
int j;
|
|
|
|
#pragma acc loop gang /* { dg-line l_loop[incr c_loop] } */
|
|
/* { dg-note {variable 'i' in 'private' clause isn't candidate for adjusting OpenACC privatization level: not addressable} "" { target *-*-* } l_loop$c_loop } */
|
|
for (i = 0; i < 32; i++)
|
|
{
|
|
#pragma acc loop worker private(x) /* { dg-line l_loop[incr c_loop] } */
|
|
/* { dg-note {variable 'j' in 'private' clause isn't candidate for adjusting OpenACC privatization level: not addressable} "" { target *-*-* } l_loop$c_loop } */
|
|
/* { dg-note {variable 'x' in 'private' clause isn't candidate for adjusting OpenACC privatization level: not addressable} "" { target *-*-* } l_loop$c_loop } */
|
|
/* { dg-note {variable 'k' declared in block isn't candidate for adjusting OpenACC privatization level: not addressable} "" { target *-*-* } l_loop$c_loop } */
|
|
for (j = 0; j < 32; j++)
|
|
{
|
|
int k;
|
|
x = i ^ j * 3;
|
|
|
|
#pragma acc loop vector /* { dg-line l_loop[incr c_loop] } */
|
|
/* { dg-note {variable 'k' in 'private' clause isn't candidate for adjusting OpenACC privatization level: not addressable} "" { target *-*-* } l_loop$c_loop } */
|
|
for (k = 0; k < 32; k++)
|
|
arr[i * 1024 + j * 32 + k] += x * k;
|
|
|
|
x = i | j * 5;
|
|
|
|
#pragma acc loop vector /* { dg-line l_loop[incr c_loop] } */
|
|
/* { dg-note {variable 'k' in 'private' clause isn't candidate for adjusting OpenACC privatization level: not addressable} "" { target *-*-* } l_loop$c_loop } */
|
|
for (k = 0; k < 32; k++)
|
|
arr[i * 1024 + j * 32 + k] += x * k;
|
|
}
|
|
}
|
|
}
|
|
|
|
for (i = 0; i < 32; i++)
|
|
for (int j = 0; j < 32; j++)
|
|
for (int k = 0; k < 32; k++)
|
|
{
|
|
int idx = i * 1024 + j * 32 + k;
|
|
assert (arr[idx] == idx + (i ^ j * 3) * k + (i | j * 5) * k);
|
|
}
|
|
}
|
|
|
|
|
|
/* Test of worker-private variables declared on a loop directive, broadcasting
|
|
to vector-partitioned mode. Addressable worker variable. */
|
|
|
|
void loop_w_5()
|
|
{
|
|
int x = 5, i, arr[32 * 32 * 32];
|
|
|
|
for (i = 0; i < 32 * 32 * 32; i++)
|
|
arr[i] = i;
|
|
|
|
#pragma acc parallel copy(arr) num_gangs(32) num_workers(32) vector_length(32) /* { dg-line l_compute[incr c_compute] } */
|
|
/* { dg-note {variable 'j' declared in block isn't candidate for adjusting OpenACC privatization level: not addressable} "" { target *-*-* } l_compute$c_compute } */
|
|
{
|
|
int j;
|
|
|
|
#pragma acc loop gang /* { dg-line l_loop[incr c_loop] } */
|
|
/* { dg-note {variable 'i' in 'private' clause isn't candidate for adjusting OpenACC privatization level: not addressable} "" { target *-*-* } l_loop$c_loop } */
|
|
for (i = 0; i < 32; i++)
|
|
{
|
|
#pragma acc loop worker private(x) /* { dg-line l_loop[incr c_loop] } */
|
|
/* { dg-note {variable 'x' in 'private' clause is candidate for adjusting OpenACC privatization level} "" { target *-*-* } l_loop$c_loop }
|
|
{ dg-note {variable 'x' ought to be adjusted for OpenACC privatization level: 'worker'} "" { target *-*-* } l_loop$c_loop }
|
|
{ dg-note {variable 'x' adjusted for OpenACC privatization level: 'worker'} "TODO" { target { ! openacc_host_selected } xfail *-*-* } l_loop$c_loop } */
|
|
/* { dg-note {variable 'j' in 'private' clause isn't candidate for adjusting OpenACC privatization level: not addressable} "" { target *-*-* } l_loop$c_loop } */
|
|
/* { dg-note {variable 'k' declared in block isn't candidate for adjusting OpenACC privatization level: not addressable} "" { target *-*-* } l_loop$c_loop } */
|
|
/* { dg-note {variable 'p' declared in block isn't candidate for adjusting OpenACC privatization level: not addressable} "" { target *-*-* } l_loop$c_loop } */
|
|
for (j = 0; j < 32; j++)
|
|
{
|
|
int k;
|
|
int *p = &x;
|
|
|
|
x = i ^ j * 3;
|
|
|
|
#pragma acc loop vector /* { dg-line l_loop[incr c_loop] } */
|
|
/* { dg-note {variable 'k' in 'private' clause isn't candidate for adjusting OpenACC privatization level: not addressable} "" { target *-*-* } l_loop$c_loop } */
|
|
for (k = 0; k < 32; k++)
|
|
arr[i * 1024 + j * 32 + k] += x * k;
|
|
|
|
*p = i | j * 5;
|
|
|
|
#pragma acc loop vector /* { dg-line l_loop[incr c_loop] } */
|
|
/* { dg-note {variable 'k' in 'private' clause isn't candidate for adjusting OpenACC privatization level: not addressable} "" { target *-*-* } l_loop$c_loop } */
|
|
for (k = 0; k < 32; k++)
|
|
arr[i * 1024 + j * 32 + k] += x * k;
|
|
}
|
|
}
|
|
}
|
|
|
|
for (i = 0; i < 32; i++)
|
|
for (int j = 0; j < 32; j++)
|
|
for (int k = 0; k < 32; k++)
|
|
{
|
|
int idx = i * 1024 + j * 32 + k;
|
|
assert (arr[idx] == idx + (i ^ j * 3) * k + (i | j * 5) * k);
|
|
}
|
|
}
|
|
|
|
|
|
/* Test of worker-private variables declared on a loop directive, broadcasting
|
|
to vector-partitioned mode. Aggregate worker variable. */
|
|
|
|
void loop_w_6()
|
|
{
|
|
int i, arr[32 * 32 * 32];
|
|
vec2 pt;
|
|
|
|
for (i = 0; i < 32 * 32 * 32; i++)
|
|
arr[i] = i;
|
|
|
|
#pragma acc parallel copy(arr) num_gangs(32) num_workers(32) vector_length(32) /* { dg-line l_compute[incr c_compute] } */
|
|
/* { dg-note {variable 'j' declared in block isn't candidate for adjusting OpenACC privatization level: not addressable} "" { target *-*-* } l_compute$c_compute } */
|
|
{
|
|
int j;
|
|
|
|
#pragma acc loop gang /* { dg-line l_loop[incr c_loop] } */
|
|
/* { dg-note {variable 'i' in 'private' clause isn't candidate for adjusting OpenACC privatization level: not addressable} "" { target *-*-* } l_loop$c_loop } */
|
|
for (i = 0; i < 32; i++)
|
|
{
|
|
#pragma acc loop worker private(pt) /* { dg-line l_loop[incr c_loop] } */
|
|
/* { dg-note {variable 'j' in 'private' clause isn't candidate for adjusting OpenACC privatization level: not addressable} "" { target *-*-* } l_loop$c_loop } */
|
|
/* { dg-note {variable 'pt' in 'private' clause isn't candidate for adjusting OpenACC privatization level: not addressable} "" { target *-*-* } l_loop$c_loop } */
|
|
/* { dg-note {variable 'k' declared in block isn't candidate for adjusting OpenACC privatization level: not addressable} "" { target *-*-* } l_loop$c_loop } */
|
|
for (j = 0; j < 32; j++)
|
|
{
|
|
int k;
|
|
|
|
pt.x = i ^ j * 3;
|
|
pt.y = i | j * 5;
|
|
|
|
#pragma acc loop vector /* { dg-line l_loop[incr c_loop] } */
|
|
/* { dg-note {variable 'k' in 'private' clause isn't candidate for adjusting OpenACC privatization level: not addressable} "" { target *-*-* } l_loop$c_loop } */
|
|
for (k = 0; k < 32; k++)
|
|
arr[i * 1024 + j * 32 + k] += pt.x * k;
|
|
|
|
#pragma acc loop vector /* { dg-line l_loop[incr c_loop] } */
|
|
/* { dg-note {variable 'k' in 'private' clause isn't candidate for adjusting OpenACC privatization level: not addressable} "" { target *-*-* } l_loop$c_loop } */
|
|
for (k = 0; k < 32; k++)
|
|
arr[i * 1024 + j * 32 + k] += pt.y * k;
|
|
}
|
|
}
|
|
}
|
|
|
|
for (i = 0; i < 32; i++)
|
|
for (int j = 0; j < 32; j++)
|
|
for (int k = 0; k < 32; k++)
|
|
{
|
|
int idx = i * 1024 + j * 32 + k;
|
|
assert (arr[idx] == idx + (i ^ j * 3) * k + (i | j * 5) * k);
|
|
}
|
|
}
|
|
|
|
|
|
/* Test of worker-private variables declared on loop directive, broadcasting
|
|
to vector-partitioned mode. Array worker variable. */
|
|
|
|
void loop_w_7()
|
|
{
|
|
int i, arr[32 * 32 * 32];
|
|
int pt[2];
|
|
|
|
for (i = 0; i < 32 * 32 * 32; i++)
|
|
arr[i] = i;
|
|
|
|
/* "pt" is treated as "present_or_copy" on the parallel directive because it
|
|
is an array variable. */
|
|
#pragma acc parallel copy(arr) num_gangs(32) num_workers(32) vector_length(32) /* { dg-line l_compute[incr c_compute] } */
|
|
/* { dg-note {variable 'j' declared in block isn't candidate for adjusting OpenACC privatization level: not addressable} "" { target *-*-* } l_compute$c_compute } */
|
|
{
|
|
int j;
|
|
|
|
#pragma acc loop gang /* { dg-line l_loop[incr c_loop] } */
|
|
/* { dg-note {variable 'i' in 'private' clause isn't candidate for adjusting OpenACC privatization level: not addressable} "" { target *-*-* } l_loop$c_loop } */
|
|
for (i = 0; i < 32; i++)
|
|
{
|
|
/* But here, it is made private per-worker. */
|
|
#pragma acc loop worker private(pt) /* { dg-line l_loop[incr c_loop] } */
|
|
/* { dg-note {variable 'j' in 'private' clause isn't candidate for adjusting OpenACC privatization level: not addressable} "" { target *-*-* } l_loop$c_loop } */
|
|
/* { dg-note {variable 'pt' in 'private' clause isn't candidate for adjusting OpenACC privatization level: not addressable} "" { target *-*-* } l_loop$c_loop } */
|
|
/* { dg-note {variable 'k' declared in block isn't candidate for adjusting OpenACC privatization level: not addressable} "" { target *-*-* } l_loop$c_loop } */
|
|
for (j = 0; j < 32; j++)
|
|
{
|
|
int k;
|
|
|
|
pt[0] = i ^ j * 3;
|
|
|
|
#pragma acc loop vector /* { dg-line l_loop[incr c_loop] } */
|
|
/* { dg-note {variable 'k' in 'private' clause isn't candidate for adjusting OpenACC privatization level: not addressable} "" { target *-*-* } l_loop$c_loop } */
|
|
for (k = 0; k < 32; k++)
|
|
arr[i * 1024 + j * 32 + k] += pt[0] * k;
|
|
|
|
pt[1] = i | j * 5;
|
|
|
|
#pragma acc loop vector /* { dg-line l_loop[incr c_loop] } */
|
|
/* { dg-note {variable 'k' in 'private' clause isn't candidate for adjusting OpenACC privatization level: not addressable} "" { target *-*-* } l_loop$c_loop } */
|
|
for (k = 0; k < 32; k++)
|
|
arr[i * 1024 + j * 32 + k] += pt[1] * k;
|
|
}
|
|
}
|
|
}
|
|
|
|
for (i = 0; i < 32; i++)
|
|
for (int j = 0; j < 32; j++)
|
|
for (int k = 0; k < 32; k++)
|
|
{
|
|
int idx = i * 1024 + j * 32 + k;
|
|
assert (arr[idx] == idx + (i ^ j * 3) * k + (i | j * 5) * k);
|
|
}
|
|
}
|
|
|
|
|
|
/* Test of gang-private variables declared on the parallel directive. */
|
|
|
|
void parallel_g_1()
|
|
{
|
|
int x = 5, i, arr[32];
|
|
|
|
for (i = 0; i < 32; i++)
|
|
arr[i] = 3;
|
|
|
|
#pragma acc parallel private(x) copy(arr) num_gangs(32) num_workers(8) vector_length(32) /* { dg-line l_compute[incr c_compute] } */
|
|
/* { dg-warning "region is worker partitioned but does not contain worker partitioned code" "" { target *-*-* } l_compute$c_compute } */
|
|
/* { dg-warning "region is vector partitioned but does not contain vector partitioned code" "" { target *-*-* } l_compute$c_compute } */
|
|
{
|
|
#pragma acc loop gang(static:1) /* { dg-line l_loop[incr c_loop] } */
|
|
/* { dg-note {variable 'i' in 'private' clause isn't candidate for adjusting OpenACC privatization level: not addressable} "" { target *-*-* } l_loop$c_loop } */
|
|
for (i = 0; i < 32; i++)
|
|
x = i * 2;
|
|
|
|
#pragma acc loop gang(static:1) /* { dg-line l_loop[incr c_loop] } */
|
|
/* { dg-note {variable 'i' in 'private' clause isn't candidate for adjusting OpenACC privatization level: not addressable} "" { target *-*-* } l_loop$c_loop } */
|
|
for (i = 0; i < 32; i++)
|
|
{
|
|
if (acc_on_device (acc_device_host))
|
|
x = i * 2;
|
|
arr[i] += x;
|
|
}
|
|
}
|
|
|
|
for (i = 0; i < 32; i++)
|
|
assert (arr[i] == 3 + i * 2);
|
|
}
|
|
|
|
|
|
/* Test of gang-private array variable declared on the parallel directive. */
|
|
|
|
void parallel_g_2()
|
|
{
|
|
int x[32], i, arr[32 * 32];
|
|
|
|
for (i = 0; i < 32 * 32; i++)
|
|
arr[i] = i;
|
|
|
|
#pragma acc parallel private(x) copy(arr) num_gangs(32) num_workers(2) vector_length(32) /* { dg-line l_compute[incr c_compute] } */
|
|
/* { dg-warning "region is vector partitioned but does not contain vector partitioned code" "" { target *-*-* } l_compute$c_compute } */
|
|
{
|
|
#pragma acc loop gang /* { dg-line l_loop[incr c_loop] } */
|
|
/* { dg-note {variable 'i' in 'private' clause isn't candidate for adjusting OpenACC privatization level: not addressable} "" { target *-*-* } l_loop$c_loop } */
|
|
/* { dg-note {variable 'j' declared in block isn't candidate for adjusting OpenACC privatization level: not addressable} "" { target *-*-* } l_loop$c_loop } */
|
|
for (i = 0; i < 32; i++)
|
|
{
|
|
int j;
|
|
for (j = 0; j < 32; j++)
|
|
x[j] = j * 2;
|
|
|
|
#pragma acc loop worker /* { dg-line l_loop[incr c_loop] } */
|
|
/* { dg-note {variable 'j' in 'private' clause isn't candidate for adjusting OpenACC privatization level: not addressable} "" { target *-*-* } l_loop$c_loop } */
|
|
for (j = 0; j < 32; j++)
|
|
arr[i * 32 + j] += x[31 - j];
|
|
}
|
|
}
|
|
|
|
for (i = 0; i < 32 * 32; i++)
|
|
assert (arr[i] == i + (31 - (i % 32)) * 2);
|
|
}
|
|
|
|
|
|
int main ()
|
|
{
|
|
local_g_1();
|
|
local_w_1();
|
|
local_w_2();
|
|
local_w_3();
|
|
local_w_4();
|
|
local_w_5();
|
|
loop_g_1();
|
|
loop_g_2();
|
|
loop_g_3();
|
|
loop_g_4();
|
|
loop_g_5();
|
|
loop_g_6();
|
|
loop_v_1();
|
|
loop_v_2();
|
|
loop_w_1();
|
|
loop_w_2();
|
|
loop_w_3();
|
|
loop_w_4();
|
|
loop_w_5();
|
|
loop_w_6();
|
|
loop_w_7();
|
|
parallel_g_1();
|
|
parallel_g_2();
|
|
|
|
return 0;
|
|
}
|