2620c80db0
gcc/testsuite/ * c-c++-common/goacc/combined-directives.c: Clean up dg-* directives. * c-c++-common/goacc/loop-clauses.c: Likewise. * g++.dg/goacc/template.C: Likewise. * gfortran.dg/goacc/combined-directives.f90: Likewise. * gfortran.dg/goacc/loop-1.f95: Likewise. * gfortran.dg/goacc/loop-5.f95: Likewise. * gfortran.dg/goacc/loop-6.f95: Likewise. * gfortran.dg/goacc/loop-tree-1.f90: Likewise. * c-c++-common/goacc-gomp/nesting-1.c: Update. * c-c++-common/goacc-gomp/nesting-fail-1.c: Likewise. * c-c++-common/goacc/clauses-fail.c: Likewise. * c-c++-common/goacc/parallel-1.c: Likewise. * c-c++-common/goacc/reduction-1.c: Likewise. * c-c++-common/goacc/reduction-2.c: Likewise. * c-c++-common/goacc/reduction-3.c: Likewise. * c-c++-common/goacc/reduction-4.c: Likewise. * c-c++-common/goacc/routine-3.c: Likewise. * c-c++-common/goacc/routine-4.c: Likewise. * c-c++-common/goacc/routine-5.c: Likewise. * c-c++-common/goacc/tile.c: Likewise. * g++.dg/goacc/template.C: Likewise. * gfortran.dg/goacc/combined-directives.f90: Likewise. * c-c++-common/goacc/nesting-1.c: Move dg-error test cases into... * c-c++-common/goacc/nesting-fail-1.c: ... this file. Update. * c-c++-common/goacc/kernels-1.c: Update. Incorporate... * c-c++-common/goacc/kernels-empty.c: ... this file, and... * c-c++-common/goacc/kernels-eternal.c: ... this file, and... * c-c++-common/goacc/kernels-noreturn.c: ... this file. * c-c++-common/goacc/host_data-1.c: New file. Incorporate... * c-c++-common/goacc/use_device-1.c: ... this file. * c-c++-common/goacc/host_data-2.c: New file. Incorporate... * c-c++-common/goacc/host_data-5.c: ... this file, and... * c-c++-common/goacc/host_data-6.c: ... this file. * c-c++-common/goacc/loop-2-kernels.c: New file. * c-c++-common/goacc/loop-2-parallel.c: Likewise. * c-c++-common/goacc/loop-3.c: Likewise. * g++.dg/goacc/reference.C: Likewise. * g++.dg/goacc/routine-1.C: Likewise. * g++.dg/goacc/routine-2.C: Likewise. libgomp/ * testsuite/libgomp.oacc-c-c++-common/clauses-1.c: Update. * testsuite/libgomp.oacc-c-c++-common/deviceptr-1.c: Likewise. * testsuite/libgomp.oacc-c-c++-common/if-1.c: Likewise. * testsuite/libgomp.oacc-c-c++-common/vector-loop.c: Likewise. * testsuite/libgomp.oacc-fortran/asyncwait-1.f90: Likewise. * testsuite/libgomp.oacc-fortran/asyncwait-2.f90: Likewise. * testsuite/libgomp.oacc-fortran/asyncwait-3.f90: Likewise. * testsuite/libgomp.oacc-fortran/declare-1.f90: Likewise. * testsuite/libgomp.oacc-c-c++-common/asyncwait-1.c: Likewise. XFAIL. * testsuite/libgomp.oacc-c-c++-common/firstprivate-1.c: Update. Incorporate... * testsuite/libgomp.oacc-c-c++-common/firstprivate-2.c: ... this file. * testsuite/libgomp.oacc-c++/template-reduction.C: New file. * testsuite/libgomp.oacc-c-c++-common/gang-static-1.c: Likewise. * testsuite/libgomp.oacc-c-c++-common/gang-static-2.c: Likewise. * testsuite/libgomp.oacc-c-c++-common/kernels-loop-clauses.c: Likewise. * testsuite/libgomp.oacc-c-c++-common/private-variables.c: Likewise. * testsuite/libgomp.oacc-c-c++-common/reduction-7.c: Likewise. * testsuite/libgomp.oacc-c-c++-common/routine-1.c: Likewise. * testsuite/libgomp.oacc-c-c++-common/routine-4.c: Likewise. * testsuite/libgomp.oacc-c-c++-common/routine-wv-2.c: Likewise. * testsuite/libgomp.oacc-fortran/clauses-1.f90: Likewise. * testsuite/libgomp.oacc-fortran/default-1.f90: Likewise. * testsuite/libgomp.oacc-fortran/firstprivate-1.f90: Likewise. * testsuite/libgomp.oacc-fortran/gang-static-1.f90: Likewise. * testsuite/libgomp.oacc-fortran/if-1.f90: Likewise. * testsuite/libgomp.oacc-fortran/implicit-firstprivate-ref.f90: Likewise. * testsuite/libgomp.oacc-fortran/pr68813.f90: Likewise. * testsuite/libgomp.oacc-fortran/private-variables.f90: Likewise. * testsuite/libgomp.oacc-c-c++-common/kernels-1.c: Merge this file... * testsuite/libgomp.oacc-c-c++-common/parallel-1.c: ..., and this file into... * testsuite/libgomp.oacc-c-c++-common/data-clauses.h: ... this new file. Update. * testsuite/libgomp.oacc-c-c++-common/data-clauses-kernels.c: New file. * testsuite/libgomp.oacc-c-c++-common/data-clauses-parallel.c: Likewise. * testsuite/libgomp.oacc-c-c++-common/kernels-2.c: Rename to... * testsuite/libgomp.oacc-c-c++-common/data-clauses-kernels-ipa-pta.c: ... this new file. Update. * testsuite/libgomp.oacc-c-c++-common/parallel-2.c: Rename to... * testsuite/libgomp.oacc-c-c++-common/data-clauses-parallel-ipa-pta.c: ... this new file. Update. * testsuite/libgomp.oacc-c-c++-common/mode-transitions.c: New file. Incorporate... * testsuite/libgomp.oacc-c-c++-common/worker-single-1a.c: ... this file, and... * testsuite/libgomp.oacc-c-c++-common/worker-single-4.c: ... this file, and... * testsuite/libgomp.oacc-c-c++-common/worker-single-6.c: ... this file. * testsuite/libgomp.oacc-c-c++-common/update-1-2.c: Remove file. Co-Authored-By: Cesar Philippidis <cesar@codesourcery.com> Co-Authored-By: Chung-Lin Tang <cltang@codesourcery.com> Co-Authored-By: James Norris <jnorris@codesourcery.com> Co-Authored-By: Julian Brown <julian@codesourcery.com> Co-Authored-By: Nathan Sidwell <nathan@codesourcery.com> Co-Authored-By: Tom de Vries <tom@codesourcery.com> From-SVN: r234575
77 lines
1.8 KiB
C
77 lines
1.8 KiB
C
/* This code uses nvptx inline assembly guarded with acc_on_device, which is
|
|
not optimized away at -O0, and then confuses the target assembler.
|
|
{ dg-skip-if "" { *-*-* } { "-O0" } { "" } } */
|
|
|
|
#include <stdio.h>
|
|
#include <openacc.h>
|
|
|
|
#define NUM_WORKERS 16
|
|
#define NUM_VECTORS 32
|
|
#define WIDTH 64
|
|
#define HEIGHT 32
|
|
|
|
#define WORK_ID(I,N) \
|
|
(acc_on_device (acc_device_nvidia) \
|
|
? ({unsigned __r; \
|
|
__asm__ volatile ("mov.u32 %0,%%tid.y;" : "=r" (__r)); \
|
|
__r; }) : (I % N))
|
|
#define VEC_ID(I,N) \
|
|
(acc_on_device (acc_device_nvidia) \
|
|
? ({unsigned __r; \
|
|
__asm__ volatile ("mov.u32 %0,%%tid.x;" : "=r" (__r)); \
|
|
__r; }) : (I % N))
|
|
|
|
#pragma acc routine worker
|
|
void __attribute__ ((noinline))
|
|
WorkVec (int *ptr, int w, int h, int nw, int nv)
|
|
{
|
|
#pragma acc loop worker
|
|
for (int i = 0; i < h; i++)
|
|
#pragma acc loop vector
|
|
for (int j = 0; j < w; j++)
|
|
ptr[i*w + j] = (WORK_ID (i, nw) << 8) | VEC_ID(j, nv);
|
|
}
|
|
|
|
int DoWorkVec (int nw)
|
|
{
|
|
int ary[HEIGHT][WIDTH];
|
|
int err = 0;
|
|
|
|
for (int ix = 0; ix != HEIGHT; ix++)
|
|
for (int jx = 0; jx != WIDTH; jx++)
|
|
ary[ix][jx] = 0xdeadbeef;
|
|
|
|
printf ("spawning %d ...", nw); fflush (stdout);
|
|
|
|
#pragma acc parallel num_workers(nw) vector_length (NUM_VECTORS) copy (ary)
|
|
{
|
|
WorkVec ((int *)ary, WIDTH, HEIGHT, nw, NUM_VECTORS);
|
|
}
|
|
|
|
for (int ix = 0; ix != HEIGHT; ix++)
|
|
for (int jx = 0; jx != WIDTH; jx++)
|
|
{
|
|
int exp = ((ix % nw) << 8) | (jx % NUM_VECTORS);
|
|
|
|
if (ary[ix][jx] != exp)
|
|
{
|
|
printf ("\nary[%d][%d] = %#x expected %#x", ix, jx,
|
|
ary[ix][jx], exp);
|
|
err = 1;
|
|
}
|
|
}
|
|
printf (err ? " failed\n" : " ok\n");
|
|
|
|
return err;
|
|
}
|
|
|
|
int main ()
|
|
{
|
|
int err = 0;
|
|
|
|
for (int W = 1; W <= NUM_WORKERS; W <<= 1)
|
|
err |= DoWorkVec (W);
|
|
|
|
return err;
|
|
}
|