f8e89d9f4d
2015-06-30 Tom de Vries <tom@codesourcery.com> * testsuite/libgomp.c++/c++.exp: Set DEFAULT_CFLAGS to -O2 if not already set. Use DEFAULT_CFLAGS in dg-runtest. * testsuite/libgomp.c++/atomic-16.C: Remove dg-options "-O2 -fopenmp". * testsuite/libgomp.c++/pr64824.C: Same. * testsuite/libgomp.c++/pr64868.C: Same. * testsuite/libgomp.c++/pr66199-1.C: Same. * testsuite/libgomp.c++/pr66199-2.C: Same. * testsuite/libgomp.c++/target-2.C: Same. * testsuite/libgomp.c++/for-7.C: Use dg-additional-options for -std=<standard> option. * testsuite/libgomp.c++/udr-11.C: Same. * testsuite/libgomp.c++/udr-12.C: Same. * testsuite/libgomp.c++/udr-13.C: Same. * testsuite/libgomp.c++/udr-14.C: Same. * testsuite/libgomp.c++/udr-15.C: Same. * testsuite/libgomp.c++/udr-16.C: Same. * testsuite/libgomp.c++/udr-17.C: Same. * testsuite/libgomp.c++/udr-18.C: Same. * testsuite/libgomp.c++/udr-19.C: Same. * testsuite/libgomp.c++/atomic-1.C: Remove dg-options "-O2". * testsuite/libgomp.c++/simd-1.C: Same. * testsuite/libgomp.c++/simd-2.C: Same. * testsuite/libgomp.c++/simd-3.C: Same. * testsuite/libgomp.c++/simd-4.C: Same. * testsuite/libgomp.c++/simd-5.C: Same. * testsuite/libgomp.c++/simd-6.C: Same. * testsuite/libgomp.c++/simd-7.C: Same. * testsuite/libgomp.c++/simd-8.C: Same. * testsuite/libgomp.c++/simd-9.C: Same. * testsuite/libgomp.c++/simd10.C: Same. * testsuite/libgomp.c++/simd11.C: Same. * testsuite/libgomp.c++/simd12.C: Same. * testsuite/libgomp.c++/simd13.C: Same. From-SVN: r225181
131 lines
3.0 KiB
C
131 lines
3.0 KiB
C
// { dg-do run }
|
|
// { dg-additional-options "-msse2" { target sse2_runtime } }
|
|
// { dg-additional-options "-mavx" { target avx_runtime } }
|
|
|
|
extern "C" void abort ();
|
|
int a[1024] __attribute__((aligned (32))) = { 1 };
|
|
int b[1024] __attribute__((aligned (32))) = { 1 };
|
|
unsigned char c[1024] __attribute__((aligned (32))) = { 1 };
|
|
int k, m;
|
|
__UINTPTR_TYPE__ u, u2, u3;
|
|
|
|
__attribute__((noinline, noclone)) int
|
|
foo (int *p)
|
|
{
|
|
int i, s = 0, s2 = 0, t, t2;
|
|
#pragma omp simd aligned(a, b, p : 32) linear(k: m + 1) reduction(+:s) \
|
|
lastprivate (t2)
|
|
for (i = 0; i < 512; i++)
|
|
{
|
|
a[i] *= p[i];
|
|
t2 = k + p[i];
|
|
k += m + 1;
|
|
s += p[i] + k;
|
|
c[i]++;
|
|
}
|
|
#pragma omp simd aligned(a, b, p : 32) linear(k: m + 1) reduction(+:s2) \
|
|
lastprivate (t, u, u2, u3)
|
|
for (i = 512; i < 1024; i++)
|
|
{
|
|
a[i] *= p[i];
|
|
k += m + 1;
|
|
t = k + p[i];
|
|
u = (__UINTPTR_TYPE__) &k;
|
|
u2 = (__UINTPTR_TYPE__) &s2;
|
|
u3 = (__UINTPTR_TYPE__) &t;
|
|
s2 += t;
|
|
c[i]++;
|
|
}
|
|
return s + s2 + t + t2;
|
|
}
|
|
|
|
__attribute__((noinline, noclone)) long int
|
|
bar (int *p, long int n, long int o)
|
|
{
|
|
long int i, s = 0, s2 = 0, t, t2;
|
|
#pragma omp simd aligned(a, b, p : 32) linear(k: m + 1) reduction(+:s) \
|
|
lastprivate (t2)
|
|
for (i = 0; i < n; i++)
|
|
{
|
|
a[i] *= p[i];
|
|
t2 = k + p[i];
|
|
k += m + 1;
|
|
s += p[i] + k;
|
|
c[i]++;
|
|
}
|
|
#pragma omp simd aligned(a, b, p : 32) linear(k: m + 1) reduction(+:s2) \
|
|
lastprivate (t, u, u2, u3)
|
|
for (i = n; i < o; i++)
|
|
{
|
|
a[i] *= p[i];
|
|
k += m + 1;
|
|
t = k + p[i];
|
|
u = (__UINTPTR_TYPE__) &k;
|
|
u2 = (__UINTPTR_TYPE__) &s2;
|
|
u3 = (__UINTPTR_TYPE__) &t;
|
|
s2 += t;
|
|
c[i]++;
|
|
}
|
|
return s + s2 + t + t2;
|
|
}
|
|
|
|
int
|
|
main ()
|
|
{
|
|
#if __SIZEOF_INT__ >= 4
|
|
int i;
|
|
k = 4;
|
|
m = 2;
|
|
for (i = 0; i < 1024; i++)
|
|
{
|
|
a[i] = i - 512;
|
|
b[i] = (i - 51) % 39;
|
|
c[i] = (unsigned char) i;
|
|
}
|
|
int s = foo (b);
|
|
for (i = 0; i < 1024; i++)
|
|
{
|
|
if (b[i] != (i - 51) % 39
|
|
|| a[i] != (i - 512) * b[i]
|
|
|| c[i] != (unsigned char) (i + 1))
|
|
abort ();
|
|
a[i] = i - 512;
|
|
}
|
|
if (k != 4 + 3 * 1024
|
|
|| s != 1596127 + (4 + 3 * 511 + b[511]) + (4 + 3 * 1024 + b[1023]))
|
|
abort ();
|
|
k = 4;
|
|
s = bar (b, 512, 1024);
|
|
for (i = 0; i < 1024; i++)
|
|
{
|
|
if (b[i] != (i - 51) % 39
|
|
|| a[i] != (i - 512) * b[i]
|
|
|| c[i] != (unsigned char) (i + 2))
|
|
abort ();
|
|
a[i] = i - 512;
|
|
}
|
|
if (k != 4 + 3 * 1024
|
|
|| s != 1596127 + (4 + 3 * 511 + b[511]) + (4 + 3 * 1024 + b[1023]))
|
|
abort ();
|
|
k = 4;
|
|
s = bar (b, 511, 1021);
|
|
for (i = 0; i < 1021; i++)
|
|
{
|
|
if (b[i] != (i - 51) % 39
|
|
|| a[i] != (i - 512) * b[i]
|
|
|| c[i] != (unsigned char) (i + 3))
|
|
abort ();
|
|
a[i] = i - 512;
|
|
}
|
|
for (i = 1021; i < 1024; i++)
|
|
if (b[i] != (i - 51) % 39
|
|
|| a[i] != i - 512
|
|
|| c[i] != (unsigned char) (i + 2))
|
|
abort ();
|
|
if (k != 4 + 3 * 1021
|
|
|| s != 1586803 + (4 + 3 * 510 + b[510]) + (4 + 3 * 1021 + b[1020]))
|
|
abort ();
|
|
#endif
|
|
return 0;
|
|
}
|