ffbdd78a4a
* testsuite/libgomp.oacc-fortran/abort-1.f90: Add 'dg-do run'. * testsuite/libgomp.oacc-fortran/abort-2.f90: Ditto. * testsuite/libgomp.oacc-fortran/acc_on_device-1-1.f90: Ditto. * testsuite/libgomp.oacc-fortran/acc_on_device-1-2.f90: Ditto. * testsuite/libgomp.oacc-fortran/acc_on_device-1-3.f90: Ditto. * testsuite/libgomp.oacc-fortran/lib-1.f90: Ditto. * testsuite/libgomp.oacc-fortran/common-block-1.f90: Use 'stop' not abort(). * testsuite/libgomp.oacc-fortran/common-block-2.f90: Ditto. * testsuite/libgomp.oacc-fortran/common-block-3.f90: Ditto. * testsuite/libgomp.oacc-fortran/data-1.f90: Ditto. * testsuite/libgomp.oacc-fortran/data-2.f90: Ditto. * testsuite/libgomp.oacc-fortran/data-5.f90: Ditto. * testsuite/libgomp.oacc-fortran/dummy-array.f90: Ditto. * testsuite/libgomp.oacc-fortran/gemm-2.f90: Ditto. * testsuite/libgomp.oacc-fortran/gemm.f90: Ditto. * testsuite/libgomp.oacc-fortran/host_data-2.f90: Ditto. * testsuite/libgomp.oacc-fortran/host_data-3.f90: Ditto. * testsuite/libgomp.oacc-fortran/host_data-4.f90: Ditto. * testsuite/libgomp.oacc-fortran/kernels-collapse-3.f90: Ditto. * testsuite/libgomp.oacc-fortran/kernels-collapse-4.f90: Ditto. * testsuite/libgomp.oacc-fortran/kernels-independent.f90: Ditto. * testsuite/libgomp.oacc-fortran/kernels-loop-1.f90: Ditto. * testsuite/libgomp.oacc-fortran/kernels-map-1.f90: Ditto. * testsuite/libgomp.oacc-fortran/kernels-parallel-loop-data-enter-exit.f95: Ditto. * testsuite/libgomp.oacc-fortran/kernels-private-vars-loop-gang-1.f90: Ditto. * testsuite/libgomp.oacc-fortran/kernels-private-vars-loop-gang-2.f90: Ditto. * testsuite/libgomp.oacc-fortran/kernels-private-vars-loop-gang-3.f90: Ditto. * testsuite/libgomp.oacc-fortran/kernels-private-vars-loop-gang-6.f90: Ditto. * testsuite/libgomp.oacc-fortran/kernels-private-vars-vector-1.f90: Ditto. * testsuite/libgomp.oacc-fortran/kernels-private-vars-vector-2.f90: Ditto. * testsuite/libgomp.oacc-fortran/kernels-private-vars-worker-1.f90: Ditto. * testsuite/libgomp.oacc-fortran/kernels-private-vars-worker-2.f90: Ditto. * testsuite/libgomp.oacc-fortran/kernels-private-vars-worker-3.f90: Ditto. * testsuite/libgomp.oacc-fortran/kernels-private-vars-worker-4.f90: Ditto. * testsuite/libgomp.oacc-fortran/kernels-private-vars-worker-5.f90: Ditto. * testsuite/libgomp.oacc-fortran/kernels-private-vars-worker-6.f90: Ditto. * testsuite/libgomp.oacc-fortran/kernels-private-vars-worker-7.f90: Ditto. * testsuite/libgomp.oacc-fortran/kernels-reduction-1.f90: Ditto. * testsuite/libgomp.oacc-fortran/lib-12.f90: Ditto. * testsuite/libgomp.oacc-fortran/lib-13.f90: Ditto. * testsuite/libgomp.oacc-fortran/lib-14.f90: Ditto. * testsuite/libgomp.oacc-fortran/kernels-acc-loop-reduction-2.f90: Likewise and also add 'dg-do run'. * testsuite/libgomp.oacc-fortran/kernels-acc-loop-reduction.f90: Ditto. From-SVN: r277503
81 lines
1.7 KiB
Fortran
81 lines
1.7 KiB
Fortran
! Exercise three levels of parallelism using SGEMM from BLAS.
|
|
|
|
! { dg-do run }
|
|
! { dg-additional-options "-fopenacc-dim=::128" }
|
|
|
|
! Implicitly set vector_length to 128 using -fopenacc-dim.
|
|
subroutine openacc_sgemm (m, n, k, alpha, a, b, beta, c)
|
|
integer :: m, n, k
|
|
real :: alpha, beta
|
|
real :: a(k,*), b(k,*), c(m,*)
|
|
|
|
integer :: i, j, l
|
|
real :: temp
|
|
|
|
!$acc parallel loop copy(c(1:m,1:n)) copyin(a(1:k,1:m),b(1:k,1:n)) firstprivate (temp)
|
|
do j = 1, n
|
|
!$acc loop
|
|
do i = 1, m
|
|
temp = 0.0
|
|
!$acc loop reduction(+:temp)
|
|
do l = 1, k
|
|
temp = temp + a(l,i)*b(l,j)
|
|
end do
|
|
if(beta == 0.0) then
|
|
c(i,j) = alpha*temp
|
|
else
|
|
c(i,j) = alpha*temp + beta*c(i,j)
|
|
end if
|
|
end do
|
|
end do
|
|
end subroutine openacc_sgemm
|
|
|
|
subroutine host_sgemm (m, n, k, alpha, a, b, beta, c)
|
|
integer :: m, n, k
|
|
real :: alpha, beta
|
|
real :: a(k,*), b(k,*), c(m,*)
|
|
|
|
integer :: i, j, l
|
|
real :: temp
|
|
|
|
do j = 1, n
|
|
do i = 1, m
|
|
temp = 0.0
|
|
do l = 1, k
|
|
temp = temp + a(l,i)*b(l,j)
|
|
end do
|
|
if(beta == 0.0) then
|
|
c(i,j) = alpha*temp
|
|
else
|
|
c(i,j) = alpha*temp + beta*c(i,j)
|
|
end if
|
|
end do
|
|
end do
|
|
end subroutine host_sgemm
|
|
|
|
program main
|
|
integer, parameter :: M = 100, N = 50, K = 2000
|
|
real :: a(K, M), b(K, N), c(M, N), d (M, N), e (M, N)
|
|
real alpha, beta
|
|
integer i, j
|
|
|
|
a(:,:) = 1.0
|
|
b(:,:) = 0.25
|
|
|
|
c(:,:) = 0.0
|
|
d(:,:) = 0.0
|
|
e(:,:) = 0.0
|
|
|
|
alpha = 1.05
|
|
beta = 1.25
|
|
|
|
call openacc_sgemm (M, N, K, alpha, a, b, beta, c)
|
|
call host_sgemm (M, N, K, alpha, a, b, beta, e)
|
|
|
|
do i = 1, m
|
|
do j = 1, n
|
|
if (c(i,j) /= e(i,j)) stop 1
|
|
end do
|
|
end do
|
|
end program main
|