| ! { dg-additional-options "-O2" } |
| ! { dg-additional-options "-fdump-tree-parloops1-all" } |
| ! { dg-additional-options "-fdump-tree-optimized" } |
| |
| program main |
| implicit none |
| integer, parameter :: n = 1024 |
| integer, dimension (0:n-1) :: a, b, c |
| integer :: i, ii |
| |
| !$acc enter data create (a(0:n-1), b(0:n-1), c(0:n-1)) |
| |
| !$acc kernels present (a(0:n-1)) |
| do i = 0, n - 1 |
| a(i) = i * 2 |
| end do |
| !$acc end kernels |
| |
| do i = 0, n -1 |
| b(i) = i * 4 |
| end do |
| |
| !$acc update device (b(0:n-1)) |
| |
| !$acc kernels present (a(0:n-1), b(0:n-1), c(0:n-1)) |
| do ii = 0, n - 1 |
| c(ii) = a(ii) + b(ii) |
| end do |
| !$acc end kernels |
| |
| !$acc exit data copyout (a(0:n-1), c(0:n-1)) |
| |
| do i = 0, n - 1 |
| if (c(i) .ne. a(i) + b(i)) STOP 1 |
| end do |
| |
| end program main |
| |
| ! Check that only three loops are analyzed, and that all can be parallelized. |
| ! { dg-final { scan-tree-dump-times "SUCCESS: may be parallelized" 2 "parloops1" } } |
| ! { dg-final { scan-tree-dump-times "(?n)__attribute__\\(\\(oacc kernels parallelized, oacc function \\(, , \\), oacc kernels, omp target entrypoint\\)\\)" 2 "parloops1" } } |
| ! { dg-final { scan-tree-dump-not "FAILED:" "parloops1" } } |
| |
| ! Check that the loop has been split off into a function. |
| ! { dg-final { scan-tree-dump-times "(?n);; Function MAIN__._omp_fn.0 " 1 "optimized" } } |
| ! { dg-final { scan-tree-dump-times "(?n);; Function MAIN__._omp_fn.1 " 1 "optimized" } } |