-
Notifications
You must be signed in to change notification settings - Fork 0
/
saxpy.f90
79 lines (70 loc) · 1.98 KB
/
saxpy.f90
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
!
! SPDX-FileCopyrightText: Copyright (c) 2022 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
! SPDX-License-Identifier: LicenseRef-NvidiaProprietary
!
! NVIDIA CORPORATION, its affiliates and licensors retain all intellectual
! property and proprietary rights in and to this material, related
! documentation and any modifications thereto. Any use, reproduction,
! disclosure or distribution of this material and related documentation
! without an express license agreement from NVIDIA CORPORATION or
! its affiliates is strictly prohibited.
!
!
! sAXPY example using Do Concurrent construct in Fortran
! Build with
! nvfortran -stdpar -Minfo -fast saxpy.f90
! Build with to target Multicore
! nvfortran -stdpar=multicore -Minfo=accel -fast saxpy.f90
!
module sm
contains
subroutine saxpy_concurrent(x,y,n,a)
real,dimension(:) :: x, y
real :: a
integer :: n, i
do concurrent (i = 1: n)
y(i) = a*x(i)+y(i)
enddo
end subroutine
subroutine saxpy_do(x,y,n,a)
real,dimension(:) :: x, y
real :: a
integer :: n, i
do i = 1, n
y(i) = a*x(i)+y(i)
enddo
end subroutine
end module
program main
use sm
real,dimension(:),allocatable :: x, x2, y
real :: a = 2.0
integer :: n, i, err = 0
integer :: c0, c1, c2, cpar, cseq
n = 1000000000
allocate(x2(n), x(n), y(n))
do i = 1, n
x(i) = 1
x2(i) = 1
y(i) = i
enddo
call system_clock( count=c0 )
call saxpy_do(x2, y, n, a)
call system_clock( count=c1 )
call saxpy_concurrent(x, y, n, a)
call system_clock( count=c2 )
cseq = c1 - c0
cpar = c2 - c1
do i = 1, n
if(x(i) .ne. x2(i)) then
err = err + 1
endif
enddo
print *, cseq, ' microseconds sequential'
print *, cpar, ' microseconds parallel with stdpar'
if(err .eq. 0) then
print *, "Test PASSED"
else
print *, "Test FAILED"
endif
end program