-
Notifications
You must be signed in to change notification settings - Fork 10
/
Copy pathaccess_efficiency.f90
130 lines (113 loc) · 2.85 KB
/
access_efficiency.f90
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
subroutine acc_loop_2d()
implicit none
integer i, j, n
real, allocatable :: buf(:, :)
real start, finish
n = 10000
allocate(buf(n, n))
!$acc enter data create(buf)
print*, "2D access:"
call cpu_time(start)
!$acc parallel loop present(buf) collapse(2)
do j=1, n
do i=1, n
buf(i, j) = buf(i, j) + 1
end do
end do
call cpu_time(finish)
print '("I, J order time = ",f6.3," seconds.")', (finish - start)
call cpu_time(start)
!$acc parallel loop present(buf) collapse(2)
do i=1, n
do j=1, n
buf(i, j) = buf(i, j) + 1
end do
end do
call cpu_time(finish)
print '("J, I order time = ",f6.3," seconds.")', (finish - start)
!$acc exit data delete(buf)
deallocate(buf)
end subroutine
subroutine acc_loop_3d()
implicit none
integer i, j, k, n
real, allocatable :: buf(:, :, :)
real start, finish
n = 1000
allocate(buf(n, n, n))
!$acc enter data create(buf)
print*, "3D access:"
call cpu_time(start)
!$acc parallel loop present(buf) collapse(3)
do k=1, n
do j=1, n
do i=1, n
buf(i, j, k) = buf(i, j, k) + 1
end do
end do
end do
call cpu_time(finish)
print '("I, J, K order time = ",f6.3," seconds.")', (finish - start)
call cpu_time(start)
!$acc parallel loop present(buf) collapse(3)
do j=1, n
do k=1, n
do i=1, n
buf(i, j, k) = buf(i, j, k) + 1
end do
end do
end do
call cpu_time(finish)
print '("I, K, J order time = ",f6.3," seconds.")', (finish - start)
call cpu_time(start)
!$acc parallel loop present(buf) collapse(3)
do i=1, n
do k=1, n
do j=1, n
buf(i, j, k) = buf(i, j, k) + 1
end do
end do
end do
call cpu_time(finish)
print '("J, K, I order time = ",f6.3," seconds.")', (finish - start)
call cpu_time(start)
!$acc parallel loop present(buf) collapse(3)
do k=1, n
do i=1, n
do j=1, n
buf(i, j, k) = buf(i, j, k) + 1
end do
end do
end do
call cpu_time(finish)
print '("J, I, K order time = ",f6.3," seconds.")', (finish - start)
call cpu_time(start)
!$acc parallel loop present(buf) collapse(3)
do i=1, n
do j=1, n
do k=1, n
buf(i, j, k) = buf(i, j, k) + 1
end do
end do
end do
call cpu_time(finish)
print '("K, J, I order time = ",f6.3," seconds.")', (finish - start)
call cpu_time(start)
!$acc parallel loop present(buf) collapse(3)
do j=1, n
do i=1, n
do k=1, n
buf(i, j, k) = buf(i, j, k) + 1
end do
end do
end do
call cpu_time(finish)
print '("K, I, J order time = ",f6.3," seconds.")', (finish - start)
!$acc exit data delete(buf)
deallocate(buf)
end subroutine
program main
implicit none
call acc_loop_2d
call acc_loop_3d
end program main