Skip to content

Commit 71f19b1

Browse files
author
Daniel Vickers
committed
Last test pass, so I have narrowed the seg fault to 4 loops. Removed two more from that list for this test.
1 parent abf2f5a commit 71f19b1

File tree

1 file changed

+23
-23
lines changed

1 file changed

+23
-23
lines changed

src/common/m_mpi_common.fpp

Lines changed: 23 additions & 23 deletions
Original file line numberDiff line numberDiff line change
@@ -837,38 +837,38 @@ contains
837837
end do
838838
$:END_GPU_PARALLEL_LOOP()
839839
840-
#:call GPU_PARALLEL_LOOP_OLD(collapse=5,private='[r]')
841-
do i = nVar + 1, nVar + 4
842-
do l = 0, p
843-
do k = 0, buff_size - 1
844-
do j = -buff_size, m + buff_size
845-
do q = 1, nb
846-
r = (i - 1) + (q - 1)*4 + nb*4 + v_size* &
847-
((j + buff_size) + (m + 2*buff_size + 1)* &
848-
(k + buff_size*l))
849-
buff_send(r) = real(mv_in(j, k + pack_offset, l, i - nVar, q), kind=wp)
850-
end do
840+
$:GPU_PARALLEL_LOOP(collapse=5,private='[r]')
841+
do i = nVar + 1, nVar + 4
842+
do l = 0, p
843+
do k = 0, buff_size - 1
844+
do j = -buff_size, m + buff_size
845+
do q = 1, nb
846+
r = (i - 1) + (q - 1)*4 + nb*4 + v_size* &
847+
((j + buff_size) + (m + 2*buff_size + 1)* &
848+
(k + buff_size*l))
849+
buff_send(r) = real(mv_in(j, k + pack_offset, l, i - nVar, q), kind=wp)
851850
end do
852851
end do
853852
end do
854853
end do
855-
#:endcall GPU_PARALLEL_LOOP_OLD
854+
end do
855+
$:END_GPU_PARALLEL_LOOP()
856856
end if
857857
#:else
858-
#:call GPU_PARALLEL_LOOP_OLD(collapse=4,private='[r]')
859-
do i = 1, nVar
860-
do l = 0, buff_size - 1
861-
do k = -buff_size, n + buff_size
862-
do j = -buff_size, m + buff_size
863-
r = (i - 1) + v_size* &
864-
((j + buff_size) + (m + 2*buff_size + 1)* &
865-
((k + buff_size) + (n + 2*buff_size + 1)*l))
866-
buff_send(r) = real(q_comm(i)%sf(j, k, l + pack_offset), kind=wp)
867-
end do
858+
$:GPU_PARALLEL_LOOP(collapse=4,private='[r]')
859+
do i = 1, nVar
860+
do l = 0, buff_size - 1
861+
do k = -buff_size, n + buff_size
862+
do j = -buff_size, m + buff_size
863+
r = (i - 1) + v_size* &
864+
((j + buff_size) + (m + 2*buff_size + 1)* &
865+
((k + buff_size) + (n + 2*buff_size + 1)*l))
866+
buff_send(r) = real(q_comm(i)%sf(j, k, l + pack_offset), kind=wp)
868867
end do
869868
end do
870869
end do
871-
#:endcall GPU_PARALLEL_LOOP_OLD
870+
end do
871+
$:END_GPU_PARALLEL_LOOP()
872872
873873
if (qbmm_comm) then
874874
#:call GPU_PARALLEL_LOOP_OLD(collapse=5,private='[r]')

0 commit comments

Comments
 (0)