@@ -757,7 +757,7 @@ contains
757757 #:for mpi_dir in [1, 2, 3]
758758 if (mpi_dir == ${mpi_dir}$) then
759759 #:if mpi_dir == 1
760- #:call GPU_PARALLEL (collapse=4,private=' [r]' )
760+ #:call GPU_PARALLEL_LOOP_OLD (collapse=4,private=' [r]' )
761761 do l = 0, p
762762 do k = 0, n
763763 do j = 0, buff_size - 1
@@ -768,10 +768,10 @@ contains
768768 end do
769769 end do
770770 end do
771- #:endcall GPU_PARALLEL
771+ #:endcall GPU_PARALLEL_LOOP_OLD
772772
773773 if (qbmm_comm) then
774- #:call GPU_PARALLEL (collapse=4,private=' [r]' )
774+ #:call GPU_PARALLEL_LOOP_OLD (collapse=4,private=' [r]' )
775775 do l = 0, p
776776 do k = 0, n
777777 do j = 0, buff_size - 1
@@ -785,9 +785,9 @@ contains
785785 end do
786786 end do
787787 end do
788- #:endcall GPU_PARALLEL
788+ #:endcall GPU_PARALLEL_LOOP_OLD
789789
790- #:call GPU_PARALLEL (collapse=5,private=' [r]' )
790+ #:call GPU_PARALLEL_LOOP_OLD (collapse=5,private=' [r]' )
791791 do l = 0, p
792792 do k = 0, n
793793 do j = 0, buff_size - 1
@@ -801,10 +801,10 @@ contains
801801 end do
802802 end do
803803 end do
804- #:endcall GPU_PARALLEL
804+ #:endcall GPU_PARALLEL_LOOP_OLD
805805 end if
806806 #:elif mpi_dir == 2
807- #:call GPU_PARALLEL (collapse=4,private=' [r]' )
807+ #:call GPU_PARALLEL_LOOP_OLD (collapse=4,private=' [r]' )
808808 do i = 1, nVar
809809 do l = 0, p
810810 do k = 0, buff_size - 1
@@ -817,10 +817,10 @@ contains
817817 end do
818818 end do
819819 end do
820- #:endcall GPU_PARALLEL
820+ #:endcall GPU_PARALLEL_LOOP_OLD
821821
822822 if (qbmm_comm) then
823- #:call GPU_PARALLEL (collapse=5,private=' [r]' )
823+ #:call GPU_PARALLEL_LOOP_OLD (collapse=5,private=' [r]' )
824824 do i = nVar + 1, nVar + 4
825825 do l = 0, p
826826 do k = 0, buff_size - 1
@@ -835,9 +835,9 @@ contains
835835 end do
836836 end do
837837 end do
838- #:endcall GPU_PARALLEL
838+ #:endcall GPU_PARALLEL_LOOP_OLD
839839
840- #:call GPU_PARALLEL (collapse=5,private=' [r]' )
840+ #:call GPU_PARALLEL_LOOP_OLD (collapse=5,private=' [r]' )
841841 do i = nVar + 1, nVar + 4
842842 do l = 0, p
843843 do k = 0, buff_size - 1
@@ -852,10 +852,10 @@ contains
852852 end do
853853 end do
854854 end do
855- #:endcall GPU_PARALLEL
855+ #:endcall GPU_PARALLEL_LOOP_OLD
856856 end if
857857 #:else
858- #:call GPU_PARALLEL (collapse=4,private=' [r]' )
858+ #:call GPU_PARALLEL_LOOP_OLD (collapse=4,private=' [r]' )
859859 do i = 1, nVar
860860 do l = 0, buff_size - 1
861861 do k = -buff_size, n + buff_size
@@ -868,10 +868,10 @@ contains
868868 end do
869869 end do
870870 end do
871- #:endcall GPU_PARALLEL
871+ #:endcall GPU_PARALLEL_LOOP_OLD
872872
873873 if (qbmm_comm) then
874- #:call GPU_PARALLEL (collapse=5,private=' [r]' )
874+ #:call GPU_PARALLEL_LOOP_OLD (collapse=5,private=' [r]' )
875875 do i = nVar + 1, nVar + 4
876876 do l = 0, buff_size - 1
877877 do k = -buff_size, n + buff_size
@@ -886,9 +886,9 @@ contains
886886 end do
887887 end do
888888 end do
889- #:endcall GPU_PARALLEL
889+ #:endcall GPU_PARALLEL_LOOP_OLD
890890
891- #:call GPU_PARALLEL (collapse=5,private=' [r]' )
891+ #:call GPU_PARALLEL_LOOP_OLD (collapse=5,private=' [r]' )
892892 do i = nVar + 1, nVar + 4
893893 do l = 0, buff_size - 1
894894 do k = -buff_size, n + buff_size
@@ -903,7 +903,7 @@ contains
903903 end do
904904 end do
905905 end do
906- #:endcall GPU_PARALLEL
906+ #:endcall GPU_PARALLEL_LOOP_OLD
907907 end if
908908 #:endif
909909 end if
@@ -958,7 +958,7 @@ contains
958958 #:for mpi_dir in [1, 2, 3]
959959 if (mpi_dir == ${mpi_dir}$) then
960960 #:if mpi_dir == 1
961- #:call GPU_PARALLEL (collapse=4,private=' [r]' )
961+ #:call GPU_PARALLEL_LOOP_OLD (collapse=4,private=' [r]' )
962962 do l = 0, p
963963 do k = 0, n
964964 do j = -buff_size, -1
@@ -976,10 +976,10 @@ contains
976976 end do
977977 end do
978978 end do
979- #:endcall GPU_PARALLEL
979+ #:endcall GPU_PARALLEL_LOOP_OLD
980980
981981 if (qbmm_comm) then
982- #:call GPU_PARALLEL (collapse=5,private=' [r]' )
982+ #:call GPU_PARALLEL_LOOP_OLD (collapse=5,private=' [r]' )
983983 do l = 0, p
984984 do k = 0, n
985985 do j = -buff_size, -1
@@ -993,9 +993,9 @@ contains
993993 end do
994994 end do
995995 end do
996- #:endcall GPU_PARALLEL
996+ #:endcall GPU_PARALLEL_LOOP_OLD
997997
998- #:call GPU_PARALLEL (collapse=5,private=' [r]' )
998+ #:call GPU_PARALLEL_LOOP_OLD (collapse=5,private=' [r]' )
999999 do l = 0, p
10001000 do k = 0, n
10011001 do j = -buff_size, -1
@@ -1009,10 +1009,10 @@ contains
10091009 end do
10101010 end do
10111011 end do
1012- #:endcall GPU_PARALLEL
1012+ #:endcall GPU_PARALLEL_LOOP_OLD
10131013 end if
10141014 #:elif mpi_dir == 2
1015- #:call GPU_PARALLEL (collapse=4,private=' [r]' )
1015+ #:call GPU_PARALLEL_LOOP_OLD (collapse=4,private=' [r]' )
10161016 do i = 1, nVar
10171017 do l = 0, p
10181018 do k = -buff_size, -1
@@ -1031,10 +1031,10 @@ contains
10311031 end do
10321032 end do
10331033 end do
1034- #:endcall GPU_PARALLEL
1034+ #:endcall GPU_PARALLEL_LOOP_OLD
10351035
10361036 if (qbmm_comm) then
1037- #:call GPU_PARALLEL (collapse=5,private=' [r]' )
1037+ #:call GPU_PARALLEL_LOOP_OLD (collapse=5,private=' [r]' )
10381038 do i = nVar + 1, nVar + 4
10391039 do l = 0, p
10401040 do k = -buff_size, -1
@@ -1049,9 +1049,9 @@ contains
10491049 end do
10501050 end do
10511051 end do
1052- #:endcall GPU_PARALLEL
1052+ #:endcall GPU_PARALLEL_LOOP_OLD
10531053
1054- #:call GPU_PARALLEL (collapse=5,private=' [r]' )
1054+ #:call GPU_PARALLEL_LOOP_OLD (collapse=5,private=' [r]' )
10551055 do i = nVar + 1, nVar + 4
10561056 do l = 0, p
10571057 do k = -buff_size, -1
@@ -1066,11 +1066,11 @@ contains
10661066 end do
10671067 end do
10681068 end do
1069- #:endcall GPU_PARALLEL
1069+ #:endcall GPU_PARALLEL_LOOP_OLD
10701070 end if
10711071 #:else
10721072 ! Unpacking buffer from bc_z%beg
1073- #:call GPU_PARALLEL (collapse=4,private=' [r]' )
1073+ #:call GPU_PARALLEL_LOOP_OLD (collapse=4,private=' [r]' )
10741074 do i = 1, nVar
10751075 do l = -buff_size, -1
10761076 do k = -buff_size, n + buff_size
@@ -1090,10 +1090,10 @@ contains
10901090 end do
10911091 end do
10921092 end do
1093- #:endcall GPU_PARALLEL
1093+ #:endcall GPU_PARALLEL_LOOP_OLD
10941094
10951095 if (qbmm_comm) then
1096- #:call GPU_PARALLEL (collapse=5,private=' [r]' )
1096+ #:call GPU_PARALLEL_LOOP_OLD (collapse=5,private=' [r]' )
10971097 do i = nVar + 1, nVar + 4
10981098 do l = -buff_size, -1
10991099 do k = -buff_size, n + buff_size
@@ -1109,9 +1109,9 @@ contains
11091109 end do
11101110 end do
11111111 end do
1112- #:endcall GPU_PARALLEL
1112+ #:endcall GPU_PARALLEL_LOOP_OLD
11131113
1114- #:call GPU_PARALLEL (collapse=5,private=' [r]' )
1114+ #:call GPU_PARALLEL_LOOP_OLD (collapse=5,private=' [r]' )
11151115 do i = nVar + 1, nVar + 4
11161116 do l = -buff_size, -1
11171117 do k = -buff_size, n + buff_size
@@ -1127,7 +1127,7 @@ contains
11271127 end do
11281128 end do
11291129 end do
1130- #:endcall GPU_PARALLEL
1130+ #:endcall GPU_PARALLEL_LOOP_OLD
11311131 end if
11321132 #:endif
11331133 end if
0 commit comments