@@ -138,23 +138,23 @@ contains
138138#if defined(MFC_GPU)
139139
140140 $:GPU_PARALLEL_LOOP(collapse= 3 )
141- do k = 1 , sys_size
142- do j = 0 , m
143- do l = 1 , cmplx_size
144- data_fltr_cmplx_gpu(l + j* cmplx_size + (k - 1 )* cmplx_size* x_size) = (0_dp , 0_dp )
145- end do
141+ do k = 1 , sys_size
142+ do j = 0 , m
143+ do l = 1 , cmplx_size
144+ data_fltr_cmplx_gpu(l + j* cmplx_size + (k - 1 )* cmplx_size* x_size) = (0_dp , 0_dp )
146145 end do
147146 end do
147+ end do
148148 $:END_GPU_PARALLEL_LOOP()
149149
150150 $:GPU_PARALLEL_LOOP(collapse= 3 )
151- do k = 1 , sys_size
152- do j = 0 , m
153- do l = 0 , p
154- data_real_gpu(l + j* real_size + 1 + (k - 1 )* real_size* x_size) = q_cons_vf(k)%sf(j, 0 , l)
155- end do
151+ do k = 1 , sys_size
152+ do j = 0 , m
153+ do l = 0 , p
154+ data_real_gpu(l + j* real_size + 1 + (k - 1 )* real_size* x_size) = q_cons_vf(k)%sf(j, 0 , l)
156155 end do
157156 end do
157+ end do
158158 $:END_GPU_PARALLEL_LOOP()
159159
160160 #:call GPU_HOST_DATA(use_device_addr= ' [data_real_gpu, data_cmplx_gpu, data_fltr_cmplx_gpu]' )
@@ -169,13 +169,13 @@ contains
169169 $:GPU_UPDATE(device= ' [Nfq]' )
170170
171171 $:GPU_PARALLEL_LOOP(collapse= 3 )
172- do k = 1 , sys_size
173- do j = 0 , m
174- do l = 1 , Nfq
175- data_fltr_cmplx_gpu(l + j* cmplx_size + (k - 1 )* cmplx_size* x_size) = data_cmplx_gpu(l + j* cmplx_size + (k - 1 )* cmplx_size* x_size)
176- end do
172+ do k = 1 , sys_size
173+ do j = 0 , m
174+ do l = 1 , Nfq
175+ data_fltr_cmplx_gpu(l + j* cmplx_size + (k - 1 )* cmplx_size* x_size) = data_cmplx_gpu(l + j* cmplx_size + (k - 1 )* cmplx_size* x_size)
177176 end do
178177 end do
178+ end do
179179 $:END_GPU_PARALLEL_LOOP()
180180
181181 #:call GPU_HOST_DATA(use_device_addr= ' [data_real_gpu, data_cmplx_gpu, data_fltr_cmplx_gpu]' )
@@ -188,36 +188,36 @@ contains
188188 #:endcall GPU_HOST_DATA
189189
190190 $:GPU_PARALLEL_LOOP(collapse= 3 )
191- do k = 1 , sys_size
192- do j = 0 , m
193- do l = 0 , p
194- data_real_gpu(l + j* real_size + 1 + (k - 1 )* real_size* x_size) = data_real_gpu(l + j* real_size + 1 + (k - 1 )* real_size* x_size)/ real (real_size, dp)
195- q_cons_vf(k)%sf(j, 0 , l) = data_real_gpu(l + j* real_size + 1 + (k - 1 )* real_size* x_size)
196- end do
191+ do k = 1 , sys_size
192+ do j = 0 , m
193+ do l = 0 , p
194+ data_real_gpu(l + j* real_size + 1 + (k - 1 )* real_size* x_size) = data_real_gpu(l + j* real_size + 1 + (k - 1 )* real_size* x_size)/ real (real_size, dp)
195+ q_cons_vf(k)%sf(j, 0 , l) = data_real_gpu(l + j* real_size + 1 + (k - 1 )* real_size* x_size)
197196 end do
198197 end do
198+ end do
199199 $:END_GPU_PARALLEL_LOOP()
200200
201201 do i = 1 , fourier_rings
202202
203203 $:GPU_PARALLEL_LOOP(collapse= 3 )
204- do k = 1 , sys_size
205- do j = 0 , m
206- do l = 1 , cmplx_size
207- data_fltr_cmplx_gpu(l + j* cmplx_size + (k - 1 )* cmplx_size* x_size) = (0_dp , 0_dp )
208- end do
204+ do k = 1 , sys_size
205+ do j = 0 , m
206+ do l = 1 , cmplx_size
207+ data_fltr_cmplx_gpu(l + j* cmplx_size + (k - 1 )* cmplx_size* x_size) = (0_dp , 0_dp )
209208 end do
210209 end do
210+ end do
211211 $:END_GPU_PARALLEL_LOOP()
212212
213213 $:GPU_PARALLEL_LOOP(collapse= 3 , firstprivate= ' [i]' )
214- do k = 1 , sys_size
215- do j = 0 , m
216- do l = 0 , p
217- data_real_gpu(l + j* real_size + 1 + (k - 1 )* real_size* x_size) = q_cons_vf(k)%sf(j, i, l)
218- end do
214+ do k = 1 , sys_size
215+ do j = 0 , m
216+ do l = 0 , p
217+ data_real_gpu(l + j* real_size + 1 + (k - 1 )* real_size* x_size) = q_cons_vf(k)%sf(j, i, l)
219218 end do
220219 end do
220+ end do
221221 $:END_GPU_PARALLEL_LOOP()
222222
223223 #:call GPU_HOST_DATA(use_device_addr= ' [data_real_gpu, data_cmplx_gpu, data_fltr_cmplx_gpu]' )
@@ -233,13 +233,13 @@ contains
233233 $:GPU_UPDATE(device= ' [Nfq]' )
234234
235235 $:GPU_PARALLEL_LOOP(collapse= 3 )
236- do k = 1 , sys_size
237- do j = 0 , m
238- do l = 1 , Nfq
239- data_fltr_cmplx_gpu(l + j* cmplx_size + (k - 1 )* cmplx_size* x_size) = data_cmplx_gpu(l + j* cmplx_size + (k - 1 )* cmplx_size* x_size)
240- end do
236+ do k = 1 , sys_size
237+ do j = 0 , m
238+ do l = 1 , Nfq
239+ data_fltr_cmplx_gpu(l + j* cmplx_size + (k - 1 )* cmplx_size* x_size) = data_cmplx_gpu(l + j* cmplx_size + (k - 1 )* cmplx_size* x_size)
241240 end do
242241 end do
242+ end do
243243 $:END_GPU_PARALLEL_LOOP()
244244
245245 #:call GPU_HOST_DATA(use_device_addr= ' [data_real_gpu, data_cmplx_gpu, data_fltr_cmplx_gpu]' )
@@ -252,14 +252,14 @@ contains
252252 #:endcall GPU_HOST_DATA
253253
254254 $:GPU_PARALLEL_LOOP(collapse= 3 , firstprivate= ' [i]' )
255- do k = 1 , sys_size
256- do j = 0 , m
257- do l = 0 , p
258- data_real_gpu(l + j* real_size + 1 + (k - 1 )* real_size* x_size) = data_real_gpu(l + j* real_size + 1 + (k - 1 )* real_size* x_size)/ real (real_size, dp)
259- q_cons_vf(k)%sf(j, i, l) = data_real_gpu(l + j* real_size + 1 + (k - 1 )* real_size* x_size)
260- end do
255+ do k = 1 , sys_size
256+ do j = 0 , m
257+ do l = 0 , p
258+ data_real_gpu(l + j* real_size + 1 + (k - 1 )* real_size* x_size) = data_real_gpu(l + j* real_size + 1 + (k - 1 )* real_size* x_size)/ real (real_size, dp)
259+ q_cons_vf(k)%sf(j, i, l) = data_real_gpu(l + j* real_size + 1 + (k - 1 )* real_size* x_size)
261260 end do
262261 end do
262+ end do
263263 $:END_GPU_PARALLEL_LOOP()
264264 end do
265265
@@ -322,4 +322,4 @@ contains
322322#endif
323323
324324 end subroutine s_finalize_fftw_module
325- end module m_fftw
325+ end module m_fftw
0 commit comments