@@ -26,14 +26,14 @@ if dim1
2626 @testset "1D -- CPU -- rdft=$rdft -- $N" begin
2727 nlp, solver, results = fft_example_1D(N; gpu=false, rdft, check=true)
2828
29- z2 = M_perpt_M_perp_vec(nlp.buffer_real, nlp.buffer_complex1, nlp.buffer_complex2, nlp.op, 1, (N,), z, Int[]; rdft)
29+ z2 = M_perpt_M_perp_vec(nlp.buffer_real, nlp.buffer_complex1, nlp.buffer_complex2, nlp.op, 1, (N,), z, Int[], nlp.fft_timer, nlp.mapping_timer ; rdft)
3030 @test z2 ≈ z
3131
32- res1 = M_perp_tz(nlp.buffer_real, nlp.buffer_complex1, nlp.buffer_complex2, nlp.op, 1, (N,), z; rdft)
32+ res1 = M_perp_tz(nlp.buffer_real, nlp.buffer_complex1, nlp.buffer_complex2, nlp.op, 1, (N,), z, nlp.fft_timer, nlp.mapping_timer ; rdft)
3333 @test norm(res1) ≈ norm(z)
3434 @test res1_wei ≈ res1
3535
36- res2 = M_perp_beta(nlp.buffer_real, nlp.buffer_complex1, nlp.buffer_complex2, nlp.op, 1, (N,), z, Int[]; rdft)
36+ res2 = M_perp_beta(nlp.buffer_real, nlp.buffer_complex1, nlp.buffer_complex2, nlp.op, 1, (N,), z, Int[], nlp.fft_timer, nlp.mapping_timer ; rdft)
3737 @test norm(res2) ≈ norm(z)
3838 @test res2_wei ≈ res2
3939 end
@@ -44,14 +44,14 @@ if dim1
4444
4545 z_gpu = CuArray(z)
4646
47- z2_gpu = M_perpt_M_perp_vec(nlp.buffer_real, nlp.buffer_complex1, nlp.buffer_complex2, nlp.op, 1, (N,), z_gpu, Int[]; rdft)
47+ z2_gpu = M_perpt_M_perp_vec(nlp.buffer_real, nlp.buffer_complex1, nlp.buffer_complex2, nlp.op, 1, (N,), z_gpu, Int[], nlp.fft_timer, nlp.mapping_timer ; rdft)
4848 @test z2_gpu ≈ z_gpu
4949
50- res1_gpu = M_perp_tz(nlp.buffer_real, nlp.buffer_complex1, nlp.buffer_complex2, nlp.op, 1, (N,), z_gpu; rdft)
50+ res1_gpu = M_perp_tz(nlp.buffer_real, nlp.buffer_complex1, nlp.buffer_complex2, nlp.op, 1, (N,), z_gpu, nlp.fft_timer, nlp.mapping_timer ; rdft)
5151 @test norm(res1_gpu) ≈ norm(z_gpu)
5252 @test res1_wei ≈ collect(res1_gpu)
5353
54- res2_gpu = M_perp_beta(nlp.buffer_real, nlp.buffer_complex1, nlp.buffer_complex2, nlp.op, 1, (N,), z_gpu, Int[]; rdft)
54+ res2_gpu = M_perp_beta(nlp.buffer_real, nlp.buffer_complex1, nlp.buffer_complex2, nlp.op, 1, (N,), z_gpu, Int[], nlp.fft_timer, nlp.mapping_timer ; rdft)
5555 @test norm(res2_gpu) ≈ norm(z_gpu)
5656 @test res2_wei ≈ collect(res2_gpu)
5757 end
@@ -78,14 +78,14 @@ if dim2
7878 @testset "2D -- CPU -- rdft=$rdft -- $N1 × $N2" begin
7979 nlp, solver, results = fft_example_2D(N1, N2; gpu=false, rdft, check=true)
8080
81- z2 = M_perpt_M_perp_vec(nlp.buffer_real, nlp.buffer_complex1, nlp.buffer_complex2, nlp.op, 2, (N1, N2), z, Int[]; rdft)
81+ z2 = M_perpt_M_perp_vec(nlp.buffer_real, nlp.buffer_complex1, nlp.buffer_complex2, nlp.op, 2, (N1, N2), z, Int[], nlp.fft_timer, nlp.mapping_timer ; rdft)
8282 @test z2 ≈ z
8383
84- res1 = M_perp_tz(nlp.buffer_real, nlp.buffer_complex1, nlp.buffer_complex2, nlp.op, 2, (N1, N2), reshape(z, (N1, N2)); rdft)
84+ res1 = M_perp_tz(nlp.buffer_real, nlp.buffer_complex1, nlp.buffer_complex2, nlp.op, 2, (N1, N2), reshape(z, (N1, N2)), nlp.fft_timer, nlp.mapping_timer ; rdft)
8585 @test norm(res1) ≈ norm(z)
8686 @test res1_wei ≈ res1
8787
88- res2 = M_perp_beta(nlp.buffer_real, nlp.buffer_complex1, nlp.buffer_complex2, nlp.op, 2, (N1, N2), z, Int[]; rdft)
88+ res2 = M_perp_beta(nlp.buffer_real, nlp.buffer_complex1, nlp.buffer_complex2, nlp.op, 2, (N1, N2), z, Int[], nlp.fft_timer, nlp.mapping_timer ; rdft)
8989 @test norm(res2) ≈ norm(z)
9090 @test res2_wei ≈ res2
9191 end
@@ -96,14 +96,14 @@ if dim2
9696
9797 z_gpu = CuArray(z)
9898
99- z2_gpu = M_perpt_M_perp_vec(nlp.buffer_real, nlp.buffer_complex1, nlp.buffer_complex2, nlp.op, 2, (N1, N2), z_gpu, Int[]; rdft)
99+ z2_gpu = M_perpt_M_perp_vec(nlp.buffer_real, nlp.buffer_complex1, nlp.buffer_complex2, nlp.op, 2, (N1, N2), z_gpu, Int[], nlp.fft_timer, nlp.mapping_timer ; rdft)
100100 @test z2_gpu ≈ z_gpu
101101
102- res1_gpu = M_perp_tz(nlp.buffer_real, nlp.buffer_complex1, nlp.buffer_complex2, nlp.op, 2, (N1, N2), reshape(z_gpu, (N1, N2)); rdft)
102+ res1_gpu = M_perp_tz(nlp.buffer_real, nlp.buffer_complex1, nlp.buffer_complex2, nlp.op, 2, (N1, N2), reshape(z_gpu, (N1, N2)), nlp.fft_timer, nlp.mapping_timer ; rdft)
103103 @test norm(res1_gpu) ≈ norm(z_gpu)
104104 @test res1_wei ≈ collect(res1_gpu)
105105
106- res2_gpu = M_perp_beta(nlp.buffer_real, nlp.buffer_complex1, nlp.buffer_complex2, nlp.op, 2, (N1, N2), z_gpu, Int[]; rdft)
106+ res2_gpu = M_perp_beta(nlp.buffer_real, nlp.buffer_complex1, nlp.buffer_complex2, nlp.op, 2, (N1, N2), z_gpu, Int[], nlp.fft_timer, nlp.mapping_timer ; rdft)
107107 @test norm(res2_gpu) ≈ norm(z_gpu)
108108 @test res2_wei ≈ collect(res2_gpu)
109109 end
@@ -130,14 +130,14 @@ if dim3
130130 @testset "3D -- CPU -- rdft=$rdft -- $N1 × $N2 × $N3" begin
131131 nlp, solver, results = fft_example_3D(N1, N2, N3; gpu=false, rdft, check=true)
132132
133- z2 = M_perpt_M_perp_vec(nlp.buffer_real, nlp.buffer_complex1, nlp.buffer_complex2, nlp.op, 3, (N1, N2, N3), z, Int[]; rdft)
133+ z2 = M_perpt_M_perp_vec(nlp.buffer_real, nlp.buffer_complex1, nlp.buffer_complex2, nlp.op, 3, (N1, N2, N3), z, Int[], nlp.fft_timer, nlp.mapping_timer ; rdft)
134134 @test z2 ≈ z
135135
136- res1 = M_perp_tz(nlp.buffer_real, nlp.buffer_complex1, nlp.buffer_complex2, nlp.op, 3, (N1, N2, N3), reshape(z, (N1, N2, N3)); rdft)
136+ res1 = M_perp_tz(nlp.buffer_real, nlp.buffer_complex1, nlp.buffer_complex2, nlp.op, 3, (N1, N2, N3), reshape(z, (N1, N2, N3)), nlp.fft_timer, nlp.mapping_timer ; rdft)
137137 @test norm(res1) ≈ norm(z)
138138 @test res1_wei ≈ res1
139139
140- res2 = M_perp_beta(nlp.buffer_real, nlp.buffer_complex1, nlp.buffer_complex2, nlp.op, 3, (N1, N2, N3), z, Int[]; rdft)
140+ res2 = M_perp_beta(nlp.buffer_real, nlp.buffer_complex1, nlp.buffer_complex2, nlp.op, 3, (N1, N2, N3), z, Int[], nlp.fft_timer, nlp.mapping_timer ; rdft)
141141 @test norm(res2) ≈ norm(z)
142142 @test res2_wei ≈ res2
143143 end
@@ -148,14 +148,14 @@ if dim3
148148
149149 z_gpu = CuArray(z)
150150
151- z2_gpu = M_perpt_M_perp_vec(nlp.buffer_real, nlp.buffer_complex1, nlp.buffer_complex2, nlp.op, 3, (N1, N2, N3), z_gpu, Int[]; rdft)
151+ z2_gpu = M_perpt_M_perp_vec(nlp.buffer_real, nlp.buffer_complex1, nlp.buffer_complex2, nlp.op, 3, (N1, N2, N3), z_gpu, Int[], nlp.fft_timer, nlp.mapping_timer ; rdft)
152152 @test z2_gpu ≈ z_gpu
153153
154- res1_gpu = M_perp_tz(nlp.buffer_real, nlp.buffer_complex1, nlp.buffer_complex2, nlp.op, 3, (N1, N2, N3), reshape(z_gpu, (N1, N2, N3)); rdft)
154+ res1_gpu = M_perp_tz(nlp.buffer_real, nlp.buffer_complex1, nlp.buffer_complex2, nlp.op, 3, (N1, N2, N3), reshape(z_gpu, (N1, N2, N3)), nlp.fft_timer, nlp.mapping_timer ; rdft)
155155 @test norm(res1_gpu) ≈ norm(z_gpu)
156156 @test res1_wei ≈ collect(res1_gpu)
157157
158- res2_gpu = M_perp_beta(nlp.buffer_real, nlp.buffer_complex1, nlp.buffer_complex2, nlp.op, 3, (N1, N2, N3), z_gpu, Int[]; rdft)
158+ res2_gpu = M_perp_beta(nlp.buffer_real, nlp.buffer_complex1, nlp.buffer_complex2, nlp.op, 3, (N1, N2, N3), z_gpu, Int[], nlp.fft_timer, nlp.mapping_timer ; rdft)
159159 @test norm(res2_gpu) ≈ norm(z_gpu)
160160 @test res2_wei ≈ collect(res2_gpu)
161161 end
0 commit comments