Skip to content

Commit c121be9

Browse files
committed
gensym endinnder
1 parent 15ff047 commit c121be9

File tree

2 files changed

+9
-8
lines changed

2 files changed

+9
-8
lines changed

src/codegen/lower_threads.jl

Lines changed: 5 additions & 5 deletions
Original file line numberDiff line numberDiff line change
@@ -554,12 +554,12 @@ function thread_two_loops_expr(
554554

555555
var"#thread#mask#" >>>= var"#trailzing#zeros#"
556556

557-
endinner = var"#thread#launch#count#0#" == (var"#thread#factor#0#"-0x00000001)
558-
var"#thread#launch#count#0#" = Core.ifelse(endinner, 0x00000000, var"#thread#launch#count#0#" + 0x00000001)
559-
var"#thread#launch#count#1#" = Core.ifelse(endinner, var"#thread#launch#count#1#" + 0x00000001, var"#thread#launch#count#1#")
557+
var"##end#inner##" = var"#thread#launch#count#0#" == (var"#thread#factor#0#"-0x00000001)
558+
var"#thread#launch#count#0#" = Core.ifelse(var"##end#inner##", 0x00000000, var"#thread#launch#count#0#" + 0x00000001)
559+
var"#thread#launch#count#1#" = Core.ifelse(var"##end#inner##", var"#thread#launch#count#1#" + 0x00000001, var"#thread#launch#count#1#")
560560

561-
var"#iter#start#0#" = Core.ifelse(endinner, var"#loop#1#start#init#", var"#iter#stop#0#")
562-
var"#iter#start#1#" = Core.ifelse(endinner, var"#iter#stop#1#", var"#iter#start#1#")
561+
var"#iter#start#0#" = Core.ifelse(var"##end#inner##", var"#loop#1#start#init#", var"#iter#stop#0#")
562+
var"#iter#start#1#" = Core.ifelse(var"##end#inner##", var"#iter#stop#1#", var"#iter#start#1#")
563563

564564
var"#threads#remain#" = (var"#thread#launch#count#" += 0x00000001) var"#nrequest#"
565565
end

test/threading.jl

Lines changed: 4 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -1,4 +1,4 @@
1-
using OffsetArrays, LinearAlgebra
1+
using OffsetArrays, LinearAlgebra, LoopVectorization, Test
22
function mydotavx(a, b)
33
s = zero(eltype(a))
44
@avxt for i eachindex(a,b)
@@ -96,9 +96,10 @@ function convlayer_direct!(
9696
end
9797

9898
@testset "Threading" begin
99+
@show @__LINE__
99100
dcd = DenseConvDims{2,(5,5),3,6}()
100101
kern4 = rand(Float32, 5, 5, 3, 6);
101-
for M 17:50:267
102+
@time for M 17:50:267
102103
img = rand(Float32, M, M, 3, 100);
103104
outimage1 = Array{Float32}(undef, size(img,1)+1-size(kern4,1), size(img,2)+1-size(kern4,2), size(kern4,4), size(img,4));
104105
outimage2 = similar(outimage1);
@@ -108,7 +109,7 @@ end
108109
@test outimage1 outimage2
109110
end
110111

111-
for M 17:399
112+
@time for M 17:399
112113
# @show M
113114
K = M; N = M;
114115
A = rand(M,K); B = rand(K,N);

0 commit comments

Comments
 (0)