Skip to content

Commit 713e97e

Browse files
committed
Unroll a bit more
1 parent 8502d92 commit 713e97e

File tree

2 files changed

+4
-3
lines changed

2 files changed

+4
-3
lines changed

Project.toml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1,7 +1,7 @@
11
name = "LoopVectorization"
22
uuid = "bdcacae8-1622-11e9-2a5c-532679323890"
33
authors = ["Chris Elrod <[email protected]>"]
4-
version = "0.9.16"
4+
version = "0.9.17"
55

66
[deps]
77
ArrayInterface = "4fba245c-0d91-5ea0-9b3e-6abc04ee57a9"

src/lowering.jl

Lines changed: 3 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -288,7 +288,7 @@ function allinteriorunrolled(ls::LoopSet, us::UnrollSpecification, N)
288288
if us.u₂loopnum > N
289289
unroll_total *= us.u₂
290290
end
291-
unroll_total 8
291+
unroll_total 16
292292
end
293293

294294
function lower_no_unroll(ls::LoopSet, us::UnrollSpecification, n::Int, inclmask::Bool, initialize::Bool = true, maxiters::Int=-1)
@@ -385,7 +385,8 @@ function lower_unrolled_dynamic(ls::LoopSet, us::UnrollSpecification, n::Int, in
385385
body = lower_block(ls, us, n, inclmask, UF)
386386
if loopisstatic
387387
iters = length(loop) ÷ UFW
388-
if iters*UF 16 && allinteriorunrolled(ls, us, n)# Let's set a limit on total unrolling
388+
# @show loop iters*UF, allinteriorunrolled(ls, us, n)# Let's set a limit on total unrolling
389+
if isone(iters) || (iters*UF 16 && allinteriorunrolled(ls, us, n))# Let's set a limit on total unrolling
389390
q = Expr(:block)
390391
foreach(_ -> push!(q.args, body), 1:iters)
391392
else

0 commit comments

Comments
 (0)