Skip to content

Commit e532a98

Browse files
committed
Fixed outer reduction bug when tiling.
1 parent a76d8c7 commit e532a98

File tree

2 files changed

+3
-3
lines changed

2 files changed

+3
-3
lines changed

Project.toml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1,7 +1,7 @@
11
name = "LoopVectorization"
22
uuid = "bdcacae8-1622-11e9-2a5c-532679323890"
33
authors = ["Chris Elrod <[email protected]>"]
4-
version = "0.2.1"
4+
version = "0.2.2"
55

66
[deps]
77
LinearAlgebra = "37e2e46d-f89d-539d-b4ee-838fcccc9c8e"

src/lowering.jl

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -369,7 +369,7 @@ function lower_compute!(
369369
for u 0:Uiter
370370
instrcall = callfun(instr) # Expr(:call, instr)
371371
varsym = if tiledouterreduction > 0 # then suffix !== nothing
372-
modsuff = ((u+suffix*U) & 3)
372+
modsuffix = ((u + suffix*U) & 3)
373373
Symbol("##",var,:_, modsuffix)
374374
elseif opunrolled
375375
Symbol("##",var,:_,u)
@@ -896,7 +896,7 @@ function lower_tiled(ls::LoopSet, vectorized::Symbol, U::Int, T::Int)
896896
firstiter = false
897897
end
898898
q = gc_preserve(ls, q)
899-
reduce_expr!(q, ls, U)
899+
reduce_expr!(q, ls, 4)
900900
Expr(:block, ls.preamble, q)
901901
end
902902
function lower_unrolled(ls::LoopSet, vectorized::Symbol, U::Int)

0 commit comments

Comments
 (0)