Skip to content

Commit 7ba1c4c

Browse files
committed
Correct flops count
1 parent 20b7960 commit 7ba1c4c

File tree

1 file changed

+12
-2
lines changed

1 file changed

+12
-2
lines changed

perf/lu.jl

Lines changed: 12 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -3,8 +3,18 @@ import LinearAlgebra, RecursiveFactorization
33

44
BenchmarkTools.DEFAULT_PARAMETERS.seconds = 0.08
55

6-
luflop(m, n) = n^3÷3 - n÷3 + m*n^2
7-
luflop(n) = luflop(n, n)
6+
function luflop(m, n=m; innerflop=2)
7+
sum(1:min(m, n)) do k
8+
invflop = 1
9+
scaleflop = isempty(k+1:m) ? 0 : sum(k+1:m)
10+
updateflop = isempty(k+1:n) ? 0 : sum(k+1:n) do j
11+
isempty(k+1:m) ? 0 : sum(k+1:m) do i
12+
innerflop
13+
end
14+
end
15+
invflop + scaleflop + updateflop
16+
end
17+
end
818

919
bas_mflops = Float64[]
1020
rec8_mflops = Float64[]

0 commit comments

Comments
 (0)