|
1 | 1 | @testset "GEMM" begin
|
2 | 2 | # using LoopVectorization, LinearAlgebra, Test; T = Float64
|
3 | 3 | Unum, Tnum = LoopVectorization.REGISTER_COUNT == 16 ? (2, 6) : (3, 9)
|
4 |
| - Unumt, Tnumt = LoopVectorization.REGISTER_COUNT == 16 ? (3, 4) : (5, 5) |
| 4 | + Unumt, Tnumt = LoopVectorization.REGISTER_COUNT == 16 ? (2, 6) : (5, 5) |
5 | 5 | if LoopVectorization.REGISTER_COUNT != 8
|
6 | 6 | @test LoopVectorization.mᵣ == Unum
|
7 | 7 | @test LoopVectorization.nᵣ == Tnum
|
|
353 | 353 | if LoopVectorization.REGISTER_COUNT == 32
|
354 | 354 | @test LoopVectorization.choose_order(lsr2amb) == ([:n, :m, :k], :m, :n, :m, 3, 7)
|
355 | 355 | elseif LoopVectorization.REGISTER_COUNT == 16
|
356 |
| - @test LoopVectorization.choose_order(lsr2amb) == ([:m, :n, :k], :n, :m, :m, 4, 2) |
| 356 | + @test LoopVectorization.choose_order(lsr2amb) == ([:m, :n, :k], :m, :n, :m, 1, 6) |
357 | 357 | end
|
358 | 358 | function rank2AmulBavx!(C, Aₘ, Aₖ, B)
|
359 | 359 | @avx for m ∈ axes(C,1), n ∈ axes(C,2)
|
|
0 commit comments