|
2 | 2 | # wrapper for batched_gemm!
|
3 | 3 | export batched_mul, batched_transpose, batched_adjoint
|
4 | 4 |
|
5 |
| - |
6 | 5 | include("./batchedadjtrans.jl")
|
7 | 6 |
|
8 |
| -function batched_mul(A::AbstractArray{T, 3}, B::AbstractArray{T, 3}) where T |
9 |
| - size(A, 3) == size(B, 3) || throw(DimensionMismatch("batch size mismatch")) |
10 |
| - batched_mul!(similar(A, (size(A, 1), size(B, 2), size(A, 3))), A, B) |
| 7 | +""" |
| 8 | + batched_mul(A, B) -> C |
| 9 | +
|
| 10 | +Batched matrix multiplication. Result has `C[:,:,k] == A[:,:,k] * B[:,:,k]` for all `k`. |
| 11 | +""" |
| 12 | +function batched_mul(A::AbstractArray{T1, 3}, B::AbstractArray{T2, 3}) where {T1, T2} |
| 13 | + axes(A, 3) == axes(B, 3) || throw(DimensionMismatch("batch size mismatch")) |
| 14 | + T = promote_type(T1, T2) |
| 15 | + C = similar(A, T, (axes(A, 1), axes(B, 2), axes(A, 3))) |
| 16 | + batched_mul!(C, A, B) |
11 | 17 | end
|
12 | 18 |
|
13 | 19 | """
|
14 | 20 | batched_mul!(C, A, B) -> C
|
15 |
| -batched `mul!`. |
| 21 | +
|
| 22 | +In-place batched matrix multiplication, |
| 23 | +equivalent to `mul!(C[:,:,k], A[:,:,k], B[:,:,k])` for all `k`. |
16 | 24 | """
|
17 | 25 | function batched_mul! end
|
18 | 26 |
|
19 | 27 | _unbatch(A) = A
|
20 | 28 | _unbatch(A::BatchedAdjOrTrans) = A.parent
|
21 | 29 |
|
22 |
| -# bmm |
23 |
| -const _BATCHED_MATRIX_LIST = [ |
24 |
| - (:(AbstractArray{T, 3}), 'N'), |
25 |
| - (:(BatchedTranspose{T, <:AbstractArray{T, 3}}), 'T'), |
26 |
| - (:(BatchedAdjoint{T, <:AbstractArray{T, 3}}), 'C') |
| 30 | +# batched_gemm! |
| 31 | + |
| 32 | +const _GemmFloat = Union{Float64, Float32, ComplexF64, ComplexF32} |
| 33 | + |
| 34 | +_BATCHED_GEMM_LIST = [ |
| 35 | + (:(StridedArray{T, 3}), 'N'), |
| 36 | + (:(BatchedTranspose{T, <:StridedArray{T, 3}}), 'T'), |
| 37 | + (:(BatchedAdjoint{T, <:StridedArray{T, 3}}), 'C') |
27 | 38 | ]
|
28 | 39 |
|
29 |
| -for (TA, transA) in _BATCHED_MATRIX_LIST, (TB, transB) in _BATCHED_MATRIX_LIST |
30 |
| - @eval begin |
31 |
| - function batched_mul!(C::AbstractArray{T, 3}, A::$TA, B::$TB) where T |
32 |
| - batched_gemm!($transA, $transB, one(T), _unbatch(A), _unbatch(B), zero(T), C) |
33 |
| - C |
34 |
| - end |
| 40 | +for (TA, transA) in _BATCHED_GEMM_LIST, (TB, transB) in _BATCHED_GEMM_LIST |
| 41 | + @eval function batched_mul!(C::StridedArray{T, 3}, A::$TA, B::$TB) where {T<:_GemmFloat} |
| 42 | + batched_gemm!($transA, $transB, one(T), _unbatch(A), _unbatch(B), zero(T), C) |
| 43 | + C |
| 44 | + end |
| 45 | +end |
35 | 46 |
|
| 47 | +# fallback |
36 | 48 |
|
| 49 | +_BATCHED_LIST = [ |
| 50 | + (:(AbstractArray{<:Any, 3}), :identity), |
| 51 | + (:(BatchedTranspose{<:Any, <:AbstractArray{<:Any, 3}}), :transpose), |
| 52 | + (:(BatchedAdjoint{<:Any, <:AbstractArray{<:Any, 3}}), :adjoint) |
| 53 | +] |
| 54 | +for (TA, fA) in _BATCHED_LIST, (TB, fB) in _BATCHED_LIST |
| 55 | + @eval function batched_mul!(C::AbstractArray{<:Any, 3}, A::$TA, B::$TB) |
| 56 | + axes(A, 3) == axes(B, 3) == axes(C, 3) || throw(DimensionMismatch("batch size mismatch")) |
| 57 | + @debug "calling fallback method for batched_mul!" typeof(A) typeof(B) typeof(C) |
| 58 | + A′, B′ = _unbatch(A), _unbatch(B) |
| 59 | + @inbounds for k in axes(C, 3) |
| 60 | + @views mul!(C[:,:,k], $fA(A′[:,:,k]), $fB(B′[:,:,k])) |
| 61 | + end |
| 62 | + C |
37 | 63 | end
|
38 | 64 | end
|
0 commit comments