Remove defaults for alpha and beta in 5-arg mul! (#96)

dkarrasch · web-flow · commit b06ba209de26 · 2020-07-27T22:01:26.000+02:00
diff --git a/.github/workflows/ci.yml b/.github/workflows/ci.yml
@@ -10,6 +10,7 @@ jobs:
   test:
     name: Julia ${{ matrix.version }} - ${{ matrix.os }}
     runs-on: ${{ matrix.os }}
+    continue-on-error: ${{ matrix.version == 'nightly' }}
     strategy:
       matrix:
         version:
diff --git a/README.md b/README.md
@@ -9,7 +9,12 @@ transformations or linear operators acting on vectors. The only requirement for
 a LinearMap is that it can act on a vector (by multiplication) efficiently.
 
 ## What's new in v2.7
-*   Speed-up of scaled `LinearMap`s by avoiding allocations
+*   Potential reduction of memory allocations in multiplication of
+    `LinearCombination`s, `BlockMap`s, and real- or complex-scaled `LinearMap`s.
+    For the latter, a new internal type `ScaledMap` has been introduced.
+*   Multiplication code for `CompositeMap`s has been refactored to facilitate to
+    provide memory for storage of intermediate results by directly calling helper
+    functions.
 
 ## What's new in v2.6
 *   New feature: "lazy" Kronecker product, Kronecker sums, and powers thereof
@@ -18,25 +23,25 @@ a LinearMap is that it can act on a vector (by multiplication) efficiently.
 *   Compatibility with the generic multiply-and-add interface (a.k.a. 5-arg
     `mul!`) introduced in julia v1.3
 
-## What's new in v2.5.0
+## What's new in v2.5
 *   New feature: concatenation of `LinearMap`s objects with `UniformScaling`s,
     consistent with (h-, v-, and hc-)concatenation of matrices. Note, matrices
     `A` must be wrapped as `LinearMap(A)`, `UniformScaling`s are promoted to
     `LinearMap`s automatically.
 
-## What's new in v2.4.0
+## What's new in v2.4
 *   Support restricted to Julia v1.0+.
 
-## What's new in v2.3.0
+## What's new in v2.3
 *   Fully Julia v0.7/v1.0/v1.1 compatible.
 *   Full support of noncommutative number types such as quaternions.
 
-## What's new in v2.2.0
+## What's new in v2.2
 *   Fully Julia v0.7/v1.0 compatible.
 *   A `convert(SparseMatrixCSC, A::LinearMap)` function, that calls the `sparse`
     matrix generating function.
 
-## What's new in v2.1.0
+## What's new in v2.1
 *   Fully Julia v0.7 compatible; dropped compatibility for previous versions of
     Julia from LinearMaps.jl v2.0.0 on.
 *   A 5-argument version for `mul!(y, A::LinearMap, x, α=1, β=0)`, which
@@ -66,7 +71,7 @@ in Julia versions below 0.7).
 ## Philosophy
 
 Several iterative linear algebra methods such as linear solvers or eigensolvers
-only require an efficient evaluation of the matrix vector product, where the
+only require an efficient evaluation of the matrix-vector product, where the
 concept of a matrix can be formalized / generalized to a linear map (or linear
 operator in the special case of a square matrix).
 
@@ -89,10 +94,11 @@ The LinearMaps package provides the following functionality:
     `isposdef`) of the existing matrix or linear map.
 
 3.  A framework for combining objects of type `LinearMap` and of type
-    `AbstractMatrix` using linear combinations, transposition and composition,
+    `AbstractMatrix` using linear combinations, transposition, composition,
+    concatenation and Kronecker product/sums,
     where the linear map resulting from these operations is never explicitly
-    evaluated but only its matrix vector product is defined (i.e. lazy
-    evaluation). The matrix vector product is written to minimize memory
+    evaluated but only its matrix-vector product is defined (i.e. lazy
+    evaluation). The matrix-vector product is written to minimize memory
     allocation by using a minimal number of temporary vectors. There is full
     support for the in-place version `mul!`, which should be preferred for
     higher efficiency in critical algorithms. In addition, it tries to recognize
@@ -159,7 +165,7 @@ The LinearMaps package provides the following functionality:
         argument corresponding to the input, and `true` if it accepts two vector
         arguments where the first will be mutated so as to contain the result.
         In both cases, the resulting `A::FunctionMap` will support both the
-        mutating and non-mutating matrix vector multiplication. Default value is
+        mutating and non-mutating matrix-vector multiplication. Default value is
         guessed based on the number of arguments for the first method in the
         method list of `f`; it is not possible to use `f` and `fc` where only
         one of the two is mutating and the other is not.
@@ -190,6 +196,12 @@ The LinearMaps package provides the following functionality:
     handle both `A::AbstractMatrix` and `A::LinearMap`, it is recommended to use
     `convert(Matrix, A*X)`.
 
+*   `convert(AbstractMatrix, A::LinearMap)`, `convert(AbstractArray, A::LinearMap)`
+
+    Create an `AbstractMatrix` representation of the `LinearMap`. This falls
+    back to `Matrix(A)`, but avoids explicit construction in case the `LinearMap`
+    object is matrix-based.
+
 *   `SparseArrays.sparse(A::LinearMap)` and `convert(SparseMatrixCSC, A::LinearMap)`
 
     Create a sparse matrix representation of the `LinearMap` object, by
@@ -206,7 +218,7 @@ The LinearMaps package provides the following functionality:
     * `mul!(Y::AbstractMatrix, A::LinearMap, X::AbstractMatrix)`: applies `A` to
       each column of `X` and stores the results in the corresponding columns of
       `Y`;
-    * `mul!(y::AbstractVector, A::LinearMap, x::AbstractVector, α::Number=true, β::Number=false)`:
+    * `mul!(y::AbstractVector, A::LinearMap, x::AbstractVector, α::Number, β::Number)`:
       computes `A * x * α + y * β` and stores the result in `y`. Analogously for `X,Y::AbstractMatrix`.
 
     Applying the adjoint or transpose of `A` (if defined) to `x` works exactly
@@ -240,7 +252,7 @@ constructor described above.
 *   `FunctionMap`
 
     Type for wrapping an arbitrary function that is supposed to implement the
-    matrix vector product as a `LinearMap`.
+    matrix-vector product as a `LinearMap`.
 
 *   `WrappedMap`
 
@@ -252,17 +264,25 @@ constructor described above.
     will never evaluate `mat1*mat2`, since this is more costly than evaluating
     `mat1*(mat2*x)` and the latter is the only operation that needs to be performed
     by `LinearMap` objects anyway. While the cost of matrix addition is comparable
-    to matrix vector multiplication, this too is not performed explicitly since
+    to matrix-vector multiplication, this too is not performed explicitly since
     this would require new storage of the same amount as of the original matrices.
 
+*   `ScaledMap`
+
+    Type for representing a scalar multiple of any `LinearMap` type. A
+    `ScaledMap` will be automatically constructed if real or complex `LinearMap`
+    objects are multiplied by real or complex scalars from the left or from the
+    right.
+
 *   `UniformScalingMap`
 
     Type for representing a scalar multiple of the identity map (a.k.a. uniform
     scaling) of a certain size `M=N`, obtained simply as `UniformScalingMap(λ, M)`.
     The type `T` of the resulting `LinearMap` object is inferred from the type of
-    `λ`. A `UniformScalingMap` of the correct size will be automatically created
-    if `LinearMap` objects are multiplied by scalars from the left or from the right,
-    respecting the order of multiplication.
+    `λ`. A `UniformScalingMap` of the correct size will be automatically
+    constructed if `LinearMap` objects are multiplied by scalars from the left
+    or from the right (respecting the order of multiplication), if either the
+    `eltype` of the `LinearMap` or the scalar are of non-commutative type, .
 
 *   `LinearCombination`, `CompositeMap`, `TransposeMap` and `AdjointMap`
 
diff --git a/src/LinearMaps.jl b/src/LinearMaps.jl
@@ -71,9 +71,13 @@ convert_to_lmaps(A) = (convert_to_lmaps_(A),)
 
 function Base.:(*)(A::LinearMap, x::AbstractVector)
     size(A, 2) == length(x) || throw(DimensionMismatch("mul!"))
-    return @inbounds mul!(similar(x, promote_type(eltype(A), eltype(x)), size(A, 1)), A, x)
+    return @inbounds A_mul_B!(similar(x, promote_type(eltype(A), eltype(x)), size(A, 1)), A, x)
 end
-function LinearAlgebra.mul!(y::AbstractVector, A::LinearMap, x::AbstractVector, α::Number=true, β::Number=false)
+function LinearAlgebra.mul!(y::AbstractVector, A::LinearMap, x::AbstractVector)
+    @boundscheck check_dim_mul(y, A, x)
+    return @inbounds A_mul_B!(y, A, x)
+end
+function LinearAlgebra.mul!(y::AbstractVector, A::LinearMap, x::AbstractVector, α::Number, β::Number)
     @boundscheck check_dim_mul(y, A, x)
     if isone(α)
         iszero(β) && (A_mul_B!(y, A, x); return y)
diff --git a/src/blockmap.jl b/src/blockmap.jl
@@ -303,9 +303,21 @@ LinearAlgebra.adjoint(A::BlockMap)  = AdjointMap(A)
 ############
 
 @inline function _blockmul!(y, A::BlockMap, x, α, β)
+    if iszero(α)
+        iszero(β) && return fill!(y, zero(eltype(y)))
+        isone(β) && return y
+        return rmul!(y, β)
+    end
+    return __blockmul!(MulStyle(A), y, A, x, α, β)
+end
+
+@inline __blockmul!(::FiveArg, y, A, x, α, β)  = ___blockmul!(y, A, x, α, β, nothing)
+@inline __blockmul!(::ThreeArg, y, A, x, α, β) = ___blockmul!(y, A, x, α, β, similar(y))
+
+function ___blockmul!(y, A, x, α, β, ::Nothing)
     maps, rows, yinds, xinds = A.maps, A.rows, A.rowranges, A.colranges
     mapind = 0
-    @views @inbounds for (row, yi) in zip(rows, yinds)
+    @views for (row, yi) in zip(rows, yinds)
         yrow = selectdim(y, 1, yi)
         mapind += 1
         mul!(yrow, maps[mapind], selectdim(x, 1, xinds[mapind]), α, β)
@@ -316,24 +328,50 @@ LinearAlgebra.adjoint(A::BlockMap)  = AdjointMap(A)
     end
     return y
 end
+function ___blockmul!(y, A, x, α, β, z)
+    maps, rows, yinds, xinds = A.maps, A.rows, A.rowranges, A.colranges
+    mapind = 0
+    @views for (row, yi) in zip(rows, yinds)
+        yrow = selectdim(y, 1, yi)
+        zrow = selectdim(z, 1, yi)
+        mapind += 1
+        if MulStyle(maps[mapind]) === ThreeArg() && !iszero(β)
+            !isone(β) && rmul!(yrow, β)
+            muladd!(ThreeArg(), yrow, maps[mapind], selectdim(x, 1, xinds[mapind]), α, zrow)
+        else
+            mul!(yrow, maps[mapind], selectdim(x, 1, xinds[mapind]), α, β)
+        end
+        for _ in 2:row
+            mapind +=1
+            muladd!(MulStyle(maps[mapind]), yrow, maps[mapind], selectdim(x, 1, xinds[mapind]), α, zrow)
+        end
+    end
+    return y
+end
 
 @inline function _transblockmul!(y, A::BlockMap, x, α, β, transform)
     maps, rows, xinds, yinds = A.maps, A.rows, A.rowranges, A.colranges
-    @views @inbounds begin
-        # first block row (rowind = 1) of A, meaning first block column of A', fill all of y
-        xcol = selectdim(x, 1, first(xinds))
-        for rowind in 1:first(rows)
-            mul!(selectdim(y, 1, yinds[rowind]), transform(maps[rowind]), xcol, α, β)
-        end
-        mapind = first(rows)
-        # subsequent block rows of A (block columns of A'),
-        # add results to corresponding parts of y
-        # TODO: think about multithreading
-        for (row, xi) in zip(Base.tail(rows), Base.tail(xinds))
-            xcol = selectdim(x, 1, xi)
-            for _ in 1:row
-                mapind +=1
-                mul!(selectdim(y, 1, yinds[mapind]), transform(maps[mapind]), xcol, α, true)
+    if iszero(α)
+        iszero(β) && return fill!(y, zero(eltype(y)))
+        isone(β) && return y
+        return rmul!(y, β)
+    else
+        @views begin
+            # first block row (rowind = 1) of A, meaning first block column of A', fill all of y
+            xcol = selectdim(x, 1, first(xinds))
+            for rowind in 1:first(rows)
+                mul!(selectdim(y, 1, yinds[rowind]), transform(maps[rowind]), xcol, α, β)
+            end
+            mapind = first(rows)
+            # subsequent block rows of A (block columns of A'),
+            # add results to corresponding parts of y
+            # TODO: think about multithreading
+            for (row, xi) in zip(Base.tail(rows), Base.tail(xinds))
+                xcol = selectdim(x, 1, xi)
+                for _ in 1:row
+                    mapind +=1
+                    mul!(selectdim(y, 1, yinds[mapind]), transform(maps[mapind]), xcol, α, true)
+                end
             end
         end
     end
@@ -345,34 +383,34 @@ end
 ############
 
 Base.@propagate_inbounds A_mul_B!(y::AbstractVector, A::BlockMap, x::AbstractVector) =
-    mul!(y, A, x)
+    mul!(y, A, x, true, false)
 
 Base.@propagate_inbounds A_mul_B!(y::AbstractVector, A::TransposeMap{<:Any,<:BlockMap}, x::AbstractVector) =
-    mul!(y, A, x)
+    mul!(y, A, x, true, false)
 
 Base.@propagate_inbounds At_mul_B!(y::AbstractVector, A::BlockMap, x::AbstractVector) =
-    mul!(y, transpose(A), x)
+    mul!(y, transpose(A), x, true, false)
 
 Base.@propagate_inbounds A_mul_B!(y::AbstractVector, A::AdjointMap{<:Any,<:BlockMap}, x::AbstractVector) =
-    mul!(y, A, x)
+    mul!(y, A, x, true, false)
 
 Base.@propagate_inbounds Ac_mul_B!(y::AbstractVector, A::BlockMap, x::AbstractVector) =
-    mul!(y, adjoint(A), x)
+    mul!(y, adjoint(A), x, true, false)
 
 for Atype in (AbstractVector, AbstractMatrix)
     @eval Base.@propagate_inbounds function LinearAlgebra.mul!(y::$Atype, A::BlockMap, x::$Atype,
-                        α::Number=true, β::Number=false)
+                        α::Number, β::Number)
         require_one_based_indexing(y, x)
         @boundscheck check_dim_mul(y, A, x)
-        return _blockmul!(y, A, x, α, β)
+        return @inbounds _blockmul!(y, A, x, α, β)
     end
 
     for (maptype, transform) in ((:(TransposeMap{<:Any,<:BlockMap}), :transpose), (:(AdjointMap{<:Any,<:BlockMap}), :adjoint))
         @eval Base.@propagate_inbounds function LinearAlgebra.mul!(y::$Atype, wrapA::$maptype, x::$Atype,
-                        α::Number=true, β::Number=false)
+                        α::Number, β::Number)
             require_one_based_indexing(y, x)
             @boundscheck check_dim_mul(y, wrapA, x)
-            return _transblockmul!(y, wrapA.lmap, x, α, β, $transform)
+            return @inbounds _transblockmul!(y, wrapA.lmap, x, α, β, $transform)
         end
     end
 end
@@ -468,7 +506,7 @@ Base.@propagate_inbounds Ac_mul_B!(y::AbstractVector, A::BlockDiagonalMap, x::Ab
 
 for Atype in (AbstractVector, AbstractMatrix)
     @eval Base.@propagate_inbounds function LinearAlgebra.mul!(y::$Atype, A::BlockDiagonalMap, x::$Atype,
-                        α::Number=true, β::Number=false)
+                        α::Number, β::Number)
         require_one_based_indexing(y, x)
         @boundscheck check_dim_mul(y, A, x)
         return _blockscaling!(y, A, x, α, β)
diff --git a/src/linearcombination.jl b/src/linearcombination.jl
@@ -66,7 +66,7 @@ LinearAlgebra.adjoint(A::LinearCombination)   = LinearCombination{eltype(A)}(map
 # multiplication with vectors & matrices
 for Atype in (AbstractVector, AbstractMatrix)
     @eval Base.@propagate_inbounds function LinearAlgebra.mul!(y::$Atype, A::LinearCombination, x::$Atype,
-                             α::Number=true, β::Number=false)
+                             α::Number, β::Number)
         @boundscheck check_dim_mul(y, A, x)
         if iszero(α) # trivial cases
             iszero(β) && (fill!(y, zero(eltype(y))); return y)
@@ -117,8 +117,8 @@ end
     return y
 end
 
-A_mul_B!(y::AbstractVector, A::LinearCombination, x::AbstractVector) = mul!(y, A, x)
+A_mul_B!(y::AbstractVector, A::LinearCombination, x::AbstractVector) = mul!(y, A, x, true, false)
 
-At_mul_B!(y::AbstractVector, A::LinearCombination, x::AbstractVector) = mul!(y, transpose(A), x)
+At_mul_B!(y::AbstractVector, A::LinearCombination, x::AbstractVector) = mul!(y, transpose(A), x, true, false)
 
-Ac_mul_B!(y::AbstractVector, A::LinearCombination, x::AbstractVector) = mul!(y, adjoint(A), x)
+Ac_mul_B!(y::AbstractVector, A::LinearCombination, x::AbstractVector) = mul!(y, adjoint(A), x, true, false)
diff --git a/src/uniformscalingmap.jl b/src/uniformscalingmap.jl
@@ -43,7 +43,7 @@ Base.:(*)(A::UniformScalingMap, x::AbstractVector) =
 # multiplication with vector/matrix
 for Atype in (AbstractVector, AbstractMatrix)
     @eval Base.@propagate_inbounds function LinearAlgebra.mul!(y::$Atype, J::UniformScalingMap, x::$Atype,
-                α::Number=true, β::Number=false)
+                α::Number, β::Number)
         @boundscheck check_dim_mul(y, J, x)
         _scaling!(y, J.λ, x, α, β)
         return y
@@ -88,11 +88,10 @@ function _scaling!(y, λ::Number, x, α::Number, β::Number)
     end # α-cases
 end # function _scaling!
 
-A_mul_B!(y::AbstractVector, A::UniformScalingMap, x::AbstractVector) = mul!(y, A, x)
+A_mul_B!(y::AbstractVector, A::UniformScalingMap, x::AbstractVector) = mul!(y, A, x, true, false)
 At_mul_B!(y::AbstractVector, A::UniformScalingMap, x::AbstractVector) = A_mul_B!(y, transpose(A), x)
 Ac_mul_B!(y::AbstractVector, A::UniformScalingMap, x::AbstractVector) = A_mul_B!(y, adjoint(A), x)
 
-
 # combine LinearMap and UniformScaling objects in linear combinations
 Base.:(+)(A₁::LinearMap, A₂::UniformScaling) = A₁ + UniformScalingMap(A₂.λ, size(A₁, 1))
 Base.:(+)(A₁::UniformScaling, A₂::LinearMap) = UniformScalingMap(A₁.λ, size(A₂, 1)) + A₂
diff --git a/src/wrappedmap.jl b/src/wrappedmap.jl
@@ -49,7 +49,7 @@ Ac_mul_B!(y::AbstractVector, A::WrappedMap, x::AbstractVector) =
 if VERSION ≥ v"1.3.0-alpha.115"
     for Atype in (AbstractVector, AbstractMatrix)
         @eval Base.@propagate_inbounds LinearAlgebra.mul!(y::$Atype, A::WrappedMap, x::$Atype,
-                        α::Number=true, β::Number=false) =
+                        α::Number, β::Number) =
             mul!(y, A.lmap, x, α, β)
     end
 else
diff --git a/test/blockmap.jl b/test/blockmap.jl
diff --git a/test/linearmaps.jl b/test/linearmaps.jl