SciML
diff --git a/‎src/common.jl
Lines changed: 17 additions & 4 deletions b/‎src/common.jl
Lines changed: 17 additions & 4 deletions
diff --git a/‎src/default.jl
Lines changed: 65 additions & 165 deletions b/‎src/default.jl
Lines changed: 65 additions & 165 deletions
@@ -1,4 +1,13 @@
-struct LinearCache{TA, Tb, Tu, Tp, Talg, Tc, Tl, Tr, Ttol}
+struct OperatorAssumptions{issquare} end
+function OperatorAssumptions(issquare = nothing)
+    OperatorAssumptions{_unwrap_val(issquare)}()
+end
+
+_unwrap_val(::Val{B}) where {B} = B
+_unwrap_val(B::Nothing) = Nothing
+_unwrap_val(B::Bool) = B
+
+struct LinearCache{TA, Tb, Tu, Tp, Talg, Tc, Tl, Tr, Ttol, issquare}
     A::TA
     b::Tb
     u::Tu
@@ -12,6 +21,7 @@ struct LinearCache{TA, Tb, Tu, Tp, Talg, Tc, Tl, Tr, Ttol}
     reltol::Ttol
     maxiters::Int
     verbose::Bool
+    assumptions::OperatorAssumptions{issquare}
 end
 
 """
@@ -86,6 +96,7 @@ function SciMLBase.init(prob::LinearProblem, alg::Union{SciMLLinearSolveAlgorith
                         verbose = false,
                         Pl = Identity(),
                         Pr = Identity(),
+                        assumptions = OperatorAssumptions(),
                         kwargs...)
     @unpack A, b, u0, p = prob
 
@@ -96,7 +107,7 @@ function SciMLBase.init(prob::LinearProblem, alg::Union{SciMLLinearSolveAlgorith
         fill!(u0, false)
     end
 
-    cacheval = init_cacheval(alg, A, b, u0, Pl, Pr, maxiters, abstol, reltol, verbose)
+    cacheval = init_cacheval(alg, A, b, u0, Pl, Pr, maxiters, abstol, reltol, verbose, assumptions)
     isfresh = true
     Tc = typeof(cacheval)
 
@@ -112,7 +123,8 @@ function SciMLBase.init(prob::LinearProblem, alg::Union{SciMLLinearSolveAlgorith
                         Tc,
                         typeof(Pl),
                         typeof(Pr),
-                        typeof(reltol)
+                        typeof(reltol),
+                        typeof(assumptions)
                         }(A,
                           b,
                           u0,
@@ -125,7 +137,8 @@ function SciMLBase.init(prob::LinearProblem, alg::Union{SciMLLinearSolveAlgorith
                           abstol,
                           reltol,
                           maxiters,
-                          verbose)
+                          verbose,
+                          assumptions)
     return cache
 end
 
 
@@ -1,209 +1,109 @@
-## Default algorithm
+defaultalg(A::DiffEqArrayOperator, b, assumptions::OperatorAssumptions) = defaultalg(A.A, b, assumptions)
 
-# Allows A === nothing as a stand-in for dense matrix
-function defaultalg(A, b)
-    if A isa DiffEqArrayOperator
-        A = A.A
-    end
-
-    # Special case on Arrays: avoid BLAS for RecursiveFactorization.jl when
-    # it makes sense according to the benchmarks, which is dependent on
-    # whether MKL or OpenBLAS is being used
-    if (A === nothing && !(b isa GPUArraysCore.AbstractGPUArray)) || A isa Matrix
-        if (A === nothing || eltype(A) <: Union{Float32, Float64, ComplexF32, ComplexF64}) &&
-           ArrayInterfaceCore.can_setindex(b)
-            if length(b) <= 10
-                alg = GenericLUFactorization()
-            elseif (length(b) <= 100 || (isopenblas() && length(b) <= 500)) &&
-                   eltype(A) <: Union{Float32, Float64}
-                alg = RFLUFactorization()
-                #elseif A === nothing || A isa Matrix
-                #    alg = FastLUFactorization()
-            else
-                alg = LUFactorization()
-            end
-        else
-            alg = LUFactorization()
-        end
+# Ambiguity handling
+defaultalg(A::DiffEqArrayOperator, b, assumptions::OperatorAssumptions{nothing}) = defaultalg(A.A, b, assumptions)
 
-        # These few cases ensure the choice is optimal without the
-        # dynamic dispatching of factorize
-    elseif A isa Tridiagonal
-        alg = GenericFactorization(; fact_alg = lu!)
-    elseif A isa SymTridiagonal
-        alg = GenericFactorization(; fact_alg = ldlt!)
-    elseif A isa SparseMatrixCSC
-        if length(b) <= 10_000
-            alg = KLUFactorization()
-        else
-            alg = UMFPACKFactorization()
-        end
+function defaultalg(A, b, ::OperatorAssumptions{nothing})
+    issquare = size(A,1) == size(A,2)
+    defaultalg(A, b, OperatorAssumptions(Val(issquare)))
+end
 
-        # This catches the cases where a factorization overload could exist
-        # For example, BlockBandedMatrix
-    elseif A !== nothing && ArrayInterfaceCore.isstructured(A)
-        alg = GenericFactorization()
+defaultalg(A::Tridiagonal, b, ::OperatorAssumptions{true}) = GenericFactorization(; fact_alg = lu!)
+defaultalg(A::Tridiagonal, b, ::OperatorAssumptions{false}) = GenericFactorization(; fact_alg = qr!)
+defaultalg(A::SymTridiagonal, b, ::OperatorAssumptions{true}) = GenericFactorization(; fact_alg = ldlt!)
 
-        # This catches the case where A is a CuMatrix
-        # Which does not have LU fully defined
-    elseif A isa GPUArraysCore.AbstractGPUArray || b isa GPUArraysCore.AbstractGPUArray
-        if VERSION >= v"1.8-"
-            alg = LUFactorization()
-        else
-            alg = QRFactorization()
-        end
+function defaultalg(A::SparseMatrixCSC, b, ::OperatorAssumptions{true})
+    if length(b) <= 10_000
+        KLUFactorization()
+    else
+        UMFPACKFactorization()
+    end
+end
 
-        # Not factorizable operator, default to only using A*x
+function defaultalg(A::GPUArraysCore.AbstractGPUArray, b, ::OperatorAssumptions{true})
+    if VERSION >= v"1.8-"
+        LUFactorization()
     else
-        alg = KrylovJL_GMRES()
+        QRFactorization()
     end
-    alg
 end
 
-## Other dispatches are to decrease the dispatch cost
+function defaultalg(A, b::GPUArraysCore.AbstractGPUArray, ::OperatorAssumptions{true})
+    if VERSION >= v"1.8-"
+        LUFactorization()
+    else
+        QRFactorization()
+    end
+end
 
-function SciMLBase.solve(cache::LinearCache, alg::Nothing,
-                         args...; kwargs...)
-    @unpack A = cache
-    if A isa DiffEqArrayOperator
-        A = A.A
+# Handle ambiguity
+function defaultalg(A::GPUArraysCore.AbstractGPUArray, b::GPUArraysCore.AbstractGPUArray, ::OperatorAssumptions{true})
+    if VERSION >= v"1.8-"
+        LUFactorization()
+    else
+        QRFactorization()
     end
+end
+
+function defaultalg(A::GPUArraysCore.AbstractGPUArray, b, ::OperatorAssumptions{false})
+    QRFactorization()
+end
+
+function defaultalg(A, b::GPUArraysCore.AbstractGPUArray, ::OperatorAssumptions{false})
+    QRFactorization()
+end
 
+# Handle ambiguity
+function defaultalg(A::GPUArraysCore.AbstractGPUArray, b::GPUArraysCore.AbstractGPUArray, ::OperatorAssumptions{false})
+    QRFactorization()
+end
+
+# Allows A === nothing as a stand-in for dense matrix
+function defaultalg(A, b, ::Assumptions{true})
     # Special case on Arrays: avoid BLAS for RecursiveFactorization.jl when
     # it makes sense according to the benchmarks, which is dependent on
     # whether MKL or OpenBLAS is being used
-    if A isa Matrix
-        b = cache.b
+    if (A === nothing && !(b isa GPUArraysCore.AbstractGPUArray)) || A isa Matrix
         if (A === nothing || eltype(A) <: Union{Float32, Float64, ComplexF32, ComplexF64}) &&
            ArrayInterfaceCore.can_setindex(b)
             if length(b) <= 10
                 alg = GenericLUFactorization()
-                SciMLBase.solve(cache, alg, args...; kwargs...)
             elseif (length(b) <= 100 || (isopenblas() && length(b) <= 500)) &&
                    eltype(A) <: Union{Float32, Float64}
                 alg = RFLUFactorization()
-                SciMLBase.solve(cache, alg, args...; kwargs...)
-                #elseif A isa Matrix
+                #elseif A === nothing || A isa Matrix
                 #    alg = FastLUFactorization()
-                #    SciMLBase.solve(cache, alg, args...; kwargs...)
             else
                 alg = LUFactorization()
-                SciMLBase.solve(cache, alg, args...; kwargs...)
             end
         else
             alg = LUFactorization()
-            SciMLBase.solve(cache, alg, args...; kwargs...)
-        end
-
-        # These few cases ensure the choice is optimal without the
-        # dynamic dispatching of factorize
-    elseif A isa Tridiagonal
-        alg = GenericFactorization(; fact_alg = lu!)
-        SciMLBase.solve(cache, alg, args...; kwargs...)
-    elseif A isa SymTridiagonal
-        alg = GenericFactorization(; fact_alg = ldlt!)
-        SciMLBase.solve(cache, alg, args...; kwargs...)
-    elseif A isa SparseMatrixCSC
-        b = cache.b
-        if length(b) <= 10_000
-            alg = KLUFactorization()
-            SciMLBase.solve(cache, alg, args...; kwargs...)
-        else
-            alg = UMFPACKFactorization()
-            SciMLBase.solve(cache, alg, args...; kwargs...)
         end
 
         # This catches the cases where a factorization overload could exist
         # For example, BlockBandedMatrix
-    elseif ArrayInterfaceCore.isstructured(A)
+    elseif A !== nothing && ArrayInterfaceCore.isstructured(A)
         alg = GenericFactorization()
-        SciMLBase.solve(cache, alg, args...; kwargs...)
 
-        # This catches the case where A is a CuMatrix
-        # Which does not have LU fully defined
-    elseif A isa GPUArraysCore.AbstractGPUArray
-        if VERSION >= v"1.8-"
-            alg = LUFactorization()
-            SciMLBase.solve(cache, alg, args...; kwargs...)
-        else
-            alg = QRFactorization()
-            SciMLBase.solve(cache, alg, args...; kwargs...)
-        end
         # Not factorizable operator, default to only using A*x
-        # IterativeSolvers is faster on CPU but not GPU-compatible
     else
         alg = KrylovJL_GMRES()
-        SciMLBase.solve(cache, alg, args...; kwargs...)
     end
+    alg
 end
 
-function init_cacheval(alg::Nothing, A, b, u, Pl, Pr, maxiters, abstol, reltol, verbose)
-    if A isa DiffEqArrayOperator
-        A = A.A
-    end
-
-    # Special case on Arrays: avoid BLAS for RecursiveFactorization.jl when
-    # it makes sense according to the benchmarks, which is dependent on
-    # whether MKL or OpenBLAS is being used
-    if A isa Matrix
-        if (A === nothing || eltype(A) <: Union{Float32, Float64, ComplexF32, ComplexF64}) &&
-           ArrayInterfaceCore.can_setindex(b)
-            if length(b) <= 10
-                alg = GenericLUFactorization()
-                init_cacheval(alg, A, b, u, Pl, Pr, maxiters, abstol, reltol, verbose)
-            elseif (length(b) <= 100 || (isopenblas() && length(b) <= 500)) &&
-                   eltype(A) <: Union{Float32, Float64}
-                alg = RFLUFactorization()
-                init_cacheval(alg, A, b, u, Pl, Pr, maxiters, abstol, reltol, verbose)
-                #elseif A isa Matrix
-                #    alg = FastLUFactorization()
-                #    init_cacheval(alg, A, b, u, Pl, Pr, maxiters, abstol, reltol, verbose)
-            else
-                alg = LUFactorization()
-                init_cacheval(alg, A, b, u, Pl, Pr, maxiters, abstol, reltol, verbose)
-            end
-        else
-            alg = LUFactorization()
-            init_cacheval(alg, A, b, u, Pl, Pr, maxiters, abstol, reltol, verbose)
-        end
+function defaultalg(A, b, ::Val{false})
+    QRFactorization()
+end
 
-        # These few cases ensure the choice is optimal without the
-        # dynamic dispatching of factorize
-    elseif A isa Tridiagonal
-        alg = GenericFactorization(; fact_alg = lu!)
-        init_cacheval(alg, A, b, u, Pl, Pr, maxiters, abstol, reltol, verbose)
-    elseif A isa SymTridiagonal
-        alg = GenericFactorization(; fact_alg = ldlt!)
-        init_cacheval(alg, A, b, u, Pl, Pr, maxiters, abstol, reltol, verbose)
-    elseif A isa SparseMatrixCSC
-        if length(b) <= 10_000
-            alg = KLUFactorization()
-            init_cacheval(alg, A, b, u, Pl, Pr, maxiters, abstol, reltol, verbose)
-        else
-            alg = UMFPACKFactorization()
-            init_cacheval(alg, A, b, u, Pl, Pr, maxiters, abstol, reltol, verbose)
-        end
+## Catch high level interface
 
-        # This catches the cases where a factorization overload could exist
-        # For example, BlockBandedMatrix
-    elseif ArrayInterfaceCore.isstructured(A)
-        alg = GenericFactorization()
-        init_cacheval(alg, A, b, u, Pl, Pr, maxiters, abstol, reltol, verbose)
+function SciMLBase.solve(cache::LinearCache, alg::Nothing,
+                         args...; assumptions::OperatorAssumptions = OperatorAssumptions(), kwargs...)
+    @unpack A, b = cache
+    SciMLBase.solve(cache, default_alg(A,b,assumptions), args...; kwargs...)
+end
 
-        # This catches the case where A is a CuMatrix
-        # Which does not have LU fully defined
-    elseif A isa GPUArraysCore.AbstractGPUArray
-        if VERSION >= v"1.8-"
-            alg = LUFactorization()
-            init_cacheval(alg, A, b, u, Pl, Pr, maxiters, abstol, reltol, verbose)
-        else
-            alg = QRFactorization()
-            init_cacheval(alg, A, b, u, Pl, Pr, maxiters, abstol, reltol, verbose)
-        end
-        # Not factorizable operator, default to only using A*x
-        # IterativeSolvers is faster on CPU but not GPU-compatible
-    else
-        alg = KrylovJL_GMRES()
-        init_cacheval(alg, A, b, u, Pl, Pr, maxiters, abstol, reltol, verbose)
-    end
+function init_cacheval(alg::Nothing, A, b, u, Pl, Pr, maxiters::Int, abstol, reltol, verbose::Bool, assumptions::OperatorAssumptions)
+    init_cacheval(default_alg(A,b), A, b, u, Pl, Pr, maxiters, abstol, reltol, verbose, assumptions)
 end