subroutine driver and interface (in-place and out-of-place)

loiseaujc · loiseaujc · commit a381d0bc8c9b · 2025-07-09T10:43:19.000+02:00
diff --git a/src/stdlib_linalg.fypp b/src/stdlib_linalg.fypp
@@ -28,7 +28,7 @@ module stdlib_linalg
   public :: eigh
   public :: eigvals
   public :: eigvalsh
-  public :: expm
+  public :: expm, matrix_exp
   public :: eye
   public :: inv
   public :: invert
@@ -1713,19 +1713,74 @@ module stdlib_linalg
     !! ```
     !!
     #:for rk,rt,ri in RC_KINDS_TYPES
-    module function stdlib_expm_${ri}$(A, order, err) result(E)
+    module function stdlib_linalg_${ri}$_expm_fun(A, order) result(E)
         !> Input matrix a(n, n).
         ${rt}$, intent(in) :: A(:, :)
         !> [optional] Order of the Pade approximation (default `order=10`)
         integer(ilp), optional, intent(in) :: order
-        !> [optional] State return flag. On error, if not requested, the code will stop.
-        type(linalg_state_type), optional, intent(out) :: err
         !> Exponential of the input matrix E = exp(A).
         ${rt}$, allocatable :: E(:, :)
-    end function stdlib_expm_${ri}$
+    end function stdlib_linalg_${ri}$_expm_fun
     #:endfor
   end interface expm
 
+  !> Matrix exponential: subroutine interface
+  interface matrix_exp
+    !! version : experimental
+    !!
+    !! Computes the exponential of a matrix using a rational Pade approximation.
+    !! ([Specification](../page/specs/stdlib_linalg.html#matrix_exp))
+    !!
+    !! ### Description
+    !!
+    !! This interface provides methods for computing the exponential of a matrix
+    !! represented as a standard Fortran rank-2 array. Supported data types include
+    !! `real` and `complex`.
+    !!
+    !! By default, the order of the Pade approximation is set to 10. It can be changed
+    !! via the `order` argument which must be non-negative.
+    !!
+    !! If the input matrix is non-square or the order of the Pade approximation is
+    !! negative, the function returns an error state.
+    !!
+    !! ### Example
+    !!
+    !! ```fortran
+    !!  real(dp) :: A(3, 3), E(3, 3)
+    !!
+    !!  A = reshape([1, 2, 3, 4, 5, 6, 7, 8, 9], [3, 3])
+    !!
+    !!  ! Default Pade approximation of the matrix exponential.
+    !!  call matrix_exp(A, E) ! Out-of-place
+    !!  ! call matrix_exp(A) for in-place computation.
+    !!
+    !!  ! Pade approximation with specified order.
+    !!  call matrix_exp(A, E, order=12)
+    !! ```
+    !!
+    #:for rk,rt,ri in RC_KINDS_TYPES
+    module subroutine stdlib_linalg_${ri}$_expm_inplace(A, order, err)
+        !> Input matrix A(n, n) / Output matrix E = exp(A)
+        ${rt}$, intent(inout) :: A(:, :)
+        !> [optional] Order of the Pade approximation (default `order=10`)
+        integer(ilp), optional, intent(in) :: order
+        !> [optional] Error handling.
+        type(linalg_state_type), optional, intent(out) :: err
+    end subroutine stdlib_linalg_${ri}$_expm_inplace
+
+    module subroutine stdlib_linalg_${ri}$_expm(A, E, order, err)
+        !> Input matrix A(n, n)
+        ${rt}$, intent(in) :: A(:, :)
+        !> Output matrix exponential E = exp(A)
+        ${rt}$, intent(out) :: E(:, :)
+        !> [optional] Order of the Pade approximation (default `order=10`)
+        integer(ilp), optional, intent(in) :: order
+        !> [optional] Error handling.
+        type(linalg_state_type), optional, intent(out) :: err
+    end subroutine stdlib_linalg_${ri}$_expm
+    #:endfor
+  end interface matrix_exp
+
 contains
 
 
diff --git a/src/stdlib_linalg_matrix_functions.fypp b/src/stdlib_linalg_matrix_functions.fypp
@@ -15,22 +15,62 @@ submodule (stdlib_linalg) stdlib_linalg_matrix_functions
 contains
 
     #:for rk,rt,ri in RC_KINDS_TYPES 
-    module function stdlib_expm_${ri}$(A, order, err) result(E)
+    module function stdlib_linalg_${ri}$_expm_fun(A, order) result(E)
+        !> Input matrix A(n, n).
+        ${rt}$, intent(in) :: A(:, :)
+        !> [optional] Order of the Pade approximation.
+        integer(ilp), optional, intent(in) :: order
+        !> Exponential of the input matrix E = exp(A).
+        ${rt}$, allocatable :: E(:, :)
+
+        E = A ; call stdlib_linalg_${ri}$_expm_inplace(E, order)
+    end function
+
+    module subroutine stdlib_linalg_${ri}$_expm(A, E, order, err)
         !> Input matrix A(n, n).
         ${rt}$, intent(in) :: A(:, :)
         !> [optional] Order of the Pade approximation.
         integer(ilp), optional, intent(in) :: order
         !> [optional] State return flag.
         type(linalg_state_type), optional, intent(out) :: err
         !> Exponential of the input matrix E = exp(A).
-        ${rt}$, allocatable :: E(:, :)
+        ${rt}$, intent(out) :: E(:, :)
+        
+        type(linalg_state_type) :: err0
+        integer(ilp) :: lda, n, lde, ne
+         
+        ! Check E sizes
+        lda = size(A, 1, kind=ilp) ; n = size(A, 2, kind=ilp)
+        lde = size(E, 1, kind=ilp) ; ne = size(E, 2, kind=ilp)
+          
+        if (lda<1 .or. n<1 .or. lda<n .or. lde<n .or. ne<n) then     
+            err0 = linalg_state_type(this,LINALG_VALUE_ERROR, &
+                                     'invalid matrix sizes: A=',[lda,n], &
+                                                          ' E=',[lde,ne])
+        else
+            E(:n, :n) = A(:n, :n) ; call stdlib_linalg_${ri}$_expm_inplace(E, order, err)
+        endif
+        
+        ! Process output and return
+        call linalg_error_handling(err0,err)
+
+        return
+    end subroutine stdlib_linalg_${ri}$_expm
+
+    module subroutine stdlib_linalg_${ri}$_expm_inplace(A, order, err)
+        !> Input matrix A(n, n) / Output matrix exponential.
+        ${rt}$, intent(inout) :: A(:, :)
+        !> [optional] Order of the Pade approximation.
+        integer(ilp), optional, intent(in) :: order
+        !> [optional] State return flag.
+        type(linalg_state_type), optional, intent(out) :: err
 
         ! Internal variables.
-        ${rt}$, allocatable :: A2(:, :), Q(:, :), X(:, :)
-        real(${rk}$)        :: a_norm, c
-        integer(ilp)        :: m, n, ee, k, s, order_, i, j
-        logical(lk)         :: p
-        type(linalg_state_type)     :: err0
+        ${rt}$, allocatable     :: A2(:, :), Q(:, :), X(:, :)
+        real(${rk}$)            :: a_norm, c
+        integer(ilp)            :: m, n, ee, k, s, order_, i, j
+        logical(lk)             :: p
+        type(linalg_state_type) :: err0
 
         ! Deal with optional args.
         order_ = 10 ; if (present(order)) order_ = order
@@ -40,82 +80,80 @@ contains
 
         if (m /= n) then
             err0 = linalg_state_type(this,LINALG_VALUE_ERROR,'Invalid matrix size A=',[m, n])
-            call linalg_error_handling(err0, err)
-            return
         else if (order_ < 0) then
             err0 = linalg_state_type(this, LINALG_VALUE_ERROR, 'Order of Pade approximation &
                                     needs to be positive, order=', order_)
-            call linalg_error_handling(err0, err)
-            return
-        endif
+        else
+            ! Compute the L-infinity norm.
+            a_norm = mnorm(A, "inf")
 
-        ! Compute the L-infinity norm.
-        a_norm = mnorm(A, "inf")
-
-        ! Determine scaling factor for the matrix.
-        ee = int(log(a_norm) / log2_${rk}$, kind=ilp) + 1
-        s  = max(0, ee+1)
-
-        ! Scale the input matrix & initialize polynomial.
-        A2 = A/2.0_${rk}$**s ; X = A2
-
-        ! First step of the Pade approximation.
-        c = 0.5_${rk}$
-        allocate (E, source=A2) ; allocate (Q, source=A2)
-        do concurrent(i=1:n, j=1:n)
-            E(i, j) = merge(1.0_${rk}$ + c*E(i, j), c*E(i, j), i == j)
-            Q(i, j) = merge(1.0_${rk}$ - c*Q(i, j), -c*Q(i, j), i == j)
-        enddo
-
-        ! Iteratively compute the Pade approximation.
-        block
-            ${rt}$ :: X_tmp(n, n)
-            p = .true.
-            do k = 2, order_
-                c = c * (order_ - k + 1) / (k * (2*order_ - k + 1))
-                X_tmp = X
-                #:if rt.startswith('complex')
-                call gemm("N", "N", n, n, n, one_c${rk}$, A2, n, X_tmp, n, zero_c${rk}$, X, n)
-                #:else
-                call gemm("N", "N", n, n, n, one_${rk}$, A2, n, X_tmp, n, zero_${rk}$, X, n)
-                #:endif
-                do concurrent(i=1:n, j=1:n)
-                    E(i, j) = E(i, j) + c*X(i, j)       ! E = E + c*X
-                enddo
-                if (p) then
-                    do concurrent(i=1:n, j=1:n)
-                        Q(i, j) = Q(i, j) + c*X(i, j)   ! Q = Q + c*X
-                    enddo
-                else
+            ! Determine scaling factor for the matrix.
+            ee = int(log(a_norm) / log2_${rk}$, kind=ilp) + 1
+            s  = max(0, ee+1)
+
+            ! Scale the input matrix & initialize polynomial.
+            A2 = A/2.0_${rk}$**s ; X = A2
+
+            ! First step of the Pade approximation.
+            c = 0.5_${rk}$
+            allocate (Q, source=A2) ; A = A2
+            do concurrent(i=1:n, j=1:n)
+                A(i, j) = merge(1.0_${rk}$ + c*A(i, j), c*A(i, j), i == j)
+                Q(i, j) = merge(1.0_${rk}$ - c*Q(i, j), -c*Q(i, j), i == j)
+            enddo
+
+            ! Iteratively compute the Pade approximation.
+            block
+                ${rt}$ :: X_tmp(n, n)
+                p = .true.
+                do k = 2, order_
+                    c = c * (order_ - k + 1) / (k * (2*order_ - k + 1))
+                    X_tmp = X
+                    #:if rt.startswith('complex')
+                    call gemm("N", "N", n, n, n, one_c${rk}$, A2, n, X_tmp, n, zero_c${rk}$, X, n)
+                    #:else
+                    call gemm("N", "N", n, n, n, one_${rk}$, A2, n, X_tmp, n, zero_${rk}$, X, n)
+                    #:endif
                     do concurrent(i=1:n, j=1:n)
-                        Q(i, j) = Q(i, j) - c*X(i, j)   ! Q = Q - c*X
+                        A(i, j) = A(i, j) + c*X(i, j)       ! E = E + c*X
                     enddo
-                endif
-                p = .not. p
-            enddo
-        end block
-
-        block
-            integer(ilp) :: ipiv(n), info
-            call gesv(n, n, Q, n, ipiv, E, n, info) ! E = inv(Q) @ E
-            call handle_gesv_info(this, info, n, n, n, err0)
-            call linalg_error_handling(err0, err)
-        end block
-
-        ! Matrix squaring.
-        block
-            ${rt}$ :: E_tmp(n, n)
-            do k = 1, s
-                E_tmp = E
-                #:if rt.startswith('complex')
-                call gemm("N", "N", n, n, n, one_c${rk}$, E_tmp, n, E_tmp, n, zero_c${rk}$, E, n)
-                #:else
-                call gemm("N", "N", n, n, n, one_${rk}$, E_tmp, n, E_tmp, n, zero_${rk}$, E, n)
-                #:endif
-            enddo
-        end block
+                    if (p) then
+                        do concurrent(i=1:n, j=1:n)
+                            Q(i, j) = Q(i, j) + c*X(i, j)   ! Q = Q + c*X
+                        enddo
+                    else
+                        do concurrent(i=1:n, j=1:n)
+                            Q(i, j) = Q(i, j) - c*X(i, j)   ! Q = Q - c*X
+                        enddo
+                    endif
+                    p = .not. p
+                enddo
+            end block
+
+            block
+                integer(ilp) :: ipiv(n), info
+                call gesv(n, n, Q, n, ipiv, A, n, info) ! E = inv(Q) @ E
+                call handle_gesv_info(this, info, n, n, n, err0)
+            end block
+
+            ! Matrix squaring.
+            block
+                ${rt}$ :: E_tmp(n, n)
+                do k = 1, s
+                    E_tmp = A
+                    #:if rt.startswith('complex')
+                    call gemm("N", "N", n, n, n, one_c${rk}$, E_tmp, n, E_tmp, n, zero_c${rk}$, A, n)
+                    #:else
+                    call gemm("N", "N", n, n, n, one_${rk}$, E_tmp, n, E_tmp, n, zero_${rk}$, A, n)
+                    #:endif
+                enddo
+            end block
+        endif
+        
+        call linalg_error_handling(err0, err)
+
         return
-    end function stdlib_expm_${ri}$
+    end subroutine stdlib_linalg_${ri}$_expm_inplace
     #:endfor
 
 end submodule stdlib_linalg_matrix_functions
diff --git a/test/linalg/test_linalg_expm.fypp b/test/linalg/test_linalg_expm.fypp
@@ -4,7 +4,7 @@
 module test_linalg_expm
     use testdrive, only: error_type, check, new_unittest, unittest_type
     use stdlib_linalg_constants
-    use stdlib_linalg, only: expm, eye, norm
+    use stdlib_linalg, only: expm, eye, norm, matrix_exp
     use stdlib_linalg_state, only: linalg_state_type, linalg_error_handling, LINALG_ERROR, &
          LINALG_INTERNAL_ERROR, LINALG_VALUE_ERROR
 
@@ -82,13 +82,13 @@ module test_linalg_expm
         enddo
 
         ! Compute matrix exponential.
-        E = expm(A, order=-1, err=err)
+        call matrix_exp(A, E, order=-1, err=err)
         ! Check result.
         call check(error, err%error(), "Negative Pade order")
         if (allocated(error)) return
 
         ! Compute matrix exponential.
-        E = expm(A(:n, :n-1), err=err)
+        call matrix_exp(A(:n, :n-1), E, err=err)
         ! Check result.
         call check(error, err%error(), "Invalid matrix size")
         if (allocated(error)) return