-
-
Notifications
You must be signed in to change notification settings - Fork 541
Add LDL decomposition #1515
New issue
Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.
By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.
Already on GitHub? Sign in to your account
Open
ajefweiss
wants to merge
5
commits into
dimforge:main
Choose a base branch
from
ajefweiss:ldldecomp
base: main
Could not load branches
Branch not found: {{ refName }}
Loading
Could not load tags
Nothing to show
Loading
Are you sure you want to change the base?
Some commits from the old base branch may be removed from the timeline,
and old review comments may become outdated.
+252
−1
Open
Add LDL decomposition #1515
Changes from all commits
Commits
Show all changes
5 commits
Select commit
Hold shift + click to select a range
5592c9f
basic ldl implementation, based on udu
ajefweiss b875935
test for cholesky eq
ajefweiss 00ca97b
hermitian ldl, better tests
ajefweiss d562fbd
update docs, renamed cholesky_l to lsqrt and added extra checks
ajefweiss 43fd280
in place ldl factorization
ajefweiss File filter
Filter by extension
Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
There are no files selected for viewing
This file contains hidden or bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains hidden or bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
| Original file line number | Diff line number | Diff line change |
|---|---|---|
| @@ -0,0 +1,121 @@ | ||
| #[cfg(feature = "serde-serialize-no-std")] | ||
| use serde::{Deserialize, Serialize}; | ||
|
|
||
| use crate::allocator::Allocator; | ||
| use crate::base::{Const, DefaultAllocator, OMatrix, OVector}; | ||
| use crate::dimension::Dim; | ||
| use simba::scalar::ComplexField; | ||
|
|
||
| /// The LDL / LDL^T factorization of a Hermitian matrix A = LDL^T where L is a lower unit-triangular matrix and D is diagonal matrix. | ||
| #[cfg_attr(feature = "serde-serialize-no-std", derive(Serialize, Deserialize))] | ||
| #[cfg_attr( | ||
| feature = "serde-serialize-no-std", | ||
| serde(bound(serialize = "OMatrix<T, D, D>: Serialize")) | ||
| )] | ||
| #[cfg_attr( | ||
| feature = "serde-serialize-no-std", | ||
| serde(bound(deserialize = "OMatrix<T, D, D>: Deserialize<'de>")) | ||
| )] | ||
| #[derive(Clone, Debug)] | ||
| pub struct LDL<T: ComplexField, D: Dim>(OMatrix<T, D, D>) | ||
| where | ||
| DefaultAllocator: Allocator<D> + Allocator<D, D>; | ||
|
|
||
| impl<T: ComplexField, D: Dim> Copy for LDL<T, D> | ||
| where | ||
| DefaultAllocator: Allocator<D> + Allocator<D, D>, | ||
| OMatrix<T, D, D>: Copy, | ||
| { | ||
| } | ||
|
|
||
| impl<T: ComplexField, D: Dim> LDL<T, D> | ||
| where | ||
| DefaultAllocator: Allocator<D> + Allocator<D, D>, | ||
| { | ||
| /// Returns the diagonal elements as a vector. | ||
| #[must_use] | ||
| pub fn d(&self) -> OVector<T, D> { | ||
| self.0.diagonal() | ||
| } | ||
|
|
||
| /// Returns the diagonal elements as a matrix. | ||
| #[must_use] | ||
| pub fn d_matrix(&self) -> OMatrix<T, D, D> { | ||
| OMatrix::from_diagonal(&self.0.diagonal()) | ||
| } | ||
|
|
||
| /// Returns the lower triangular matrix. | ||
| #[must_use] | ||
| pub fn l_matrix(&self) -> OMatrix<T, D, D> { | ||
| let mut l = self.0.clone(); | ||
|
|
||
| l.column_iter_mut() | ||
| .enumerate() | ||
| .for_each(|(idx, mut column)| { | ||
| column[idx] = T::one(); | ||
| }); | ||
|
|
||
| l | ||
| } | ||
|
|
||
| /// Returns the matrix L * sqrt(D). | ||
| /// This function returns `None` if the square root of any of the values in the diagonal matrix D is not finite. | ||
| /// | ||
| /// This function can be used to generate a lower triangular matrix as if it were generated by the Cholesky decomposition, without the requirement of positive definiteness. | ||
| pub fn lsqrtd(&self) -> Option<OMatrix<T, D, D>> { | ||
| let n_dim = self.0.shape_generic().1; | ||
|
|
||
| let lsqrtd: crate::Matrix<T, D, D, <DefaultAllocator as Allocator<D, D>>::Buffer<T>> = &self | ||
| .l_matrix() | ||
| * OMatrix::from_diagonal(&OVector::from_iterator_generic( | ||
| n_dim, | ||
| Const::<1>, | ||
| self.d().iter().map(|value| value.clone().sqrt()), | ||
| )); | ||
|
|
||
| // Check for any non-finite numbers in lsqrtd and return None if necessary. | ||
| if !lsqrtd.iter().fold(true, |acc, next| acc & next.is_finite()) { | ||
| None | ||
| } else { | ||
| Some(lsqrtd) | ||
| } | ||
| } | ||
|
|
||
| /// Computes the LDL / LDL^T factorization. | ||
| pub fn new(mut matrix: OMatrix<T, D, D>) -> Option<Self> { | ||
| for j in 0..matrix.ncols() { | ||
| let mut d_j: T = matrix[(j, j)].clone(); | ||
|
|
||
| if j > 0 { | ||
| for k in 0..j { | ||
| d_j -= matrix[(j, k)].clone() | ||
| * matrix[(j, k)].clone().conjugate() | ||
| * matrix[(k, k)].clone(); | ||
| } | ||
| } | ||
|
|
||
| matrix[(j, j)] = d_j; | ||
|
|
||
| for i in (j + 1)..matrix.ncols() { | ||
| let mut l_ij = matrix[(i, j)].clone(); | ||
|
|
||
| for k in 0..j { | ||
| l_ij -= matrix[(j, k)].clone().conjugate() | ||
| * matrix[(i, k)].clone() | ||
| * matrix[(k, k)].clone(); | ||
| } | ||
|
|
||
| if matrix[(j, j)] == T::zero() { | ||
| matrix[(i, j)] = T::zero(); | ||
| } else { | ||
| matrix[(i, j)] = l_ij / matrix[(j, j)].clone(); | ||
| } | ||
|
|
||
| // Zero out the upper triangular part. | ||
| matrix[(j, i)] = T::zero(); | ||
| } | ||
| } | ||
|
|
||
| Some(Self(matrix)) | ||
| } | ||
| } |
This file contains hidden or bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains hidden or bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
| Original file line number | Diff line number | Diff line change |
|---|---|---|
| @@ -0,0 +1,115 @@ | ||
| use na::{Complex, Matrix3}; | ||
| use num::Zero; | ||
|
|
||
| #[test] | ||
| #[rustfmt::skip] | ||
| fn ldl_simple() { | ||
| let m = Matrix3::new( | ||
| Complex::new(2.0, 0.0), Complex::new(-1.0, 0.5), Complex::zero(), | ||
| Complex::new(-1.0, -0.5), Complex::new(2.0, 0.0), Complex::new(-1.0, 0.0), | ||
| Complex::zero(), Complex::new(-1.0, 0.0), Complex::new(2.0, 0.0)); | ||
|
|
||
| let ldl = m.ldl().unwrap(); | ||
|
|
||
| println!("{:}", &m); | ||
| println!("{:}", ldl.l_matrix()); | ||
| println!("{:}", ldl.d()); | ||
|
|
||
| // Rebuild | ||
| let p = ldl.l_matrix() * ldl.d_matrix() * ldl.l_matrix().adjoint(); | ||
|
|
||
|
|
||
| println!("{:}", &p); | ||
|
|
||
| assert!(relative_eq!(m, p, epsilon = 3.0e-12)); | ||
| } | ||
|
|
||
| #[test] | ||
| #[rustfmt::skip] | ||
| fn ldl_partial() { | ||
| let m = Matrix3::new( | ||
| Complex::new(2.0, 0.0), Complex::zero(), Complex::zero(), | ||
| Complex::zero(), Complex::zero(), Complex::zero(), | ||
| Complex::zero(), Complex::zero(), Complex::new(2.0, 0.0)); | ||
|
|
||
| let ldl = m.lower_triangle().ldl().unwrap(); | ||
|
|
||
| // Rebuild | ||
| let p = ldl.l_matrix() * ldl.d_matrix() * ldl.l_matrix().adjoint(); | ||
|
|
||
| assert!(relative_eq!(m, p, epsilon = 3.0e-12)); | ||
| } | ||
|
|
||
| #[test] | ||
| #[rustfmt::skip] | ||
| fn ldl_lsqrtd() { | ||
| let m = Matrix3::new( | ||
| Complex::new(2.0, 0.0), Complex::new(-1.0, 0.5), Complex::zero(), | ||
| Complex::new(-1.0, -0.5), Complex::new(2.0, 0.0), Complex::new(-1.0, 0.0), | ||
| Complex::zero(), Complex::new(-1.0, 0.0), Complex::new(2.0, 0.0)); | ||
|
|
||
| let chol= m.cholesky().unwrap(); | ||
| let ldl = m.ldl().unwrap(); | ||
|
|
||
| assert!(relative_eq!(ldl.lsqrtd().unwrap(), chol.l(), epsilon = 3.0e-16)); | ||
| } | ||
|
|
||
| #[test] | ||
| #[should_panic] | ||
| #[rustfmt::skip] | ||
| fn ldl_non_sym_panic() { | ||
| let m = Matrix3::new( | ||
| 2.0, -1.0, 0.0, | ||
| 1.0, -2.0, 3.0, | ||
| -2.0, 1.0, 0.3); | ||
|
|
||
| let ldl = m.ldl().unwrap(); | ||
|
|
||
| // Rebuild | ||
| let p = ldl.l_matrix() * ldl.d_matrix() * ldl.l_matrix().transpose(); | ||
|
|
||
| assert!(relative_eq!(m, p, epsilon = 3.0e-16)); | ||
| } | ||
|
|
||
| #[cfg(feature = "proptest-support")] | ||
| mod proptest_tests { | ||
| #[allow(unused_imports)] | ||
| use crate::core::helper::{RandComplex, RandScalar}; | ||
|
|
||
| macro_rules! gen_tests( | ||
| ($module: ident, $scalar: expr) => { | ||
| mod $module { | ||
| #[allow(unused_imports)] | ||
| use crate::core::helper::{RandScalar, RandComplex}; | ||
| use crate::proptest::*; | ||
| use proptest::{prop_assert, proptest}; | ||
|
|
||
| proptest! { | ||
| #[test] | ||
| fn ldl(m in dmatrix_($scalar)) { | ||
| let m = &m * m.adjoint(); | ||
|
|
||
| if let Some(ldl) = m.clone().ldl() { | ||
| let p = &ldl.l * &ldl.d_matrix() * &ldl.l.transpose(); | ||
| println!("m: {}, p: {}", m, p); | ||
|
|
||
| prop_assert!(relative_eq!(m, p, epsilon = 1.0e-7)); | ||
| } | ||
| } | ||
|
|
||
| #[test] | ||
| fn ldl_static(m in matrix4_($scalar)) { | ||
| let m = m.hermitian_part(); | ||
|
|
||
| if let Some(ldl) = m.ldl() { | ||
| let p = ldl.l * ldl.d_matrix() * ldl.l.transpose(); | ||
| prop_assert!(relative_eq!(m, p, epsilon = 1.0e-7)); | ||
| } | ||
| } | ||
| } | ||
| } | ||
| } | ||
| ); | ||
|
|
||
| gen_tests!(f64, PROPTEST_F64); | ||
| } | ||
This file contains hidden or bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
| Original file line number | Diff line number | Diff line change |
|---|---|---|
|
|
@@ -8,6 +8,7 @@ mod exp; | |
| mod full_piv_lu; | ||
| mod hessenberg; | ||
| mod inverse; | ||
| mod ldl; | ||
| mod lu; | ||
| mod pow; | ||
| mod qr; | ||
|
|
||
Add this suggestion to a batch that can be applied as a single commit.
This suggestion is invalid because no changes were made to the code.
Suggestions cannot be applied while the pull request is closed.
Suggestions cannot be applied while viewing a subset of changes.
Only one suggestion per line can be applied in a batch.
Add this suggestion to a batch that can be applied as a single commit.
Applying suggestions on deleted lines is not supported.
You must change the existing code in this line in order to create a valid suggestion.
Outdated suggestions cannot be applied.
This suggestion has been applied or marked resolved.
Suggestions cannot be applied from pending reviews.
Suggestions cannot be applied on multi-line comments.
Suggestions cannot be applied while the pull request is queued to merge.
Suggestion cannot be applied right now. Please check back later.
There was a problem hiding this comment.
Choose a reason for hiding this comment
The reason will be displayed to describe this comment to others. Learn more.
If I understood correctly what you said in the comment, then this implementation of the LDL^T decomposition requires the matrix to be symmetric positive definite (not semi definite), right? However, using
M M^Twill only give us pos. semidefinite, so we should expect some spurious failures here. I've actually run into the same problem innalgebra-lapackand you can see my solution here. I've added a proptest function that gives a spd matrix in a bit of a hacky, but sound way: The idea is to useM' = M M^T + alpha * Id, where alpha is chosen suitably large to make we don't get into numerical trouble. You should be able to easily adapt the functions to return complex matrices.Uh oh!
There was an error while loading. Please reload this page.
There was a problem hiding this comment.
Choose a reason for hiding this comment
The reason will be displayed to describe this comment to others. Learn more.
just wanted to weigh in - i'm a little confused actually... the 'point' of LDL is that it's a generalisation of the Cholesky algorithm to all symmetric/Hermitian matrices, with no requirements on positive definiteness/semi-definiteness. If it only works for definite/semidefinite matrices then there's no benefit to using LDL over Cholesky, which is a simpler decomposition and a more efficient algorithm.
There was a problem hiding this comment.
Choose a reason for hiding this comment
The reason will be displayed to describe this comment to others. Learn more.
Sorry if the above text is slightly confusing. But no, the LDL/LDL^T decomposition only requires the matrix to be symmetric. It does NOT require it to be positive definite. This is stated in both textbooks referenced here.
The problem is that, in both cases, the algorithms that are shown DO require the matrix to be positive OR negative definite. I'd have to look deeper into this, but I think this is because in the semi-positive/negative definite cases the solution is not unique. I think there is a choice for the particular column where the corresponding value in the D matrix is zero.
There was a problem hiding this comment.
Choose a reason for hiding this comment
The reason will be displayed to describe this comment to others. Learn more.
Thanks for working on this! Having an LDL-like factorization in nalgebra would be genuinely useful.
As written, this looks to me like the standard no-pivot, strictly diagonal LDLᵀ/LDLᴴ recursion, rather than the more general symmetric-indefinite factorization many users may expect from an
LDLAPI.To handle symmetric/Hermitian-indefinite factorizations, you have to use the Bunch–Kaufman family (or equivalent): symmetric pivoting/permutations, with
Dallowed to have 1×1 and 2×2 blocks. That extra machinery matters for general Hermitian/symmetric indefinite matrices.In particular, without pivoting and with
Dforced to be strictly diagonal, this does not cover all symmetric matrices. For example, [[0, 1], [1, 0]] does not admit a factorization of the formA = L D Lᵀwith unit-lower-triangularLand diagonalDin that fixed ordering.Because of that, I’d be hesitant to expose this as a general-purpose
LDLfor Hermitian matrices unless the contract is made very explicit in the docs.I do think this could still be useful, but I think it would help to choose one of two directions explicitly:
LDL, aim for a pivoted/block-diagonal factorization closer to Bunch–Kaufman.There was a problem hiding this comment.
Choose a reason for hiding this comment
The reason will be displayed to describe this comment to others. Learn more.
Hey @awinick, thanks for weighing in! Do you have a source for the symmetric indefinite LDL decomposition that you mentioned?
There was a problem hiding this comment.
Choose a reason for hiding this comment
The reason will be displayed to describe this comment to others. Learn more.
The original '77 paper is openly available here https://www.ams.org/journals/mcom/1977-31-137/S0025-5718-1977-0428694-0/S0025-5718-1977-0428694-0.pdf. Also see the comment here #1515 (comment)
Personally I would prefer continuing with option (1) for the time being as it seems to cover most practical use cases that I have run into. I can clean up the code / docs a bit more at some later time when I have more free time.
There was a problem hiding this comment.
Choose a reason for hiding this comment
The reason will be displayed to describe this comment to others. Learn more.
thank you!
There was a problem hiding this comment.
Choose a reason for hiding this comment
The reason will be displayed to describe this comment to others. Learn more.
Hey @geo-ant you might be interested in the PR I just opened.