abacusmodeling
diff --git a/‎include/RI/global/Blas_Interface.h‎
Lines changed: 0 additions & 1 deletion b/‎include/RI/global/Blas_Interface.h‎
Lines changed: 0 additions & 1 deletion
diff --git a/‎include/RI/global/Lapack-Fortran.h‎
Lines changed: 43 additions & 0 deletions b/‎include/RI/global/Lapack-Fortran.h‎
Lines changed: 43 additions & 0 deletions
diff --git a/‎include/RI/global/Lapack_Interface-Contiguous.h‎
Lines changed: 39 additions & 0 deletions b/‎include/RI/global/Lapack_Interface-Contiguous.h‎
Lines changed: 39 additions & 0 deletions
diff --git a/‎include/RI/global/Lapack_Interface-Tensor.h‎
Lines changed: 48 additions & 0 deletions b/‎include/RI/global/Lapack_Interface-Tensor.h‎
Lines changed: 48 additions & 0 deletions
diff --git a/‎include/RI/global/Lapack_Interface.h‎
Lines changed: 157 additions & 0 deletions b/‎include/RI/global/Lapack_Interface.h‎
Lines changed: 157 additions & 0 deletions
diff --git a/‎include/RI/global/Tensor.h‎
Lines changed: 20 additions & 5 deletions b/‎include/RI/global/Tensor.h‎
Lines changed: 20 additions & 5 deletions
@@ -10,7 +10,6 @@
 #include <string>
 #include <stdexcept>
 
-
 #ifdef __MKL_RI
 #include <mkl_trans.h>
 #endif
 
@@ -0,0 +1,43 @@
+// ===================
+//  Author: Peize Lin
+//  date: 2022.12.25
+// ===================
+
+#pragma once
+
+#include <complex>
+
+namespace RI
+{
+
+extern "C"
+{
+	// potrf computes the Cholesky factorization of a real symmetric positive definite matrix
+	void spotrf_(const char*const uplo, const int*const n, float*const A, const int*const lda, int*const info);
+	void dpotrf_(const char*const uplo, const int*const n, double*const A, const int*const lda, int*const info);
+	void cpotrf_(const char*const uplo, const int*const n, std::complex<float>*const A, const int*const lda, int*const info);
+	void zpotrf_(const char*const uplo, const int*const n, std::complex<double>*const A, const int*const lda, int*const info);
+
+	// potri takes potrf's output to perform matrix inversion
+	void spotri_(const char*const uplo, const int*const n, float*const A, const int*const lda, int*const info);
+	void dpotri_(const char*const uplo, const int*const n, double*const A, const int*const lda, int*const info);
+	void cpotri_(const char*const uplo, const int*const n, std::complex<float>*const A, const int*const lda, int*const info);
+	void zpotri_(const char*const uplo, const int*const n, std::complex<double>*const A, const int*const lda, int*const info);		
+
+	// solve the eigenproblem Ax=ex, where A is Symmetric
+	void ssyev_(const char*const jobz, const char*const uplo,
+		const int*const n, float*const A, const int*const lda, float*const W,
+		float*const WORK, const int*const lwork, int*const info);
+	void dsyev_(const char*const jobz, const char*const uplo,
+		const int*const n, double*const A, const int*const lda, double*const W,
+		double*const WORK, const int*const lwork, int*const info);
+	// solve the eigenproblem Ax=ex, where A is Hermitian
+	void cheev_(const char*const jobz, const char*const uplo,
+		const int*const n, std::complex<float>*const A, const int*const lda, float*const W,
+		std::complex<float>*const WORK, const int*const lwork, float*const RWORK, int*const info);
+	void zheev_(const char*const jobz, const char*const uplo,
+		const int*const n, std::complex<double>*const A, const int*const lda, double*const W,
+		std::complex<double>*const WORK, const int*const lwork, double*const RWORK, int*const info);
+}
+
+}
@@ -0,0 +1,39 @@
+// ===================
+//  Author: Peize Lin
+//  date: 2022.12.25
+// ===================
+
+#pragma once
+
+#include "Lapack_Interface.h"
+#include "Global_Func-2.h"
+
+namespace RI
+{
+
+namespace Lapack_Interface
+{
+	// potrf computes the Cholesky factorization of a real symmetric positive definite matrix
+	template<typename T>
+	inline int potrf( const char &uplo, const int &n, T*const A )
+	{
+		return potrf(uplo, n, A, n);
+	}
+	
+	// potri takes potrf's output to perform matrix inversion
+	template<typename T>
+	inline int potri( const char &uplo, const int &n, T*const A )	
+	{
+		return potri(uplo, n, A, n);
+	}
+
+	// solve the eigenproblem Ax=ex, where A is Hermitian
+	template<typename T>
+	inline int heev(const char &jobz, const char &uplo,
+		const int &n, T*const A, Global_Func::To_Real_t<T>*const W)
+	{
+		return heev(jobz, uplo, n, A, n, W);
+	}
+}
+
+}
@@ -0,0 +1,48 @@
+// ===================
+//  Author: Peize Lin
+//  date: 2022.12.25
+// ===================
+
+#pragma once
+
+#include "Lapack_Interface-Contiguous.h"
+#include "Tensor.h"
+#include <cassert>
+#include <string>
+
+namespace RI
+{
+
+namespace Lapack_Interface
+{
+	// potrf computes the Cholesky factorization of a real symmetric positive definite matrix
+	template<typename T>
+	inline int potrf( const char &uplo, Tensor<T> &A )
+	{
+		assert(A.shape.size()==2);
+		assert(A.shape[0]==A.shape[1]);
+		return potrf(uplo, A.shape[0], A.ptr());
+	}
+
+	// potri takes potrf's output to perform matrix inversion
+	template<typename T>
+	inline int potri( const char &uplo, Tensor<T> &A )
+	{
+		assert(A.shape.size()==2);
+		assert(A.shape[0]==A.shape[1]);
+		return potri(uplo, A.shape[0], A.ptr());
+	}
+
+	// solve the eigenproblem Ax=ex, where A is Hermitian
+	template<typename T>
+	inline int heev(const char &jobz, const char &uplo,
+		Tensor<T> &A, std::vector<Global_Func::To_Real_t<T>> &W)
+	{
+		assert(A.shape.size()==2);
+		assert(A.shape[0]==A.shape[1]);
+		assert(A.shape[0]==W.size());
+		return heev(jobz, uplo, A.shape[0], A.ptr(), W.data());
+	}
+}
+
+}
@@ -0,0 +1,157 @@
+// ===================
+//  Author: Peize Lin
+//  date: 2022.12.25
+// ===================
+
+#pragma once
+
+#include "Lapack-Fortran.h"
+
+#include <string>
+#include <stdexcept>
+
+
+#ifdef __MKL_RI
+#include <mkl_trans.h>
+#endif
+
+#define LAPACK_INFO_CHECK(x) if(const int info=(x))	throw std::runtime_error("info="+std::to_string(info)+".\n"+std::string(__FILE__)+" line "+std::to_string(__LINE__));
+
+namespace RI
+{
+
+namespace Lapack_Interface
+{
+	// potrf computes the Cholesky factorization of a real symmetric positive definite matrix
+	inline int potrf( const char &uplo, const int &n, float*const A, const int &lda )
+	{
+		int info;
+		const char uplo_changed = Blas_Interface::change_uplo(uplo);
+		spotrf_( &uplo_changed, &n, A, &lda, &info );
+		return info;
+	}	
+	inline int potrf( const char &uplo, const int &n, double*const A, const int &lda )
+	{
+		int info;
+		const char uplo_changed = Blas_Interface::change_uplo(uplo);
+		dpotrf_( &uplo_changed, &n, A, &lda, &info );
+		return info;
+	}	
+	inline int potrf( const char &uplo, const int &n, std::complex<float>*const A, const int &lda )
+	{
+		int info;
+		const char uplo_changed = Blas_Interface::change_uplo(uplo);
+		cpotrf_( &uplo_changed, &n, A, &lda, &info );
+		return info;
+	}	
+	inline int potrf( const char &uplo, const int &n, std::complex<double>*const A, const int &lda )
+	{
+		int info;
+		const char uplo_changed = Blas_Interface::change_uplo(uplo);
+		zpotrf_( &uplo_changed, &n, A, &lda, &info );
+		return info;
+	}	
+
+	// potri takes potrf's output to perform matrix inversion
+	inline int potri( const char &uplo, const int &n, float*const A, const int &lda )
+	{
+		int info;
+		const char uplo_changed = Blas_Interface::change_uplo(uplo);
+		spotri_( &uplo_changed, &n, A, &lda, &info);	
+		return info;	
+	}	
+	inline int potri( const char &uplo, const int &n, double*const A, const int &lda )
+	{
+		int info;
+		const char uplo_changed = Blas_Interface::change_uplo(uplo);
+		dpotri_( &uplo_changed, &n, A, &lda, &info);	
+		return info;	
+	}
+	inline int potri( const char &uplo, const int &n, std::complex<float>*const A, const int &lda )
+	{
+		int info;
+		const char uplo_changed = Blas_Interface::change_uplo(uplo);
+		cpotri_( &uplo_changed, &n, A, &lda, &info);	
+		return info;	
+	}
+	inline int potri( const char &uplo, const int &n, std::complex<double>*const A, const int &lda )
+	{
+		int info;
+		const char uplo_changed = Blas_Interface::change_uplo(uplo);
+		zpotri_( &uplo_changed, &n, A, &lda, &info);
+		return info;
+	}
+
+	// solve the eigenproblem Ax=ex, where A is Symmetric
+	inline int syev(const char &jobz, const char &uplo,
+		const int &n, float*const A, const int &lda, float*const W,
+		float*const WORK, const int &lwork)
+	{
+		int info;
+		const char uplo_changed = Blas_Interface::change_uplo(uplo);
+		ssyev_(&jobz, &uplo_changed, &n, A, &lda, W, WORK, &lwork, &info);
+		return info;
+	}
+	inline int syev(const char &jobz, const char &uplo,
+		const int &n, double*const A, const int &lda, double*const W,
+		double*const WORK, const int &lwork)
+	{
+		int info;
+		const char uplo_changed = Blas_Interface::change_uplo(uplo);
+		dsyev_(&jobz, &uplo_changed, &n, A, &lda, W, WORK, &lwork, &info);
+		return info;
+	}
+	// solve the eigenproblem Ax=ex, where A is Hermitian
+	inline int heev(const char &jobz, const char &uplo,
+		const int &n, std::complex<float>*const A, const int &lda, float*const W,
+		std::complex<float>*const WORK, const int &lwork, float*const RWORK)
+	{
+		int info;
+		const char uplo_changed = Blas_Interface::change_uplo(uplo);
+		cheev_(&jobz, &uplo_changed, &n, A, &lda, W, WORK, &lwork, RWORK, &info);
+		return info;
+	}
+	inline int heev(const char &jobz, const char &uplo,
+		const int &n, std::complex<double>*const A, const int &lda, double*const W,
+		std::complex<double>*const WORK, const int &lwork, double*const RWORK)
+	{
+		int info;
+		const char uplo_changed = Blas_Interface::change_uplo(uplo);
+		zheev_(&jobz, &uplo_changed, &n, A, &lda, W, WORK, &lwork, RWORK, &info);
+		return info;
+	}
+
+	// solve the eigenproblem Ax=ex, where A is Hermitian
+	template<typename T,
+		typename std::enable_if< std::is_arithmetic<T>::value,int>::type =0>
+	inline int heev(const char &jobz, const char &uplo,
+		const int &n, T*const A, const int &lda, T*const W)
+	{
+		T work_tmp=100;
+		constexpr int minus_one = -1;
+		LAPACK_INFO_CHECK(syev(jobz, uplo, n, A, lda, W, &work_tmp, minus_one));		// get best lwork
+
+		const int lwork = work_tmp;
+		std::vector<T> WORK(std::max(1,lwork));
+		return syev(jobz, uplo, n, A, lda, W, WORK.data(), lwork);
+	}
+	template<typename T,
+		typename std::enable_if< std::is_arithmetic<T>::value,int>::type =0>
+	inline int heev(const char &jobz, const char &uplo,
+		const int &n, std::complex<T>*const A, const int &lda, T*const W)
+	{
+		std::vector<T> RWORK(std::max(1,3*n-2));
+
+		std::complex<T> work_tmp;
+		constexpr int minus_one = -1;
+		LAPACK_INFO_CHECK(heev(jobz, uplo, n, A, lda, W, &work_tmp, minus_one, RWORK.data()));		// get best lwork
+
+		const int lwork = std::real(work_tmp);
+		std::vector<std::complex<T>> WORK(std::max(1,lwork));
+		return heev(jobz, uplo, n, A, lda, W, WORK.data(), lwork, RWORK.data());
+	}	
+}
+
+}
+
+#undef LAPACK_INFO_CHECK
@@ -60,16 +60,16 @@ class Tensor
 
 
 template<typename T>
-Tensor<T> operator+ (const Tensor<T> &t1, const Tensor<T> &t2);
+extern Tensor<T> operator+ (const Tensor<T> &t1, const Tensor<T> &t2);
 template<typename T>
-Tensor<T> operator- (const Tensor<T> &t1, const Tensor<T> &t2);
+extern Tensor<T> operator- (const Tensor<T> &t1, const Tensor<T> &t2);
 
 template<typename T>
-Tensor<T> operator* (const Tensor<T> &t1, const Tensor<T> &t2);
+extern Tensor<T> operator* (const Tensor<T> &t1, const Tensor<T> &t2);
 template<typename T>
-Tensor<T> operator* (const T &t1, const Tensor<T> &t2);
+extern Tensor<T> operator* (const T &t1, const Tensor<T> &t2);
 template<typename T>
-Tensor<T> operator* (const Tensor<T> &t1, const T &t2);
+extern Tensor<T> operator* (const Tensor<T> &t1, const T &t2);
 
 
 namespace Global_Func
@@ -78,6 +78,21 @@ namespace Global_Func
 	Tensor<Tout> convert(const Tensor<Tin> &t);
 }
 
+
+template<typename T, std::size_t N0>
+extern Tensor<T> to_Tensor(const std::array<T,N0> &a);
+template<typename T, std::size_t N0, std::size_t N1>
+extern Tensor<T> to_Tensor(const std::array<std::array<T,N1>,N0> &a);
+template<typename T, std::size_t N0, std::size_t N1, std::size_t N2>
+extern Tensor<T> to_Tensor(const std::array<std::array<std::array<T,N2>,N1>,N0> &a);
+
+template<typename T, std::size_t N0>
+extern std::array<T,N0> to_array(const Tensor<T> &t);
+template<typename T, std::size_t N0, std::size_t N1>
+extern std::array<std::array<T,N1>,N0> to_array(const Tensor<T> &t);
+template<typename T, std::size_t N0, std::size_t N1, std::size_t N2>
+extern std::array<std::array<std::array<T,N2>,N1>,N0> to_array(const Tensor<T> &t);
+
 }
 
 #include "Blas_Interface-Tensor.h"