Skip to content

Commit 0801fcc

Browse files
Update lapack.cu
1 parent 1bed146 commit 0801fcc

File tree

1 file changed

+5
-3
lines changed
  • source/source_base/module_container/ATen/kernels/cuda

1 file changed

+5
-3
lines changed

source/source_base/module_container/ATen/kernels/cuda/lapack.cu

Lines changed: 5 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -70,8 +70,10 @@ struct lapack_trtri<T, DEVICE_GPU> {
7070
{
7171
// TODO: trtri is not implemented in this method yet
7272
// Cause the trtri in cuSolver is not stable for ABACUS!
73-
//cuSolverConnector::trtri(cusolver_handle, uplo, diag, dim, Mat, lda);
74-
cuSolverConnector::potri(cusolver_handle, uplo, diag, dim, Mat, lda);
73+
// But why?! trtri and potri are different routines for different job!
74+
// How can BPCG work without using a proper routine?
75+
cuSolverConnector::trtri(cusolver_handle, uplo, diag, dim, Mat, lda);
76+
// cuSolverConnector::potri(cusolver_handle, uplo, diag, dim, Mat, lda);
7577
}
7678
};
7779

@@ -201,4 +203,4 @@ template struct lapack_getrs<std::complex<float>, DEVICE_GPU>;
201203
template struct lapack_getrs<std::complex<double>, DEVICE_GPU>;
202204

203205
} // namespace kernels
204-
} // namespace container
206+
} // namespace container

0 commit comments

Comments
 (0)