From e2bd8623f88c3e7aa1c4a2eaa5dc7ab351219a33 Mon Sep 17 00:00:00 2001 From: Gael Guennebaud Date: Mon, 13 Oct 2008 13:14:43 +0000 Subject: [PATCH] Solve the issue found by Timothy in solveTriangular: => row-major rhs are now evaluated to a column-major temporary before the computations. Add solveInPlace in Cholesky* --- Eigen/src/Cholesky/Cholesky.h | 34 ++++++++++++++++- .../src/Cholesky/CholeskyWithoutSquareRoot.h | 37 +++++++++++++++++-- Eigen/src/Core/MatrixBase.h | 9 +++-- Eigen/src/Core/Product.h | 17 +-------- Eigen/src/Core/SolveTriangular.h | 37 +++++++++++++------ Eigen/src/Core/util/XprHelper.h | 12 ++++++ Eigen/src/SVD/SVD.h | 23 ++++++------ test/sparse.cpp | 4 ++ test/triangular.cpp | 1 + 9 files changed, 129 insertions(+), 45 deletions(-) diff --git a/Eigen/src/Cholesky/Cholesky.h b/Eigen/src/Cholesky/Cholesky.h index a64ab7c70..b94fea8dc 100644 --- a/Eigen/src/Cholesky/Cholesky.h +++ b/Eigen/src/Cholesky/Cholesky.h @@ -74,6 +74,9 @@ template class Cholesky template typename Derived::Eval solve(const MatrixBase &b) const; + template + bool solveInPlace(MatrixBase &bAndX) const; + void compute(const MatrixType& matrix); protected: @@ -141,8 +144,37 @@ typename Derived::Eval Cholesky::solve(const MatrixBase &b) { const int size = m_matrix.rows(); ei_assert(size==b.rows()); + typename ei_eval_to_column_major::type x(b); + solveInPlace(x); + return x; + //return m_matrix.adjoint().template part().solveTriangular(matrixL().solveTriangular(b)); +} - return m_matrix.adjoint().template part().solveTriangular(matrixL().solveTriangular(b)); +/** Computes the solution x of \f$ A x = b \f$ using the current decomposition of A. + * The result is stored in \a bAndx + * + * \returns true in case of success, false otherwise. + * + * In other words, it computes \f$ b = A^{-1} b \f$ with + * \f$ {L^{*}}^{-1} L^{-1} b \f$ from right to left. + * \param bAndX stores both the matrix \f$ b \f$ and the result \f$ x \f$ + * + * Example: \include Cholesky_solve.cpp + * Output: \verbinclude Cholesky_solve.out + * + * \sa MatrixBase::cholesky(), Cholesky::solve() + */ +template +template +bool Cholesky::solveInPlace(MatrixBase &bAndX) const +{ + const int size = m_matrix.rows(); + ei_assert(size==bAndX.rows()); + if (!m_isPositiveDefinite) + return false; + matrixL().solveTriangularInPlace(bAndX); + m_matrix.adjoint().template part().solveTriangularInPlace(bAndX); + return true; } /** \cholesky_module diff --git a/Eigen/src/Cholesky/CholeskyWithoutSquareRoot.h b/Eigen/src/Cholesky/CholeskyWithoutSquareRoot.h index 4040869b0..fd111fb1f 100644 --- a/Eigen/src/Cholesky/CholeskyWithoutSquareRoot.h +++ b/Eigen/src/Cholesky/CholeskyWithoutSquareRoot.h @@ -71,6 +71,9 @@ template class CholeskyWithoutSquareRoot template typename Derived::Eval solve(const MatrixBase &b) const; + template + bool solveInPlace(MatrixBase &bAndX) const; + void compute(const MatrixType& matrix); protected: @@ -101,7 +104,7 @@ void CholeskyWithoutSquareRoot::compute(const MatrixType& a) m_matrix = a; return; } - + // Let's preallocate a temporay vector to evaluate the matrix-vector product into it. // Unlike the standard Cholesky decomposition, here we cannot evaluate it to the destination // matrix because it a sub-row which is not compatible suitable for efficient packet evaluation. @@ -144,8 +147,8 @@ void CholeskyWithoutSquareRoot::compute(const MatrixType& a) * \param b the column vector \f$ b \f$, which can also be a matrix. * * See Cholesky::solve() for a example. - * - * \sa MatrixBase::choleskyNoSqrt() + * + * \sa CholeskyWithoutSquareRoot::solveInPlace(), MatrixBase::choleskyNoSqrt() */ template template @@ -161,6 +164,34 @@ typename Derived::Eval CholeskyWithoutSquareRoot::solve(const Matrix ); } +/** Computes the solution x of \f$ A x = b \f$ using the current decomposition of A. + * The result is stored in \a bAndx + * + * \returns true in case of success, false otherwise. + * + * In other words, it computes \f$ b = A^{-1} b \f$ with + * \f$ {L^{*}}^{-1} D^{-1} L^{-1} b \f$ from right to left. + * \param bAndX stores both the matrix \f$ b \f$ and the result \f$ x \f$ + * + * Example: \include Cholesky_solve.cpp + * Output: \verbinclude Cholesky_solve.out + * + * \sa MatrixBase::cholesky(), CholeskyWithoutSquareRoot::solve() + */ +template +template +bool CholeskyWithoutSquareRoot::solveInPlace(MatrixBase &bAndX) const +{ + const int size = m_matrix.rows(); + ei_assert(size==bAndX.rows()); + if (!m_isPositiveDefinite) + return false; + matrixL().solveTriangularInPlace(bAndX); + bAndX *= m_matrix.cwise().inverse().template part(); + m_matrix.adjoint().template part().solveTriangularInPlace(bAndX); + return true; +} + /** \cholesky_module * \returns the Cholesky decomposition without square root of \c *this */ diff --git a/Eigen/src/Core/MatrixBase.h b/Eigen/src/Core/MatrixBase.h index 2e8355f77..944d353d8 100644 --- a/Eigen/src/Core/MatrixBase.h +++ b/Eigen/src/Core/MatrixBase.h @@ -320,7 +320,8 @@ template class MatrixBase Derived& operator*=(const MatrixBase& other); template - typename OtherDerived::Eval solveTriangular(const MatrixBase& other) const; + typename ei_eval_to_column_major::type + solveTriangular(const MatrixBase& other) const; template void solveTriangularInPlace(MatrixBase& other) const; @@ -544,11 +545,11 @@ template class MatrixBase const Select select(const MatrixBase& thenMatrix, const MatrixBase& elseMatrix) const; - + template inline const Select > select(const MatrixBase& thenMatrix, typename ThenDerived::Scalar elseScalar) const; - + template inline const Select, ElseDerived > select(typename ElseDerived::Scalar thenScalar, const MatrixBase& elseMatrix) const; @@ -581,7 +582,7 @@ template class MatrixBase template EvalType cross(const MatrixBase& other) const; EvalType unitOrthogonal(void) const; - + #ifdef EIGEN_MATRIXBASE_PLUGIN #include EIGEN_MATRIXBASE_PLUGIN #endif diff --git a/Eigen/src/Core/Product.h b/Eigen/src/Core/Product.h index 04deae0ab..429cdc0e9 100644 --- a/Eigen/src/Core/Product.h +++ b/Eigen/src/Core/Product.h @@ -36,8 +36,6 @@ struct ei_product_coeff_impl; template struct ei_product_packet_impl; -template struct ei_product_eval_to_column_major; - /** \class ProductReturnType * * \brief Helper class to get the correct and optimized returned type of operator* @@ -70,7 +68,7 @@ struct ProductReturnType typedef typename ei_nested::type LhsNested; typedef typename ei_nested::type + typename ei_eval_to_column_major::type >::type RhsNested; typedef Product Type; @@ -706,23 +704,12 @@ inline Derived& MatrixBase::lazyAssign(const Product struct ei_product_eval_to_column_major -{ - typedef Matrix::Scalar, - ei_traits::RowsAtCompileTime, - ei_traits::ColsAtCompileTime, - ColMajor, - ei_traits::MaxRowsAtCompileTime, - ei_traits::MaxColsAtCompileTime - > type; -}; - template struct ei_product_copy_rhs { typedef typename ei_meta_if< (ei_traits::Flags & RowMajorBit) || (!(ei_traits::Flags & DirectAccessBit)), - typename ei_product_eval_to_column_major::type, + typename ei_eval_to_column_major::type, const T& >::ret type; }; diff --git a/Eigen/src/Core/SolveTriangular.h b/Eigen/src/Core/SolveTriangular.h index e77d9e238..ea0956ab3 100755 --- a/Eigen/src/Core/SolveTriangular.h +++ b/Eigen/src/Core/SolveTriangular.h @@ -88,12 +88,12 @@ struct ei_solve_triangular_selector other.coeffRef(i,c) = tmp/lhs.coeff(i,i); } - // now let process the remaining rows 4 at once + // now let's process the remaining rows 4 at once for(int i=blockyStart; IsLower ? i0; ) { int startBlock = i; int endBlock = startBlock + (IsLower ? 4 : -4); - + /* Process the i cols times 4 rows block, and keep the result in a temporary vector */ // FIXME use fixed size block but take care to small fixed size matrices... Matrix btmp(4); @@ -101,7 +101,7 @@ struct ei_solve_triangular_selector btmp = lhs.block(startBlock,0,4,i) * other.col(c).start(i); else btmp = lhs.block(i-3,i+1,4,size-1-i) * other.col(c).end(size-1-i); - + /* Let's process the 4x4 sub-matrix as usual. * btmp stores the diagonal coefficients used to update the remaining part of the result. */ @@ -191,6 +191,12 @@ struct ei_solve_triangular_selector &(lhs.const_cast_derived().coeffRef(IsLower ? endBlock : 0, IsLower ? startBlock : endBlock+1)), lhs.stride(), btmp, &(other.coeffRef(IsLower ? endBlock : 0, c))); +// if (IsLower) +// other.col(c).end(size-endBlock) += (lhs.block(endBlock, startBlock, size-endBlock, endBlock-startBlock) +// * other.col(c).block(startBlock,endBlock-startBlock)).lazy(); +// else +// other.col(c).end(size-endBlock) += (lhs.block(endBlock, startBlock, size-endBlock, endBlock-startBlock) +// * other.col(c).block(startBlock,endBlock-startBlock)).lazy(); } /* Now we have to process the remaining part as usual */ @@ -227,7 +233,15 @@ void MatrixBase::solveTriangularInPlace(MatrixBase& other ei_assert(!(Flags & ZeroDiagBit)); ei_assert(Flags & (UpperTriangularBit|LowerTriangularBit)); - ei_solve_triangular_selector::run(derived(), other.derived()); + const bool copy = ei_traits::Flags&RowMajorBit; + typedef typename ei_meta_if::type, OtherDerived&>::ret OtherCopy; + OtherCopy otherCopy(other.derived()); + + ei_solve_triangular_selector::type>::run(derived(), otherCopy); + + if (copy) + other = otherCopy; } /** \returns the product of the inverse of \c *this with \a other, \a *this being triangular. @@ -240,17 +254,17 @@ void MatrixBase::solveTriangularInPlace(MatrixBase& other * It is required that \c *this be marked as either an upper or a lower triangular matrix, which * can be done by marked(), and that is automatically the case with expressions such as those returned * by extract(). - * + * * \addexample SolveTriangular \label How to solve a triangular system (aka. how to multiply the inverse of a triangular matrix by another one) - * + * * Example: \include MatrixBase_marked.cpp * Output: \verbinclude MatrixBase_marked.out - * + * * This function is essentially a wrapper to the faster solveTriangularInPlace() function creating * a temporary copy of \a other, calling solveTriangularInPlace() on the copy and returning it. * Therefore, if \a other is not needed anymore, it is quite faster to call solveTriangularInPlace() * instead of solveTriangular(). - * + * * For users coming from BLAS, this function (and more specifically solveTriangularInPlace()) offer * all the operations supported by the \c *TRSV and \c *TRSM BLAS routines. * @@ -258,14 +272,15 @@ void MatrixBase::solveTriangularInPlace(MatrixBase& other * \code * M * T^1 <=> T.transpose().solveTriangularInPlace(M.transpose()); * \endcode - * + * * \sa solveTriangularInPlace(), marked(), extract() */ template template -typename OtherDerived::Eval MatrixBase::solveTriangular(const MatrixBase& other) const +typename ei_eval_to_column_major::type +MatrixBase::solveTriangular(const MatrixBase& other) const { - typename OtherDerived::Eval res(other); + typename ei_eval_to_column_major::type res(other); solveTriangularInPlace(res); return res; } diff --git a/Eigen/src/Core/util/XprHelper.h b/Eigen/src/Core/util/XprHelper.h index 00f1a39ea..5b8a2c021 100644 --- a/Eigen/src/Core/util/XprHelper.h +++ b/Eigen/src/Core/util/XprHelper.h @@ -121,6 +121,18 @@ template struct ei_eval > type; }; + +template struct ei_eval_to_column_major +{ + typedef Matrix::Scalar, + ei_traits::RowsAtCompileTime, + ei_traits::ColsAtCompileTime, + ColMajor, + ei_traits::MaxRowsAtCompileTime, + ei_traits::MaxColsAtCompileTime + > type; +}; + template struct ei_must_nest_by_value { enum { ret = false }; }; template struct ei_must_nest_by_value > { enum { ret = true }; }; diff --git a/Eigen/src/SVD/SVD.h b/Eigen/src/SVD/SVD.h index 39020fdfc..c3f3bb235 100644 --- a/Eigen/src/SVD/SVD.h +++ b/Eigen/src/SVD/SVD.h @@ -50,16 +50,16 @@ template class SVD AlignmentMask = int(PacketSize)-1, MinSize = EIGEN_ENUM_MIN(MatrixType::RowsAtCompileTime, MatrixType::ColsAtCompileTime) }; - + typedef Matrix ColVector; typedef Matrix RowVector; - + typedef Matrix MatrixUType; typedef Matrix MatrixVType; typedef Matrix SingularValuesType; public: - + SVD(const MatrixType& matrix) : m_matU(matrix.rows(), std::min(matrix.rows(), matrix.cols())), m_matV(matrix.cols(),matrix.cols()), @@ -69,7 +69,7 @@ template class SVD } template - void solve(const MatrixBase &b, ResultType* result) const; + bool solve(const MatrixBase &b, ResultType* result) const; const MatrixUType& matrixU() const { return m_matU; } const SingularValuesType& singularValues() const { return m_sigma; } @@ -97,7 +97,7 @@ void SVD::compute(const MatrixType& matrix) const int m = matrix.rows(); const int n = matrix.cols(); const int nu = std::min(m,n); - + m_matU.resize(m, nu); m_matU.setZero(); m_sigma.resize(std::min(m,n)); @@ -130,7 +130,7 @@ void SVD::compute(const MatrixType& matrix) } m_sigma[k] = -m_sigma[k]; } - + for (j = k+1; j < n; j++) { if ((k < nct) && (m_sigma[k] != 0.0)) @@ -468,18 +468,18 @@ void SVD::compute(const MatrixType& matrix) template SVD& SVD::sort() { - int mu = m_matU.rows(); - int mv = m_matV.rows(); + int mu = m_matU.rows(); + int mv = m_matV.rows(); int n = m_matU.cols(); for (int i=0; i p) + if (m_sigma.coeff(j) > p) { k = j; p = m_sigma.coeff(j); @@ -509,7 +509,7 @@ SVD& SVD::sort() */ template template -void SVD::solve(const MatrixBase &b, ResultType* result) const +bool SVD::solve(const MatrixBase &b, ResultType* result) const { const int rows = m_matU.rows(); ei_assert(b.rows() == rows); @@ -530,6 +530,7 @@ void SVD::solve(const MatrixBase &b, ResultType* resul result->col(j) = m_matV * aux; } + return true; } /** \svd_module diff --git a/test/sparse.cpp b/test/sparse.cpp index 040f889cb..39ea05b8b 100644 --- a/test/sparse.cpp +++ b/test/sparse.cpp @@ -217,6 +217,10 @@ template void sparse(int rows, int cols) // TODO test row major } + // test Cholesky + { + } + } void test_sparse() diff --git a/test/triangular.cpp b/test/triangular.cpp index 2ada0dd90..34afa7b3c 100644 --- a/test/triangular.cpp +++ b/test/triangular.cpp @@ -125,5 +125,6 @@ void test_triangular() CALL_SUBTEST( triangular(MatrixXcf(4, 4)) ); CALL_SUBTEST( triangular(Matrix,8, 8>()) ); CALL_SUBTEST( triangular(MatrixXd(17,17)) ); + CALL_SUBTEST( triangular(Matrix(5, 5)) ); } }