From e9e5261664cc77049f8b77a2c36c535fbd44889c Mon Sep 17 00:00:00 2001 From: Gael Guennebaud Date: Sat, 26 Jul 2008 23:05:44 +0000 Subject: [PATCH] Fix a couple issues introduced in the previous commit: * removed DirectAccessBit from Part * use a template specialization in inverseProduct() to transform a Part xpr to a Flagged xpr --- Eigen/src/Core/InverseProduct.h | 29 +++++++++++++++++++++++------ Eigen/src/Core/MatrixBase.h | 4 ++-- Eigen/src/Core/Part.h | 5 ++++- Eigen/src/Core/Product.h | 16 ++++++++++++++-- Eigen/src/Geometry/OrthoMethods.h | 8 ++++---- 5 files changed, 47 insertions(+), 15 deletions(-) diff --git a/Eigen/src/Core/InverseProduct.h b/Eigen/src/Core/InverseProduct.h index 87f426af5..cfab54228 100755 --- a/Eigen/src/Core/InverseProduct.h +++ b/Eigen/src/Core/InverseProduct.h @@ -25,8 +25,12 @@ #ifndef EIGEN_INVERSEPRODUCT_H #define EIGEN_INVERSEPRODUCT_H +template struct ei_is_part { enum {value=false}; }; +template struct ei_is_part > { enum {value=true}; }; + template::value ? -1 // this is to solve ambiguous specializations + : (int(Lhs::Flags) & LowerTriangularBit) ? Lower : (int(Lhs::Flags) & UpperTriangularBit) ? Upper @@ -35,6 +39,16 @@ template struct ei_trisolve_selector; +// transform a Part xpr to a Flagged xpr +template +struct ei_trisolve_selector,Rhs,TriangularPart,StorageOrder> +{ + static void run(const Part& lhs, Rhs& other) + { + ei_trisolve_selector,Rhs>::run(lhs._expression(), other); + } +}; + // forward substitution, row-major template struct ei_trisolve_selector @@ -102,12 +116,12 @@ struct ei_trisolve_selector int blockyEnd = (std::max(size-5,0)/4)*4; for(int i=0; i btmp; /* Let's process the 4x4 sub-matrix as usual. * btmp stores the diagonal coefficients used to update the remaining part of the result. */ + int startBlock = i; + int endBlock = startBlock+4; + Matrix btmp; for (;i { if(!(Lhs::Flags & UnitDiagBit)) other.coeffRef(i,c) /= lhs.coeff(i,i); - // NOTE we cannot use lhs.col(i).end(size-i-1) because Part::coeffRef gets called by .col() to - // get the address of the start of the row + + /* NOTE we cannot use lhs.col(i).end(size-i-1) because Part::coeffRef gets called by .col() to + * get the address of the start of the row + */ other.col(c).end(size-i-1) -= other.coeffRef(i,c) * Block(lhs, i+1,i, size-i-1,1); } if(!(Lhs::Flags & UnitDiagBit)) @@ -146,6 +162,7 @@ struct ei_trisolve_selector }; // backward substitution, col-major +// see the previous specialization for details on the algorithm template struct ei_trisolve_selector { diff --git a/Eigen/src/Core/MatrixBase.h b/Eigen/src/Core/MatrixBase.h index dbc251199..1e9d0d958 100644 --- a/Eigen/src/Core/MatrixBase.h +++ b/Eigen/src/Core/MatrixBase.h @@ -32,7 +32,7 @@ * This class is the base that is inherited by all matrix, vector, and expression * types. Most of the Eigen API is contained in this class. Other important classes for * the Eigen API are Matrix, Cwise, and PartialRedux. - * + * * Note that some methods are defined in the \ref Array module. * * \param Derived is the derived type, e.g. a matrix type, or an expression, etc. @@ -550,7 +550,7 @@ template class MatrixBase template typename ei_eval::type cross(const MatrixBase& other) const; - typename ei_eval::type perpendicular(void) const; + typename ei_eval::type someOrthogonal(void) const; }; #endif // EIGEN_MATRIXBASE_H diff --git a/Eigen/src/Core/Part.h b/Eigen/src/Core/Part.h index 1a7c7f82a..871e27427 100644 --- a/Eigen/src/Core/Part.h +++ b/Eigen/src/Core/Part.h @@ -53,7 +53,7 @@ struct ei_traits > ColsAtCompileTime = MatrixType::ColsAtCompileTime, MaxRowsAtCompileTime = MatrixType::MaxRowsAtCompileTime, MaxColsAtCompileTime = MatrixType::MaxColsAtCompileTime, - Flags = (_MatrixTypeNested::Flags & (HereditaryBits | DirectAccessBit) & (~(PacketAccessBit | LinearAccessBit))) | Mode, + Flags = (_MatrixTypeNested::Flags & (HereditaryBits) & (~(PacketAccessBit | DirectAccessBit | LinearAccessBit))) | Mode, CoeffReadCost = _MatrixTypeNested::CoeffReadCost }; }; @@ -109,6 +109,9 @@ template class Part return m_matrix.const_cast_derived().coeffRef(row, col); } + /** \internal */ + const MatrixType& _expression() const { return m_matrix; } + /** discard any writes to a row */ const Block row(int i) { return Base::row(i); } const Block row(int i) const { return Base::row(i); } diff --git a/Eigen/src/Core/Product.h b/Eigen/src/Core/Product.h index bf491b765..9a0365939 100644 --- a/Eigen/src/Core/Product.h +++ b/Eigen/src/Core/Product.h @@ -378,7 +378,7 @@ struct ei_product_coeff_vectorized_dyn_selector } }; -// NOTE the 2 following specializations are because taking .col(0) on a vector is a bit slower +// NOTE the 3 following specializations are because taking .col(0) on a vector is a bit slower template struct ei_product_coeff_vectorized_dyn_selector { @@ -403,6 +403,18 @@ struct ei_product_coeff_vectorized_dyn_selector } }; +template +struct ei_product_coeff_vectorized_dyn_selector +{ + inline static void run(int row, int /*col*/, const Lhs& lhs, const Rhs& rhs, typename Lhs::Scalar &res) + { + res = ei_dot_impl< + Lhs, + Rhs, + LinearVectorization, NoUnrolling>::run(lhs, rhs); + } +}; + template struct ei_product_coeff_impl { @@ -518,7 +530,7 @@ struct ei_cache_friendly_product_selector struct ei_cache_friendly_product_selector { diff --git a/Eigen/src/Geometry/OrthoMethods.h b/Eigen/src/Geometry/OrthoMethods.h index 5955ce223..ea71c12d2 100644 --- a/Eigen/src/Geometry/OrthoMethods.h +++ b/Eigen/src/Geometry/OrthoMethods.h @@ -23,8 +23,8 @@ // License and a copy of the GNU General Public License along with // Eigen. If not, see . -#ifndef EIGEN_CROSS_H -#define EIGEN_CROSS_H +#ifndef EIGEN_ORTHOMETHODS_H +#define EIGEN_ORTHOMETHODS_H /** \geometry_module * \returns the cross product of \c *this and \a other */ @@ -34,7 +34,7 @@ inline typename ei_eval::type MatrixBase::cross(const MatrixBase& other) const { EIGEN_STATIC_ASSERT_VECTOR_SPECIFIC_SIZE(Derived,3); - + // Note that there is no need for an expression here since the compiler // optimize such a small temporary very well (even within a complex expression) const typename ei_nested::type lhs(derived()); @@ -107,4 +107,4 @@ MatrixBase::someOrthogonal() const return ei_perpendicular_selector::run(derived()); } -#endif // EIGEN_CROSS_H +#endif // EIGEN_ORTHOMETHODS_H