* vectorize dot product, copying code from sum.

* make the conj functor vectorizable: it is just identity in real case, and complex doesn't use the vectorized path anyway. * fix bug in Block: a 3x1 block in a 4x4 matrix (all fixed-size) should not be vectorizable, since in fixed-size we are assuming the size to be a multiple of packet size. (Or would you prefer Vector3d to be flagged "packetaccess" even though no packet access is possible on vectors of that type?) * rename: isOrtho for vectors ---> isOrthogonal isOrtho for matrices ---> isUnitary * add normalize() * reimplement normalized with quotient1 functor
2025-03-31 19:00:35 +08:00 · 2008-06-24 15:13:00 +00:00 · 2008-06-24 15:13:00 +00:00 · 3b94436d2f
commit 3b94436d2f
parent c9560df4a0
12 changed files with 270 additions and 69 deletions
--- a/Eigen/src/Core/Block.h
+++ b/Eigen/src/Core/Block.h
@ -67,14 +67,18 @@ struct ei_traits<Block<MatrixType, BlockRows, BlockCols> >
      : (BlockRows==Dynamic ? MatrixType::MaxRowsAtCompileTime : BlockRows),
    MaxColsAtCompileTime = ColsAtCompileTime == 1 ? 1
      : (BlockCols==Dynamic ? MatrixType::MaxColsAtCompileTime : BlockCols),
-    FlagsMaskLargeBit = ((RowsAtCompileTime != Dynamic && MatrixType::RowsAtCompileTime == Dynamic)
-                      || (ColsAtCompileTime != Dynamic && MatrixType::ColsAtCompileTime == Dynamic))
-                      ? ~LargeBit
-                      : ~(unsigned int)0,
+    MaskLargeBit = ((RowsAtCompileTime != Dynamic && MatrixType::RowsAtCompileTime == Dynamic)
+                  || (ColsAtCompileTime != Dynamic && MatrixType::ColsAtCompileTime == Dynamic))
+                   ? ~LargeBit
+                   : ~(unsigned int)0,
+    MaskPacketAccessBit = ei_corrected_matrix_flags<
+                            Scalar, RowsAtCompileTime, ColsAtCompileTime,
+                            MaxRowsAtCompileTime, MaxColsAtCompileTime, MatrixType::Flags
+                          >::ret & PacketAccessBit,
    FlagsLinearAccessBit = MatrixType::Flags & RowMajorBit
                        ? (RowsAtCompileTime == 1 ? LinearAccessBit : 0)
                        : (ColsAtCompileTime == 1 ? LinearAccessBit : 0),
-    Flags = (MatrixType::Flags & (HereditaryBits | PacketAccessBit | DirectAccessBit) & FlagsMaskLargeBit)
+    Flags = (MatrixType::Flags & (HereditaryBits | MaskPacketAccessBit | DirectAccessBit) & MaskLargeBit)
          | FlagsLinearAccessBit,
    CoeffReadCost = MatrixType::CoeffReadCost
  };
--- a/Eigen/src/Core/Dot.h
+++ b/Eigen/src/Core/Dot.h
@ -25,43 +25,222 @@
 #ifndef EIGEN_DOT_H
 #define EIGEN_DOT_H

-template<int Index, int Size, typename Derived1, typename Derived2>
-struct ei_dot_impl
+/***************************************************************************
+* Part 1 : the logic deciding a strategy for vectorization and unrolling
+***************************************************************************/
+
+template<typename Derived1, typename Derived2>
+struct ei_dot_traits
 {
-  inline static void run(const Derived1 &v1, const Derived2& v2, typename Derived1::Scalar &dot)
+public:
+  enum {
+    Vectorization = (int(Derived1::Flags)&int(Derived2::Flags)&PacketAccessBit)
+                 && (int(Derived1::Flags)&int(Derived2::Flags)&LinearAccessBit)
+                  ? LinearVectorization
+                  : NoVectorization
+  };
+
+private:
+  typedef typename Derived1::Scalar Scalar;
+  enum {
+    PacketSize = ei_packet_traits<Scalar>::size,
+    Cost = Derived1::SizeAtCompileTime * (Derived1::CoeffReadCost + Derived2::CoeffReadCost + NumTraits<Scalar>::MulCost)
+           + (Derived1::SizeAtCompileTime-1) * NumTraits<Scalar>::AddCost,
+    UnrollingLimit = EIGEN_UNROLLING_LIMIT * (int(Vectorization) == int(NoVectorization) ? 1 : int(PacketSize))
+  };
+
+public:
+  enum {
+    Unrolling = Cost <= UnrollingLimit
+              ? CompleteUnrolling
+              : NoUnrolling
+  };
+};
+
+/***************************************************************************
+* Part 2 : unrollers
+***************************************************************************/
+
+/*** no vectorization ***/
+
+template<typename Derived1, typename Derived2, int Start, int Length>
+struct ei_dot_novec_unroller
+{
+  enum {
+    HalfLength = Length/2
+  };
+
+  typedef typename Derived1::Scalar Scalar;
+
+  inline static Scalar run(const Derived1& v1, const Derived2& v2)
  {
-    ei_dot_impl<Index-1, Size, Derived1, Derived2>::run(v1, v2, dot);
-    dot += v1.coeff(Index) * ei_conj(v2.coeff(Index));
+    return ei_dot_novec_unroller<Derived1, Derived2, Start, HalfLength>::run(v1, v2)
+         + ei_dot_novec_unroller<Derived1, Derived2, Start+HalfLength, Length-HalfLength>::run(v1, v2);
  }
 };

-template<int Size, typename Derived1, typename Derived2>
-struct ei_dot_impl<0, Size, Derived1, Derived2>
+template<typename Derived1, typename Derived2, int Start>
+struct ei_dot_novec_unroller<Derived1, Derived2, Start, 1>
 {
-  inline static void run(const Derived1 &v1, const Derived2& v2, typename Derived1::Scalar &dot)
+  typedef typename Derived1::Scalar Scalar;
+
+  inline static Scalar run(const Derived1& v1, const Derived2& v2)
  {
-    dot = v1.coeff(0) * ei_conj(v2.coeff(0));
+    return v1.coeff(Start) * ei_conj(v2.coeff(Start));
+  }
+};
+
+/*** vectorization ***/
+
+template<typename Derived1, typename Derived2, int Index, int Stop,
+         bool LastPacket = (Stop-Index == ei_packet_traits<typename Derived1::Scalar>::size)>
+struct ei_dot_vec_unroller
+{
+  typedef typename Derived1::Scalar Scalar;
+  typedef typename ei_packet_traits<Scalar>::type PacketScalar;
+
+  enum {
+    row1 = Derived1::RowsAtCompileTime == 1 ? 0 : Index,
+    col1 = Derived1::RowsAtCompileTime == 1 ? Index : 0,
+    row2 = Derived2::RowsAtCompileTime == 1 ? 0 : Index,
+    col2 = Derived2::RowsAtCompileTime == 1 ? Index : 0
+  };
+
+  inline static PacketScalar run(const Derived1& v1, const Derived2& v2)
+  {
+    return ei_padd(
+      ei_pmul(v1.template packet<Aligned>(row1, col1), v2.template packet<Aligned>(row2, col2)),
+      ei_dot_vec_unroller<Derived1, Derived2, Index+ei_packet_traits<Scalar>::size, Stop>::run(v1, v2)
+    );
+  }
+};
+
+template<typename Derived1, typename Derived2, int Index, int Stop>
+struct ei_dot_vec_unroller<Derived1, Derived2, Index, Stop, true>
+{
+  enum {
+    row1 = Derived1::RowsAtCompileTime == 1 ? 0 : Index,
+    col1 = Derived1::RowsAtCompileTime == 1 ? Index : 0,
+    row2 = Derived2::RowsAtCompileTime == 1 ? 0 : Index,
+    col2 = Derived2::RowsAtCompileTime == 1 ? Index : 0
+  };
+
+  typedef typename Derived1::Scalar Scalar;
+  typedef typename ei_packet_traits<Scalar>::type PacketScalar;
+
+  inline static PacketScalar run(const Derived1& v1, const Derived2& v2)
+  {
+    return ei_pmul(v1.template packet<Aligned>(row1, col1), v2.template packet<Aligned>(row2, col2));
+  }
+};
+
+/***************************************************************************
+* Part 3 : implementation of all cases
+***************************************************************************/
+
+template<typename Derived1, typename Derived2,
+         int Vectorization = ei_dot_traits<Derived1, Derived2>::Vectorization,
+         int Unrolling = ei_dot_traits<Derived1, Derived2>::Unrolling
+>
+struct ei_dot_impl;
+
+template<typename Derived1, typename Derived2>
+struct ei_dot_impl<Derived1, Derived2, NoVectorization, NoUnrolling>
+{
+  typedef typename Derived1::Scalar Scalar;
+  static Scalar run(const Derived1& v1, const Derived2& v2)
+  {
+    Scalar res;
+    res = v1.coeff(0) * ei_conj(v2.coeff(0));
+    for(int i = 1; i < v1.size(); i++)
+      res += v1.coeff(i) * ei_conj(v2.coeff(i));
+    return res;
  }
 };

 template<typename Derived1, typename Derived2>
-struct ei_dot_impl<Dynamic, Dynamic, Derived1, Derived2>
+struct ei_dot_impl<Derived1, Derived2, NoVectorization, CompleteUnrolling>
+  : public ei_dot_novec_unroller<Derived1, Derived2, 0, Derived1::SizeAtCompileTime>
+{};
+
+template<typename Derived1, typename Derived2>
+struct ei_dot_impl<Derived1, Derived2, LinearVectorization, NoUnrolling>
 {
-  inline static void run(const Derived1& v1, const Derived2& v2, typename Derived1::Scalar& dot)
+  typedef typename Derived1::Scalar Scalar;
+  typedef typename ei_packet_traits<Scalar>::type PacketScalar;
+
+  static Scalar run(const Derived1& v1, const Derived2& v2)
  {
-    dot = v1.coeff(0) * ei_conj(v2.coeff(0));
-    for(int i = 1; i < v1.size(); i++)
-      dot += v1.coeff(i)* ei_conj(v2.coeff(i));
+    const int size = v1.size();
+    const int packetSize = ei_packet_traits<Scalar>::size;
+    const int alignedSize = (size/packetSize)*packetSize;
+    const bool rowVector1 = Derived1::RowsAtCompileTime == 1;
+    const bool rowVector2 = Derived2::RowsAtCompileTime == 1;
+    Scalar res;
+
+    // do the vectorizable part of the sum
+    if(size >= packetSize)
+    {
+      PacketScalar packet_res;
+      packet_res = ei_pmul(
+                         v1.template packet<Aligned>(0, 0),
+                         v2.template packet<Aligned>(0, 0)
+                   );
+      for(int index = packetSize; index<alignedSize; index += packetSize)
+      {
+        const int row1 = rowVector1 ? 0 : index;
+        const int col1 = rowVector1 ? index : 0;
+        const int row2 = rowVector2 ? 0 : index;
+        const int col2 = rowVector2 ? index : 0;
+        packet_res = ei_padd(
+                       packet_res,
+                       ei_pmul(
+                         v1.template packet<Aligned>(row1, col1),
+                         v2.template packet<Aligned>(row2, col2)
+                       )
+                     );
+      }
+      res = ei_predux(packet_res);
+
+      // now we must do the rest without vectorization.
+      if(alignedSize == size) return res;
+    }
+    else // too small to vectorize anything.
+         // since this is dynamic-size hence inefficient anyway for such small sizes, don't try to optimize.
+    {
+      res = Scalar(0);
+    }
+
+    // do the remainder of the vector
+    for(int index = alignedSize; index < size; index++)
+    {
+      const int row1 = rowVector1 ? 0 : index;
+      const int col1 = rowVector1 ? index : 0;
+      const int row2 = rowVector2 ? 0 : index;
+      const int col2 = rowVector2 ? index : 0;
+      res += v1.coeff(row1, col1) * v2.coeff(row2, col2);
+    }
+
+    return res;
  }
 };

-// prevent buggy user code from causing an infinite recursion
-template<int Index, typename Derived1, typename Derived2>
-struct ei_dot_impl<Index, 0, Derived1, Derived2>
+template<typename Derived1, typename Derived2>
+struct ei_dot_impl<Derived1, Derived2, LinearVectorization, CompleteUnrolling>
 {
-  inline static void run(const Derived1&, const Derived2&, typename Derived1::Scalar&) {}
+  typedef typename Derived1::Scalar Scalar;
+  static Scalar run(const Derived1& v1, const Derived2& v2)
+  {
+    return ei_predux(
+      ei_dot_vec_unroller<Derived1, Derived2, 0, Derived1::SizeAtCompileTime>::run(v1, v2)
+    );
+  }
 };

+/***************************************************************************
+* Part 4 : implementation of MatrixBase methods
+***************************************************************************/
+
 /** \returns the dot product of *this with other.
  *
  * \only_for_vectors
@ -81,24 +260,13 @@ MatrixBase<Derived>::dot(const MatrixBase<OtherDerived>& other) const
  typedef typename OtherDerived::Nested OtherNested;
  typedef typename ei_unref<Nested>::type _Nested;
  typedef typename ei_unref<OtherNested>::type _OtherNested;
-  Nested nested(derived());
-  OtherNested otherNested(other.derived());

  EIGEN_STATIC_ASSERT_VECTOR_ONLY(_Nested);
  EIGEN_STATIC_ASSERT_VECTOR_ONLY(_OtherNested);
  EIGEN_STATIC_ASSERT_SAME_VECTOR_SIZE(_Nested,_OtherNested);
-  ei_assert(nested.size() == otherNested.size());
-  const bool unroll = SizeAtCompileTime
-                      * (_Nested::CoeffReadCost + _OtherNested::CoeffReadCost + NumTraits<Scalar>::MulCost)
-                      + (int(SizeAtCompileTime) - 1) * NumTraits<Scalar>::AddCost
-                      <= EIGEN_UNROLLING_LIMIT;
+  ei_assert(size() == other.size());

-  Scalar res;
-  ei_dot_impl<unroll ? int(SizeAtCompileTime)-1 : Dynamic,
-              unroll ? int(SizeAtCompileTime) : Dynamic,
-              _Nested, _OtherNested>
-    ::run(nested, otherNested, res);
-  return res;
+  return ei_dot_impl<_Nested, _OtherNested>::run(derived(), other.derived());
 }

 /** \returns the squared norm of *this, i.e. the dot product of *this with itself.
@ -129,24 +297,36 @@ inline typename NumTraits<typename ei_traits<Derived>::Scalar>::Real MatrixBase<
  *
  * \only_for_vectors
  *
-  * \sa norm()
+  * \sa norm(), normalize()
  */
 template<typename Derived>
-inline const typename MatrixBase<Derived>::ScalarMultipleReturnType
+inline const typename MatrixBase<Derived>::ScalarQuotient1ReturnType
 MatrixBase<Derived>::normalized() const
 {
-  return (*this) * (RealScalar(1)/norm());
+  return *this / norm();
+}
+
+/** Normalizes the vector, i.e. divides it by its own norm.
+  *
+  * \only_for_vectors
+  *
+  * \sa norm(), normalized()
+  */
+template<typename Derived>
+inline void MatrixBase<Derived>::normalize()
+{
+  *this /= norm();
 }

 /** \returns true if *this is approximately orthogonal to \a other,
  *          within the precision given by \a prec.
  *
-  * Example: \include MatrixBase_isOrtho_vector.cpp
-  * Output: \verbinclude MatrixBase_isOrtho_vector.out
+  * Example: \include MatrixBase_isOrthogonal.cpp
+  * Output: \verbinclude MatrixBase_isOrthogonal.out
  */
 template<typename Derived>
 template<typename OtherDerived>
-bool MatrixBase<Derived>::isOrtho
+bool MatrixBase<Derived>::isOrthogonal
 (const MatrixBase<OtherDerived>& other, RealScalar prec) const
 {
  typename ei_nested<Derived,2>::type nested(derived());
@ -159,14 +339,14 @@ bool MatrixBase<Derived>::isOrtho
  *          type is real numbers, a unitary matrix is an orthogonal matrix, whence the name.
  *
  * \note This can be used to check whether a family of vectors forms an orthonormal basis.
-  *       Indeed, \c m.isOrtho() returns true if and only if the columns of m form an
+  *       Indeed, \c m.isUnitary() returns true if and only if the columns (equivalently, the rows) of m form an
  *       orthonormal basis.
  *
-  * Example: \include MatrixBase_isOrtho_matrix.cpp
-  * Output: \verbinclude MatrixBase_isOrtho_matrix.out
+  * Example: \include MatrixBase_isUnitary.cpp
+  * Output: \verbinclude MatrixBase_isUnitary.out
  */
 template<typename Derived>
-bool MatrixBase<Derived>::isOrtho(RealScalar prec) const
+bool MatrixBase<Derived>::isUnitary(RealScalar prec) const
 {
  typename Derived::Nested nested(derived());
  for(int i = 0; i < cols(); i++)
--- a/Eigen/src/Core/Functors.h
+++ b/Eigen/src/Core/Functors.h
@ -169,7 +169,12 @@ template<typename Scalar> struct ei_scalar_abs_op EIGEN_EMPTY_STRUCT {
 };
 template<typename Scalar>
 struct ei_functor_traits<ei_scalar_abs_op<Scalar> >
-{ enum { Cost = NumTraits<Scalar>::AddCost, PacketAccess = false }; };
+{
+  enum {
+    Cost = NumTraits<Scalar>::AddCost,
+    PacketAccess = false // this could actually be vectorized with SSSE3.
+  };
+};

 /** \internal
  * \brief Template functor to compute the squared absolute value of a scalar
@ -194,10 +199,17 @@ struct ei_functor_traits<ei_scalar_abs2_op<Scalar> >
  */
 template<typename Scalar> struct ei_scalar_conjugate_op EIGEN_EMPTY_STRUCT {
  inline const Scalar operator() (const Scalar& a) const { return ei_conj(a); }
+  template<typename PacketScalar>
+  inline const PacketScalar packetOp(const PacketScalar& a) const { return a; }
 };
 template<typename Scalar>
 struct ei_functor_traits<ei_scalar_conjugate_op<Scalar> >
-{ enum { Cost = NumTraits<Scalar>::IsComplex ? NumTraits<Scalar>::AddCost : 0, PacketAccess = false }; };
+{
+  enum {
+    Cost = NumTraits<Scalar>::IsComplex ? NumTraits<Scalar>::AddCost : 0,
+    PacketAccess = int(ei_packet_traits<Scalar>::size)>1
+  };
+};

 /** \internal
  * \brief Template functor to cast a scalar to another type
--- a/Eigen/src/Core/MatrixBase.h
+++ b/Eigen/src/Core/MatrixBase.h
@ -168,8 +168,11 @@ template<typename Derived> class MatrixBase
      typedef Block<Derived, (ei_traits<Derived>::RowsAtCompileTime == 1 ? 1 : Size),
                             (ei_traits<Derived>::ColsAtCompileTime == 1 ? 1 : Size)> Type;
    };
-    /** Represents a product scalar-matrix */
+    /** Represents a scalar multiple of a matrix */
    typedef CwiseUnaryOp<ei_scalar_multiple_op<Scalar>, Derived> ScalarMultipleReturnType;
+    /** Represents a quotient of a matrix by a scalar*/
+    typedef CwiseUnaryOp<ei_scalar_quotient1_op<Scalar>, Derived> ScalarQuotient1ReturnType;
+
    /** the return type of MatrixBase::conjugate() */
    typedef typename ei_meta_if<NumTraits<Scalar>::IsComplex,
                        CwiseUnaryOp<ei_scalar_conjugate_op<Scalar>, Derived>,
@ -280,7 +283,8 @@ template<typename Derived> class MatrixBase
    Scalar dot(const MatrixBase<OtherDerived>& other) const;
    RealScalar norm2() const;
    RealScalar norm()  const;
-    const ScalarMultipleReturnType normalized() const;
+    const ScalarQuotient1ReturnType normalized() const;
+    void normalize();

    Transpose<Derived> transpose();
    const Transpose<Derived> transpose() const;
@ -391,9 +395,9 @@ template<typename Derived> class MatrixBase
    bool isLower(RealScalar prec = precision<Scalar>()) const;

    template<typename OtherDerived>
-    bool isOrtho(const MatrixBase<OtherDerived>& other,
-                 RealScalar prec = precision<Scalar>()) const;
-    bool isOrtho(RealScalar prec = precision<Scalar>()) const;
+    bool isOrthogonal(const MatrixBase<OtherDerived>& other,
+                      RealScalar prec = precision<Scalar>()) const;
+    bool isUnitary(RealScalar prec = precision<Scalar>()) const;

    template<typename OtherDerived>
    inline bool operator==(const MatrixBase<OtherDerived>& other) const
--- a/Eigen/src/Core/Sum.h
+++ b/Eigen/src/Core/Sum.h
@ -184,7 +184,7 @@ struct ei_sum_impl<Derived, LinearVectorization, NoUnrolling>
  static Scalar run(const Derived& mat)
  {
    const int size = mat.size();
-    const int packetSize = ei_packet_traits<typename Derived::Scalar>::size;
+    const int packetSize = ei_packet_traits<Scalar>::size;
    const int alignedSize = (size/packetSize)*packetSize;
    const bool rowMajor = Derived::Flags&RowMajorBit;
    const int innerSize = rowMajor ? mat.cols() : mat.rows();
@ -284,5 +284,4 @@ MatrixBase<Derived>::trace() const
  return diagonal().sum();
 }

-
 #endif // EIGEN_SUM_H
--- a/Eigen/src/Core/util/Constants.h
+++ b/Eigen/src/Core/util/Constants.h
@ -143,10 +143,10 @@ enum DirectionType { Vertical, Horizontal };
 enum ProductEvaluationMode { NormalProduct, CacheFriendlyProduct, DiagonalProduct };

 enum {
-  NoVectorization,
  InnerVectorization,
  LinearVectorization,
-  SliceVectorization
+  SliceVectorization,
+  NoVectorization
 };

 enum {
--- a/doc/snippets/MatrixBase_isOrtho_matrix.cpp
+++ b/doc/snippets/MatrixBase_isOrtho_matrix.cpp
@ -1,5 +0,0 @@
-Matrix3d m = Matrix3d::identity();
-m(0,2) = 1e-4;
-cout << "Here's the matrix m:" << endl << m << endl;
-cout << "m.isOrtho() returns: " << m.isOrtho() << endl;
-cout << "m.isOrtho(1e-3) returns: " << m.isOrtho(1e-3) << endl;
--- a/doc/snippets/MatrixBase_isOrtho_vector.cpp
+++ b/doc/snippets/MatrixBase_isOrtho_vector.cpp
@ -2,5 +2,5 @@ Vector3d v(1,0,0);
 Vector3d w(1e-4,0,1);
 cout << "Here's the vector v:" << endl << v << endl;
 cout << "Here's the vector w:" << endl << w << endl;
-cout << "v.isOrtho(w) returns: " << v.isOrtho(w) << endl;
-cout << "v.isOrtho(w,1e-3) returns: " << v.isOrtho(w,1e-3) << endl;
+cout << "v.isOrthogonal(w) returns: " << v.isOrthogonal(w) << endl;
+cout << "v.isOrthogonal(w,1e-3) returns: " << v.isOrthogonal(w,1e-3) << endl;
--- a/doc/snippets/MatrixBase_isUnitary.cpp
+++ b/doc/snippets/MatrixBase_isUnitary.cpp
@ -0,0 +1,5 @@
+Matrix3d m = Matrix3d::identity();
+m(0,2) = 1e-4;
+cout << "Here's the matrix m:" << endl << m << endl;
+cout << "m.isUnitary() returns: " << m.isUnitary() << endl;
+cout << "m.isUnitary(1e-3) returns: " << m.isUnitary(1e-3) << endl;
--- a/test/adjoint.cpp
+++ b/test/adjoint.cpp
@ -56,9 +56,6 @@ template<typename MatrixType> void adjoint(const MatrixType& m)
  VERIFY_IS_APPROX(m1.adjoint().conjugate().transpose(),    m1);

  // check multiplicative behavior
-  std::cout << (m1.adjoint() * m2).adjoint() << std::endl;
-  std::cout << "------------------------------" << std::endl;
-  std::cout << m2.adjoint() * m1 << std::endl;
  VERIFY_IS_APPROX((m1.adjoint() * m2).adjoint(),           m2.adjoint() * m1);
  VERIFY_IS_APPROX((s1 * m1).adjoint(),                     ei_conj(s1) * m1.adjoint());

--- a/test/cwiseop.cpp
+++ b/test/cwiseop.cpp
@ -59,7 +59,12 @@ template<typename MatrixType> void cwiseops(const MatrixType& m)

  VERIFY_IS_APPROX(               mzero,    m1-m1);
  VERIFY_IS_APPROX(               m2,       m1+m2-m1);
-  VERIFY_IS_APPROX(               mones,    m2.cwiseQuotient(m2));
+#ifdef EIGEN_VECTORIZE
+  if(NumTraits<Scalar>::HasFloatingPoint)
+#endif
+  {
+    VERIFY_IS_APPROX(               mones,    m2.cwiseQuotient(m2));
+  }
  VERIFY_IS_APPROX(               m1.cwiseProduct(m2),    m2.cwiseProduct(m1));

  VERIFY( m1.cwiseLessThan(m1.cwise(bind2nd(plus<Scalar>(), Scalar(1)))).all() );
--- a/test/geometry.cpp
+++ b/test/geometry.cpp
@ -86,7 +86,7 @@ template<typename Scalar> void geometry(void)
  m << v0.normalized(),
      (v0.cross(v1)).normalized(),
      (v0.cross(v1).cross(v0)).normalized();
-  VERIFY(m.isOrtho());
+  VERIFY(m.isUnitary());

  // AngleAxis
  VERIFY_IS_APPROX(AngleAxis(a,v1.normalized()).toRotationMatrix(),