Temporarily turn off the NEON implementation of pfloor as it does not work for large values.

The NEON implementation mimics the SSE implementation, but didn't mention the caveat that due to the unsigned of signed integer conversions, not all values in the original floating point  represented are supported.
This commit is contained in:
Zachary Garrett 2020-08-04 16:28:23 +00:00 committed by Rasmus Munk Larsen
parent 23b7f0572b
commit 21122498ec

View File

@ -137,7 +137,7 @@ struct packet_traits<float> : default_packet_traits
HasBlend = 0, HasBlend = 0,
HasDiv = 1, HasDiv = 1,
HasFloor = 1, HasFloor = 0,
HasSin = EIGEN_FAST_MATH, HasSin = EIGEN_FAST_MATH,
HasCos = EIGEN_FAST_MATH, HasCos = EIGEN_FAST_MATH,
@ -1397,6 +1397,9 @@ template<> EIGEN_STRONG_INLINE Packet2f pcmp_lt_or_nan<Packet2f>(const Packet2f&
template<> EIGEN_STRONG_INLINE Packet4f pcmp_lt_or_nan<Packet4f>(const Packet4f& a, const Packet4f& b) template<> EIGEN_STRONG_INLINE Packet4f pcmp_lt_or_nan<Packet4f>(const Packet4f& a, const Packet4f& b)
{ return vreinterpretq_f32_u32(vmvnq_u32(vcgeq_f32(a,b))); } { return vreinterpretq_f32_u32(vmvnq_u32(vcgeq_f32(a,b))); }
// WARNING: this pfloor implementation makes sense for inputs that fit in
// signed int32 integers (up to ~2.14e9), hence this is currently only used
// by pexp and not exposed through HasFloor.
template<> EIGEN_STRONG_INLINE Packet2f pfloor<Packet2f>(const Packet2f& a) template<> EIGEN_STRONG_INLINE Packet2f pfloor<Packet2f>(const Packet2f& a)
{ {
const Packet2f cst_1 = pset1<Packet2f>(1.0f); const Packet2f cst_1 = pset1<Packet2f>(1.0f);
@ -3269,7 +3272,7 @@ template<> struct packet_traits<double> : default_packet_traits
HasBlend = 0, HasBlend = 0,
HasDiv = 1, HasDiv = 1,
HasFloor = 1, HasFloor = 0,
HasSin = 0, HasSin = 0,
HasCos = 0, HasCos = 0,
@ -3329,6 +3332,9 @@ template<> EIGEN_STRONG_INLINE Packet2d pmin<Packet2d>(const Packet2d& a, const
template<> EIGEN_STRONG_INLINE Packet2d pmax<Packet2d>(const Packet2d& a, const Packet2d& b) { return vmaxq_f64(a,b); } template<> EIGEN_STRONG_INLINE Packet2d pmax<Packet2d>(const Packet2d& a, const Packet2d& b) { return vmaxq_f64(a,b); }
// WARNING: this pfloor implementation makes sense for inputs that fit in
// signed int64 integers (up to ~9.22e18), hence this is currently only used
// by pexp and not exposed through HasFloor.
template<> EIGEN_STRONG_INLINE Packet2d pfloor<Packet2d>(const Packet2d& a) template<> EIGEN_STRONG_INLINE Packet2d pfloor<Packet2d>(const Packet2d& a)
{ {
const Packet2d cst_1 = pset1<Packet2d>(1.0); const Packet2d cst_1 = pset1<Packet2d>(1.0);