Optimize predux<Packet4d> (AVX)

This commit is contained in:
Gael Guennebaud 2016-11-22 21:41:30 +01:00
parent f3fb0a1940
commit 7dd894e40e

View File

@ -401,8 +401,7 @@ template<> EIGEN_STRONG_INLINE float predux<Packet8f>(const Packet8f& a)
}
template<> EIGEN_STRONG_INLINE double predux<Packet4d>(const Packet4d& a)
{
Packet4d tmp0 = _mm256_hadd_pd(a,_mm256_permute2f128_pd(a,a,1));
return pfirst(_mm256_hadd_pd(tmp0,tmp0));
return predux(_mm_add_pd(_mm256_castpd256_pd128(a),_mm256_extractf128_pd(a,1)));
}
template<> EIGEN_STRONG_INLINE Packet4f predux_downto4<Packet8f>(const Packet8f& a)