diff --git a/Eigen/src/Core/arch/CUDA/PacketMathHalf.h b/Eigen/src/Core/arch/CUDA/PacketMathHalf.h index 8931f4662..0bf891d24 100644 --- a/Eigen/src/Core/arch/CUDA/PacketMathHalf.h +++ b/Eigen/src/Core/arch/CUDA/PacketMathHalf.h @@ -607,7 +607,7 @@ template<> EIGEN_STRONG_INLINE Packet4h pset1(const Eigen::half& from) } template<> EIGEN_STRONG_INLINE Eigen::half pfirst(const Packet4h& from) { - return raw_uint16_to_half(static_cast(_mm_cvtsi64_si32(from.x))); + return half_impl::raw_uint16_to_half(static_cast(_mm_cvtsi64_si32(from.x))); } template<> EIGEN_STRONG_INLINE Packet4h pconj(const Packet4h& a) { return a; } @@ -618,17 +618,17 @@ template<> EIGEN_STRONG_INLINE Packet4h padd(const Packet4h& a, const Eigen::half h[4]; - Eigen::half ha = raw_uint16_to_half(static_cast(a64)); - Eigen::half hb = raw_uint16_to_half(static_cast(b64)); + Eigen::half ha = half_impl::raw_uint16_to_half(static_cast(a64)); + Eigen::half hb = half_impl::raw_uint16_to_half(static_cast(b64)); h[0] = ha + hb; - ha = raw_uint16_to_half(static_cast(a64 >> 16)); - hb = raw_uint16_to_half(static_cast(b64 >> 16)); + ha = half_impl::raw_uint16_to_half(static_cast(a64 >> 16)); + hb = half_impl::raw_uint16_to_half(static_cast(b64 >> 16)); h[1] = ha + hb; - ha = raw_uint16_to_half(static_cast(a64 >> 32)); - hb = raw_uint16_to_half(static_cast(b64 >> 32)); + ha = half_impl::raw_uint16_to_half(static_cast(a64 >> 32)); + hb = half_impl::raw_uint16_to_half(static_cast(b64 >> 32)); h[2] = ha + hb; - ha = raw_uint16_to_half(static_cast(a64 >> 48)); - hb = raw_uint16_to_half(static_cast(b64 >> 48)); + ha = half_impl::raw_uint16_to_half(static_cast(a64 >> 48)); + hb = half_impl::raw_uint16_to_half(static_cast(b64 >> 48)); h[3] = ha + hb; Packet4h result; result.x = _mm_set_pi16(h[3].x, h[2].x, h[1].x, h[0].x); @@ -641,17 +641,17 @@ template<> EIGEN_STRONG_INLINE Packet4h pmul(const Packet4h& a, const Eigen::half h[4]; - Eigen::half ha = raw_uint16_to_half(static_cast(a64)); - Eigen::half hb = raw_uint16_to_half(static_cast(b64)); + Eigen::half ha = half_impl::raw_uint16_to_half(static_cast(a64)); + Eigen::half hb = half_impl::raw_uint16_to_half(static_cast(b64)); h[0] = ha * hb; - ha = raw_uint16_to_half(static_cast(a64 >> 16)); - hb = raw_uint16_to_half(static_cast(b64 >> 16)); + ha = half_impl::raw_uint16_to_half(static_cast(a64 >> 16)); + hb = half_impl::raw_uint16_to_half(static_cast(b64 >> 16)); h[1] = ha * hb; - ha = raw_uint16_to_half(static_cast(a64 >> 32)); - hb = raw_uint16_to_half(static_cast(b64 >> 32)); + ha = half_impl::raw_uint16_to_half(static_cast(a64 >> 32)); + hb = half_impl::raw_uint16_to_half(static_cast(b64 >> 32)); h[2] = ha * hb; - ha = raw_uint16_to_half(static_cast(a64 >> 48)); - hb = raw_uint16_to_half(static_cast(b64 >> 48)); + ha = half_impl::raw_uint16_to_half(static_cast(a64 >> 48)); + hb = half_impl::raw_uint16_to_half(static_cast(b64 >> 48)); h[3] = ha * hb; Packet4h result; result.x = _mm_set_pi16(h[3].x, h[2].x, h[1].x, h[0].x);