mirror of
https://gitlab.com/libeigen/eigen.git
synced 2025-01-12 14:25:16 +08:00
Fix non-trivial Half constructor for CUDA.
Both CUDA and HIP require trivial default constructors for types used in shared memory. Otherwise failing with ``` error: initialization is not supported for __shared__ variables. ```
This commit is contained in:
parent
6045243141
commit
1296abdf82
@ -85,11 +85,12 @@ namespace half_impl {
|
||||
#if !defined(EIGEN_HAS_GPU_FP16) || !defined(EIGEN_GPU_COMPILE_PHASE)
|
||||
// Make our own __half_raw definition that is similar to CUDA's.
|
||||
struct __half_raw {
|
||||
#if (defined(EIGEN_HAS_HIP_FP16) && !defined(EIGEN_HIP_DEVICE_COMPILE))
|
||||
// Eigen::half can be used as the datatype for some shared memory declarations (in Eigen and TF)
|
||||
// (In HIP) The element type for shared memory declaration cannot have non-trivial constructors
|
||||
// and hence the following special casing (which skips the zero-initilization)
|
||||
// Note that this check gets done even in the host compilation phase, and hence the need for this
|
||||
#if (defined(EIGEN_HAS_GPU_FP16) && !defined(EIGEN_DEVICE_COMPILE_PHASE))
|
||||
// Eigen::half can be used as the datatype for shared memory declarations (in Eigen and TF)
|
||||
// The element type for shared memory cannot have non-trivial constructors
|
||||
// and hence the following special casing (which skips the zero-initilization).
|
||||
// Note that this check gets done even in the host compilation phase, and
|
||||
// hence the need for this
|
||||
EIGEN_DEVICE_FUNC __half_raw() {}
|
||||
#else
|
||||
EIGEN_DEVICE_FUNC EIGEN_CONSTEXPR __half_raw() : x(0) {}
|
||||
|
Loading…
Reference in New Issue
Block a user