aboutsummaryrefslogtreecommitdiffhomepage
path: root/unsupported/Eigen/CXX11/src/Tensor/TensorMeta.h
diff options
context:
space:
mode:
authorGravatar Benoit Steiner <benoit.steiner.goog@gmail.com>2016-06-09 08:22:27 -0700
committerGravatar Benoit Steiner <benoit.steiner.goog@gmail.com>2016-06-09 08:22:27 -0700
commitaa33446dace833fbf06632e586c80119b3d8ac11 (patch)
treed7bc59330e69e19de37da9fffc64016ee0febec0 /unsupported/Eigen/CXX11/src/Tensor/TensorMeta.h
parent15890c304edbccedc8a989468ed3fc475f428059 (diff)
Improved support for vectorization of 16-bit floats
Diffstat (limited to 'unsupported/Eigen/CXX11/src/Tensor/TensorMeta.h')
-rw-r--r--unsupported/Eigen/CXX11/src/Tensor/TensorMeta.h5
1 files changed, 5 insertions, 0 deletions
diff --git a/unsupported/Eigen/CXX11/src/Tensor/TensorMeta.h b/unsupported/Eigen/CXX11/src/Tensor/TensorMeta.h
index b1645d56f..82a905a65 100644
--- a/unsupported/Eigen/CXX11/src/Tensor/TensorMeta.h
+++ b/unsupported/Eigen/CXX11/src/Tensor/TensorMeta.h
@@ -55,6 +55,11 @@ struct PacketType {
// For CUDA packet types when using a GpuDevice
#if defined(EIGEN_USE_GPU) && defined(__CUDACC__)
template <>
+ struct PacketType<half, GpuDevice> {
+ typedef half2 type;
+ static const int size = 2;
+ };
+template <>
struct PacketType<float, GpuDevice> {
typedef float4 type;
static const int size = 4;