// This file is part of Eigen, a lightweight C++ template library // for linear algebra. // // Copyright (C) 2015 Benoit Steiner // // This Source Code Form is subject to the terms of the Mozilla // Public License v. 2.0. If a copy of the MPL was not distributed // with this file, You can obtain one at http://mozilla.org/MPL/2.0/. #ifndef EIGEN_CXX11_TENSOR_TENSOR_META_H #define EIGEN_CXX11_TENSOR_TENSOR_META_H namespace Eigen { template struct Cond {}; template EIGEN_DEVICE_FUNC EIGEN_ALWAYS_INLINE const T1& choose(Cond, const T1& first, const T2&) { return first; } template EIGEN_DEVICE_FUNC EIGEN_ALWAYS_INLINE const T2& choose(Cond, const T1&, const T2& second) { return second; } template EIGEN_DEVICE_FUNC EIGEN_ALWAYS_INLINE T divup(const X x, const Y y) { return static_cast((x + y - 1) / y); } template EIGEN_DEVICE_FUNC EIGEN_ALWAYS_INLINE T divup(const T x, const T y) { return static_cast((x + y - 1) / y); } template struct max_n_1 { static const size_t size = n; }; template <> struct max_n_1<0> { static const size_t size = 1; }; // Default packet types template struct PacketType : internal::packet_traits { typedef typename internal::packet_traits::type type; }; // For CUDA packet types when using a GpuDevice #if defined(EIGEN_USE_GPU) && defined(EIGEN_HAS_GPU_FP16) typedef ulonglong2 Packet4h2; template<> struct PacketType { typedef Packet4h2 type; static const int size = 8; enum { HasAdd = 1, HasSub = 1, HasMul = 1, HasNegate = 1, HasAbs = 1, HasArg = 0, HasAbs2 = 0, HasMin = 1, HasMax = 1, HasConj = 0, HasSetLinear = 0, HasBlend = 0, HasDiv = 1, HasSqrt = 1, HasRsqrt = 1, HasExp = 1, HasExpm1 = 0, HasLog = 1, HasLog1p = 0, HasLog10 = 0, HasPow = 1, }; }; #endif #if defined(EIGEN_USE_SYCL) namespace TensorSycl { namespace internal { template struct PlusOp { static constexpr Index Value = A + B; }; template struct DivOp { static constexpr Index Value = A / B; }; template class StepOp> struct static_for { template static EIGEN_DEVICE_FUNC EIGEN_STRONG_INLINE void loop(UnaryOperator op) { op(start); static_for::Value, end, step, StepOp>::loop(op); } }; template class StepOp> struct static_for { template static EIGEN_DEVICE_FUNC EIGEN_STRONG_INLINE void loop(UnaryOperator) {} }; template struct Vectorise { static const int PacketSize = 1; typedef OutScalar PacketReturnType; }; template struct Vectorise { static const int PacketSize = Eigen::PacketType::size; typedef typename Eigen::PacketType::type PacketReturnType; }; static EIGEN_DEVICE_FUNC EIGEN_ALWAYS_INLINE Index roundUp(Index x, Index y) { return ((((x) + (y)-1) / (y)) * (y)); } } // namespace internal } // namespace TensorSycl template <> struct PacketType { typedef half type; static const int size = 1; enum { HasAdd = 0, HasSub = 0, HasMul = 0, HasNegate = 0, HasAbs = 0, HasArg = 0, HasAbs2 = 0, HasMin = 0, HasMax = 0, HasConj = 0, HasSetLinear = 0, HasBlend = 0 }; }; template struct PacketType : internal::default_packet_traits { typedef Scalar type; typedef Scalar half; enum { Vectorizable = 0, size = 1, AlignedOnScalar = 0, HasHalfPacket = 0 }; enum { HasAdd = 0, HasSub = 0, HasMul = 0, HasNegate = 0, HasAbs = 0, HasAbs2 = 0, HasMin = 0, HasMax = 0, HasConj = 0, HasSetLinear = 0 }; }; template struct PacketType : PacketType{}; #ifndef EIGEN_DONT_VECTORIZE_SYCL #define PACKET_TYPE(CVQual, Type, val, lengths, DEV)\ template<> struct PacketType : internal::sycl_packet_traits \ {\ typedef typename internal::packet_traits::type type;\ typedef typename internal::packet_traits::half half;\ }; PACKET_TYPE(const, float, 1, 4, SyclDevice) PACKET_TYPE(, float, 1, 4, SyclDevice) PACKET_TYPE(const, float, 1, 4, const SyclDevice) PACKET_TYPE(, float, 1, 4, const SyclDevice) PACKET_TYPE(const, double, 0, 2, SyclDevice) PACKET_TYPE(, double, 0, 2, SyclDevice) PACKET_TYPE(const, double, 0, 2, const SyclDevice) PACKET_TYPE(, double, 0, 2, const SyclDevice) #undef PACKET_TYPE template<> struct PacketType: PacketType{}; template<> struct PacketType: PacketType{}; #endif #endif // Tuple mimics std::pair but works on e.g. nvcc. template struct Tuple { public: U first; V second; typedef U first_type; typedef V second_type; EIGEN_CONSTEXPR EIGEN_DEVICE_FUNC EIGEN_STRONG_INLINE Tuple() : first(), second() {} EIGEN_CONSTEXPR EIGEN_DEVICE_FUNC EIGEN_STRONG_INLINE Tuple(const U& f, const V& s) : first(f), second(s) {} EIGEN_DEVICE_FUNC EIGEN_STRONG_INLINE void swap(Tuple& rhs) { using numext::swap; swap(first, rhs.first); swap(second, rhs.second); } }; template EIGEN_CONSTEXPR EIGEN_DEVICE_FUNC EIGEN_STRONG_INLINE bool operator==(const Tuple& x, const Tuple& y) { return (x.first == y.first && x.second == y.second); } template EIGEN_CONSTEXPR EIGEN_DEVICE_FUNC EIGEN_STRONG_INLINE bool operator!=(const Tuple& x, const Tuple& y) { return !(x == y); } // Can't use std::pairs on cuda devices template struct IndexPair { EIGEN_CONSTEXPR EIGEN_DEVICE_FUNC EIGEN_ALWAYS_INLINE IndexPair() : first(0), second(0) {} EIGEN_CONSTEXPR EIGEN_DEVICE_FUNC EIGEN_ALWAYS_INLINE IndexPair(Idx f, Idx s) : first(f), second(s) {} EIGEN_DEVICE_FUNC void set(IndexPair val) { first = val.first; second = val.second; } Idx first; Idx second; }; #ifdef EIGEN_HAS_SFINAE namespace internal { template EIGEN_CONSTEXPR EIGEN_DEVICE_FUNC EIGEN_STRONG_INLINE array customIndices2Array(IndexType& idx, numeric_list) { return { idx[Is]... }; } template EIGEN_CONSTEXPR EIGEN_DEVICE_FUNC EIGEN_STRONG_INLINE array customIndices2Array(IndexType&, numeric_list) { return array(); } /** Make an array (for index/dimensions) out of a custom index */ template EIGEN_CONSTEXPR EIGEN_DEVICE_FUNC EIGEN_STRONG_INLINE array customIndices2Array(IndexType& idx) { return customIndices2Array(idx, typename gen_numeric_list::type{}); } template struct is_base_of { typedef char (&yes)[1]; typedef char (&no)[2]; template struct Host { operator BB*() const; operator DD*(); }; template static yes check(D*, T); static no check(B*, int); static const bool value = sizeof(check(Host(), int())) == sizeof(yes); }; } #endif } // namespace Eigen #endif // EIGEN_CXX11_TENSOR_TENSOR_META_H