diff options
author | Rasmus Munk Larsen <rmlarsen@google.com> | 2020-10-09 20:05:49 +0000 |
---|---|---|
committer | Rasmus Munk Larsen <rmlarsen@google.com> | 2020-10-09 20:05:49 +0000 |
commit | 4e4d3f32d168ed9ce09d950f099a60ddcd11240f (patch) | |
tree | 3e52ae5b43c238679f69f3caf4d908d4afb16f13 /Eigen/src/Core/arch/NEON/PacketMath.h | |
parent | 7a8d3d5b81cb528f7f084b63686ffb20494053f6 (diff) |
Clean up packetmath tests and fix various bugs to make bfloat16 pass (almost) all packetmath tests with SSE, AVX, and AVX512.
Diffstat (limited to 'Eigen/src/Core/arch/NEON/PacketMath.h')
-rw-r--r-- | Eigen/src/Core/arch/NEON/PacketMath.h | 5 |
1 files changed, 5 insertions, 0 deletions
diff --git a/Eigen/src/Core/arch/NEON/PacketMath.h b/Eigen/src/Core/arch/NEON/PacketMath.h index 1246abeaa..6dbae8cee 100644 --- a/Eigen/src/Core/arch/NEON/PacketMath.h +++ b/Eigen/src/Core/arch/NEON/PacketMath.h @@ -3373,6 +3373,11 @@ template <> EIGEN_STRONG_INLINE Packet4bf pmax<Packet4bf>(const Packet4bf &a, return F32ToBf16(pmax<Packet4f>(Bf16ToF32(a), Bf16ToF32(b))); } +template<> EIGEN_STRONG_INLINE Packet4bf plset<Packet4bf>(const bfloat16& a) +{ + return F32ToBf16(plset<Packet4f>(static_cast<float>(a))); +} + template<> EIGEN_STRONG_INLINE Packet4bf por(const Packet4bf& a,const Packet4bf& b) { return por<Packet4us>(a, b); } |