diff options
author | Gael Guennebaud <g.gael@free.fr> | 2014-04-25 10:56:18 +0200 |
---|---|---|
committer | Gael Guennebaud <g.gael@free.fr> | 2014-04-25 10:56:18 +0200 |
commit | 3d8d0f6269478a06f4fcbd4b838c8e9b9d7e9d62 (patch) | |
tree | 9f55e81498c1acc61ea0c10bce0ead69a71875d1 /Eigen/src/Core/arch/AltiVec | |
parent | b0e19db1cf462a07e25429d4f04f7d8e858f670f (diff) |
Enable vectorization of pack_rhs with a column-major RHS.
Rename and generalize Kernel<*> to PacketBlock<*,N>.
Diffstat (limited to 'Eigen/src/Core/arch/AltiVec')
-rw-r--r-- | Eigen/src/Core/arch/AltiVec/Complex.h | 2 | ||||
-rwxr-xr-x | Eigen/src/Core/arch/AltiVec/PacketMath.h | 4 |
2 files changed, 3 insertions, 3 deletions
diff --git a/Eigen/src/Core/arch/AltiVec/Complex.h b/Eigen/src/Core/arch/AltiVec/Complex.h index ee1f008b1..8fdffad5e 100644 --- a/Eigen/src/Core/arch/AltiVec/Complex.h +++ b/Eigen/src/Core/arch/AltiVec/Complex.h @@ -229,7 +229,7 @@ template<> EIGEN_STRONG_INLINE Packet2cf pcplxflip<Packet2cf>(const Packet2cf& x return Packet2cf(vec_perm(x.v, x.v, p16uc_COMPLEX_REV)); } -template<> EIGEN_STRONG_INLINE void ptranspose(Kernel<Packet2cf>& kernel) +template<> EIGEN_STRONG_INLINE void ptranspose(PacketBlock<Packet2cf,2>& kernel) { Packet4f tmp = vec_perm(kernel.packet[0].v, kernel.packet[1].v, p16uc_COMPLEX_TRANSPOSE_0); kernel.packet[1].v = vec_perm(kernel.packet[0].v, kernel.packet[1].v, p16uc_COMPLEX_TRANSPOSE_1); diff --git a/Eigen/src/Core/arch/AltiVec/PacketMath.h b/Eigen/src/Core/arch/AltiVec/PacketMath.h index e26d88382..8a67354e4 100755 --- a/Eigen/src/Core/arch/AltiVec/PacketMath.h +++ b/Eigen/src/Core/arch/AltiVec/PacketMath.h @@ -539,7 +539,7 @@ struct palign_impl<Offset,Packet4i> }; template<> EIGEN_DEVICE_FUNC inline void -ptranspose(Kernel<Packet4f>& kernel) { +ptranspose(PacketBlock<Packet4f,4>& kernel) { Packet4f t0, t1, t2, t3; t0 = vec_mergeh(kernel.packet[0], kernel.packet[2]); t1 = vec_mergel(kernel.packet[0], kernel.packet[2]); @@ -552,7 +552,7 @@ ptranspose(Kernel<Packet4f>& kernel) { } template<> EIGEN_DEVICE_FUNC inline void -ptranspose(Kernel<Packet4i>& kernel) { +ptranspose(PacketBlock<Packet4i,4>& kernel) { Packet4i t0, t1, t2, t3; t0 = vec_mergeh(kernel.packet[0], kernel.packet[2]); t1 = vec_mergel(kernel.packet[0], kernel.packet[2]); |