/* Copyright 2015 The TensorFlow Authors. All Rights Reserved. Licensed under the Apache License, Version 2.0 (the "License"); you may not use this file except in compliance with the License. You may obtain a copy of the License at http://www.apache.org/licenses/LICENSE-2.0 Unless required by applicable law or agreed to in writing, software distributed under the License is distributed on an "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. See the License for the specific language governing permissions and limitations under the License. ==============================================================================*/ #ifndef TENSORFLOW_CORE_KERNELS_CWISE_OPS_GRADIENTS_H_ #define TENSORFLOW_CORE_KERNELS_CWISE_OPS_GRADIENTS_H_ #define EIGEN_USE_THREADS #include "third_party/eigen3/unsupported/Eigen/CXX11/Tensor" #include "tensorflow/core/kernels/cwise_ops.h" namespace Eigen { namespace internal { // Gradient for the tanh function template struct scalar_tanh_gradient_op { EIGEN_EMPTY_STRUCT_CTOR(scalar_tanh_gradient_op) EIGEN_DEVICE_FUNC EIGEN_STRONG_INLINE const T operator()(const T& output, const T& output_gradient) const { return output_gradient * (T(1) - output * output); } template EIGEN_DEVICE_FUNC EIGEN_STRONG_INLINE const Packet packetOp(const Packet& output, const Packet& output_gradient) const { return pmul(output_gradient, psub(pset1(T(1)), pmul(output, output))); } }; template struct functor_traits> { enum { Cost = NumTraits::AddCost + 2 * NumTraits::MulCost, PacketAccess = packet_traits::HasSub && packet_traits::HasMul, }; }; // Gradient for the sigmoid function template struct scalar_sigmoid_gradient_op { EIGEN_EMPTY_STRUCT_CTOR(scalar_sigmoid_gradient_op) EIGEN_DEVICE_FUNC EIGEN_STRONG_INLINE const T operator()(const T& output, const T& output_gradient) const { return output_gradient * output * (T(1) - output); } template EIGEN_DEVICE_FUNC EIGEN_STRONG_INLINE const Packet packetOp(const Packet& output, const Packet& output_gradient) const { return pmul(output_gradient, pmul(output, psub(pset1(T(1)), output))); } }; template struct functor_traits> { enum { Cost = NumTraits::AddCost + 2 * NumTraits::MulCost, PacketAccess = packet_traits::HasSub && packet_traits::HasMul, }; }; // Gradient for the inverse function template struct scalar_inverse_gradient_op { EIGEN_EMPTY_STRUCT_CTOR(scalar_inverse_gradient_op) EIGEN_DEVICE_FUNC EIGEN_STRONG_INLINE const T operator()(const T& output, const T& output_gradient) const { const T out_conj = numext::conj(output); return -output_gradient * out_conj * out_conj; } template EIGEN_DEVICE_FUNC EIGEN_STRONG_INLINE const Packet packetOp(const Packet& output, const Packet& output_gradient) const { const Packet out_conj = pconj(output); return pnegate(pmul(output_gradient, pmul(out_conj, out_conj))); } }; template struct functor_traits> { enum { Cost = NumTraits::AddCost + 2 * NumTraits::MulCost, PacketAccess = packet_traits::HasMul, }; }; // Gradient for the sqrt function template struct scalar_sqrt_gradient_op { EIGEN_EMPTY_STRUCT_CTOR(scalar_sqrt_gradient_op) EIGEN_DEVICE_FUNC EIGEN_STRONG_INLINE const T operator()(const T& output, const T& output_gradient) const { const T out_conj = numext::conj(output); return static_cast(0.5) * output_gradient / out_conj; } template EIGEN_DEVICE_FUNC EIGEN_STRONG_INLINE const Packet packetOp(const Packet& output, const Packet& output_gradient) const { const Packet const_half = pset1(static_cast(0.5)); const Packet out_conj = pconj(output); return pdiv(pmul(const_half, output_gradient), out_conj); } }; template struct functor_traits> { enum { PacketAccess = packet_traits::HasMul & packet_traits::HasDiv, Cost = NumTraits::MulCost + scalar_div_cost::value, }; }; // Gradient for the rsqrt function template struct scalar_rsqrt_gradient_op { EIGEN_EMPTY_STRUCT_CTOR(scalar_rsqrt_gradient_op) EIGEN_DEVICE_FUNC EIGEN_STRONG_INLINE const T operator()(const T& output, const T& output_gradient) const { const T out_conj = numext::conj(output); return static_cast(-0.5) * (output_gradient * out_conj) * (out_conj * out_conj); } template EIGEN_DEVICE_FUNC EIGEN_STRONG_INLINE const Packet packetOp(const Packet& output, const Packet& output_gradient) const { const Packet const_half = pset1(static_cast(-0.5)); const Packet out_conj = pconj(output); return pmul(const_half, pmul(pmul(output_gradient, out_conj), pmul(out_conj, out_conj))); } }; template struct functor_traits> { enum { Cost = 4 * NumTraits::MulCost, PacketAccess = packet_traits::HasMul, }; }; } // end namespace internal } // end namespace Eigen namespace tensorflow { namespace functor { template struct SimpleBinaryFunctor { void operator()(const Device& d, typename Functor::tout_type out, typename Functor::tin_type in0, typename Functor::tin_type in1); }; // Partial specialization of BinaryFunctor for CPU devices typedef Eigen::ThreadPoolDevice CPUDevice; template struct SimpleBinaryFunctor { void operator()(const CPUDevice& d, typename Functor::tout_type out, typename Functor::tin_type in0, typename Functor::tin_type in1) { out.device(d) = in0.binaryExpr(in1, typename Functor::func()); } }; #ifdef TENSORFLOW_USE_SYCL // Partial specialization of BinaryFunctor for SYCL devices typedef Eigen::SyclDevice SYCLDevice; template struct SimpleBinaryFunctor { void operator()(const SYCLDevice& d, typename Functor::tout_type out, typename Functor::tin_type in0, typename Functor::tin_type in1) { out.device(d) = in0.binaryExpr(in1, typename Functor::func()); } }; #endif // TENSORFLOW_USE_SYCL template struct tanh_grad : base> {}; template struct sigmoid_grad : base> { }; template struct inverse_grad : base> { }; template struct sqrt_grad : base> {}; template struct rsqrt_grad : base> {}; template struct igamma_grad_a : base> {}; } // end namespace functor } // end namespace tensorflow #endif // TENSORFLOW_CORE_KERNELS_CWISE_OPS_GRADIENTS_H_