diff options
Diffstat (limited to 'tensorflow/core/kernels/xent_op_gpu.cu.cc')
-rw-r--r-- | tensorflow/core/kernels/xent_op_gpu.cu.cc | 35 |
1 files changed, 35 insertions, 0 deletions
diff --git a/tensorflow/core/kernels/xent_op_gpu.cu.cc b/tensorflow/core/kernels/xent_op_gpu.cu.cc new file mode 100644 index 0000000000..eec6a84281 --- /dev/null +++ b/tensorflow/core/kernels/xent_op_gpu.cu.cc @@ -0,0 +1,35 @@ +#if GOOGLE_CUDA + +#define EIGEN_USE_GPU + +#include "tensorflow/core/kernels/xent_op.h" + +#include "tensorflow/core/platform/port.h" +#include "tensorflow/core/framework/tensor_types.h" + +namespace tensorflow { + +typedef Eigen::GpuDevice GPUDevice; + +// Partial specialization for a GPUDevice, that uses the Eigen implementation +// from XentEigenImpl. +namespace functor { +template <typename T> +struct XentFunctor<GPUDevice, T> { + void operator()(const GPUDevice& d, typename TTypes<T>::ConstMatrix logits, + typename TTypes<T>::ConstMatrix labels, + typename TTypes<T>::Matrix scratch, + typename TTypes<T>::Vec loss, + typename TTypes<T>::Matrix backprop) { + XentEigenImpl<GPUDevice, T>::Compute(d, logits, labels, scratch, loss, + backprop); + } +}; +} // end namespace functor + +// Instantiate the GPU implementation for float. +template struct functor::XentFunctor<GPUDevice, float>; + +} // end namespace tensorflow + +#endif // GOOGLE_CUDA |