aboutsummaryrefslogtreecommitdiffhomepage
path: root/tensorflow/contrib/reduce_slice_ops
diff options
context:
space:
mode:
authorGravatar A. Unique TensorFlower <gardener@tensorflow.org>2017-12-21 14:50:09 -0800
committerGravatar TensorFlower Gardener <gardener@tensorflow.org>2017-12-21 14:54:21 -0800
commite21952f86328d16d1a8a4ac5e100917a251d093f (patch)
tree1d9274230d915810cd78563f9952ee7ecf006408 /tensorflow/contrib/reduce_slice_ops
parent7989a3aa026f93c1f45e1baf4ac37ad2a79156f9 (diff)
Automated g4 rollback of changelist 179782067
PiperOrigin-RevId: 179861781
Diffstat (limited to 'tensorflow/contrib/reduce_slice_ops')
-rw-r--r--tensorflow/contrib/reduce_slice_ops/kernels/reduce_slice_ops_gpu.cu.cc11
1 files changed, 5 insertions, 6 deletions
diff --git a/tensorflow/contrib/reduce_slice_ops/kernels/reduce_slice_ops_gpu.cu.cc b/tensorflow/contrib/reduce_slice_ops/kernels/reduce_slice_ops_gpu.cu.cc
index 501cddb8c8..8e6870fadd 100644
--- a/tensorflow/contrib/reduce_slice_ops/kernels/reduce_slice_ops_gpu.cu.cc
+++ b/tensorflow/contrib/reduce_slice_ops/kernels/reduce_slice_ops_gpu.cu.cc
@@ -34,9 +34,9 @@ namespace functor {
__global__ void ReduceSliceDeviceKernel##reduceop( \
Cuda3DLaunchConfig config, Index indices_width, Index bound, \
const T begin, const Index *indices, const T *input, T *out) { \
- CUDA_AXIS_KERNEL_LOOP(x, config.virtual_thread_count.x, X) { \
- CUDA_AXIS_KERNEL_LOOP(y, config.virtual_thread_count.y, Y) { \
- CUDA_AXIS_KERNEL_LOOP(z, config.virtual_thread_count.z, Z) { \
+ CUDA_AXIS_KERNEL_LOOP(x, config.virtual_thread_count, x) { \
+ CUDA_AXIS_KERNEL_LOOP(y, config.virtual_thread_count, y) { \
+ CUDA_AXIS_KERNEL_LOOP(z, config.virtual_thread_count, z) { \
Index outidx = x * config.virtual_thread_count.y * \
config.virtual_thread_count.z + \
y * config.virtual_thread_count.z + z; \
@@ -68,9 +68,8 @@ namespace functor {
if (sizex * sizey * sizez == 0) { \
return; \
} \
- Cuda3DLaunchConfig config = GetCuda3DLaunchConfig( \
- sizex, sizey, sizez, d, ReduceSliceDeviceKernel##reduceop<T, Index>, \
- 0, 0); \
+ Cuda3DLaunchConfig config = GetCuda3DLaunchConfig(sizex, sizey, sizez, d,\
+ ReduceSliceDeviceKernel##reduceop<T, Index>, 0, 0); \
\
ReduceSliceDeviceKernel##reduceop<T, Index> \
<<<config.block_count, config.thread_per_block, 0, d.stream()>>>( \