aboutsummaryrefslogtreecommitdiffhomepage
path: root/tensorflow/core/kernels/strided_slice_op.cc
diff options
context:
space:
mode:
Diffstat (limited to 'tensorflow/core/kernels/strided_slice_op.cc')
-rw-r--r--tensorflow/core/kernels/strided_slice_op.cc67
1 files changed, 67 insertions, 0 deletions
diff --git a/tensorflow/core/kernels/strided_slice_op.cc b/tensorflow/core/kernels/strided_slice_op.cc
index 6580d271d1..10593516f7 100644
--- a/tensorflow/core/kernels/strided_slice_op.cc
+++ b/tensorflow/core/kernels/strided_slice_op.cc
@@ -451,4 +451,71 @@ REGISTER_KERNEL_BUILDER(Name("StridedSliceAssign")
#undef REGISTER_GPU
#endif // GOOGLE_CUDA
+
+#ifdef TENSORFLOW_USE_SYCL
+#define REGISTER_SYCL(type) \
+ REGISTER_KERNEL_BUILDER(Name("StridedSlice") \
+ .Device(DEVICE_SYCL) \
+ .TypeConstraint<type>("T") \
+ .HostMemory("begin") \
+ .HostMemory("end") \
+ .HostMemory("strides") \
+ .TypeConstraint<int32>("Index"), \
+ StridedSliceOp<SYCLDevice, type>) \
+ REGISTER_KERNEL_BUILDER(Name("StridedSliceGrad") \
+ .Device(DEVICE_SYCL) \
+ .TypeConstraint<type>("T") \
+ .HostMemory("shape") \
+ .HostMemory("begin") \
+ .HostMemory("end") \
+ .HostMemory("strides") \
+ .TypeConstraint<int32>("Index"), \
+ StridedSliceGradOp<SYCLDevice, type>)\
+ REGISTER_KERNEL_BUILDER(Name("StridedSliceAssign") \
+ .Device(DEVICE_SYCL) \
+ .TypeConstraint<type>("T") \
+ .HostMemory("begin") \
+ .HostMemory("end") \
+ .HostMemory("strides") \
+ .TypeConstraint<int32>("Index"), \
+ StridedSliceAssignOp<SYCLDevice, type>)
+
+REGISTER_SYCL(float);
+REGISTER_SYCL(double);
+
+// A special GPU kernel for int32.
+// TODO(b/25387198): Also enable int32 in device memory. This kernel
+// registration requires all int32 inputs and outputs to be in host memory.
+REGISTER_KERNEL_BUILDER(Name("StridedSlice")
+ .Device(DEVICE_SYCL)
+ .TypeConstraint<int32>("T")
+ .TypeConstraint<int32>("Index")
+ .HostMemory("input")
+ .HostMemory("begin")
+ .HostMemory("end")
+ .HostMemory("strides")
+ .HostMemory("output"),
+ StridedSliceOp<CPUDevice, int32>);
+REGISTER_KERNEL_BUILDER(Name("StridedSliceGrad")
+ .Device(DEVICE_SYCL)
+ .TypeConstraint<int32>("T")
+ .TypeConstraint<int32>("Index")
+ .HostMemory("shape")
+ .HostMemory("begin")
+ .HostMemory("end")
+ .HostMemory("strides")
+ .HostMemory("dy")
+ .HostMemory("output"),
+ StridedSliceGradOp<CPUDevice, int32>);
+REGISTER_KERNEL_BUILDER(Name("StridedSliceAssign")
+ .Device(DEVICE_SYCL)
+ .TypeConstraint<int32>("T")
+ .TypeConstraint<int32>("Index")
+ .HostMemory("ref")
+ .HostMemory("begin")
+ .HostMemory("end")
+ .HostMemory("strides"),
+ StridedSliceAssignOp<CPUDevice, int32>)
+#undef REGISTER_SYCL
+#endif // TENSORFLOW_USE_SYCL
} // namespace tensorflow