aboutsummaryrefslogtreecommitdiffhomepage
path: root/tensorflow/core/kernels/conv_grad_input_ops.cc
diff options
context:
space:
mode:
authorGravatar Justin Lebar <jlebar@google.com>2018-04-23 17:16:55 -0700
committerGravatar TensorFlower Gardener <gardener@tensorflow.org>2018-04-23 17:19:22 -0700
commit80fc661853f9a0844faf95eb68438dc85a5879e3 (patch)
treee7328a367c4f4db472063f96c983b70e63aa3f26 /tensorflow/core/kernels/conv_grad_input_ops.cc
parentecd837fd0ab69cf54d920eae3b1c73602be6c626 (diff)
Use tensorflow::se instead of perftools::gputools for StreamExecutor.
PiperOrigin-RevId: 194010749
Diffstat (limited to 'tensorflow/core/kernels/conv_grad_input_ops.cc')
-rw-r--r--tensorflow/core/kernels/conv_grad_input_ops.cc28
1 files changed, 14 insertions, 14 deletions
diff --git a/tensorflow/core/kernels/conv_grad_input_ops.cc b/tensorflow/core/kernels/conv_grad_input_ops.cc
index 66d15c6e78..35f2676023 100644
--- a/tensorflow/core/kernels/conv_grad_input_ops.cc
+++ b/tensorflow/core/kernels/conv_grad_input_ops.cc
@@ -604,7 +604,7 @@ struct ConvBackwardDataAutoTuneGroup {
static string name() { return "ConvBwdData"; }
};
typedef AutoTuneSingleton<ConvBackwardDataAutoTuneGroup, ConvParameters,
- perftools::gputools::dnn::AlgorithmConfig>
+ se::dnn::AlgorithmConfig>
AutoTuneConvBwdData;
// Backprop for input.
@@ -705,9 +705,9 @@ void LaunchConv2DBackpropInputOp<GPUDevice, T>::operator()(
const Tensor& out_backprop, const Tensor& filter, int row_dilation,
int col_dilation, int row_stride, int col_stride, const Padding& padding,
Tensor* in_backprop, TensorFormat data_format) {
- using perftools::gputools::dnn::AlgorithmConfig;
- using perftools::gputools::dnn::AlgorithmDesc;
- using perftools::gputools::dnn::ProfileResult;
+ using se::dnn::AlgorithmConfig;
+ using se::dnn::AlgorithmDesc;
+ using se::dnn::ProfileResult;
std::vector<int32> strides(4, 1);
std::vector<int32> dilations(4, 1);
@@ -778,8 +778,8 @@ void LaunchConv2DBackpropInputOp<GPUDevice, T>::operator()(
auto c_ptr = AsDeviceMemory(in_backprop->template flat<T>().data(),
in_backprop->template flat<T>().size());
- auto transpose = perftools::gputools::blas::Transpose::kTranspose;
- auto no_transpose = perftools::gputools::blas::Transpose::kNoTranspose;
+ auto transpose = se::blas::Transpose::kTranspose;
+ auto no_transpose = se::blas::Transpose::kNoTranspose;
bool blas_launch_status =
stream
@@ -810,8 +810,8 @@ void LaunchConv2DBackpropInputOp<GPUDevice, T>::operator()(
auto c_ptr = AsDeviceMemory(in_backprop->template flat<T>().data(),
in_backprop->template flat<T>().size());
- auto transpose = perftools::gputools::blas::Transpose::kTranspose;
- auto no_transpose = perftools::gputools::blas::Transpose::kNoTranspose;
+ auto transpose = se::blas::Transpose::kTranspose;
+ auto no_transpose = se::blas::Transpose::kNoTranspose;
bool blas_launch_status =
stream
@@ -841,24 +841,24 @@ void LaunchConv2DBackpropInputOp<GPUDevice, T>::operator()(
CHECK(padding_rows >= 0 && padding_cols >= 0)
<< "Negative row or col paddings: (" << padding_rows << ", "
<< padding_cols << ")";
- perftools::gputools::dnn::BatchDescriptor input_desc;
+ se::dnn::BatchDescriptor input_desc;
input_desc.set_count(dims.batch_size)
.set_height(GetTensorDim(compatible_input_shape, data_format, 'H'))
.set_width(GetTensorDim(compatible_input_shape, data_format, 'W'))
.set_feature_map_count(dims.in_depth)
- .set_layout(perftools::gputools::dnn::DataLayout::kBatchDepthYX);
- perftools::gputools::dnn::BatchDescriptor output_desc;
+ .set_layout(se::dnn::DataLayout::kBatchDepthYX);
+ se::dnn::BatchDescriptor output_desc;
output_desc.set_count(dims.batch_size)
.set_height(dims.spatial_dims[0].output_size)
.set_width(dims.spatial_dims[1].output_size)
.set_feature_map_count(dims.out_depth)
- .set_layout(perftools::gputools::dnn::DataLayout::kBatchDepthYX);
- perftools::gputools::dnn::FilterDescriptor filter_desc;
+ .set_layout(se::dnn::DataLayout::kBatchDepthYX);
+ se::dnn::FilterDescriptor filter_desc;
filter_desc.set_input_filter_height(dims.spatial_dims[0].filter_size)
.set_input_filter_width(dims.spatial_dims[1].filter_size)
.set_input_feature_map_count(dims.in_depth)
.set_output_feature_map_count(dims.out_depth);
- perftools::gputools::dnn::ConvolutionDescriptor conv_desc;
+ se::dnn::ConvolutionDescriptor conv_desc;
conv_desc.set_vertical_dilation_rate(dims.spatial_dims[0].dilation)
.set_horizontal_dilation_rate(dims.spatial_dims[1].dilation)
.set_vertical_filter_stride(dims.spatial_dims[0].stride)