aboutsummaryrefslogtreecommitdiffhomepage
path: root/tensorflow/stream_executor/stream.h
diff options
context:
space:
mode:
authorGravatar A. Unique TensorFlower <gardener@tensorflow.org>2017-08-24 00:00:52 -0700
committerGravatar TensorFlower Gardener <gardener@tensorflow.org>2017-08-24 00:04:32 -0700
commit91b00a110feb83b7307ea9c280142007090f3cd9 (patch)
tree65b55fce64f9685476deca665686588def6e95b0 /tensorflow/stream_executor/stream.h
parent2f531b54ce51fdb9fc2b055548e534a13624ea93 (diff)
Automated g4 rollback of changelist 166276461
PiperOrigin-RevId: 166305887
Diffstat (limited to 'tensorflow/stream_executor/stream.h')
-rw-r--r--tensorflow/stream_executor/stream.h98
1 files changed, 24 insertions, 74 deletions
diff --git a/tensorflow/stream_executor/stream.h b/tensorflow/stream_executor/stream.h
index a418fe961c..9bd4c21a66 100644
--- a/tensorflow/stream_executor/stream.h
+++ b/tensorflow/stream_executor/stream.h
@@ -240,17 +240,15 @@ class Stream {
DeviceMemory<float> *offset_backprop);
// TODO(leary) add double-precision version of this interface.
- Stream &ThenFusedConvolve(
- const dnn::BatchDescriptor &conv_input_descriptor,
- const DeviceMemory<int8> &conv_input_data, float conv_input_scale,
- const dnn::FilterDescriptor &filter_descriptor,
- const DeviceMemory<int8> &filter_data,
- const dnn::ConvolutionDescriptor &convolution_descriptor,
- const DeviceMemory<int8> &side_input_data, float side_input_scale,
- const dnn::BatchDescriptor &bias_descriptor,
- const DeviceMemory<float> &biases, dnn::ActivationMode activation_mode,
- const dnn::BatchDescriptor &output_descriptor,
- DeviceMemory<int8> *output);
+ Stream &ThenConvolve(const dnn::BatchDescriptor &input_descriptor,
+ const DeviceMemory<float> &input_data,
+ const dnn::FilterDescriptor &filter_descriptor,
+ const DeviceMemory<float> &filter_data,
+ const dnn::ConvolutionDescriptor &convolution_descriptor,
+ const DeviceMemory<float> &biases,
+ dnn::ActivationMode activation_mode,
+ const dnn::BatchDescriptor &output_descriptor,
+ DeviceMemory<float> *output);
Stream &ThenConvolve(const dnn::BatchDescriptor &input_descriptor,
const DeviceMemory<float> &input_data,
@@ -280,39 +278,23 @@ class Stream {
const dnn::BatchDescriptor &output_descriptor,
DeviceMemory<float> *output_data);
- Stream &ThenFusedConvolveWithScratch(
- const dnn::BatchDescriptor &conv_input_descriptor,
- const DeviceMemory<int8> &conv_input_data, float conv_input_scale,
- const dnn::FilterDescriptor &filter_descriptor,
- const DeviceMemory<int8> &filter_data,
- const dnn::ConvolutionDescriptor &convolution_descriptor,
- const DeviceMemory<int8> &side_input_data, float side_input_scale,
- const dnn::BatchDescriptor &bias_descriptor,
- const DeviceMemory<float> &biases, dnn::ActivationMode activation_mode,
- const dnn::BatchDescriptor &output_descriptor, DeviceMemory<int8> *output,
- ScratchAllocator *scratch_allocator);
-
- Stream &ThenFusedConvolveWithScratch(
- const dnn::BatchDescriptor &conv_input_descriptor,
- const DeviceMemory<Eigen::half> &conv_input_data, float conv_input_scale,
+ Stream &ThenConvolveWithScratch(
+ const dnn::BatchDescriptor &input_descriptor,
+ const DeviceMemory<Eigen::half> &input_data,
const dnn::FilterDescriptor &filter_descriptor,
const DeviceMemory<Eigen::half> &filter_data,
const dnn::ConvolutionDescriptor &convolution_descriptor,
- const DeviceMemory<Eigen::half> &side_input_data, float side_input_scale,
- const dnn::BatchDescriptor &bias_descriptor,
const DeviceMemory<Eigen::half> &biases,
dnn::ActivationMode activation_mode,
const dnn::BatchDescriptor &output_descriptor,
DeviceMemory<Eigen::half> *output, ScratchAllocator *scratch_allocator);
- Stream &ThenFusedConvolveWithScratch(
- const dnn::BatchDescriptor &conv_input_descriptor,
- const DeviceMemory<float> &conv_input_data, float conv_input_scale,
+ Stream &ThenConvolveWithScratch(
+ const dnn::BatchDescriptor &input_descriptor,
+ const DeviceMemory<float> &input_data,
const dnn::FilterDescriptor &filter_descriptor,
const DeviceMemory<float> &filter_data,
const dnn::ConvolutionDescriptor &convolution_descriptor,
- const DeviceMemory<float> &side_input_data, float side_input_scale,
- const dnn::BatchDescriptor &bias_descriptor,
const DeviceMemory<float> &biases, dnn::ActivationMode activation_mode,
const dnn::BatchDescriptor &output_descriptor,
DeviceMemory<float> *output, ScratchAllocator *scratch_allocator);
@@ -341,6 +323,7 @@ class Stream {
const dnn::FilterDescriptor &filter_descriptor,
const DeviceMemory<float> &filter_data,
const dnn::ConvolutionDescriptor &convolution_descriptor,
+ const DeviceMemory<float> &biases, dnn::ActivationMode activation_mode,
const dnn::BatchDescriptor &output_descriptor,
DeviceMemory<float> *output, ScratchAllocator *scratch_allocator,
const dnn::AlgorithmConfig &algorithm_config,
@@ -352,68 +335,35 @@ class Stream {
const dnn::FilterDescriptor &filter_descriptor,
const DeviceMemory<Eigen::half> &filter_data,
const dnn::ConvolutionDescriptor &convolution_descriptor,
+ const DeviceMemory<Eigen::half> &biases,
+ dnn::ActivationMode activation_mode,
const dnn::BatchDescriptor &output_descriptor,
DeviceMemory<Eigen::half> *output, ScratchAllocator *scratch_allocator,
const dnn::AlgorithmConfig &algorithm_config,
dnn::ProfileResult *output_profile_result);
- Stream &ThenFusedConvolveWithAlgorithm(
- const dnn::BatchDescriptor &conv_input_descriptor,
- const DeviceMemory<double> &conv_input_data, double conv_input_scale,
- const dnn::FilterDescriptor &filter_descriptor,
- const DeviceMemory<double> &filter_data,
- const dnn::ConvolutionDescriptor &convolution_descriptor,
- const DeviceMemory<double> &side_input_data, double side_input_scale,
- const dnn::BatchDescriptor &bias_descriptor,
- const DeviceMemory<double> &biases, dnn::ActivationMode activation_mode,
- const dnn::BatchDescriptor &output_descriptor,
- DeviceMemory<double> *output, ScratchAllocator *scratch_allocator,
- const dnn::AlgorithmConfig &algorithm_config,
- dnn::ProfileResult *output_profile_result);
-
- Stream &ThenFusedConvolveWithAlgorithm(
- const dnn::BatchDescriptor &conv_input_descriptor,
- const DeviceMemory<float> &conv_input_data, float conv_input_scale,
+ Stream &ThenConvolveWithAlgorithm(
+ const dnn::BatchDescriptor &input_descriptor,
+ const DeviceMemory<float> &input_data,
const dnn::FilterDescriptor &filter_descriptor,
const DeviceMemory<float> &filter_data,
const dnn::ConvolutionDescriptor &convolution_descriptor,
- const DeviceMemory<float> &side_input_data, float side_input_scale,
- const dnn::BatchDescriptor &bias_descriptor,
- const DeviceMemory<float> &biases, dnn::ActivationMode activation_mode,
const dnn::BatchDescriptor &output_descriptor,
DeviceMemory<float> *output, ScratchAllocator *scratch_allocator,
const dnn::AlgorithmConfig &algorithm_config,
dnn::ProfileResult *output_profile_result);
- Stream &ThenFusedConvolveWithAlgorithm(
- const dnn::BatchDescriptor &conv_input_descriptor,
- const DeviceMemory<Eigen::half> &conv_input_data, float conv_input_scale,
+ Stream &ThenConvolveWithAlgorithm(
+ const dnn::BatchDescriptor &input_descriptor,
+ const DeviceMemory<Eigen::half> &input_data,
const dnn::FilterDescriptor &filter_descriptor,
const DeviceMemory<Eigen::half> &filter_data,
const dnn::ConvolutionDescriptor &convolution_descriptor,
- const DeviceMemory<Eigen::half> &side_input_data, float side_input_scale,
- const dnn::BatchDescriptor &bias_descriptor,
- const DeviceMemory<Eigen::half> &biases,
- dnn::ActivationMode activation_mode,
const dnn::BatchDescriptor &output_descriptor,
DeviceMemory<Eigen::half> *output, ScratchAllocator *scratch_allocator,
const dnn::AlgorithmConfig &algorithm_config,
dnn::ProfileResult *output_profile_result);
- Stream &ThenFusedConvolveWithAlgorithm(
- const dnn::BatchDescriptor &conv_input_descriptor,
- const DeviceMemory<int8> &conv_input_data, float conv_input_scale,
- const dnn::FilterDescriptor &filter_descriptor,
- const DeviceMemory<int8> &filter_data,
- const dnn::ConvolutionDescriptor &convolution_descriptor,
- const DeviceMemory<int8> &side_input_data, float side_input_scale,
- const dnn::BatchDescriptor &bias_descriptor,
- const DeviceMemory<float> &biases, dnn::ActivationMode activation_mode,
- const dnn::BatchDescriptor &output_descriptor, DeviceMemory<int8> *output,
- ScratchAllocator *scratch_allocator,
- const dnn::AlgorithmConfig &algorithm_config,
- dnn::ProfileResult *output_profile_result);
-
Stream &ThenSeparableConvolve(
const dnn::BatchDescriptor &input_descriptor,
const DeviceMemory<float> &input_data,