diff options
author | A. Unique TensorFlower <gardener@tensorflow.org> | 2017-08-24 00:00:52 -0700 |
---|---|---|
committer | TensorFlower Gardener <gardener@tensorflow.org> | 2017-08-24 00:04:32 -0700 |
commit | 91b00a110feb83b7307ea9c280142007090f3cd9 (patch) | |
tree | 65b55fce64f9685476deca665686588def6e95b0 /tensorflow/stream_executor/stream.h | |
parent | 2f531b54ce51fdb9fc2b055548e534a13624ea93 (diff) |
Automated g4 rollback of changelist 166276461
PiperOrigin-RevId: 166305887
Diffstat (limited to 'tensorflow/stream_executor/stream.h')
-rw-r--r-- | tensorflow/stream_executor/stream.h | 98 |
1 files changed, 24 insertions, 74 deletions
diff --git a/tensorflow/stream_executor/stream.h b/tensorflow/stream_executor/stream.h index a418fe961c..9bd4c21a66 100644 --- a/tensorflow/stream_executor/stream.h +++ b/tensorflow/stream_executor/stream.h @@ -240,17 +240,15 @@ class Stream { DeviceMemory<float> *offset_backprop); // TODO(leary) add double-precision version of this interface. - Stream &ThenFusedConvolve( - const dnn::BatchDescriptor &conv_input_descriptor, - const DeviceMemory<int8> &conv_input_data, float conv_input_scale, - const dnn::FilterDescriptor &filter_descriptor, - const DeviceMemory<int8> &filter_data, - const dnn::ConvolutionDescriptor &convolution_descriptor, - const DeviceMemory<int8> &side_input_data, float side_input_scale, - const dnn::BatchDescriptor &bias_descriptor, - const DeviceMemory<float> &biases, dnn::ActivationMode activation_mode, - const dnn::BatchDescriptor &output_descriptor, - DeviceMemory<int8> *output); + Stream &ThenConvolve(const dnn::BatchDescriptor &input_descriptor, + const DeviceMemory<float> &input_data, + const dnn::FilterDescriptor &filter_descriptor, + const DeviceMemory<float> &filter_data, + const dnn::ConvolutionDescriptor &convolution_descriptor, + const DeviceMemory<float> &biases, + dnn::ActivationMode activation_mode, + const dnn::BatchDescriptor &output_descriptor, + DeviceMemory<float> *output); Stream &ThenConvolve(const dnn::BatchDescriptor &input_descriptor, const DeviceMemory<float> &input_data, @@ -280,39 +278,23 @@ class Stream { const dnn::BatchDescriptor &output_descriptor, DeviceMemory<float> *output_data); - Stream &ThenFusedConvolveWithScratch( - const dnn::BatchDescriptor &conv_input_descriptor, - const DeviceMemory<int8> &conv_input_data, float conv_input_scale, - const dnn::FilterDescriptor &filter_descriptor, - const DeviceMemory<int8> &filter_data, - const dnn::ConvolutionDescriptor &convolution_descriptor, - const DeviceMemory<int8> &side_input_data, float side_input_scale, - const dnn::BatchDescriptor &bias_descriptor, - const DeviceMemory<float> &biases, dnn::ActivationMode activation_mode, - const dnn::BatchDescriptor &output_descriptor, DeviceMemory<int8> *output, - ScratchAllocator *scratch_allocator); - - Stream &ThenFusedConvolveWithScratch( - const dnn::BatchDescriptor &conv_input_descriptor, - const DeviceMemory<Eigen::half> &conv_input_data, float conv_input_scale, + Stream &ThenConvolveWithScratch( + const dnn::BatchDescriptor &input_descriptor, + const DeviceMemory<Eigen::half> &input_data, const dnn::FilterDescriptor &filter_descriptor, const DeviceMemory<Eigen::half> &filter_data, const dnn::ConvolutionDescriptor &convolution_descriptor, - const DeviceMemory<Eigen::half> &side_input_data, float side_input_scale, - const dnn::BatchDescriptor &bias_descriptor, const DeviceMemory<Eigen::half> &biases, dnn::ActivationMode activation_mode, const dnn::BatchDescriptor &output_descriptor, DeviceMemory<Eigen::half> *output, ScratchAllocator *scratch_allocator); - Stream &ThenFusedConvolveWithScratch( - const dnn::BatchDescriptor &conv_input_descriptor, - const DeviceMemory<float> &conv_input_data, float conv_input_scale, + Stream &ThenConvolveWithScratch( + const dnn::BatchDescriptor &input_descriptor, + const DeviceMemory<float> &input_data, const dnn::FilterDescriptor &filter_descriptor, const DeviceMemory<float> &filter_data, const dnn::ConvolutionDescriptor &convolution_descriptor, - const DeviceMemory<float> &side_input_data, float side_input_scale, - const dnn::BatchDescriptor &bias_descriptor, const DeviceMemory<float> &biases, dnn::ActivationMode activation_mode, const dnn::BatchDescriptor &output_descriptor, DeviceMemory<float> *output, ScratchAllocator *scratch_allocator); @@ -341,6 +323,7 @@ class Stream { const dnn::FilterDescriptor &filter_descriptor, const DeviceMemory<float> &filter_data, const dnn::ConvolutionDescriptor &convolution_descriptor, + const DeviceMemory<float> &biases, dnn::ActivationMode activation_mode, const dnn::BatchDescriptor &output_descriptor, DeviceMemory<float> *output, ScratchAllocator *scratch_allocator, const dnn::AlgorithmConfig &algorithm_config, @@ -352,68 +335,35 @@ class Stream { const dnn::FilterDescriptor &filter_descriptor, const DeviceMemory<Eigen::half> &filter_data, const dnn::ConvolutionDescriptor &convolution_descriptor, + const DeviceMemory<Eigen::half> &biases, + dnn::ActivationMode activation_mode, const dnn::BatchDescriptor &output_descriptor, DeviceMemory<Eigen::half> *output, ScratchAllocator *scratch_allocator, const dnn::AlgorithmConfig &algorithm_config, dnn::ProfileResult *output_profile_result); - Stream &ThenFusedConvolveWithAlgorithm( - const dnn::BatchDescriptor &conv_input_descriptor, - const DeviceMemory<double> &conv_input_data, double conv_input_scale, - const dnn::FilterDescriptor &filter_descriptor, - const DeviceMemory<double> &filter_data, - const dnn::ConvolutionDescriptor &convolution_descriptor, - const DeviceMemory<double> &side_input_data, double side_input_scale, - const dnn::BatchDescriptor &bias_descriptor, - const DeviceMemory<double> &biases, dnn::ActivationMode activation_mode, - const dnn::BatchDescriptor &output_descriptor, - DeviceMemory<double> *output, ScratchAllocator *scratch_allocator, - const dnn::AlgorithmConfig &algorithm_config, - dnn::ProfileResult *output_profile_result); - - Stream &ThenFusedConvolveWithAlgorithm( - const dnn::BatchDescriptor &conv_input_descriptor, - const DeviceMemory<float> &conv_input_data, float conv_input_scale, + Stream &ThenConvolveWithAlgorithm( + const dnn::BatchDescriptor &input_descriptor, + const DeviceMemory<float> &input_data, const dnn::FilterDescriptor &filter_descriptor, const DeviceMemory<float> &filter_data, const dnn::ConvolutionDescriptor &convolution_descriptor, - const DeviceMemory<float> &side_input_data, float side_input_scale, - const dnn::BatchDescriptor &bias_descriptor, - const DeviceMemory<float> &biases, dnn::ActivationMode activation_mode, const dnn::BatchDescriptor &output_descriptor, DeviceMemory<float> *output, ScratchAllocator *scratch_allocator, const dnn::AlgorithmConfig &algorithm_config, dnn::ProfileResult *output_profile_result); - Stream &ThenFusedConvolveWithAlgorithm( - const dnn::BatchDescriptor &conv_input_descriptor, - const DeviceMemory<Eigen::half> &conv_input_data, float conv_input_scale, + Stream &ThenConvolveWithAlgorithm( + const dnn::BatchDescriptor &input_descriptor, + const DeviceMemory<Eigen::half> &input_data, const dnn::FilterDescriptor &filter_descriptor, const DeviceMemory<Eigen::half> &filter_data, const dnn::ConvolutionDescriptor &convolution_descriptor, - const DeviceMemory<Eigen::half> &side_input_data, float side_input_scale, - const dnn::BatchDescriptor &bias_descriptor, - const DeviceMemory<Eigen::half> &biases, - dnn::ActivationMode activation_mode, const dnn::BatchDescriptor &output_descriptor, DeviceMemory<Eigen::half> *output, ScratchAllocator *scratch_allocator, const dnn::AlgorithmConfig &algorithm_config, dnn::ProfileResult *output_profile_result); - Stream &ThenFusedConvolveWithAlgorithm( - const dnn::BatchDescriptor &conv_input_descriptor, - const DeviceMemory<int8> &conv_input_data, float conv_input_scale, - const dnn::FilterDescriptor &filter_descriptor, - const DeviceMemory<int8> &filter_data, - const dnn::ConvolutionDescriptor &convolution_descriptor, - const DeviceMemory<int8> &side_input_data, float side_input_scale, - const dnn::BatchDescriptor &bias_descriptor, - const DeviceMemory<float> &biases, dnn::ActivationMode activation_mode, - const dnn::BatchDescriptor &output_descriptor, DeviceMemory<int8> *output, - ScratchAllocator *scratch_allocator, - const dnn::AlgorithmConfig &algorithm_config, - dnn::ProfileResult *output_profile_result); - Stream &ThenSeparableConvolve( const dnn::BatchDescriptor &input_descriptor, const DeviceMemory<float> &input_data, |