StreamExecutor: Optimize kernel argument packing

Create a single class to hold all kernel arguments and optimize how they are added into this class. Change: 140556725
author: Peter Hawkins <phawkins@google.com> 2016-11-29 18:55:46 -0800
committer: TensorFlower Gardener <gardener@tensorflow.org> 2016-11-29 19:05:55 -0800
commit: bada4a5339d4567419e993b7736eb23a6f3535c4 (patch)
tree: d793b3a70518a2ab63fbc24c0e41d72eb7d7d97f /tensorflow/stream_executor/stream_executor_pimpl.cc
parent: 347d3ef2a871d8212f39c7ea2b7defe63468dfbc (diff)
1 files changed, 1 insertions, 6 deletions
diff --git a/tensorflow/stream_executor/stream_executor_pimpl.cc b/tensorflow/stream_executor/stream_executor_pimpl.cc
index 2fdd1e4b49..7739d31662 100644
--- a/tensorflow/stream_executor/stream_executor_pimpl.cc
+++ b/tensorflow/stream_executor/stream_executor_pimpl.cc
@@ -394,7 +394,7 @@ rng::RngSupport *StreamExecutor::AsRng() {
 bool StreamExecutor::Launch(Stream *stream, const ThreadDim &thread_dims,
                             const BlockDim &block_dims,
                             const KernelBase &kernel,
-                            const std::vector<KernelArg> &args) {
+                            const KernelArgsArrayBase &args) {
   SubmitTrace(&TraceListener::LaunchSubmit, stream, thread_dims, block_dims,
               kernel, args);
 
@@ -659,11 +659,6 @@ bool StreamExecutor::DeviceMemoryUsage(int64 *free, int64 *total) const {
   return implementation_->DeviceMemoryUsage(free, total);
 }
 
-KernelArg StreamExecutor::DeviceMemoryToKernelArg(
-    const DeviceMemoryBase &gpu_mem) const {
-  return implementation_->DeviceMemoryToKernelArg(gpu_mem);
-}
-
 void StreamExecutor::EnqueueOnBackgroundThread(std::function<void()> task) {
   background_threads_->Schedule(task);
 }
author	Peter Hawkins <phawkins@google.com>	2016-11-29 18:55:46 -0800
committer	TensorFlower Gardener <gardener@tensorflow.org>	2016-11-29 19:05:55 -0800
commit	bada4a5339d4567419e993b7736eb23a6f3535c4 (patch)
tree	d793b3a70518a2ab63fbc24c0e41d72eb7d7d97f /tensorflow/stream_executor/stream_executor_pimpl.cc
parent	347d3ef2a871d8212f39c7ea2b7defe63468dfbc (diff)