Memory ordering is enforced by streams, we don't need to block TensorFlow's executor until transfers from host to device are complete.

PiperOrigin-RevId: 210098914
author: A. Unique TensorFlower <gardener@tensorflow.org> 2018-08-24 08:02:49 -0700
committer: TensorFlower Gardener <gardener@tensorflow.org> 2018-08-24 08:05:50 -0700
commit: 36ebaf71bd2ca763c2aa67fa93e3839a5119d708 (patch)
tree: 851bef6e99dd335439c5907b5df95a85b0d7be97 /tensorflow/compiler/jit
parent: 925cae2cc51f419d36b3438e693cced27b72799d (diff)
1 files changed, 3 insertions, 14 deletions
diff --git a/tensorflow/compiler/jit/xla_device_context.cc b/tensorflow/compiler/jit/xla_device_context.cc
index 2027ec7737..ee07c5c964 100644
--- a/tensorflow/compiler/jit/xla_device_context.cc
+++ b/tensorflow/compiler/jit/xla_device_context.cc
@@ -184,18 +184,6 @@ void XlaTransferManager::CopyCPUTensorToDevice(const Tensor* cpu_tensor,
       return;
     }
     status = TransferLiteralToDevice(reshaped_cpu_tensor, device_tensor);
-    if (status.ok()) {
-      xla_tensor->set_host_tensor(*cpu_tensor);
-      host_to_device_stream_->ThenDoHostCallback([this, done]() {
-        // We must not call the done closure directly from DoHostCallback
-        // to avoid a deadlock. If done() is the callback that ends an
-        // Executor's run, the Executor may call XlaDevice::Sync() inside the
-        // callback. This deadlocks, because XlaDevice::Sync() waits for all
-        // stream activity to complete.
-        thread_pool_->Schedule([done]() { done(Status::OK()); });
-      });
-      return;
-    }
   } else {
     se::DeviceMemoryBase dev_dst_ptr =
         XlaTensor::DeviceMemoryFromTensor(*device_tensor);
@@ -208,8 +196,9 @@ void XlaTransferManager::CopyCPUTensorToDevice(const Tensor* cpu_tensor,
           host_to_device_stream_.get(), block_status.error_message().c_str());
     }
   }
-  xla_tensor->set_host_tensor(*cpu_tensor);
-
+  if (status.ok()) {
+    xla_tensor->set_host_tensor(*cpu_tensor);
+  }
   done(status);
 }
author	A. Unique TensorFlower <gardener@tensorflow.org>	2018-08-24 08:02:49 -0700
committer	TensorFlower Gardener <gardener@tensorflow.org>	2018-08-24 08:05:50 -0700
commit	36ebaf71bd2ca763c2aa67fa93e3839a5119d708 (patch)
tree	851bef6e99dd335439c5907b5df95a85b0d7be97 /tensorflow/compiler/jit
parent	925cae2cc51f419d36b3438e693cced27b72799d (diff)