Do not reuse allocations which hold tuple logical buffers. This works around a GPU codegen issue which extended the live range of tuple buffers. This also addresses a potential latent bug where thread-local or custom call buffer might have been reused.

Change: 145561773
author: Mark Heffernan <meheff@google.com> 2017-01-25 10:07:46 -0800
committer: TensorFlower Gardener <gardener@tensorflow.org> 2017-01-25 10:23:34 -0800
commit: 081758b0e5efc1a1591cda068a4866099bf8a3c5 (patch)
tree: d44c5835cd768b93140e2e9354fbba5ac33d4fe7 /tensorflow/compiler/xla/service/buffer_assignment.h
parent: e521a3dfffa5ec5e6e8b942cf829dfb4c9ec473f (diff)
1 files changed, 22 insertions, 5 deletions
diff --git a/tensorflow/compiler/xla/service/buffer_assignment.h b/tensorflow/compiler/xla/service/buffer_assignment.h
index af455de298..46c2253e13 100644
--- a/tensorflow/compiler/xla/service/buffer_assignment.h
+++ b/tensorflow/compiler/xla/service/buffer_assignment.h
@@ -52,8 +52,12 @@ class BufferAllocation {
   // contiguously and can be used as array indexes.
   using Index = int64;
 
-  BufferAllocation(Index index, int64 size, bool is_thread_local)
-      : index_(index), size_(size), is_thread_local_(is_thread_local) {}
+  BufferAllocation(Index index, int64 size, bool is_thread_local,
+                   bool is_reusable)
+      : index_(index),
+        size_(size),
+        is_thread_local_(is_thread_local),
+        is_reusable_(is_reusable) {}
   ~BufferAllocation() {}
 
   // Adds a LogicalBuffer to the set assigned to this buffer.
@@ -64,6 +68,9 @@ class BufferAllocation {
   // local.
   bool is_thread_local() const { return is_thread_local_; }
 
+  // Whether this allocation can be used by more than one logical buffer.
+  bool is_reusable() const { return is_reusable_; }
+
   // Whether this allocation holds a LogicalBuffer from a parameter of the entry
   // computation. These buffers have lifetimes which may be longer than the
   // XLA computation.
@@ -138,6 +145,9 @@ class BufferAllocation {
   // Whether this buffer needs to be thread-local.
   bool is_thread_local_;
 
+  // Whether this buffer is usable by more than one logical buffer.
+  bool is_reusable_;
+
   // Whether this allocation holds an entry computation parameter. Entry
   // computation parameters are special be cause they have lifetimes which may
   // outlast the computation.
@@ -232,10 +242,13 @@ class BufferAssignment {
   // assigned to it. `is_thread_local` indicates whether this buffer needs to be
   // thread-local.
   BufferAllocation* NewAllocation(const LogicalBuffer& buffer, int64 size,
-                                  bool is_thread_local);
+                                  bool is_thread_local, bool is_reusable);
 
-  // Adds a LogicalBuffer to the set assigned to the given allocation.
-  void AddAssignment(const LogicalBuffer& buffer, BufferAllocation* allocation);
+  // Adds a LogicalBuffer to the set assigned to the given allocation. If
+  // colocated_buffer is true, then the logical buffer is an alias of another
+  // buffer assigned to this allocation.
+  void AddAssignment(const LogicalBuffer& buffer, BufferAllocation* allocation,
+                     bool colocated_buffer);
 
   // Returns the BufferLiveness object used to construct this assignment.
   const BufferLiveness& liveness() { return *liveness_; }
@@ -314,6 +327,10 @@ class BufferAssigner {
                          const LogicalBuffer& buffer,
                          BufferAssignment* assignment);
 
+  // Colocated buffers are logical buffers from different computations which
+  // alias. Explicitly handling these colocated buffers is necessary because
+  // points-to analysis is computation level scope and does not recognize
+  // aliasing across computations (b/32491382).
   using ColocatedBufferSet = std::vector<const LogicalBuffer*>;
 
   // Returns a vector of ColocatedBufferSet objects, where each
author	Mark Heffernan <meheff@google.com>	2017-01-25 10:07:46 -0800
committer	TensorFlower Gardener <gardener@tensorflow.org>	2017-01-25 10:23:34 -0800
commit	081758b0e5efc1a1591cda068a4866099bf8a3c5 (patch)
tree	d44c5835cd768b93140e2e9354fbba5ac33d4fe7 /tensorflow/compiler/xla/service/buffer_assignment.h
parent	e521a3dfffa5ec5e6e8b942cf829dfb4c9ec473f (diff)