Track memory allocation/deallocation history.

PiperOrigin-RevId: 171239477
author: A. Unique TensorFlower <gardener@tensorflow.org> 2017-10-05 18:38:03 -0700
committer: TensorFlower Gardener <gardener@tensorflow.org> 2017-10-05 18:42:49 -0700
commit: 86238e8d09efce59de038b062a230030aa8bdd3a (patch)
tree: 8c58160f1bc7b2fc9649b744fac7a43971ef2b03 /tensorflow/python/profiler
parent: d6513c8149d5b69faa250949c6bec6c796c553e8 (diff)
1 files changed, 29 insertions, 0 deletions
diff --git a/tensorflow/python/profiler/internal/run_metadata_test.py b/tensorflow/python/profiler/internal/run_metadata_test.py
index 80df44f5f5..4ff09d3800 100644
--- a/tensorflow/python/profiler/internal/run_metadata_test.py
+++ b/tensorflow/python/profiler/internal/run_metadata_test.py
@@ -121,6 +121,35 @@ class RunMetadataTest(test.TestCase):
     self.assertEqual(len(ret['gpu:0']), 1)
     self.assertEqual(len(ret['gpu:0/stream:all']), 1, '%s' % run_meta)
 
+  def testAllocationHistory(self):
+    if not test.is_gpu_available(cuda_only=True):
+      return
+
+    gpu_dev = test.gpu_device_name()
+    ops.reset_default_graph()
+    with ops.device(gpu_dev):
+      _, run_meta = _run_model()
+
+    mm = _extract_node(run_meta, 'MatMul')['gpu:0'][0]
+    mm_allocs = mm.memory[0].allocation_records
+    # has allocation and deallocation.
+    self.assertEqual(len(mm_allocs), 2)
+    # first allocated.
+    self.assertGreater(mm_allocs[1].alloc_micros, mm_allocs[0].alloc_micros)
+    self.assertGreater(mm_allocs[0].alloc_bytes, 0)
+    # Then deallocated.
+    self.assertLess(mm_allocs[1].alloc_bytes, 0)
+    # All memory deallocated.
+    self.assertEqual(mm_allocs[0].alloc_bytes + mm_allocs[1].alloc_bytes, 0)
+
+    rand = _extract_node(
+        run_meta, 'random_normal/RandomStandardNormal')['gpu:0'][0]
+    random_allocs = rand.memory[0].allocation_records
+    # random normal must allocated first since matmul depends on it.
+    self.assertLess(random_allocs[0].alloc_micros, mm.all_start_micros)
+    # deallocates the memory after matmul started.
+    self.assertGreater(random_allocs[1].alloc_micros, mm.all_start_micros)
+
   def testCPU(self):
     ops.reset_default_graph()
     with ops.device('/cpu:0'):
author	A. Unique TensorFlower <gardener@tensorflow.org>	2017-10-05 18:38:03 -0700
committer	TensorFlower Gardener <gardener@tensorflow.org>	2017-10-05 18:42:49 -0700
commit	86238e8d09efce59de038b062a230030aa8bdd3a (patch)
tree	8c58160f1bc7b2fc9649b744fac7a43971ef2b03 /tensorflow/python/profiler
parent	d6513c8149d5b69faa250949c6bec6c796c553e8 (diff)