aboutsummaryrefslogtreecommitdiffhomepage
path: root/tensorflow/contrib/hooks/python/training/profiler_hook.py
diff options
context:
space:
mode:
Diffstat (limited to 'tensorflow/contrib/hooks/python/training/profiler_hook.py')
-rw-r--r--tensorflow/contrib/hooks/python/training/profiler_hook.py104
1 files changed, 104 insertions, 0 deletions
diff --git a/tensorflow/contrib/hooks/python/training/profiler_hook.py b/tensorflow/contrib/hooks/python/training/profiler_hook.py
new file mode 100644
index 0000000000..35aa25edfd
--- /dev/null
+++ b/tensorflow/contrib/hooks/python/training/profiler_hook.py
@@ -0,0 +1,104 @@
+# Copyright 2017 The TensorFlow Authors. All Rights Reserved.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+# http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+# ==============================================================================
+"""Additional `SessionRunHook` implementations to complement those in
+tensorflow/python/training.
+
+"""
+
+from __future__ import absolute_import
+from __future__ import division
+from __future__ import print_function
+
+import os.path
+
+from tensorflow.core.protobuf import config_pb2
+from tensorflow.python.client import timeline
+from tensorflow.python.platform import gfile
+from tensorflow.python.platform import tf_logging as logging
+from tensorflow.python.training.basic_session_run_hooks import SecondOrStepTimer
+from tensorflow.python.training.session_run_hook import SessionRunArgs
+from tensorflow.python.training import session_run_hook
+from tensorflow.python.training import training_util
+
+
+class ProfilerHook(session_run_hook.SessionRunHook):
+ """Captures CPU/GPU profiling information every N steps or seconds.
+
+ This produces files called "timeline-<step>.json", which are in Chrome
+ Trace format.
+
+ For more information see:
+ https://github.com/catapult-project/catapult/blob/master/tracing/README.md"""
+
+ def __init__(self,
+ save_steps=None,
+ save_secs=None,
+ output_dir="",
+ show_dataflow=True,
+ show_memory=False):
+ """Initializes a hook that takes periodic profiling snapshots.
+
+ Args:
+ save_steps: `int`, save profile traces every N steps. Exactly one of
+ `save_secs` and `save_steps` should be set.
+ save_secs: `int`, save profile traces every N seconds.
+ output_dir: `string`, the directory to save the profile traces to.
+ Defaults to the current directory.
+ show_dataflow: `bool`, if True, add flow events to the trace connecting
+ producers and consumers of tensors.
+ show_memory: `bool`, if True, add object snapshot events to the trace
+ showing the sizes and lifetimes of tensors.
+ """
+ self._output_file = os.path.join(output_dir, "timeline-{}.json")
+ self._show_dataflow = show_dataflow
+ self._show_memory = show_memory
+ self._timer = SecondOrStepTimer(every_secs=save_secs,
+ every_steps=save_steps)
+
+ def begin(self):
+ self._next_step = None
+ self._global_step_tensor = training_util.get_global_step()
+ if self._global_step_tensor is None:
+ raise RuntimeError(
+ "Global step should be created to use ProfilerHook.")
+
+ def before_run(self, run_context):
+ self._request_summary = (
+ self._next_step is None or
+ self._timer.should_trigger_for_step(self._next_step))
+ requests = {"global_step": self._global_step_tensor}
+ opts = (config_pb2.RunOptions(trace_level=config_pb2.RunOptions.FULL_TRACE)
+ if self._request_summary else None)
+
+ return SessionRunArgs(requests, options=opts)
+
+ def after_run(self, run_context, run_values):
+ global_step = run_values.results["global_step"]
+
+ if self._request_summary:
+ self._timer.update_last_triggered_step(global_step)
+ self._save(global_step,
+ self._output_file.format(global_step),
+ run_values.run_metadata.step_stats)
+
+ self._next_step = global_step + 1
+
+ def _save(self, step, save_path, step_stats):
+ logging.info("Saving timeline for %d into '%s'.", step, save_path)
+ with gfile.Open(save_path, "w") as f:
+ trace = timeline.Timeline(step_stats)
+ f.write(trace.generate_chrome_trace_format(
+ show_dataflow=self._show_dataflow,
+ show_memory=self._show_memory))