/* Copyright 2018 The TensorFlow Authors. All Rights Reserved. Licensed under the Apache License, Version 2.0 (the "License"); you may not use this file except in compliance with the License. You may obtain a copy of the License at http://www.apache.org/licenses/LICENSE-2.0 Unless required by applicable law or agreed to in writing, software distributed under the License is distributed on an "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. See the License for the specific language governing permissions and limitations under the License. ==============================================================================*/ #ifndef TENSORFLOW_CORE_UTIL_STATS_CALCULATOR_H_ #define TENSORFLOW_CORE_UTIL_STATS_CALCULATOR_H_ #include #include #include #include #include #include #include #include "tensorflow/core/util/stat_summarizer_options.h" namespace tensorflow { template class Stat { public: void UpdateStat(ValueType v) { if (count_ == 0) { first_ = v; } newest_ = v; max_ = std::max(v, max_); min_ = std::min(v, min_); ++count_; sum_ += v; squared_sum_ += static_cast(v) * v; } void Reset() { new (this) Stat(); } bool empty() const { return count_ == 0; } ValueType first() const { return first_; } ValueType newest() const { return newest_; } ValueType max() const { return max_; } ValueType min() const { return min_; } int64_t count() const { return count_; } ValueType sum() const { return sum_; } HighPrecisionValueType squared_sum() const { return squared_sum_; } bool all_same() const { return (count_ == 0 || min_ == max_); } HighPrecisionValueType avg() const { return empty() ? std::numeric_limits::quiet_NaN() : static_cast(sum_) / count_; } ValueType std_deviation() const { return all_same() ? 0 : sqrt(squared_sum_ / count_ - avg() * avg()); } void OutputToStream(std::ostream* stream) const { if (empty()) { *stream << "count=0"; } else if (all_same()) { *stream << "count=" << count_ << " curr=" << newest_; if (count_ > 1) *stream << "(all same)"; } else { *stream << "count=" << count_ << " first=" << first_ << " curr=" << newest_ << " min=" << min_ << " max=" << max_ << " avg=" << avg() << " std=" << std_deviation(); } } friend std::ostream& operator<<(std::ostream& stream, const Stat& stat) { stat.OutputToStream(&stream); return stream; } private: ValueType first_ = 0; ValueType newest_ = 0; ValueType max_ = std::numeric_limits::min(); ValueType min_ = std::numeric_limits::max(); int64_t count_ = 0; ValueType sum_ = 0; HighPrecisionValueType squared_sum_ = 0; }; // A StatsCalculator assists in performance analysis of Graph executions. // // It summarizes time spent executing (on GPU/CPU), memory used etc for // graph execution. // // For example usage see StatsSummarizer. class StatsCalculator { public: enum SortingMetric { BY_NAME, BY_RUN_ORDER, BY_TIME, BY_MEMORY, BY_TYPE, }; explicit StatsCalculator(const StatSummarizerOptions& options); // Returns a string detailing the accumulated runtime stats in a tab-separated // format which can be pasted into a spreadsheet for further analysis. std::string GetOutputString() const; std::string GetShortSummary() const; void ComputeStatsByType( std::map* node_type_map_count, std::map* node_type_map_time, std::map* node_type_map_memory, std::map* node_type_map_times_called, int64_t* accumulated_us) const; std::string GetStatsByNodeType() const; std::string GetStatsByMetric(const std::string& title, SortingMetric sorting_metric, int num_stats) const; // Returns number of runs. int num_runs() const { return static_cast(run_total_us_.count()); } // Returns stats of total microseconds spent by all nodes in each run. const Stat& run_total_us() const { return run_total_us_; } void UpdateRunTotalUs(int64_t run_total_us) { run_total_us_.UpdateStat(run_total_us); } void UpdateMemoryUsed(int64_t memory) { memory_.UpdateStat(memory); } struct Detail { std::string name; std::string type; int64_t run_order; Stat start_us; Stat rel_end_us; Stat mem_used; int64_t times_called; }; const std::map& GetDetails() const { return details_; } void AddNodeStats(const std::string& name, const std::string& type, int64_t run_order, int64_t start_us, int64_t rel_end_us, int64_t mem_used); private: void OrderNodesByMetric(SortingMetric sorting_metric, std::vector* details) const; std::string HeaderString(const std::string& title) const; std::string ColumnString(const Detail& detail, const int64_t cumulative_stat_on_node, const Stat& stat) const; Stat run_total_us_; Stat memory_; std::map details_; StatSummarizerOptions options_; }; } // namespace tensorflow #endif // TENSORFLOW_CORE_UTIL_STATS_CALCULATOR_H_