Avoid some over-inlined routines. Reduces code size of TensorFlow binaries

considerably. Shrinks text size of example_trainer binary by ~1.5%. Change: 115578002
author: A. Unique TensorFlower <nobody@tensorflow.org> 2016-02-25 10:37:06 -0800
committer: TensorFlower Gardener <gardener@tensorflow.org> 2016-02-25 11:15:46 -0800
commit: 9ccc4b6afe4defa748de89eac90ba1062232bb5a (patch)
tree: ea5f3577c2dcc0986f7ab47f97979858974075f3 /tensorflow/core/kernels/reduction_ops_common.cc
parent: 63bd3efc5c9a052d605766497726120b73f5cb3c (diff)
1 files changed, 127 insertions, 0 deletions
diff --git a/tensorflow/core/kernels/reduction_ops_common.cc b/tensorflow/core/kernels/reduction_ops_common.cc
new file mode 100644
index 0000000000..50e0791872
--- /dev/null
+++ b/tensorflow/core/kernels/reduction_ops_common.cc
@@ -0,0 +1,127 @@
+#include "tensorflow/core/kernels/reduction_ops_common.h"
+
+namespace tensorflow {
+
+TensorShape ReductionHelper::out_reshape() const {
+  TensorShape shape;
+  for (auto size : out_reshape_) shape.AddDim(size);
+  return shape;
+}
+
+// The final output shape must be allocated with this shape.
+TensorShape ReductionHelper::out_shape() const {
+  TensorShape shape;
+  for (auto size : out_shape_) shape.AddDim(size);
+  return shape;
+}
+
+TensorShape ReductionHelper::shuffled_shape() {
+  const int dims = data_reshape_.size();
+  TensorShape shape;
+  for (int i = reduce_first_axis_; i < dims; i += 2) {
+    shape.AddDim(data_reshape_[i]);
+  }
+  for (int i = !reduce_first_axis_; i < dims; i += 2) {
+    shape.AddDim(data_reshape_[i]);
+  }
+  return shape;
+}
+
+gtl::InlinedVector<int32, 8> ReductionHelper::permutation() {
+  const int dims = data_reshape_.size();
+  const int unreduced_dims = (dims + !reduce_first_axis_) / 2;
+  gtl::InlinedVector<int32, 8> perm(dims);
+  for (int i = 0; i < unreduced_dims; i++) {
+    perm[i] = 2 * i + reduce_first_axis_;
+  }
+  for (int i = unreduced_dims; i < dims; i++) {
+    perm[i] = 2 * (i - unreduced_dims) + !reduce_first_axis_;
+  }
+  return perm;
+}
+
+Status ReductionHelper::Simplify(const Tensor& data, const Tensor& axis,
+                                 const bool keep_dims) {
+  // bitmap[i] indicates whether to reduce data along i-th axis.
+  gtl::InlinedVector<bool, 4> bitmap(data.dims(), false);
+  auto axis_vec = axis.flat<int32>();
+  for (int64 i = 0; i < axis.NumElements(); ++i) {
+    const int32 index = axis_vec(i);
+    if (index < 0 || index >= data.dims()) {
+      return errors::OutOfRange("Invalid reduction dimension (", index,
+                                " for input with ", data.dims(),
+                                " dimension(s)");
+    }
+    bitmap[index] = true;
+  }
+
+  // Output tensor's dim sizes.
+  out_shape_.clear();
+  for (int i = 0; i < data.dims(); ++i) {
+    if (!bitmap[i]) {
+      // If we are not reducing along dimension i.
+      out_shape_.push_back(data.dim_size(i));
+    } else if (keep_dims) {
+      // We are reducing along dimension i, but we want to keep the
+      // same number of dimensions, so we set the dimension of i to
+      // '1'.
+      out_shape_.push_back(1);
+    }
+  }
+
+  // Depending on bitmap[i] and bitmap[i-1], we can collapse axis of
+  // the input data before doing the reduction on the resulting
+  // tensor.  The shape of the reduction is a reshape of the final
+  // output.
+
+  // We'll skip the leading 1s.
+  int dim_index = 0;
+  for (; dim_index < data.dims(); ++dim_index) {
+    if (data.dim_size(dim_index) != 1) break;
+  }
+  if (dim_index >= data.dims()) {
+    // Special case. The input is essentially a scalar.
+    reduce_first_axis_ = true;
+  } else {
+    // Starting from the (dim_index)-th dimension, dimensions
+    // alternates between runs that need to be reduced and runs that
+    // don't.
+    //
+    // NOTE: If a dimension has size 1, we group it as the current
+    // run so that we can minimize the number of runs.
+    //
+    // E.g., when we want to reduce a tensor of shape [2, 1, 3, 1,
+    // 5] by axes = [1, 4], we should treat the tensor as a [6, 5]
+    // and reduce by axes = [1] (i.e., the output is shape [6]).
+    reduce_first_axis_ = bitmap[dim_index];
+    data_reshape_.push_back(data.dim_size(dim_index));
+    ++dim_index;
+    for (; dim_index < data.dims(); ++dim_index) {
+      const auto size = data.dim_size(dim_index);
+      if (size == 1) {
+        bitmap[dim_index] = bitmap[dim_index - 1];
+      }
+      if (bitmap[dim_index - 1] != bitmap[dim_index]) {
+        // Starts a new run of reduce or !reduce.
+        data_reshape_.push_back(size);
+      } else {
+        // Continue a run of reduce or !reduce.
+        data_reshape_.back() *= size;
+      }
+    }
+    // If reduce_first_axis_ is true (input's dimension 0, 2, 4, etc
+    // are reduced), data_reshape_[1, 3, 5, ...]  is out_reshape_,
+    // otherwise, data_reshape_[0, 2, 4, ...] is.
+    for (size_t i = reduce_first_axis_ ? 1 : 0; i < data_reshape_.size();
+         i += 2) {
+      out_reshape_.push_back(data_reshape_[i]);
+    }
+  }
+
+  VLOG(1) << "data reshape: " << str_util::Join(data_reshape_, ",");
+  VLOG(1) << "out  reshape: " << str_util::Join(out_reshape_, ",");
+  VLOG(1) << "out    shape: " << str_util::Join(out_shape_, ",");
+  return Status::OK();
+}
+
+}  // namespace tensorflow
author	A. Unique TensorFlower <nobody@tensorflow.org>	2016-02-25 10:37:06 -0800
committer	TensorFlower Gardener <gardener@tensorflow.org>	2016-02-25 11:15:46 -0800
commit	9ccc4b6afe4defa748de89eac90ba1062232bb5a (patch)
tree	ea5f3577c2dcc0986f7ab47f97979858974075f3 /tensorflow/core/kernels/reduction_ops_common.cc
parent	63bd3efc5c9a052d605766497726120b73f5cb3c (diff)