1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
|
// See docs in ../ops/attention_ops.cc.
#define EIGEN_USE_THREADS
#include "tensorflow/core/platform/port.h"
#include "tensorflow/core/framework/op.h"
#include "tensorflow/core/framework/op_kernel.h"
#include "tensorflow/core/framework/types.h"
#include "tensorflow/core/platform/logging.h"
#include "tensorflow/core/public/tensor.h"
#include "tensorflow/core/public/tensor_shape.h"
#include "third_party/eigen3/unsupported/Eigen/CXX11/NeuralNetworks"
namespace tensorflow {
class ExtractGlimpseOp : public OpKernel {
public:
explicit ExtractGlimpseOp(OpKernelConstruction* context) : OpKernel(context) {
OP_REQUIRES_OK(context, context->GetAttr("normalized", &normalized_));
OP_REQUIRES_OK(context, context->GetAttr("centered", ¢ered_));
OP_REQUIRES_OK(context, context->GetAttr("uniform_noise", &uniform_noise_));
}
// Expect input tensor of rank 4 with dimensions (batch_size, height, width,
// depth).
void Compute(OpKernelContext* context) override {
const Tensor& input = context->input(0);
const TensorShape input_shape = input.shape();
const int32 num_dims = input_shape.dims();
OP_REQUIRES(
context, num_dims == 4,
errors::InvalidArgument(
"input must be 4-dimensional (batch_size, height, width, depth)",
input_shape.ShortDebugString()));
const int64 batch_size = input_shape.dim_size(0);
const Tensor& window_size = context->input(1);
OP_REQUIRES(context, (window_size.shape().dims() == 1) &&
window_size.shape().dim_size(0) == 2,
errors::InvalidArgument(
"input must be a vector of size 2 (height, width)",
window_size.shape().ShortDebugString()));
const int64 output_height = window_size.tensor<int, 1>()(0);
const int64 output_width = window_size.tensor<int, 1>()(1);
TensorShape output_shape = input_shape;
output_shape.set_dim(1, output_height);
output_shape.set_dim(2, output_width);
const Tensor& offsets = context->input(2);
OP_REQUIRES(context, offsets.shape().dims() == 2,
errors::InvalidArgument("input must be a matrix",
offsets.shape().ShortDebugString()));
OP_REQUIRES(context, offsets.shape().dim_size(0) == batch_size,
errors::InvalidArgument("first dimension should be batch",
offsets.shape().ShortDebugString()));
OP_REQUIRES(
context, offsets.shape().dim_size(1) == 2,
errors::InvalidArgument("second dimension should be of size 2 (y,x)",
offsets.shape().ShortDebugString()));
Tensor* output = nullptr;
OP_REQUIRES_OK(context, context->allocate_output(0, output_shape, &output));
std::vector<Eigen::IndexPair<float> > offset_vec;
offset_vec.reserve(batch_size);
for (int i = 0; i < batch_size; ++i) {
float offset_y = offsets.tensor<float, 2>()(i, 0);
float offset_x = offsets.tensor<float, 2>()(i, 1);
// Eigen::ExtractGlimpses expects offsets as (x,y), whereas the
// calling TensorFlow operates with (y,x) as indices.
offset_vec.push_back(Eigen::IndexPair<float>(offset_x, offset_y));
}
output->tensor<float, 4>().swap_layout().device(
context->eigen_cpu_device()) =
Eigen::ExtractGlimpses(input.tensor<float, 4>().swap_layout(),
output_width, output_height, offset_vec,
normalized_, centered_, uniform_noise_);
}
private:
bool normalized_;
bool centered_;
bool uniform_noise_;
};
REGISTER_KERNEL_BUILDER(Name("ExtractGlimpse").Device(DEVICE_CPU),
ExtractGlimpseOp);
} // end namespace tensorflow
|