aboutsummaryrefslogtreecommitdiffhomepage
diff options
context:
space:
mode:
authorGravatar A. Unique TensorFlower <gardener@tensorflow.org>2017-04-05 17:17:49 -0800
committerGravatar TensorFlower Gardener <gardener@tensorflow.org>2017-04-05 18:31:39 -0700
commit88feb346baaf8a344f7c6b02f474277962081b58 (patch)
tree8225c4ceda7cc74db3c236bf4d7f9c1261420f85
parenta24c6b842d982de8a38ae5058ace91cb47ee3cef (diff)
Update ops-related pbtxt files.
Change: 152332812
-rw-r--r--tensorflow/core/ops/compat/ops_history.v1.pbtxt26
-rw-r--r--tensorflow/core/ops/ops.pbtxt33
2 files changed, 59 insertions, 0 deletions
diff --git a/tensorflow/core/ops/compat/ops_history.v1.pbtxt b/tensorflow/core/ops/compat/ops_history.v1.pbtxt
index c538a278a3..9a29487b82 100644
--- a/tensorflow/core/ops/compat/ops_history.v1.pbtxt
+++ b/tensorflow/core/ops/compat/ops_history.v1.pbtxt
@@ -1667,6 +1667,32 @@ op {
}
}
op {
+ name: "AudioSpectrogram"
+ input_arg {
+ name: "input"
+ type: DT_FLOAT
+ }
+ output_arg {
+ name: "spectrogram"
+ type: DT_FLOAT
+ }
+ attr {
+ name: "window_size"
+ type: "int"
+ }
+ attr {
+ name: "stride"
+ type: "int"
+ }
+ attr {
+ name: "magnitude_squared"
+ type: "bool"
+ default_value {
+ b: false
+ }
+ }
+}
+op {
name: "AudioSummary"
input_arg {
name: "tag"
diff --git a/tensorflow/core/ops/ops.pbtxt b/tensorflow/core/ops/ops.pbtxt
index 172bdf02e2..31341e714b 100644
--- a/tensorflow/core/ops/ops.pbtxt
+++ b/tensorflow/core/ops/ops.pbtxt
@@ -1904,6 +1904,39 @@ op {
summary: "Computes atan of x element-wise."
}
op {
+ name: "AudioSpectrogram"
+ input_arg {
+ name: "input"
+ description: "Float representation of audio data."
+ type: DT_FLOAT
+ }
+ output_arg {
+ name: "spectrogram"
+ description: "3D representation of the audio frequencies as an image."
+ type: DT_FLOAT
+ }
+ attr {
+ name: "window_size"
+ type: "int"
+ description: "How wide the input window is in samples. For the highest efficiency\nthis should be a power of two, but other values are accepted."
+ }
+ attr {
+ name: "stride"
+ type: "int"
+ description: "How widely apart the center of adjacent sample windows should be."
+ }
+ attr {
+ name: "magnitude_squared"
+ type: "bool"
+ default_value {
+ b: false
+ }
+ description: "Whether to return the squared magnitude or just the\nmagnitude. Using squared magnitude can avoid extra calculations."
+ }
+ summary: "Produces a visualization of audio data over time."
+ description: "Spectrograms are a standard way of representing audio information as a series of\nslices of frequency information, one slice for each window of time. By joining\nthese together into a sequence, they form a distinctive fingerprint of the sound\nover time.\n\nThis op expects to receive audio data as an input, stored as floats in the range\n-1 to 1, together with a window width in samples, and a stride specifying how\nfar to move the window between slices. From this it generates a three\ndimensional output. The lowest dimension has an amplitude value for each\nfrequency during that time slice. The next dimension is time, with successive\nfrequency slices. The final dimension is for the channels in the input, so a\nstereo audio input would have two here for example.\n\nThis means the layout when converted and saved as an image is rotated 90 degrees\nclockwise from a typical spectrogram. Time is descending down the Y axis, and\nthe frequency decreases from left to right.\n\nEach value in the result represents the square root of the sum of the real and\nimaginary parts of an FFT on the current window of samples. In this way, the\nlowest dimension represents the power of each frequency in the current window,\nand adjacent windows are concatenated in the next dimension.\n\nTo get a more intuitive and visual look at what this operation does, you can run\ntensorflow/examples/wav_to_spectrogram to read in an audio file and save out the\nresulting spectrogram as a PNG image."
+}
+op {
name: "AudioSummary"
input_arg {
name: "tag"