aboutsummaryrefslogtreecommitdiffhomepage
path: root/tensorflow/core/util/matmul_autotune.cc
diff options
context:
space:
mode:
authorGravatar Yangzihao Wang <yangzihao@google.com>2017-07-21 09:22:31 -0700
committerGravatar TensorFlower Gardener <gardener@tensorflow.org>2017-07-21 09:38:31 -0700
commit3e3306ef0009b5b21050139f9b8e5f4868c4c0c7 (patch)
treec7e25f278d93e9ce1ab9e2984df7b97c0f27c6d0 /tensorflow/core/util/matmul_autotune.cc
parent4729180d24af3126d736a7045c43fcbf031b5bef (diff)
Let GetBlasGemmAlgorithms() always return true.
PiperOrigin-RevId: 162748507
Diffstat (limited to 'tensorflow/core/util/matmul_autotune.cc')
-rw-r--r--tensorflow/core/util/matmul_autotune.cc51
1 files changed, 51 insertions, 0 deletions
diff --git a/tensorflow/core/util/matmul_autotune.cc b/tensorflow/core/util/matmul_autotune.cc
new file mode 100644
index 0000000000..741a78a193
--- /dev/null
+++ b/tensorflow/core/util/matmul_autotune.cc
@@ -0,0 +1,51 @@
+/* Copyright 2015 The TensorFlow Authors. All Rights Reserved.
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+ http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+==============================================================================*/
+
+#include "tensorflow/core/util/matmul_autotune.h"
+
+#include "tensorflow/core/framework/types.h"
+#include "tensorflow/core/lib/core/stringpiece.h"
+#include "tensorflow/core/util/env_var.h"
+
+namespace tensorflow {
+bool MatmulAutotuneEnable() {
+ bool value;
+ Status status =
+ ReadBoolFromEnvVar("TF_MATMUL_AUTOTUNE_ENABLE", false, &value);
+ if (!status.ok()) {
+ LOG(ERROR) << status.error_message();
+ }
+ return value;
+}
+
+bool MatmulDoFP32ComputationFP16Input() {
+ bool value;
+ // Feedback from NVIDIA: the "true floating point 16" compute capability is
+ // absent from compute capability SM 5.2. The native 16 bit floating point
+ // computation was introduced in SM 5.3 and higher compute capability. So
+ // for compatibility, set this to be true by default for now.
+ // TODO(yangzihao): In the future, we need to return three possibilities:
+ // user-set-true, user-set-false, user-no-setting. In the calling sites,
+ // check the compatibilities. Note that user-set-false with compute
+ // capability <= 5.2 will cause an error in the later cublasGemmEx() call.
+ Status status =
+ ReadBoolFromEnvVar("TF_FP16_MATMUL_USE_FP32_COMPUTE", true, &value);
+ if (!status.ok()) {
+ LOG(ERROR) << status.error_message();
+ }
+ return value;
+}
+
+} // namespace tensorflow