diff options
author | 2017-07-21 09:22:31 -0700 | |
---|---|---|
committer | 2017-07-21 09:38:31 -0700 | |
commit | 3e3306ef0009b5b21050139f9b8e5f4868c4c0c7 (patch) | |
tree | c7e25f278d93e9ce1ab9e2984df7b97c0f27c6d0 /tensorflow/core/util/matmul_autotune.cc | |
parent | 4729180d24af3126d736a7045c43fcbf031b5bef (diff) |
Let GetBlasGemmAlgorithms() always return true.
PiperOrigin-RevId: 162748507
Diffstat (limited to 'tensorflow/core/util/matmul_autotune.cc')
-rw-r--r-- | tensorflow/core/util/matmul_autotune.cc | 51 |
1 files changed, 51 insertions, 0 deletions
diff --git a/tensorflow/core/util/matmul_autotune.cc b/tensorflow/core/util/matmul_autotune.cc new file mode 100644 index 0000000000..741a78a193 --- /dev/null +++ b/tensorflow/core/util/matmul_autotune.cc @@ -0,0 +1,51 @@ +/* Copyright 2015 The TensorFlow Authors. All Rights Reserved. + +Licensed under the Apache License, Version 2.0 (the "License"); +you may not use this file except in compliance with the License. +You may obtain a copy of the License at + + http://www.apache.org/licenses/LICENSE-2.0 + +Unless required by applicable law or agreed to in writing, software +distributed under the License is distributed on an "AS IS" BASIS, +WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. +See the License for the specific language governing permissions and +limitations under the License. +==============================================================================*/ + +#include "tensorflow/core/util/matmul_autotune.h" + +#include "tensorflow/core/framework/types.h" +#include "tensorflow/core/lib/core/stringpiece.h" +#include "tensorflow/core/util/env_var.h" + +namespace tensorflow { +bool MatmulAutotuneEnable() { + bool value; + Status status = + ReadBoolFromEnvVar("TF_MATMUL_AUTOTUNE_ENABLE", false, &value); + if (!status.ok()) { + LOG(ERROR) << status.error_message(); + } + return value; +} + +bool MatmulDoFP32ComputationFP16Input() { + bool value; + // Feedback from NVIDIA: the "true floating point 16" compute capability is + // absent from compute capability SM 5.2. The native 16 bit floating point + // computation was introduced in SM 5.3 and higher compute capability. So + // for compatibility, set this to be true by default for now. + // TODO(yangzihao): In the future, we need to return three possibilities: + // user-set-true, user-set-false, user-no-setting. In the calling sites, + // check the compatibilities. Note that user-set-false with compute + // capability <= 5.2 will cause an error in the later cublasGemmEx() call. + Status status = + ReadBoolFromEnvVar("TF_FP16_MATMUL_USE_FP32_COMPUTE", true, &value); + if (!status.ok()) { + LOG(ERROR) << status.error_message(); + } + return value; +} + +} // namespace tensorflow |