aboutsummaryrefslogtreecommitdiffhomepage
path: root/tensorflow/compiler
diff options
context:
space:
mode:
authorGravatar TensorFlower Gardener <gardener@tensorflow.org>2018-10-01 21:18:17 -0700
committerGravatar TensorFlower Gardener <gardener@tensorflow.org>2018-10-01 21:18:17 -0700
commit6161d8cc4d66b87ba198cb6a16d83ce317c77eff (patch)
tree47b45fcd51a5bf0001afd30295fc6e236d563a4e /tensorflow/compiler
parent350388fca9cb9509962ff393a9d21fb2879c9179 (diff)
parent6a5090b086bc9d665eb9e65f05eb94cdb58baaa2 (diff)
Merge pull request #21958 from MattConley:CudaOccupancy
PiperOrigin-RevId: 215331087
Diffstat (limited to 'tensorflow/compiler')
-rw-r--r--tensorflow/compiler/xla/service/gpu/partition_assignment.cc9
1 files changed, 2 insertions, 7 deletions
diff --git a/tensorflow/compiler/xla/service/gpu/partition_assignment.cc b/tensorflow/compiler/xla/service/gpu/partition_assignment.cc
index cf9f102d31..375f68a159 100644
--- a/tensorflow/compiler/xla/service/gpu/partition_assignment.cc
+++ b/tensorflow/compiler/xla/service/gpu/partition_assignment.cc
@@ -62,13 +62,8 @@ LaunchDimensions CalculateLaunchDimensions(
//
// <num threads per block> * <max blocks per core> = <max threads per core>
- auto threads_per_core = device_desc.threads_per_core_limit();
- auto blocks_per_core = device_desc.blocks_per_core_limit();
- int64 threads_per_block;
- if (threads_per_core != 0 && blocks_per_core != 0) {
- threads_per_block = device_desc.threads_per_core_limit() /
- device_desc.blocks_per_core_limit();
- } else {
+ int64 threads_per_block = device_desc.threads_per_block_limit();
+ if (threads_per_block == 0) {
static std::atomic<int64> log_count{0};
if (log_count.fetch_add(1) < 8) {
LOG(WARNING) << "Attempting to calculate launch dimensions for GPU "