aboutsummaryrefslogtreecommitdiffhomepage
path: root/tensorflow/stream_executor/executor_cache.h
blob: f814def9cc0ab6fc5bfa611fa1acbd04b53f240e (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
/* Copyright 2015 Google Inc. All Rights Reserved.

Licensed under the Apache License, Version 2.0 (the "License");
you may not use this file except in compliance with the License.
You may obtain a copy of the License at

    http://www.apache.org/licenses/LICENSE-2.0

Unless required by applicable law or agreed to in writing, software
distributed under the License is distributed on an "AS IS" BASIS,
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
See the License for the specific language governing permissions and
limitations under the License.
==============================================================================*/

#ifndef TENSORFLOW_STREAM_EXECUTOR_EXECUTOR_CACHE_H_
#define TENSORFLOW_STREAM_EXECUTOR_EXECUTOR_CACHE_H_

#include "tensorflow/stream_executor/lib/status.h"
#include "tensorflow/stream_executor/lib/statusor.h"
#include "tensorflow/stream_executor/stream_executor_pimpl.h"

namespace perftools {
namespace gputools {

// Utility class to allow Platform objects to manage cached StreamExecutors.
class ExecutorCache {
 public:
  ExecutorCache() {}

  // Inserts a new StreamExecutor with the given configuration into the cache.
  // Will not overwrite if called when a matching element is already present.
  port::Status Insert(const StreamExecutorConfig& config,
                      std::unique_ptr<StreamExecutor> executor);

  // Returns a pointer to the described executor (if one with a matching config
  // has been created), or a NOT_FOUND status.
  port::StatusOr<StreamExecutor*> Get(const StreamExecutorConfig& config);

  // Destroys all Executors and clears the cache.
  // Performs no synchronization - undefined behavior may occur if any executors
  // are active!
  void DestroyAllExecutors();

 private:
  typedef std::pair<StreamExecutorConfig, std::unique_ptr<StreamExecutor>>
      Entry;

  // Maps ordinal number to a list of cached executors for that ordinal.
  // We key off of ordinal (instead of just looking up all fields in the
  // StreamExecutorConfig) for a slight improvement in lookup time.
  std::map<int, std::vector<Entry>> cache_;

  SE_DISALLOW_COPY_AND_ASSIGN(ExecutorCache);
};

}  // namespace gputools
}  // namespace perftools

#endif  // TENSORFLOW_STREAM_EXECUTOR_EXECUTOR_CACHE_H_