blob: 9675d2940c32a3a18d7d2f650a9dcd6bbdd56e62 (
plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
|
// This file contains declarations relating to kernel cache configuration
// parameters recognized by the StreamExecutor.
#ifndef TENSORFLOW_STREAM_EXECUTOR_KERNEL_CACHE_CONFIG_H_
#define TENSORFLOW_STREAM_EXECUTOR_KERNEL_CACHE_CONFIG_H_
namespace perftools {
namespace gputools {
// This enum represents potential configurations of L1/shared memory when
// running a particular kernel. These values represent user preference, and
// the runtime is not required to respect these choices.
enum class KernelCacheConfig {
// Indicates no preference for device L1/shared memory configuration.
kNoPreference,
// Indicates a preference for more shared memory than L1 cache.
kPreferShared,
// Indicates a preference for more L1 cache than shared memory.
kPreferL1,
// Indicates a preference for equal amounts of L1 cache and shared memory.
kPreferEqual,
};
} // namespace gputools
} // namespace perftools
#endif // TENSORFLOW_STREAM_EXECUTOR_KERNEL_CACHE_CONFIG_H_
|