1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
|
# Description:
# LIBXSMM: Library for small matrix-matrix multiplications targeting Intel Architecture (x86).
licenses(["notice"]) # BSD 3-clause
exports_files(["LICENSE"])
# Arguments to ./scripts/libxsmm_interface.py, see that file for detailed description.
# precision: SP & DP
# prefetch: 1 (auto)
libxsmm_interface_arguments = "0 1"
# Arguments to ./scripts/libxsmm_config.py, see that file for detailed description.
# ilp64: no
# big: no
# offload: no
# alignment [b]
# prefetch: 1 (auto)
# threshold: fallback to BLAS if n*m*k above this
# synchronize: yes
# jit: yes
# flags
# alpha = 1
# beta = 1
libxsmm_config_arguments = "0 0 0 64 1 0 1 1 0 1 1"
# Arguments to ./scripts/libxsmm_dispatch.py, see that file for detailed description.
# (dummy argument)
libxsmm_dispatch_arguments = "0"
genrule(
name = "libxsmm_headers",
srcs = [
"src/template/libxsmm.h",
"src/template/libxsmm_config.h",
],
outs = [
"include/libxsmm.h",
"include/libxsmm_config.h",
"include/libxsmm_dispatch.h",
],
cmd = "$(location :libxsmm_interface) $(location src/template/libxsmm.h) " + libxsmm_interface_arguments + " > $(location include/libxsmm.h);" +
"$(location :libxsmm_config) $(location src/template/libxsmm_config.h) " + libxsmm_config_arguments + " > $(location include/libxsmm_config.h);" +
"$(location :libxsmm_dispatch) " + libxsmm_dispatch_arguments + " > $(location include/libxsmm_dispatch.h)",
tools = [
":libxsmm_config",
":libxsmm_dispatch",
":libxsmm_interface",
],
visibility = [
"//tensorflow/core/kernels:__pkg__",
"//third_party/eigen3:__pkg__",
],
)
cc_library(
name = "xsmm_avx",
srcs = [
"src/libxsmm_main.c",
"src/libxsmm_dump.c",
"src/libxsmm_malloc.c",
"src/libxsmm_gemm.c",
"src/libxsmm_timer.c",
"src/libxsmm_trace.c",
"src/libxsmm_trans.c",
"src/libxsmm_sync.c",
"src/libxsmm_perf.c",
"src/libxsmm_spmdm.c",
"src/libxsmm_dnn.c",
"src/libxsmm_dnn_handle.c",
"src/libxsmm_dnn_convolution_forward.c",
"src/libxsmm_dnn_convolution_backward.c",
"src/libxsmm_dnn_convolution_weight_update.c",
"src/libxsmm_cpuid_x86.c",
] + glob([
"src/generator_*.c",
]),
hdrs = [
"include/libxsmm_cpuid.h",
"include/libxsmm_dnn.h",
"include/libxsmm_frontend.h",
"include/libxsmm_generator.h",
"include/libxsmm_intrinsics_x86.h",
"include/libxsmm_macros.h",
"include/libxsmm_malloc.h",
"include/libxsmm_spmdm.h",
"include/libxsmm_sync.h",
"include/libxsmm_timer.h",
"include/libxsmm_typedefs.h",
# Generated:
"include/libxsmm.h",
"include/libxsmm_config.h",
"include/libxsmm_dispatch.h",
],
copts = [
"-mavx", # JIT does not work without avx anyway, and this silences some CRC32 warnings.
"-Wno-vla", # Libxsmm convolutions heavily use VLA.
],
defines = [
"LIBXSMM_BUILD",
"LIBXSMM_CPUID_X86_NOINLINE",
"__BLAS=0",
],
includes = [
"include",
"src",
"src/template",
],
visibility = ["//visibility:public"],
)
py_library(
name = "libxsmm_scripts",
srcs = glob(["scripts/*.py"]),
data = ["version.txt"],
)
py_binary(
name = "libxsmm_interface",
srcs = ["scripts/libxsmm_interface.py"],
deps = [":libxsmm_scripts"],
)
py_binary(
name = "libxsmm_config",
srcs = ["scripts/libxsmm_config.py"],
deps = [":libxsmm_scripts"],
)
py_binary(
name = "libxsmm_dispatch",
srcs = ["scripts/libxsmm_dispatch.py"],
deps = [":libxsmm_scripts"],
)
|