aboutsummaryrefslogtreecommitdiffhomepage
path: root/third_party/sycl/crosstool/computecpp.tpl
blob: 8b0a7a7d4ad70b7d7ae9cfdd39a930eab4957072 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
#!/usr/bin/env python

import os
import sys
import tempfile
from subprocess import call, Popen, PIPE

CPU_CXX_COMPILER = ('%{host_cxx_compiler}')
CPU_C_COMPILER = ('%{host_c_compiler}')

CURRENT_DIR = os.path.dirname(sys.argv[0])
COMPUTECPP_ROOT = CURRENT_DIR + '/../sycl/'
COMPUTECPP_DRIVER= COMPUTECPP_ROOT + 'bin/compute++'
COMPUTECPP_INCLUDE = COMPUTECPP_ROOT + 'include'

def main():
  remove_flags = ('-Wl,--no-undefined', '-Wno-unused-but-set-variable', '-Wignored-attributes')
  # remove -fsanitize-coverage from string with g++
  if 'g++' in CPU_CXX_COMPILER:
    remove_flags += ('-fsanitize-coverage',)
  compiler_flags = [flag for flag in sys.argv[1:] if not flag.startswith(remove_flags)]

  output_file_index = compiler_flags.index('-o') + 1
  output_file_name = compiler_flags[output_file_index]

  if output_file_index == 1:
    # we are linking
    return call([CPU_CXX_COMPILER] + compiler_flags + ['-Wl,--no-undefined'])

  # find what we compile
  compiling_cpp = False
  if '-c' in compiler_flags:
    compiled_file_index = compiler_flags.index('-c') + 1
    compiled_file_name = compiler_flags[compiled_file_index]
    compiling_cpp = compiled_file_name.endswith(('.cc', '.c++', '.cpp', '.CPP', '.C', '.cxx'))

  # add -D_GLIBCXX_USE_CXX11_ABI=0 to the command line if you have custom installation of GCC/Clang
  compiler_flags = compiler_flags + ['-DEIGEN_USE_SYCL=1', '-DTENSORFLOW_USE_SYCL', '-DEIGEN_HAS_C99_MATH']

  if not compiling_cpp:
    # compile for C
    return call([CPU_C_COMPILER] + compiler_flags)

  # create a blacklist of folders that will be skipped when compiling with ComputeCpp
  skip_extensions = [".cu.cc"]
  skip_folders = ["tensorflow/compiler", "tensorflow/docs_src", "third_party", "external", "hexagon"]
  skip_folders = [(folder + '/') for folder in skip_folders]
  # if compiling external project skip computecpp
  if any(compiled_file_name.endswith(_ext) for _ext in skip_extensions) or any(_folder in output_file_name for _folder in skip_folders):
    return call([CPU_CXX_COMPILER] + compiler_flags)

  # this is an optimisation that will check if compiled file has to be compiled with ComputeCpp
  flags_without_output = list(compiler_flags)
  del flags_without_output[output_file_index]   # remove output_file_name
  del flags_without_output[output_file_index - 1] # remove '-o'
  # create preprocessed of the file and store it for later use
  pipe = Popen([CPU_CXX_COMPILER] + flags_without_output + ["-E"], stdout=PIPE)
  preprocessed_file_str = pipe.communicate()[0]
  if pipe.returncode != 0:
    return pipe.returncode

  # check if it has parallel_for in it
  if not '.parallel_for' in preprocessed_file_str:
    # call CXX compiler like usual
    with tempfile.NamedTemporaryFile(suffix=".ii") as preprocessed_file: # Force '.ii' extension so that g++ does not preprocess the file again
      preprocessed_file.write(preprocessed_file_str)
      preprocessed_file.flush()
      compiler_flags[compiled_file_index] = preprocessed_file.name
      return call([CPU_CXX_COMPILER] + compiler_flags)
  del preprocessed_file_str   # save some memory as this string can be quite big

  filename, file_extension = os.path.splitext(output_file_name)
  bc_out = filename + '.sycl'

  # strip asan for the device
  computecpp_device_compiler_flags = ['-sycl-compress-name', '-Wno-unused-variable',
                                      '-I', COMPUTECPP_INCLUDE, '-isystem', COMPUTECPP_INCLUDE,
                                      '-std=c++11', '-sycl', '-emit-llvm', '-no-serial-memop',
                                      '-Xclang', '-cl-denorms-are-zero', '-Xclang', '-cl-fp32-correctly-rounded-divide-sqrt']
  # disable flags enabling SIMD instructions
  computecpp_device_compiler_flags += [flag for flag in compiler_flags if \
    not any(x in flag.lower() for x in ('-fsanitize', '-fno-canonical-system-headers', '=native', '=core2', 'msse', 'vectorize', 'mavx', 'mmmx', 'm3dnow', 'fma'))]

  x = call([COMPUTECPP_DRIVER] + computecpp_device_compiler_flags)
  if x == 0:
    # dont want that in case of compiling with computecpp first
    host_compiler_flags = [flag for flag in compiler_flags if (not flag.startswith(('-MF', '-MD',)) and not '.d' in flag)]
    host_compiler_flags[host_compiler_flags.index('-c')] = "--include"
    host_compiler_flags = ['-xc++', '-Wno-unused-variable', '-I', COMPUTECPP_INCLUDE, '-c', bc_out] + host_compiler_flags
    x = call([CPU_CXX_COMPILER] + host_compiler_flags)
  return x

if __name__ == '__main__':
  sys.exit(main())