diff options
Diffstat (limited to 'third_party/gpus')
-rw-r--r-- | third_party/gpus/crosstool/BUILD | 28 | ||||
-rw-r--r-- | third_party/gpus/crosstool/CROSSTOOL | 146 | ||||
-rw-r--r-- | third_party/gpus/crosstool/LICENSE | 203 | ||||
-rwxr-xr-x | third_party/gpus/crosstool/clang/bin/crosstool_wrapper_driver_is_not_gcc | 316 | ||||
-rw-r--r-- | third_party/gpus/cuda/BUILD | 158 | ||||
-rw-r--r-- | third_party/gpus/cuda/LICENSE | 203 | ||||
-rwxr-xr-x | third_party/gpus/cuda/cuda_config.sh | 169 |
7 files changed, 1223 insertions, 0 deletions
diff --git a/third_party/gpus/crosstool/BUILD b/third_party/gpus/crosstool/BUILD new file mode 100644 index 0000000000..eac4dc7fad --- /dev/null +++ b/third_party/gpus/crosstool/BUILD @@ -0,0 +1,28 @@ +licenses(["restricted"]) + +package(default_visibility = ["//visibility:public"]) + +filegroup( + name = "crosstool", + srcs = ["CROSSTOOL"], + output_licenses = ["unencumbered"], +) + +cc_toolchain( + name = "cc-compiler-local", + all_files = ":empty", + compiler_files = ":empty", + cpu = "local", + dwp_files = ":empty", + dynamic_runtime_libs = [":empty"], + linker_files = ":empty", + objcopy_files = ":empty", + static_runtime_libs = [":empty"], + strip_files = ":empty", + supports_param_files = 0, +) + +filegroup( + name = "empty", + srcs = [], +) diff --git a/third_party/gpus/crosstool/CROSSTOOL b/third_party/gpus/crosstool/CROSSTOOL new file mode 100644 index 0000000000..3570c5c8a2 --- /dev/null +++ b/third_party/gpus/crosstool/CROSSTOOL @@ -0,0 +1,146 @@ +major_version: "local" +minor_version: "" +default_target_cpu: "same_as_host" + +default_toolchain { + cpu: "k8" + toolchain_identifier: "local_linux" +} +default_toolchain { + cpu: "piii" + toolchain_identifier: "local_linux" +} +default_toolchain { + cpu: "darwin" + toolchain_identifier: "local_darwin" +} + +toolchain { + abi_version: "local" + abi_libc_version: "local" + builtin_sysroot: "" + compiler: "compiler" + host_system_name: "local" + needsPic: true + supports_gold_linker: false + supports_incremental_linker: false + supports_fission: false + supports_interface_shared_objects: false + supports_normalizing_ar: false + supports_start_end_lib: false + supports_thin_archives: false + target_libc: "local" + target_cpu: "local" + target_system_name: "local" + toolchain_identifier: "local_linux" + + tool_path { name: "ar" path: "/usr/bin/ar" } + tool_path { name: "compat-ld" path: "/usr/bin/ld" } + tool_path { name: "cpp" path: "/usr/bin/cpp" } + tool_path { name: "dwp" path: "/usr/bin/dwp" } + # As part of the TensorFlow release, we place some cuda-related compilation + # files in third_party/gpus/crosstool/clang/bin, and this relative + # path, combined with the rest of our Bazel configuration causes our + # compilation to use those files. + tool_path { name: "gcc" path: "clang/bin/crosstool_wrapper_driver_is_not_gcc" } + # Use "-std=c++11" for nvcc. For consistency, force both the host compiler + # and the device compiler to use "-std=c++11". + cxx_flag: "-std=c++11" + linker_flag: "-lstdc++" + linker_flag: "-B/usr/bin/" + + # TODO(bazel-team): In theory, the path here ought to exactly match the path + # used by gcc. That works because bazel currently doesn't track files at + # absolute locations and has no remote execution, yet. However, this will need + # to be fixed, maybe with auto-detection? + cxx_builtin_include_directory: "/usr/lib/gcc/" + cxx_builtin_include_directory: "/usr/local/include" + cxx_builtin_include_directory: "/usr/include" + tool_path { name: "gcov" path: "/usr/bin/gcov" } + + # C(++) compiles invoke the compiler (as that is the one knowing where + # to find libraries), but we provide LD so other rules can invoke the linker. + tool_path { name: "ld" path: "/usr/bin/ld" } + + tool_path { name: "nm" path: "/usr/bin/nm" } + tool_path { name: "objcopy" path: "/usr/bin/objcopy" } + objcopy_embed_flag: "-I" + objcopy_embed_flag: "binary" + tool_path { name: "objdump" path: "/usr/bin/objdump" } + tool_path { name: "strip" path: "/usr/bin/strip" } + + # Anticipated future default. + unfiltered_cxx_flag: "-no-canonical-prefixes" + + # Make C++ compilation deterministic. Use linkstamping instead of these + # compiler symbols. + unfiltered_cxx_flag: "-Wno-builtin-macro-redefined" + unfiltered_cxx_flag: "-D__DATE__=\"redacted\"" + unfiltered_cxx_flag: "-D__TIMESTAMP__=\"redacted\"" + unfiltered_cxx_flag: "-D__TIME__=\"redacted\"" + + # Security hardening on by default. + # Conservative choice; -D_FORTIFY_SOURCE=2 may be unsafe in some cases. + # We need to undef it before redefining it as some distributions now have + # it enabled by default. + compiler_flag: "-U_FORTIFY_SOURCE" + compiler_flag: "-D_FORTIFY_SOURCE=1" + compiler_flag: "-fstack-protector" + compiler_flag: "-fPIE" + linker_flag: "-pie" + linker_flag: "-Wl,-z,relro,-z,now" + + # Enable coloring even if there's no attached terminal. Bazel removes the + # escape sequences if --nocolor is specified. This isn't supported by gcc + # on Ubuntu 14.04. + # compiler_flag: "-fcolor-diagnostics" + + # All warnings are enabled. Maybe enable -Werror as well? + compiler_flag: "-Wall" + # Enable a few more warnings that aren't part of -Wall. + compiler_flag: "-Wunused-but-set-parameter" + # But disable some that are problematic. + compiler_flag: "-Wno-free-nonheap-object" # has false positives + + # Keep stack frames for debugging, even in opt mode. + compiler_flag: "-fno-omit-frame-pointer" + + # Anticipated future default. + linker_flag: "-no-canonical-prefixes" + # Have gcc return the exit code from ld. + linker_flag: "-pass-exit-codes" + # Stamp the binary with a unique identifier. + linker_flag: "-Wl,--build-id=md5" + linker_flag: "-Wl,--hash-style=gnu" + # Gold linker only? Can we enable this by default? + # linker_flag: "-Wl,--warn-execstack" + # linker_flag: "-Wl,--detect-odr-violations" + + compilation_mode_flags { + mode: DBG + # Enable debug symbols. + compiler_flag: "-g" + } + compilation_mode_flags { + mode: OPT + + # No debug symbols. + # Maybe we should enable https://gcc.gnu.org/wiki/DebugFission for opt or + # even generally? However, that can't happen here, as it requires special + # handling in Bazel. + compiler_flag: "-g0" + + # Conservative choice for -O + # -O3 can increase binary size and even slow down the resulting binaries. + # Profile first and / or use FDO if you need better performance than this. + compiler_flag: "-O2" + + # Disable assertions + compiler_flag: "-DNDEBUG" + + # Removal of unused code and data at link time (can this increase binary size in some cases?). + compiler_flag: "-ffunction-sections" + compiler_flag: "-fdata-sections" + linker_flag: "-Wl,--gc-sections" + } +} diff --git a/third_party/gpus/crosstool/LICENSE b/third_party/gpus/crosstool/LICENSE new file mode 100644 index 0000000000..d3da228420 --- /dev/null +++ b/third_party/gpus/crosstool/LICENSE @@ -0,0 +1,203 @@ +Copyright 2015 The TensorFlow Authors. All rights reserved. + + Apache License + Version 2.0, January 2004 + http://www.apache.org/licenses/ + + TERMS AND CONDITIONS FOR USE, REPRODUCTION, AND DISTRIBUTION + + 1. Definitions. + + "License" shall mean the terms and conditions for use, reproduction, + and distribution as defined by Sections 1 through 9 of this document. + + "Licensor" shall mean the copyright owner or entity authorized by + the copyright owner that is granting the License. + + "Legal Entity" shall mean the union of the acting entity and all + other entities that control, are controlled by, or are under common + control with that entity. For the purposes of this definition, + "control" means (i) the power, direct or indirect, to cause the + direction or management of such entity, whether by contract or + otherwise, or (ii) ownership of fifty percent (50%) or more of the + outstanding shares, or (iii) beneficial ownership of such entity. + + "You" (or "Your") shall mean an individual or Legal Entity + exercising permissions granted by this License. + + "Source" form shall mean the preferred form for making modifications, + including but not limited to software source code, documentation + source, and configuration files. + + "Object" form shall mean any form resulting from mechanical + transformation or translation of a Source form, including but + not limited to compiled object code, generated documentation, + and conversions to other media types. + + "Work" shall mean the work of authorship, whether in Source or + Object form, made available under the License, as indicated by a + copyright notice that is included in or attached to the work + (an example is provided in the Appendix below). + + "Derivative Works" shall mean any work, whether in Source or Object + form, that is based on (or derived from) the Work and for which the + editorial revisions, annotations, elaborations, or other modifications + represent, as a whole, an original work of authorship. For the purposes + of this License, Derivative Works shall not include works that remain + separable from, or merely link (or bind by name) to the interfaces of, + the Work and Derivative Works thereof. + + "Contribution" shall mean any work of authorship, including + the original version of the Work and any modifications or additions + to that Work or Derivative Works thereof, that is intentionally + submitted to Licensor for inclusion in the Work by the copyright owner + or by an individual or Legal Entity authorized to submit on behalf of + the copyright owner. For the purposes of this definition, "submitted" + means any form of electronic, verbal, or written communication sent + to the Licensor or its representatives, including but not limited to + communication on electronic mailing lists, source code control systems, + and issue tracking systems that are managed by, or on behalf of, the + Licensor for the purpose of discussing and improving the Work, but + excluding communication that is conspicuously marked or otherwise + designated in writing by the copyright owner as "Not a Contribution." + + "Contributor" shall mean Licensor and any individual or Legal Entity + on behalf of whom a Contribution has been received by Licensor and + subsequently incorporated within the Work. + + 2. Grant of Copyright License. Subject to the terms and conditions of + this License, each Contributor hereby grants to You a perpetual, + worldwide, non-exclusive, no-charge, royalty-free, irrevocable + copyright license to reproduce, prepare Derivative Works of, + publicly display, publicly perform, sublicense, and distribute the + Work and such Derivative Works in Source or Object form. + + 3. Grant of Patent License. Subject to the terms and conditions of + this License, each Contributor hereby grants to You a perpetual, + worldwide, non-exclusive, no-charge, royalty-free, irrevocable + (except as stated in this section) patent license to make, have made, + use, offer to sell, sell, import, and otherwise transfer the Work, + where such license applies only to those patent claims licensable + by such Contributor that are necessarily infringed by their + Contribution(s) alone or by combination of their Contribution(s) + with the Work to which such Contribution(s) was submitted. If You + institute patent litigation against any entity (including a + cross-claim or counterclaim in a lawsuit) alleging that the Work + or a Contribution incorporated within the Work constitutes direct + or contributory patent infringement, then any patent licenses + granted to You under this License for that Work shall terminate + as of the date such litigation is filed. + + 4. Redistribution. You may reproduce and distribute copies of the + Work or Derivative Works thereof in any medium, with or without + modifications, and in Source or Object form, provided that You + meet the following conditions: + + (a) You must give any other recipients of the Work or + Derivative Works a copy of this License; and + + (b) You must cause any modified files to carry prominent notices + stating that You changed the files; and + + (c) You must retain, in the Source form of any Derivative Works + that You distribute, all copyright, patent, trademark, and + attribution notices from the Source form of the Work, + excluding those notices that do not pertain to any part of + the Derivative Works; and + + (d) If the Work includes a "NOTICE" text file as part of its + distribution, then any Derivative Works that You distribute must + include a readable copy of the attribution notices contained + within such NOTICE file, excluding those notices that do not + pertain to any part of the Derivative Works, in at least one + of the following places: within a NOTICE text file distributed + as part of the Derivative Works; within the Source form or + documentation, if provided along with the Derivative Works; or, + within a display generated by the Derivative Works, if and + wherever such third-party notices normally appear. The contents + of the NOTICE file are for informational purposes only and + do not modify the License. You may add Your own attribution + notices within Derivative Works that You distribute, alongside + or as an addendum to the NOTICE text from the Work, provided + that such additional attribution notices cannot be construed + as modifying the License. + + You may add Your own copyright statement to Your modifications and + may provide additional or different license terms and conditions + for use, reproduction, or distribution of Your modifications, or + for any such Derivative Works as a whole, provided Your use, + reproduction, and distribution of the Work otherwise complies with + the conditions stated in this License. + + 5. Submission of Contributions. Unless You explicitly state otherwise, + any Contribution intentionally submitted for inclusion in the Work + by You to the Licensor shall be under the terms and conditions of + this License, without any additional terms or conditions. + Notwithstanding the above, nothing herein shall supersede or modify + the terms of any separate license agreement you may have executed + with Licensor regarding such Contributions. + + 6. Trademarks. This License does not grant permission to use the trade + names, trademarks, service marks, or product names of the Licensor, + except as required for reasonable and customary use in describing the + origin of the Work and reproducing the content of the NOTICE file. + + 7. Disclaimer of Warranty. Unless required by applicable law or + agreed to in writing, Licensor provides the Work (and each + Contributor provides its Contributions) on an "AS IS" BASIS, + WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or + implied, including, without limitation, any warranties or conditions + of TITLE, NON-INFRINGEMENT, MERCHANTABILITY, or FITNESS FOR A + PARTICULAR PURPOSE. You are solely responsible for determining the + appropriateness of using or redistributing the Work and assume any + risks associated with Your exercise of permissions under this License. + + 8. Limitation of Liability. In no event and under no legal theory, + whether in tort (including negligence), contract, or otherwise, + unless required by applicable law (such as deliberate and grossly + negligent acts) or agreed to in writing, shall any Contributor be + liable to You for damages, including any direct, indirect, special, + incidental, or consequential damages of any character arising as a + result of this License or out of the use or inability to use the + Work (including but not limited to damages for loss of goodwill, + work stoppage, computer failure or malfunction, or any and all + other commercial damages or losses), even if such Contributor + has been advised of the possibility of such damages. + + 9. Accepting Warranty or Additional Liability. While redistributing + the Work or Derivative Works thereof, You may choose to offer, + and charge a fee for, acceptance of support, warranty, indemnity, + or other liability obligations and/or rights consistent with this + License. However, in accepting such obligations, You may act only + on Your own behalf and on Your sole responsibility, not on behalf + of any other Contributor, and only if You agree to indemnify, + defend, and hold each Contributor harmless for any liability + incurred by, or claims asserted against, such Contributor by reason + of your accepting any such warranty or additional liability. + + END OF TERMS AND CONDITIONS + + APPENDIX: How to apply the Apache License to your work. + + To apply the Apache License to your work, attach the following + boilerplate notice, with the fields enclosed by brackets "[]" + replaced with your own identifying information. (Don't include + the brackets!) The text should be enclosed in the appropriate + comment syntax for the file format. We also recommend that a + file or class name and description of purpose be included on the + same "printed page" as the copyright notice for easier + identification within third-party archives. + + Copyright 2015, The TensorFlow Authors. + + Licensed under the Apache License, Version 2.0 (the "License"); + you may not use this file except in compliance with the License. + You may obtain a copy of the License at + + http://www.apache.org/licenses/LICENSE-2.0 + + Unless required by applicable law or agreed to in writing, software + distributed under the License is distributed on an "AS IS" BASIS, + WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. + See the License for the specific language governing permissions and + limitations under the License. diff --git a/third_party/gpus/crosstool/clang/bin/crosstool_wrapper_driver_is_not_gcc b/third_party/gpus/crosstool/clang/bin/crosstool_wrapper_driver_is_not_gcc new file mode 100755 index 0000000000..0f419a8b61 --- /dev/null +++ b/third_party/gpus/crosstool/clang/bin/crosstool_wrapper_driver_is_not_gcc @@ -0,0 +1,316 @@ +#!/usr/bin/env python2 + +"""Crosstool wrapper for compiling CUDA programs. + +SYNOPSIS: + crosstool_wrapper_is_not_gcc [options passed in by cc_library() + or cc_binary() rule] + +DESCRIPTION: + This script is expected to be called by the cc_library() or cc_binary() bazel + rules. When the option "-x cuda" is present in the list of arguments passed + to this script, it invokes the nvcc CUDA compiler. Most arguments are passed + as is as a string to --compiler-options of nvcc. When "-x cuda" is not + present, this wrapper invokes hybrid_driver_is_not_gcc with the input + arguments as is. + +NOTES: + Changes to the contents of this file must be propagated from + //third_party/gpus/crosstool/crosstool_wrapper_is_not_gcc to + //third_party/gpus/crosstool/v*/*/clang/bin/crosstool_wrapper_is_not_gcc +""" + +__author__ = 'keveman@google.com (Manjunath Kudlur)' + +from argparse import ArgumentParser +import os +import subprocess +import re +import sys +import pipes + +CURRENT_DIR = os.path.dirname(sys.argv[0]) +CPU_COMPILER = ('/usr/bin/gcc') +NVCC_PATH = CURRENT_DIR + '/../../../cuda/bin/nvcc' +GCC_HOST_COMPILER_PATH = ('/usr/bin/gcc') +LLVM_HOST_COMPILER_PATH = ('/usr/bin/gcc') +PREFIX_DIR = os.path.dirname(GCC_HOST_COMPILER_PATH) + + +def Log(s): + print 'gpus/crosstool: {0}'.format(s) + + +def GetOptionValue(argv, option): + """Extract the list of values for option from the argv list. + + Args: + argv: A list of strings, possibly the argv passed to main(). + option: The option whose value to extract, without the leading '-'. + + Returns: + A list of values, either directly following the option, + (eg., -opt val1 val2) or values collected from multiple occurrences of + the option (eg., -opt val1 -opt val2). + """ + + parser = ArgumentParser() + parser.add_argument('-' + option, nargs='*', action='append') + args, _ = parser.parse_known_args(argv) + if not args or not vars(args)[option]: + return [] + else: + return sum(vars(args)[option], []) + + +def GetHostCompilerOptions(argv): + """Collect the -isystem, -iquote, and --sysroot option values from argv. + + Args: + argv: A list of strings, possibly the argv passed to main(). + + Returns: + The string that can be used as the --compiler-options to nvcc. + """ + + parser = ArgumentParser() + parser.add_argument('-isystem', nargs='*', action='append') + parser.add_argument('-iquote', nargs='*', action='append') + parser.add_argument('--sysroot', nargs=1) + parser.add_argument('-g', nargs='*', action='append') + + args, _ = parser.parse_known_args(argv) + + opts = '' + # This is a temporary workaround for b/12960069. + # NVIDIA is going to fix this in CUDA 6.5, but until then this workaround + # will let us compile Thrust with the cuda crosstool. + # bazel passes all include directories as '-isystem dir' to the crosstool. + # This causes nvcc to think that there are kernel launches from system + # directories (which apparently is not supported by the compiler). This + # workaround changes '-isystem third_party/gpus/cuda/include' to + # '-iquote third_party/gpus/cuda/include'. + isystem_args = [x for x in args.isystem + if 'third_party/gpus/cuda/include' not in x] + iquote_args = (args.iquote + + [x for x in args.isystem + if 'third_party/gpus/cuda/include' in x]) + # This hack is needed so that we can compile eigen3. We need to include + # third_party/eigen3 with -I. Some eigen file include using the + # include <Eigen/Core> syntax, and -iquote doesn't work for that. + has_eigen = ['third_party/eigen3'] in isystem_args + if has_eigen: + isystem_args.remove(['third_party/eigen3']) + + if isystem_args: + opts += '-isystem ' + ' -isystem '.join(sum(isystem_args, [])) + if iquote_args: + opts += ' -iquote ' + ' -iquote '.join(sum(iquote_args, [])) + if args.g: + opts += ' -g' + ' -g'.join(sum(args.g, [])) + if args.sysroot: + opts += ' --sysroot ' + args.sysroot[0] + if has_eigen: + opts += ' -I third_party/eigen3' + + return opts + +def GetNvccOptions(argv): + """Collect the -nvcc_options values from argv. + + Args: + argv: A list of strings, possibly the argv passed to main(). + + Returns: + The string that can be passed directly to nvcc. + """ + + parser = ArgumentParser() + parser.add_argument('-nvcc_options', nargs='*', action='append') + + args, _ = parser.parse_known_args(argv) + + if args.nvcc_options: + return ' '.join(['--'+a for a in sum(args.nvcc_options, [])]) + return '' + + +def StripAndTransformNvccOptions(argv): + """Strips the -nvcc_options values from argv and transforms define-macros. + + Args: + argv: A list of strings, possibly the argv passed to main(). + + Returns: + A list of strings that can be passed directly to gcudacc. + """ + parser = ArgumentParser() + parser.add_argument('-nvcc_options', nargs='*', action='store') + args, leftover = parser.parse_known_args(argv) + if args.nvcc_options: + for option in args.nvcc_options: + (flag, _, value) = option.partition('=') + if 'define-macro' in flag: + leftover.append('-D' + value) + return leftover + + +def InvokeGcudacc(argv, gcudacc_version, gcudacc_flags, log=False): + """Call gcudacc with arguments assembled from argv. + + Args: + argv: A list of strings, possibly the argv passed to main(). + gcudacc_version: The version of gcudacc; this is a subdirectory name under + the gcudacc bin/ directory. + gcudacc_flags: A list of extra arguments passed just for gcudacc. + log: True if logging is requested. + + Returns: + The return value of calling os.system('gcudacc ' + args) + """ + + gcudacc_cmd = os.path.join(GCUDACC_PATH_BASE, gcudacc_version, 'gcudacc.par') + gcudacc_cmd = ( + gcudacc_cmd + + ' --google_host_compiler={0} '.format(LLVM_HOST_COMPILER_PATH) + + ' '.join(sum(gcudacc_flags, [])) + + ' -- ' + + ' '.join(StripAndTransformNvccOptions(argv))) + if log: Log(gcudacc_cmd) + return os.system(gcudacc_cmd) + + +def InvokeNvcc(argv, log=False): + """Call nvcc with arguments assembled from argv. + + Args: + argv: A list of strings, possibly the argv passed to main(). + log: True if logging is requested. + + Returns: + The return value of calling os.system('nvcc ' + args) + """ + + host_compiler_options = GetHostCompilerOptions(argv) + nvcc_compiler_options = GetNvccOptions(argv) + opt_option = GetOptionValue(argv, 'O') + m_options = GetOptionValue(argv, 'm') + m_options = ''.join([' -m' + m for m in m_options if m in ['32', '64']]) + include_options = GetOptionValue(argv, 'I') + out_file = GetOptionValue(argv, 'o') + depfiles = GetOptionValue(argv, 'MF') + defines = GetOptionValue(argv, 'D') + defines = ''.join([' -D' + define for define in defines]) + undefines = GetOptionValue(argv, 'U') + undefines = ''.join([' -U' + define for define in undefines]) + std_options = GetOptionValue(argv, 'std') + # currently only c++11 is supported by Cuda 7.0 std argument + nvcc_allowed_std_options = ["c++11"] + std_options = ''.join([' -std=' + define + for define in std_options if define in nvcc_allowed_std_options]) + + # The list of source files get passed after the -c option. I don't know of + # any other reliable way to just get the list of source files to be compiled. + src_files = GetOptionValue(argv, 'c') + + if len(src_files) == 0: + return 1 + if len(out_file) != 1: + return 1 + + opt = (' -O2' if (len(opt_option) > 0 and int(opt_option[0]) > 0) + else ' -g -G') + + includes = (' -I ' + ' -I '.join(include_options) + if len(include_options) > 0 + else '') + + # Unfortunately, there are other options that have -c prefix too. + # So allowing only those look like C/C++ files. + src_files = [f for f in src_files if + re.search('\.cpp$|\.cc$|\.c$|\.cxx$|\.C$', f)] + srcs = ' '.join(src_files) + out = ' -o ' + out_file[0] + + nvccopts = ' '.join([ + r'-gencode=arch=compute_35,\"code=sm_35,compute_35\"', + r'-gencode=arch=compute_52,\"code=sm_52,compute_52\"',]) + nvccopts += ' ' + nvcc_compiler_options + nvccopts += undefines + nvccopts += defines + nvccopts += std_options + nvccopts += m_options + + if depfiles: + # Generate the dependency file + depfile = depfiles[0] + cmd = (NVCC_PATH + ' ' + nvccopts + + ' --compiler-options "' + host_compiler_options + '"' + + ' --compiler-bindir=' + GCC_HOST_COMPILER_PATH + + ' -I .' + + ' -x cu ' + includes + ' ' + srcs + ' -M -o ' + depfile) + if log: Log(cmd) + exit_status = os.system(cmd) + if exit_status != 0: + return exit_status + + cmd = (NVCC_PATH + ' ' + nvccopts + + ' --compiler-options "' + host_compiler_options + ' -fPIC"' + + ' --compiler-bindir=' + GCC_HOST_COMPILER_PATH + + ' -I .' + + ' -x cu ' + opt + includes + ' -c ' + srcs + out) + + # TODO(zhengxq): for some reason, 'gcc' needs this help to find 'as'. + # Need to investigate and fix. + cmd = 'PATH=' + PREFIX_DIR + ' ' + cmd + if log: Log(cmd) + return os.system(cmd) + + +def main(): + parser = ArgumentParser() + parser.add_argument('-x', nargs=1) + parser.add_argument('--cuda_log', action='store_true') + parser.add_argument('--use_gcudacc', action='store_true') + parser.add_argument('--gcudacc_version', action='store', default='v8') + parser.add_argument('--gcudacc_flag', nargs='*', action='append', default=[]) + args, leftover = parser.parse_known_args(sys.argv[1:]) + + if args.x and args.x[0] == 'cuda': + if args.cuda_log: Log('-x cuda') + leftover = [pipes.quote(s) for s in leftover] + if args.use_gcudacc: + if args.cuda_log: Log('using gcudacc') + return InvokeGcudacc(argv=leftover, + gcudacc_version=args.gcudacc_version, + gcudacc_flags=args.gcudacc_flag, + log=args.cuda_log) + if args.cuda_log: Log('using nvcc') + return InvokeNvcc(leftover, log=args.cuda_log) + + # Strip our flags before passing through to the CPU compiler for files which + # are not -x cuda. We can't just pass 'leftover' because it also strips -x. + # We not only want to pass -x to the CPU compiler, but also keep it in its + # relative location in the argv list (the compiler is actually sensitive to + # this). + cpu_compiler_flags = [flag for flag in sys.argv[1:] + if not flag.startswith(('--cuda_log', + '--use_gcudacc', + '--gcudacc_version', + '--gcudacc_flag'))] + if args.use_gcudacc: + # This macro is defined for TUs that are not marked with "-x cuda" but are + # built as part of a -config=cuda --use_gcudacc compilation. They are + # compiled with the default CPU compiler. Since the objects built from + # these TUs are later linked with objects that come from gcudacc, some + # parts of the code need to be marked for these special cases. For example, + # some types have to be defined similarly for gcudacc-compiled TUs and + # default CPU compiler-compiled TUs linked with them, but differently when + # nvcc is used. + # TODO(eliben): rename to a more descriptive name. + cpu_compiler_flags.append('-D__GCUDACC_HOST__') + + return subprocess.call([CPU_COMPILER] + cpu_compiler_flags) + +if __name__ == '__main__': + sys.exit(main()) diff --git a/third_party/gpus/cuda/BUILD b/third_party/gpus/cuda/BUILD new file mode 100644 index 0000000000..40c048661c --- /dev/null +++ b/third_party/gpus/cuda/BUILD @@ -0,0 +1,158 @@ +licenses(["restricted"]) # MPL2, portions GPL v3, LGPL v3, BSD-like + +load("/tensorflow/tensorflow", "if_cuda") + +package(default_visibility = ["//visibility:public"]) + +config_setting( + name = "cuda_crosstool_condition", + values = {"crosstool_top": "//third_party/gpus/crosstool"}, + visibility = ["//visibility:public"], +) + +config_setting( + name = "using_gcudacc", + values = { + "crosstool_top": "//third_party/gpus/crosstool", + "copt": "--use_gcudacc", + }, + visibility = ["//visibility:public"], +) + +config_setting( + name = "using_nvcc", + values = { + "crosstool_top": "//third_party/gpus/crosstool", + "copt": "--use_nvcc", + }, +) + +cc_library( + name = "cuda_headers", + hdrs = glob([ + "**/*.h", + ]), + includes = [".", "include"], + visibility = ["//visibility:public"], +) + +cc_library( + name = "cudart_static", + srcs = [ + "lib64/libcudart_static.a", + ], + includes = ["include/"], + linkopts = [ + "-ldl", + "-lrt", + "-lpthread", + ], + visibility = ["//visibility:public"], +) + +cc_library( + name = "cudart", + srcs = [ + "lib64/libcudart.so.7.0", + ], + data = [ + "lib64/libcudart.so.7.0", + ], + includes = ["include/"], + visibility = ["//visibility:public"], + linkstatic = 1, +) + +cc_library( + name = "cublas", + srcs = [ + "lib64/libcublas.so.7.0", + ], + data = [ + "lib64/libcublas.so.7.0", + ], + includes = ["include/"], + visibility = ["//visibility:public"], + linkstatic = 1, +) + +cc_library( + name = "cudnn", + srcs = [ + "lib64/libcudnn.so.6.5", + ], + data = [ + "lib64/libcudnn.so.6.5", + ], + includes = ["include/"], + visibility = ["//visibility:public"], + linkstatic = 1, +) + +cc_library( + name = "cuda", + deps = [ + ":cuda_headers", + ":cudart", + ":cublas", + ":cudnn", + ], + visibility = ["//visibility:public"], +) + +# TODO(opensource): for now, we have to invoke the cuda_config.sh manually in the source tree. +# This rule checks if Cuda libraries in the source tree has been properly configured. +# The output list makes bazel runs this rule first if the Cuda files are missing. +# This gives us an opportunity to check and print a meaningful error message. +# But we will need to create the output file list to make bazel happy in a successfull run. +genrule( + name = "cuda_check", + srcs = [ + "cuda.config", + "cuda_config.sh", + ], + outs = [ + "include/cuda.h", + "include/cublas.h", + "include/cudnn.h", + "lib64/libcudart_static.a", + "lib64/libcublas.so.7.0", + "lib64/libcudnn.so.6.5", + "lib64/libcudart.so.7.0", + ], + cmd = if_cuda( + # Under cuda config, create all the symbolic links to the actual cuda files + "OUTPUTDIR=`readlink -f $(@D)/../../..`; cd third_party/gpus/cuda; OUTPUTDIR=$$OUTPUTDIR ./cuda_config.sh --check;", + + # Under non-cuda config, create all dummy files to make the build go through + ";".join([ + "mkdir -p $(@D)/include", + "mkdir -p $(@D)/lib64", + "touch $(@D)/include/cuda.h", + "touch $(@D)/include/cublas.h", + "touch $(@D)/include/cudnn.h", + "touch $(@D)/lib64/libcudart_static.a", + "touch $(@D)/lib64/libcublas.so.7.0", + "touch $(@D)/lib64/libcudnn.so.6.5", + "touch $(@D)/lib64/libcudart.so.7.0" + ]), + ), + local = 1, +) + +genrule( + name = "cuda_config_check", + outs = [ + "cuda.config", + ], + cmd = if_cuda( + # Under cuda config, create the symbolic link to the actual cuda.config + "ln -sf `readlink -f third_party/gpus/cuda/cuda.config` $(@D)/;", + + # Under non-cuda config, create the dummy file + ";".join([ + "touch $(@D)/cuda.config", + ]), + ), + local = 1, +) diff --git a/third_party/gpus/cuda/LICENSE b/third_party/gpus/cuda/LICENSE new file mode 100644 index 0000000000..d3da228420 --- /dev/null +++ b/third_party/gpus/cuda/LICENSE @@ -0,0 +1,203 @@ +Copyright 2015 The TensorFlow Authors. All rights reserved. + + Apache License + Version 2.0, January 2004 + http://www.apache.org/licenses/ + + TERMS AND CONDITIONS FOR USE, REPRODUCTION, AND DISTRIBUTION + + 1. Definitions. + + "License" shall mean the terms and conditions for use, reproduction, + and distribution as defined by Sections 1 through 9 of this document. + + "Licensor" shall mean the copyright owner or entity authorized by + the copyright owner that is granting the License. + + "Legal Entity" shall mean the union of the acting entity and all + other entities that control, are controlled by, or are under common + control with that entity. For the purposes of this definition, + "control" means (i) the power, direct or indirect, to cause the + direction or management of such entity, whether by contract or + otherwise, or (ii) ownership of fifty percent (50%) or more of the + outstanding shares, or (iii) beneficial ownership of such entity. + + "You" (or "Your") shall mean an individual or Legal Entity + exercising permissions granted by this License. + + "Source" form shall mean the preferred form for making modifications, + including but not limited to software source code, documentation + source, and configuration files. + + "Object" form shall mean any form resulting from mechanical + transformation or translation of a Source form, including but + not limited to compiled object code, generated documentation, + and conversions to other media types. + + "Work" shall mean the work of authorship, whether in Source or + Object form, made available under the License, as indicated by a + copyright notice that is included in or attached to the work + (an example is provided in the Appendix below). + + "Derivative Works" shall mean any work, whether in Source or Object + form, that is based on (or derived from) the Work and for which the + editorial revisions, annotations, elaborations, or other modifications + represent, as a whole, an original work of authorship. For the purposes + of this License, Derivative Works shall not include works that remain + separable from, or merely link (or bind by name) to the interfaces of, + the Work and Derivative Works thereof. + + "Contribution" shall mean any work of authorship, including + the original version of the Work and any modifications or additions + to that Work or Derivative Works thereof, that is intentionally + submitted to Licensor for inclusion in the Work by the copyright owner + or by an individual or Legal Entity authorized to submit on behalf of + the copyright owner. For the purposes of this definition, "submitted" + means any form of electronic, verbal, or written communication sent + to the Licensor or its representatives, including but not limited to + communication on electronic mailing lists, source code control systems, + and issue tracking systems that are managed by, or on behalf of, the + Licensor for the purpose of discussing and improving the Work, but + excluding communication that is conspicuously marked or otherwise + designated in writing by the copyright owner as "Not a Contribution." + + "Contributor" shall mean Licensor and any individual or Legal Entity + on behalf of whom a Contribution has been received by Licensor and + subsequently incorporated within the Work. + + 2. Grant of Copyright License. Subject to the terms and conditions of + this License, each Contributor hereby grants to You a perpetual, + worldwide, non-exclusive, no-charge, royalty-free, irrevocable + copyright license to reproduce, prepare Derivative Works of, + publicly display, publicly perform, sublicense, and distribute the + Work and such Derivative Works in Source or Object form. + + 3. Grant of Patent License. Subject to the terms and conditions of + this License, each Contributor hereby grants to You a perpetual, + worldwide, non-exclusive, no-charge, royalty-free, irrevocable + (except as stated in this section) patent license to make, have made, + use, offer to sell, sell, import, and otherwise transfer the Work, + where such license applies only to those patent claims licensable + by such Contributor that are necessarily infringed by their + Contribution(s) alone or by combination of their Contribution(s) + with the Work to which such Contribution(s) was submitted. If You + institute patent litigation against any entity (including a + cross-claim or counterclaim in a lawsuit) alleging that the Work + or a Contribution incorporated within the Work constitutes direct + or contributory patent infringement, then any patent licenses + granted to You under this License for that Work shall terminate + as of the date such litigation is filed. + + 4. Redistribution. You may reproduce and distribute copies of the + Work or Derivative Works thereof in any medium, with or without + modifications, and in Source or Object form, provided that You + meet the following conditions: + + (a) You must give any other recipients of the Work or + Derivative Works a copy of this License; and + + (b) You must cause any modified files to carry prominent notices + stating that You changed the files; and + + (c) You must retain, in the Source form of any Derivative Works + that You distribute, all copyright, patent, trademark, and + attribution notices from the Source form of the Work, + excluding those notices that do not pertain to any part of + the Derivative Works; and + + (d) If the Work includes a "NOTICE" text file as part of its + distribution, then any Derivative Works that You distribute must + include a readable copy of the attribution notices contained + within such NOTICE file, excluding those notices that do not + pertain to any part of the Derivative Works, in at least one + of the following places: within a NOTICE text file distributed + as part of the Derivative Works; within the Source form or + documentation, if provided along with the Derivative Works; or, + within a display generated by the Derivative Works, if and + wherever such third-party notices normally appear. The contents + of the NOTICE file are for informational purposes only and + do not modify the License. You may add Your own attribution + notices within Derivative Works that You distribute, alongside + or as an addendum to the NOTICE text from the Work, provided + that such additional attribution notices cannot be construed + as modifying the License. + + You may add Your own copyright statement to Your modifications and + may provide additional or different license terms and conditions + for use, reproduction, or distribution of Your modifications, or + for any such Derivative Works as a whole, provided Your use, + reproduction, and distribution of the Work otherwise complies with + the conditions stated in this License. + + 5. Submission of Contributions. Unless You explicitly state otherwise, + any Contribution intentionally submitted for inclusion in the Work + by You to the Licensor shall be under the terms and conditions of + this License, without any additional terms or conditions. + Notwithstanding the above, nothing herein shall supersede or modify + the terms of any separate license agreement you may have executed + with Licensor regarding such Contributions. + + 6. Trademarks. This License does not grant permission to use the trade + names, trademarks, service marks, or product names of the Licensor, + except as required for reasonable and customary use in describing the + origin of the Work and reproducing the content of the NOTICE file. + + 7. Disclaimer of Warranty. Unless required by applicable law or + agreed to in writing, Licensor provides the Work (and each + Contributor provides its Contributions) on an "AS IS" BASIS, + WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or + implied, including, without limitation, any warranties or conditions + of TITLE, NON-INFRINGEMENT, MERCHANTABILITY, or FITNESS FOR A + PARTICULAR PURPOSE. You are solely responsible for determining the + appropriateness of using or redistributing the Work and assume any + risks associated with Your exercise of permissions under this License. + + 8. Limitation of Liability. In no event and under no legal theory, + whether in tort (including negligence), contract, or otherwise, + unless required by applicable law (such as deliberate and grossly + negligent acts) or agreed to in writing, shall any Contributor be + liable to You for damages, including any direct, indirect, special, + incidental, or consequential damages of any character arising as a + result of this License or out of the use or inability to use the + Work (including but not limited to damages for loss of goodwill, + work stoppage, computer failure or malfunction, or any and all + other commercial damages or losses), even if such Contributor + has been advised of the possibility of such damages. + + 9. Accepting Warranty or Additional Liability. While redistributing + the Work or Derivative Works thereof, You may choose to offer, + and charge a fee for, acceptance of support, warranty, indemnity, + or other liability obligations and/or rights consistent with this + License. However, in accepting such obligations, You may act only + on Your own behalf and on Your sole responsibility, not on behalf + of any other Contributor, and only if You agree to indemnify, + defend, and hold each Contributor harmless for any liability + incurred by, or claims asserted against, such Contributor by reason + of your accepting any such warranty or additional liability. + + END OF TERMS AND CONDITIONS + + APPENDIX: How to apply the Apache License to your work. + + To apply the Apache License to your work, attach the following + boilerplate notice, with the fields enclosed by brackets "[]" + replaced with your own identifying information. (Don't include + the brackets!) The text should be enclosed in the appropriate + comment syntax for the file format. We also recommend that a + file or class name and description of purpose be included on the + same "printed page" as the copyright notice for easier + identification within third-party archives. + + Copyright 2015, The TensorFlow Authors. + + Licensed under the Apache License, Version 2.0 (the "License"); + you may not use this file except in compliance with the License. + You may obtain a copy of the License at + + http://www.apache.org/licenses/LICENSE-2.0 + + Unless required by applicable law or agreed to in writing, software + distributed under the License is distributed on an "AS IS" BASIS, + WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. + See the License for the specific language governing permissions and + limitations under the License. diff --git a/third_party/gpus/cuda/cuda_config.sh b/third_party/gpus/cuda/cuda_config.sh new file mode 100755 index 0000000000..034298590b --- /dev/null +++ b/third_party/gpus/cuda/cuda_config.sh @@ -0,0 +1,169 @@ +#!/bin/bash + +# A simple script to configure the Cuda tree needed for the TensorFlow GPU +# build. We need both Cuda toolkit 7.0 and Cudnn 6.5. +# Useage: +# * User edit cuda.config to point both Cuda toolkit and Cudnn libraries to their local path +# * run cuda_config.sh to generate symbolic links in the source tree to reflect +# * the file organizations needed by TensorFlow. + +print_usage() { +cat << EOF +Usage: $0 [--check] + Configure TensorFlow's canonical view of Cuda libraries using cuda.config. +Arguments: + --check: Only check that the proper Cuda dependencies has already been + properly configured in the source tree. It also creates symbolic links to + the files in the gen-tree to make bazel happy. +EOF +} + +CHECK_ONLY=0 +# Parse the arguments. Add more arguments as the "case" line when needed. +while [[ $# > 0 ]]; do + argument="$1" + shift + case $argument in + --check) + CHECK_ONLY=1 + ;; + *) + echo "Error: unknown arguments" + print_usage + exit -1 + ;; + esac +done + +source cuda.config || exit -1 + +OUTPUTDIR=${OUTPUTDIR:-../../..} +CUDA_TOOLKIT_PATH=${CUDA_TOOLKIT_PATH:-/usr/local/cuda} +CUDNN_INSTALL_PATH=${CUDNN_INSTALL_PATH:-/usr/local/cuda} + +# An error message when the Cuda toolkit is not found +function CudaError { + echo ERROR: $1 +cat << EOF +############################################################################## +############################################################################## +Cuda 7.0 toolkit is missing. +1. Download and install the CUDA 7.0 toolkit and CUDNN 6.5 library; +2. Run configure from the root of the source tree, before rerunning bazel; +Please refer to README.md for more details. +############################################################################## +############################################################################## +EOF + exit -1 +} + +# An error message when CUDNN is not found +function CudnnError { + echo ERROR: $1 +cat << EOF +############################################################################## +############################################################################## +Cudnn 6.5 is missing. +1. Download and install the CUDA 7.0 toolkit and CUDNN 6.5 library; +2. Run configure from the root of the source tree, before rerunning bazel; +Please refer to README.md for more details. +############################################################################## +############################################################################## +EOF + exit -1 +} + +# Check that Cuda libraries has already been properly configured in the source tree. +# We still need to create links to the gen-tree to make bazel happy. +function CheckAndLinkToSrcTree { + ERROR_FUNC=$1 + FILE=$2 + if test ! -e $FILE; then + $ERROR_FUNC "$PWD/$FILE cannot be found" + fi + + # Link the output file to the source tree, avoiding self links if they are + # the same. This could happen if invoked from the source tree by accident. + if [ ! `readlink -f $PWD` == `readlink -f $OUTPUTDIR/third_party/gpus/cuda` ]; then + mkdir -p `dirname $OUTPUTDIR/third_party/gpus/cuda/$FILE` + ln -sf $PWD/$FILE $OUTPUTDIR/third_party/gpus/cuda/$FILE + fi +} + +if [ "$CHECK_ONLY" == "1" ]; then + CheckAndLinkToSrcTree CudaError include/cuda.h + CheckAndLinkToSrcTree CudaError include/cublas.h + CheckAndLinkToSrcTree CudnnError include/cudnn.h + CheckAndLinkToSrcTree CudaError lib64/libcudart_static.a + CheckAndLinkToSrcTree CudaError lib64/libcublas.so.7.0 + CheckAndLinkToSrcTree CudnnError lib64/libcudnn.so.6.5 + CheckAndLinkToSrcTree CudaError lib64/libcudart.so.7.0 + exit 0 +fi + +# Actually configure the source tree for TensorFlow's canonical view of Cuda +# libraries. + +if test ! -e ${CUDA_TOOLKIT_PATH}/lib64/libcudart.so.7.0; then + CudaError "cannot find ${CUDA_TOOLKIT_PATH}/lib64/libcudart.so.7.0" +fi + +if test ! -d ${CUDNN_INSTALL_PATH}; then + CudnnError "cannot find dir: ${CUDNN_INSTALL_PATH}" +fi + +# Locate cudnn.h +if test -e ${CUDNN_INSTALL_PATH}/cudnn.h; then + CUDNN_HEADER_PATH=${CUDNN_INSTALL_PATH} +elif test -e ${CUDNN_INSTALL_PATH}/include/cudnn.h; then + CUDNN_HEADER_PATH=${CUDNN_INSTALL_PATH}/include +else + CudnnError "cannot find cudnn.h under: ${CUDNN_INSTALL_PATH}" +fi + +# Locate libcudnn.so.6.5 +if test -e ${CUDNN_INSTALL_PATH}/libcudnn.so.6.5; then + CUDNN_LIB_PATH=${CUDNN_INSTALL_PATH} +elif test -e ${CUDNN_INSTALL_PATH}/lib64/libcudnn.so.6.5; then + CUDNN_LIB_PATH=${CUDNN_INSTALL_PATH}/lib64 +else + CudnnError "cannot find libcudnn.so.6.5 under: ${CUDNN_INSTALL_PATH}" +fi + +# Helper function to build symbolic links for all files under a directory. +function LinkOneDir { + SRC_PREFIX=$1 + DST_PREFIX=$2 + SRC_DIR=$3 + DST_DIR=`echo $SRC_DIR | sed "s,^$SRC_PREFIX,$DST_PREFIX,"` + mkdir -p $DST_DIR + FILE_LIST=`find -L $SRC_DIR -maxdepth 1 -type f` + if test "$FILE_LIST" != ""; then + ln -sf $FILE_LIST $DST_DIR/ || exit -1 + fi +} +export -f LinkOneDir + +# Build links for all files under the directory, including subdirectoreis. +function LinkAllFiles { + SRC_DIR=$1 + DST_DIR=$2 + find -L $SRC_DIR -type d | xargs -I {} bash -c "LinkOneDir $SRC_DIR $DST_DIR {}" || exit -1 +} + +# Set up the symbolic links for cuda toolkit. We link at individual file level, +# not at the directory level. +# This is because the external library may have different file layout from our desired structure. +mkdir -p $OUTPUTDIR/third_party/gpus/cuda +echo "Setting up Cuda include" +LinkAllFiles ${CUDA_TOOLKIT_PATH}/include $OUTPUTDIR/third_party/gpus/cuda/include || exit -1 +echo "Setting up Cuda lib64" +LinkAllFiles ${CUDA_TOOLKIT_PATH}/lib64 $OUTPUTDIR/third_party/gpus/cuda/lib64 || exit -1 +echo "Setting up Cuda bin" +LinkAllFiles ${CUDA_TOOLKIT_PATH}/bin $OUTPUTDIR/third_party/gpus/cuda/bin || exit -1 +echo "Setting up Cuda nvvm" +LinkAllFiles ${CUDA_TOOLKIT_PATH}/nvvm $OUTPUTDIR/third_party/gpus/cuda/nvvm || exit -1 + +# Set up symbolic link for cudnn +ln -sf $CUDNN_HEADER_PATH/cudnn.h $OUTPUTDIR/third_party/gpus/cuda/include/cudnn.h || exit -1 +ln -sf $CUDNN_LIB_PATH/libcudnn.so.6.5 $OUTPUTDIR/third_party/gpus/cuda/lib64/libcudnn.so.6.5 || exit -1 |