123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259 |
- import itertools
- import os
- import os.path
- import sys
- import subprocess
- import optparse
- import process_command_files as pcf
- from process_whole_archive_option import ProcessWholeArchiveOption
- def get_leaks_suppressions(cmd):
- supp, newcmd = [], []
- for arg in cmd:
- if arg.endswith(".supp"):
- supp.append(arg)
- else:
- newcmd.append(arg)
- return supp, newcmd
- MUSL_LIBS = '-lc', '-lcrypt', '-ldl', '-lm', '-lpthread', '-lrt', '-lutil'
- CUDA_LIBRARIES = {
- '-lcublas_static': '-lcublas',
- '-lcublasLt_static': '-lcublasLt',
- '-lcudart_static': '-lcudart',
- '-lcudnn_static': '-lcudnn',
- '-lcufft_static_nocallback': '-lcufft',
- '-lcurand_static': '-lcurand',
- '-lcusolver_static': '-lcusolver',
- '-lcusparse_static': '-lcusparse',
- '-lmyelin_compiler_static': '-lmyelin',
- '-lmyelin_executor_static': '-lnvcaffe_parser',
- '-lmyelin_pattern_library_static': '',
- '-lmyelin_pattern_runtime_static': '',
- '-lnvinfer_static': '-lnvinfer',
- '-lnvinfer_plugin_static': '-lnvinfer_plugin',
- '-lnvonnxparser_static': '-lnvonnxparser',
- '-lnvparsers_static': '-lnvparsers',
- }
- def prune_cuda_libraries(cmd, prune_arches, nvprune_exe, build_root):
- def name_generator(prefix):
- for idx in itertools.count():
- yield prefix + '_' + str(idx)
- def compute_arch(arch):
- _, ver = arch.split('_', 1)
- return 'compute_{}'.format(ver)
- libs_to_prune = set(CUDA_LIBRARIES)
- # does not contain device code, nothing to prune
- libs_to_prune.remove('-lcudart_static')
- tmp_names_gen = name_generator('cuda_pruned_libs')
- arch_args = []
- for arch in prune_arches.split(':'):
- arch_args.append('-gencode')
- arch_args.append('arch={},code={}'.format(compute_arch(arch), arch))
- flags = []
- cuda_deps = set()
- for flag in reversed(cmd):
- if flag in libs_to_prune:
- cuda_deps.add('lib' + flag[2:] + '.a')
- flag += '_pruned'
- elif flag.startswith('-L') and os.path.exists(flag[2:]) and os.path.isdir(flag[2:]) and any(f in cuda_deps for f in os.listdir(flag[2:])):
- from_dirpath = flag[2:]
- from_deps = list(cuda_deps & set(os.listdir(from_dirpath)))
- if from_deps:
- to_dirpath = os.path.abspath(os.path.join(build_root, next(tmp_names_gen)))
- os.makedirs(to_dirpath)
- for f in from_deps:
- # prune lib
- from_path = os.path.join(from_dirpath, f)
- to_path = os.path.join(to_dirpath, f[:-2] + '_pruned.a')
- subprocess.check_call([nvprune_exe] + arch_args + ['--output-file', to_path, from_path])
- cuda_deps.remove(f)
- # do not remove current directory
- # because it can contain other libraries we want link to
- # instead we just add new directory with pruned libs
- flags.append('-L' + to_dirpath)
- flags.append(flag)
- assert not cuda_deps, ('Unresolved CUDA deps: ' + ','.join(cuda_deps))
- return reversed(flags)
- def remove_excessive_flags(cmd):
- flags = []
- for flag in cmd:
- if not flag.endswith('.ios.interface') and not flag.endswith('.pkg.fake'):
- flags.append(flag)
- return flags
- def fix_sanitize_flag(cmd, opts):
- """
- Remove -fsanitize=address flag if sanitazers are linked explicitly for linux target.
- """
- for flag in cmd:
- if flag.startswith('--target') and 'linux' not in flag.lower():
- # use toolchained sanitize libraries
- return cmd
- assert opts.clang_ver
- CLANG_RT = 'contrib/libs/clang' + opts.clang_ver + '-rt/lib/'
- sanitize_flags = {
- '-fsanitize=address': CLANG_RT + 'asan',
- '-fsanitize=memory': CLANG_RT + 'msan',
- '-fsanitize=leak': CLANG_RT + 'lsan',
- '-fsanitize=undefined': CLANG_RT + 'ubsan',
- '-fsanitize=thread': CLANG_RT + 'tsan',
- }
- used_sanitize_libs = []
- aux = []
- for flag in cmd:
- if flag.startswith('-fsanitize-coverage='):
- # do not link sanitizer libraries from clang
- aux.append('-fno-sanitize-link-runtime')
- if flag in sanitize_flags and any(s.startswith(sanitize_flags[flag]) for s in cmd):
- # exclude '-fsanitize=' if appropriate library is linked explicitly
- continue
- if any(flag.startswith(lib) for lib in sanitize_flags.values()):
- used_sanitize_libs.append(flag)
- continue
- aux.append(flag)
- # move sanitize libraries out of the repeatedly searched group of archives
- flags = []
- for flag in aux:
- if flag == '-Wl,--start-group':
- flags += ['-Wl,--whole-archive'] + used_sanitize_libs + ['-Wl,--no-whole-archive']
- flags.append(flag)
- return flags
- def fix_cmd_for_musl(cmd):
- flags = []
- for flag in cmd:
- if flag not in MUSL_LIBS:
- flags.append(flag)
- return flags
- def fix_cmd_for_dynamic_cuda(cmd):
- flags = []
- for flag in cmd:
- if flag in CUDA_LIBRARIES:
- flags.append(CUDA_LIBRARIES[flag])
- else:
- flags.append(flag)
- return flags
- def gen_default_suppressions(inputs, output, source_root):
- import collections
- import os
- supp_map = collections.defaultdict(set)
- for filename in inputs:
- sanitizer = os.path.basename(filename).split('.', 1)[0]
- with open(os.path.join(source_root, filename)) as src:
- for line in src:
- line = line.strip()
- if not line or line.startswith('#'):
- continue
- supp_map[sanitizer].add(line)
- with open(output, "wb") as dst:
- for supp_type, supps in supp_map.items():
- dst.write('extern "C" const char *__%s_default_suppressions() {\n' % supp_type)
- dst.write(' return "{}";\n'.format('\\n'.join(sorted(supps))))
- dst.write('}\n')
- def fix_blas_resolving(cmd):
- # Intel mkl comes as a precompiled static library and thus can not be recompiled with sanitizer runtime instrumentation.
- # That's why we prefer to use cblas instead of Intel mkl as a drop-in replacement under sanitizers.
- # But if the library has dependencies on mkl and cblas simultaneously, it will get a linking error.
- # Hence we assume that it's probably compiling without sanitizers and we can easily remove cblas to prevent multiple definitions of the same symbol at link time.
- for arg in cmd:
- if arg.startswith('contrib/libs') and arg.endswith('mkl-lp64.a'):
- return [arg for arg in cmd if not arg.endswith('libcontrib-libs-cblas.a')]
- return cmd
- def parse_args():
- parser = optparse.OptionParser()
- parser.disable_interspersed_args()
- parser.add_option('--musl', action='store_true')
- parser.add_option('--custom-step')
- parser.add_option('--python')
- parser.add_option('--source-root')
- parser.add_option('--clang-ver')
- parser.add_option('--dynamic-cuda', action='store_true')
- parser.add_option('--cuda-architectures',
- help='List of supported CUDA architectures, separated by ":" (e.g. "sm_52:compute_70:lto_90a"')
- parser.add_option('--nvprune-exe')
- parser.add_option('--build-root')
- parser.add_option('--arch')
- parser.add_option('--linker-output')
- parser.add_option('--whole-archive-peers', action='append')
- parser.add_option('--whole-archive-libs', action='append')
- return parser.parse_args()
- if __name__ == '__main__':
- opts, args = parse_args()
- args = pcf.skip_markers(args)
- cmd = fix_blas_resolving(args)
- cmd = remove_excessive_flags(cmd)
- if opts.musl:
- cmd = fix_cmd_for_musl(cmd)
- cmd = fix_sanitize_flag(cmd, opts)
- if 'ld.lld' in str(cmd):
- if '-fPIE' in str(cmd) or '-fPIC' in str(cmd):
- # support explicit PIE
- pass
- else:
- cmd.append('-Wl,-no-pie')
- if opts.dynamic_cuda:
- cmd = fix_cmd_for_dynamic_cuda(cmd)
- elif opts.cuda_architectures:
- cmd = prune_cuda_libraries(cmd, opts.cuda_architectures, opts.nvprune_exe, opts.build_root)
- cmd = ProcessWholeArchiveOption(opts.arch, opts.whole_archive_peers, opts.whole_archive_libs).construct_cmd(cmd)
- if opts.custom_step:
- assert opts.python
- subprocess.check_call([opts.python] + [opts.custom_step] + args)
- supp, cmd = get_leaks_suppressions(cmd)
- if supp:
- src_file = "default_suppressions.cpp"
- gen_default_suppressions(supp, src_file, opts.source_root)
- cmd += [src_file]
- if opts.linker_output:
- stdout = open(opts.linker_output, 'w')
- else:
- stdout = sys.stdout
- rc = subprocess.call(cmd, shell=False, stderr=sys.stderr, stdout=stdout)
- sys.exit(rc)
|