From 54b6afa675a248ca46897acf47f9bf8cf06f047d Mon Sep 17 00:00:00 2001 From: Beau Johnston Date: Sun, 10 Jun 2018 07:42:50 +1000 Subject: [PATCH] added cuda compiler --- mesonbuild/compilers/__init__.py | 2 + mesonbuild/compilers/compilers.py | 11 +- mesonbuild/compilers/cuda.py | 188 +++++++++++++++++++++++++++ mesonbuild/environment.py | 44 ++++++- test cases/cuda/1 simple/meson.build | 5 + test cases/cuda/1 simple/prog.cu | 13 ++ 6 files changed, 261 insertions(+), 2 deletions(-) create mode 100644 mesonbuild/compilers/cuda.py create mode 100644 test cases/cuda/1 simple/meson.build create mode 100644 test cases/cuda/1 simple/prog.cu diff --git a/mesonbuild/compilers/__init__.py b/mesonbuild/compilers/__init__.py index c568a9862..60cca93c2 100644 --- a/mesonbuild/compilers/__init__.py +++ b/mesonbuild/compilers/__init__.py @@ -72,6 +72,7 @@ __all__ = [ 'JavaCompiler', 'LLVMDCompiler', 'MonoCompiler', + 'NvidiaCudaCompiler', 'VisualStudioCsCompiler', 'NAGFortranCompiler', 'ObjCCompiler', @@ -153,6 +154,7 @@ from .d import ( GnuDCompiler, LLVMDCompiler, ) +from .cuda import CudaCompiler from .fortran import ( FortranCompiler, G95FortranCompiler, diff --git a/mesonbuild/compilers/compilers.py b/mesonbuild/compilers/compilers.py index 016e704ad..b2dc213c3 100644 --- a/mesonbuild/compilers/compilers.py +++ b/mesonbuild/compilers/compilers.py @@ -37,6 +37,7 @@ lib_suffixes = ('a', 'lib', 'dll', 'dylib', 'so') lang_suffixes = { 'c': ('c',), 'cpp': ('cpp', 'cc', 'cxx', 'c++', 'hh', 'hpp', 'ipp', 'hxx'), + 'cuda': ('cu',), # f90, f95, f03, f08 are for free-form fortran ('f90' recommended) # f, for, ftn, fpp are for fixed-form fortran ('f' or 'for' recommended) 'fortran': ('f90', 'f95', 'f03', 'f08', 'f', 'for', 'ftn', 'fpp'), @@ -58,7 +59,7 @@ clib_langs = ('objcpp', 'cpp', 'objc', 'c', 'fortran',) # List of languages that can be linked with C code directly by the linker # used in build.py:process_compilers() and build.py:get_dynamic_linker() # XXX: Add Rust to this? -clink_langs = ('d',) + clib_langs +clink_langs = ('d', 'cuda') + clib_langs clink_suffixes = () for _l in clink_langs + ('vala',): clink_suffixes += lang_suffixes[_l] @@ -69,6 +70,7 @@ soregex = re.compile(r'.*\.so(\.[0-9]+)?(\.[0-9]+)?(\.[0-9]+)?$') # Environment variables that each lang uses. cflags_mapping = {'c': 'CFLAGS', 'cpp': 'CXXFLAGS', + 'cuda': 'CUFLAGS', 'objc': 'OBJCFLAGS', 'objcpp': 'OBJCXXFLAGS', 'fortran': 'FFLAGS', @@ -143,6 +145,13 @@ armclang_buildtype_args = {'plain': [], 'custom': [], } +cuda_buildtype_args = {'plain': [], + 'debug': ['-O0', '-g'], + 'debugoptimized': ['-O1', '--debug'], + 'release': ['-O3', '-Otime'], + 'minsize': ['-O3', '-Ospace'], + } + arm_buildtype_args = {'plain': [], 'debug': ['-O0', '--debug'], 'debugoptimized': ['-O1', '--debug'], diff --git a/mesonbuild/compilers/cuda.py b/mesonbuild/compilers/cuda.py new file mode 100644 index 000000000..f398bad81 --- /dev/null +++ b/mesonbuild/compilers/cuda.py @@ -0,0 +1,188 @@ +# Copyright 2012-2017 The Meson development team + +# Licensed under the Apache License, Version 2.0 (the "License"); +# you may not use this file except in compliance with the License. +# You may obtain a copy of the License at + +# http://www.apache.org/licenses/LICENSE-2.0 + +# Unless required by applicable law or agreed to in writing, software +# distributed under the License is distributed on an "AS IS" BASIS, +# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. +# See the License for the specific language governing permissions and +# limitations under the License. + +import subprocess, os.path + +from .. import mlog +from ..mesonlib import EnvironmentException, Popen_safe +from .compilers import Compiler, cuda_buildtype_args + +class CudaCompiler(Compiler): + def __init__(self, exelist, version, is_cross, exe_wrapper=None): + # If a child ObjCPP class has already set it, don't set it ourselves + if not hasattr(self, 'language'): + self.language = 'cuda' + super().__init__(exelist, version) + self.is_cross = is_cross + self.exe_wrapper = exe_wrapper + self.id = 'nvcc' + default_warn_args = [] + self.warn_args = {'1': default_warn_args, + '2': default_warn_args + ['-Wextra'], + '3': default_warn_args + ['-Wextra', '-Wpedantic']} + + def needs_static_linker(self): + return False + + def get_display_language(self): + return 'Cuda' + + def get_no_stdinc_args(self): + return [''] + + def sanity_check(self, work_dir, environment): + source_name = os.path.join(work_dir, 'sanitycheckcuda.cu') + binary_name = os.path.join(work_dir, 'sanitycheckcuda') + extra_flags = self.get_cross_extra_flags(environment, link=False) + if self.is_cross: + extra_flags += self.get_compile_only_args() + + code = ''' + #include + int main(int argc,char** argv){ + return 0; + } + ''' + + with open(source_name, 'w') as ofile: + ofile.write(code) + pc = subprocess.Popen(self.exelist + extra_flags + [source_name, '-o', binary_name]) + pc.wait() + if pc.returncode != 0: + raise EnvironmentException('Cuda compiler %s can not compile programs.' % self.name_string()) + if self.is_cross: + # Can't check if the binaries run so we have to assume they do + return + pe = subprocess.Popen(binary_name) + pe.wait() + if pe.returncode != 0: + raise EnvironmentException('Executables created by ObjC compiler %s are not runnable.' % self.name_string()) + + def get_compiler_check_args(self): + return super().get_compiler_check_args() + [] + + def has_header_symbol(self, hname, symbol, prefix, env, extra_args=None, dependencies=None): + if super().has_header_symbol(hname, symbol, prefix, env, extra_args, dependencies): + return True + if extra_args is None: + extra_args = [] + fargs = {'prefix': prefix, 'header': hname, 'symbol': symbol} + t = '''{prefix} + #include <{header}> + using {symbol}; + int main () {{ return 0; }}''' + return self.compiles(t.format(**fargs), env, extra_args, dependencies) + + def sanity_check_impl(self, work_dir, environment, sname, code): + mlog.debug('Sanity testing ' + self.get_display_language() + ' compiler:', ' '.join(self.exelist)) + mlog.debug('Is cross compiler: %s.' % str(self.is_cross)) + + extra_flags = [] + source_name = os.path.join(work_dir, sname) + binname = sname.rsplit('.', 1)[0] + if self.is_cross: + binname += '_cross' + if self.exe_wrapper is None: + # Linking cross built apps is painful. You can't really + # tell if you should use -nostdlib or not and for example + # on OSX the compiler binary is the same but you need + # a ton of compiler flags to differentiate between + # arm and x86_64. So just compile. + extra_flags += self.get_cross_extra_flags(environment, link=False) + extra_flags += self.get_compile_only_args() + else: + extra_flags += self.get_cross_extra_flags(environment, link=True) + # Is a valid executable output for all toolchains and platforms + binname += '.exe' + # Write binary check source + binary_name = os.path.join(work_dir, binname) + with open(source_name, 'w') as ofile: + ofile.write(code) + # Compile sanity check + cmdlist = self.exelist + extra_flags + [source_name] + self.get_output_args(binary_name) + pc, stdo, stde = Popen_safe(cmdlist, cwd=work_dir) + mlog.debug('Sanity check compiler command line:', ' '.join(cmdlist)) + mlog.debug('Sanity check compile stdout:') + mlog.debug(stdo) + mlog.debug('-----\nSanity check compile stderr:') + mlog.debug(stde) + mlog.debug('-----') + if pc.returncode != 0: + raise EnvironmentException('Compiler {0} can not compile programs.'.format(self.name_string())) + # Run sanity check + if self.is_cross: + if self.exe_wrapper is None: + # Can't check if the binaries run so we have to assume they do + return + cmdlist = self.exe_wrapper + [binary_name] + else: + cmdlist = [binary_name] + mlog.debug('Running test binary command: ' + ' '.join(cmdlist)) + pe = subprocess.Popen(cmdlist) + pe.wait() + if pe.returncode != 0: + raise EnvironmentException('Executables created by {0} compiler {1} are not runnable.'.format(self.language, self.name_string())) + + def get_output_args(self, target): + return ['-o', target] + + def name_string(self): + return ' '.join(self.exelist) + + def get_dependency_gen_args(self, outtarget, outfile): + return [] + + def get_compile_only_args(self): + return ['-c'] + + def get_no_optimization_args(self): + return ['-O0'] + + def get_linker_exelist(self): + return self.exelist[:] + + def get_linker_output_args(self, outputname): + return ['-o', outputname] + + def get_warn_args(self, level): + return self.warn_args[level] + + def get_buildtype_args(self, buildtype): + return cuda_buildtype_args[buildtype] + + def get_include_args(self, path, is_system): + if path == '': + path = '.' + return ['-I' + path] + + def depfile_for_object(self, objfile): + return objfile + '.' + self.get_depfile_suffix() + + def get_depfile_suffix(self): + return 'd' + + def get_buildtype_linker_args(self, buildtype): + return [] + + def get_std_exe_link_args(self): + return [] + + def build_rpath_args(self, build_dir, from_dir, rpath_paths, build_rpath, install_rpath): + return [] + + def get_linker_search_args(self, dirname): + return ['/LIBPATH:' + dirname] + + def linker_to_compiler_args(self, args): + return ['/link'] + args diff --git a/mesonbuild/environment.py b/mesonbuild/environment.py index 0809ac5f7..87d221d87 100644 --- a/mesonbuild/environment.py +++ b/mesonbuild/environment.py @@ -59,6 +59,7 @@ from .compilers import ( IntelFortranCompiler, JavaCompiler, MonoCompiler, + CudaCompiler, VisualStudioCsCompiler, NAGFortranCompiler, Open64FortranCompiler, @@ -99,6 +100,17 @@ known_cpu_families = ( 'x86_64' ) +# Environment variables that each lang uses. +cflags_mapping = {'c': 'CFLAGS', + 'cpp': 'CXXFLAGS', + 'cu': 'CUFLAGS', + 'objc': 'OBJCFLAGS', + 'objcpp': 'OBJCXXFLAGS', + 'fortran': 'FFLAGS', + 'd': 'DFLAGS', + 'vala': 'VALAFLAGS'} + + def detect_gcovr(version='3.1', log=False): gcovr_exe = 'gcovr' try: @@ -410,6 +422,7 @@ class Environment: self.default_d = ['ldc2', 'ldc', 'gdc', 'dmd'] self.default_fortran = ['gfortran', 'g95', 'f95', 'f90', 'f77', 'ifort', 'pgfortran'] self.default_java = ['javac'] + self.default_cuda = ['nvcc'] self.default_rust = ['rustc'] self.default_swift = ['swiftc'] self.default_vala = ['valac'] @@ -417,6 +430,7 @@ class Environment: self.default_strip = ['strip'] self.vs_static_linker = ['lib'] self.clang_cl_static_linker = ['llvm-lib'] + self.cuda_static_linker = ['nvlink'] self.gcc_static_linker = ['gcc-ar'] self.clang_static_linker = ['llvm-ar'] self.default_pkgconfig = ['pkg-config'] @@ -737,6 +751,25 @@ class Environment: def detect_cpp_compiler(self, want_cross): return self._detect_c_or_cpp_compiler('cpp', want_cross) + def detect_cuda_compiler(self, want_cross): + popen_exceptions = {} + compilers, ccache, is_cross, exe_wrap = self._get_compilers('cuda', 'Cuda', want_cross) + for compiler in compilers: + if isinstance(compiler, str): + compiler = [compiler] + else: + raise EnvironmentException() + arg = '--version' + try: + p, out, err = Popen_safe(compiler + [arg]) + except OSError as e: + popen_exceptions[' '.join(compiler + [arg])] = e + continue + version = search_version(out) + cls = CudaCompiler + return cls(ccache + compiler, version, is_cross, exe_wrap) + raise EnvironmentException('Could not find suitable CUDA compiler: "' + ' '.join(compilers) + '"') + def detect_fortran_compiler(self, want_cross): popen_exceptions = {} compilers, ccache, is_cross, exe_wrap = self._get_compilers('fortran', want_cross) @@ -999,6 +1032,10 @@ class Environment: comp = self.detect_objc_compiler(False) if need_cross_compiler: cross_comp = self.detect_objc_compiler(True) + elif lang == 'cuda': + comp = self.environment.detect_cuda_compiler(False) + if need_cross_compiler: + cross_comp = self.environment.detect_cuda_compiler(True) elif lang == 'objcpp': comp = self.detect_objcpp_compiler(False) if need_cross_compiler: @@ -1057,7 +1094,12 @@ class Environment: if linker is not None: linkers = [linker] else: - if isinstance(compiler, compilers.VisualStudioCCompiler): + evar = 'AR' + if isinstance(compiler, compilers.CudaCompiler): + linkers = [self.cuda_static_linker, self.default_static_linker] + elif evar in os.environ: + linkers = [shlex.split(os.environ[evar])] + elif isinstance(compiler, compilers.VisualStudioCCompiler): linkers = [self.vs_static_linker, self.clang_cl_static_linker] elif isinstance(compiler, compilers.GnuCompiler): # Use gcc-ar if available; needed for LTO diff --git a/test cases/cuda/1 simple/meson.build b/test cases/cuda/1 simple/meson.build new file mode 100644 index 000000000..19af734af --- /dev/null +++ b/test cases/cuda/1 simple/meson.build @@ -0,0 +1,5 @@ +project('simple', 'cuda', version : '1.0.0') + +exe = executable('prog', 'prog.cu') +test('cudatest', exe) + diff --git a/test cases/cuda/1 simple/prog.cu b/test cases/cuda/1 simple/prog.cu new file mode 100644 index 000000000..ed21152af --- /dev/null +++ b/test cases/cuda/1 simple/prog.cu @@ -0,0 +1,13 @@ +#include +#include + +__global__ void kernel (void){ + +} + +int main( void ) { + kernel<<<1,1>>>(); + printf( "Hello, World!\n" ); + return 0; +} +