commit
379b42c5b1
15 changed files with 375 additions and 2 deletions
@ -0,0 +1,7 @@ |
|||||||
|
## Cuda support |
||||||
|
|
||||||
|
Compiling Cuda source code is now supported, though only with the |
||||||
|
Ninja backend. This has been tested only on Linux for now. |
||||||
|
|
||||||
|
Because NVidia's Cuda compiler does not produce `.d` dependency files, |
||||||
|
dependency tracking does not work. |
@ -0,0 +1,202 @@ |
|||||||
|
# Copyright 2012-2017 The Meson development team |
||||||
|
|
||||||
|
# Licensed under the Apache License, Version 2.0 (the "License"); |
||||||
|
# you may not use this file except in compliance with the License. |
||||||
|
# You may obtain a copy of the License at |
||||||
|
|
||||||
|
# http://www.apache.org/licenses/LICENSE-2.0 |
||||||
|
|
||||||
|
# Unless required by applicable law or agreed to in writing, software |
||||||
|
# distributed under the License is distributed on an "AS IS" BASIS, |
||||||
|
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. |
||||||
|
# See the License for the specific language governing permissions and |
||||||
|
# limitations under the License. |
||||||
|
|
||||||
|
import subprocess, os.path |
||||||
|
|
||||||
|
from .. import mlog |
||||||
|
from ..mesonlib import EnvironmentException, Popen_safe |
||||||
|
from .compilers import Compiler, cuda_buildtype_args, cuda_optimization_args, cuda_debug_args |
||||||
|
|
||||||
|
class CudaCompiler(Compiler): |
||||||
|
def __init__(self, exelist, version, is_cross, exe_wrapper=None): |
||||||
|
if not hasattr(self, 'language'): |
||||||
|
self.language = 'cuda' |
||||||
|
super().__init__(exelist, version) |
||||||
|
self.is_cross = is_cross |
||||||
|
self.exe_wrapper = exe_wrapper |
||||||
|
self.id = 'nvcc' |
||||||
|
default_warn_args = [] |
||||||
|
self.warn_args = {'1': default_warn_args, |
||||||
|
'2': default_warn_args + ['-Wextra'], |
||||||
|
'3': default_warn_args + ['-Wextra', '-Wpedantic']} |
||||||
|
|
||||||
|
def needs_static_linker(self): |
||||||
|
return False |
||||||
|
|
||||||
|
def get_display_language(self): |
||||||
|
return 'Cuda' |
||||||
|
|
||||||
|
def get_no_stdinc_args(self): |
||||||
|
return [] |
||||||
|
|
||||||
|
def sanity_check(self, work_dir, environment): |
||||||
|
source_name = os.path.join(work_dir, 'sanitycheckcuda.cu') |
||||||
|
binary_name = os.path.join(work_dir, 'sanitycheckcuda') |
||||||
|
extra_flags = self.get_cross_extra_flags(environment, link=False) |
||||||
|
if self.is_cross: |
||||||
|
extra_flags += self.get_compile_only_args() |
||||||
|
|
||||||
|
code = ''' |
||||||
|
__global__ void kernel (void) { |
||||||
|
|
||||||
|
} |
||||||
|
|
||||||
|
int main(int argc,char** argv){ |
||||||
|
return 0; |
||||||
|
} |
||||||
|
''' |
||||||
|
|
||||||
|
with open(source_name, 'w') as ofile: |
||||||
|
ofile.write(code) |
||||||
|
pc = subprocess.Popen(self.exelist + extra_flags + [source_name, '-o', binary_name]) |
||||||
|
pc.wait() |
||||||
|
if pc.returncode != 0: |
||||||
|
raise EnvironmentException('Cuda compiler %s can not compile programs.' % self.name_string()) |
||||||
|
if self.is_cross: |
||||||
|
# Can't check if the binaries run so we have to assume they do |
||||||
|
return |
||||||
|
pe = subprocess.Popen(binary_name) |
||||||
|
pe.wait() |
||||||
|
if pe.returncode != 0: |
||||||
|
raise EnvironmentException('Executables created by Cuda compiler %s are not runnable.' % self.name_string()) |
||||||
|
|
||||||
|
def get_compiler_check_args(self): |
||||||
|
return super().get_compiler_check_args() + [] |
||||||
|
|
||||||
|
def has_header_symbol(self, hname, symbol, prefix, env, extra_args=None, dependencies=None): |
||||||
|
if super().has_header_symbol(hname, symbol, prefix, env, extra_args, dependencies): |
||||||
|
return True |
||||||
|
if extra_args is None: |
||||||
|
extra_args = [] |
||||||
|
fargs = {'prefix': prefix, 'header': hname, 'symbol': symbol} |
||||||
|
t = '''{prefix} |
||||||
|
#include <{header}> |
||||||
|
using {symbol}; |
||||||
|
int main () {{ return 0; }}''' |
||||||
|
return self.compiles(t.format(**fargs), env, extra_args, dependencies) |
||||||
|
|
||||||
|
def sanity_check_impl(self, work_dir, environment, sname, code): |
||||||
|
mlog.debug('Sanity testing ' + self.get_display_language() + ' compiler:', ' '.join(self.exelist)) |
||||||
|
mlog.debug('Is cross compiler: %s.' % str(self.is_cross)) |
||||||
|
|
||||||
|
extra_flags = [] |
||||||
|
source_name = os.path.join(work_dir, sname) |
||||||
|
binname = sname.rsplit('.', 1)[0] |
||||||
|
if self.is_cross: |
||||||
|
binname += '_cross' |
||||||
|
if self.exe_wrapper is None: |
||||||
|
# Linking cross built apps is painful. You can't really |
||||||
|
# tell if you should use -nostdlib or not and for example |
||||||
|
# on OSX the compiler binary is the same but you need |
||||||
|
# a ton of compiler flags to differentiate between |
||||||
|
# arm and x86_64. So just compile. |
||||||
|
extra_flags += self.get_cross_extra_flags(environment, link=False) |
||||||
|
extra_flags += self.get_compile_only_args() |
||||||
|
else: |
||||||
|
extra_flags += self.get_cross_extra_flags(environment, link=True) |
||||||
|
# Is a valid executable output for all toolchains and platforms |
||||||
|
binname += '.exe' |
||||||
|
# Write binary check source |
||||||
|
binary_name = os.path.join(work_dir, binname) |
||||||
|
with open(source_name, 'w') as ofile: |
||||||
|
ofile.write(code) |
||||||
|
# Compile sanity check |
||||||
|
cmdlist = self.exelist + extra_flags + [source_name] + self.get_output_args(binary_name) |
||||||
|
pc, stdo, stde = Popen_safe(cmdlist, cwd=work_dir) |
||||||
|
mlog.debug('Sanity check compiler command line:', ' '.join(cmdlist)) |
||||||
|
mlog.debug('Sanity check compile stdout:') |
||||||
|
mlog.debug(stdo) |
||||||
|
mlog.debug('-----\nSanity check compile stderr:') |
||||||
|
mlog.debug(stde) |
||||||
|
mlog.debug('-----') |
||||||
|
if pc.returncode != 0: |
||||||
|
raise EnvironmentException('Compiler {0} can not compile programs.'.format(self.name_string())) |
||||||
|
# Run sanity check |
||||||
|
if self.is_cross: |
||||||
|
if self.exe_wrapper is None: |
||||||
|
# Can't check if the binaries run so we have to assume they do |
||||||
|
return |
||||||
|
cmdlist = self.exe_wrapper + [binary_name] |
||||||
|
else: |
||||||
|
cmdlist = [binary_name] |
||||||
|
mlog.debug('Running test binary command: ' + ' '.join(cmdlist)) |
||||||
|
pe = subprocess.Popen(cmdlist) |
||||||
|
pe.wait() |
||||||
|
if pe.returncode != 0: |
||||||
|
raise EnvironmentException('Executables created by {0} compiler {1} are not runnable.'.format(self.language, self.name_string())) |
||||||
|
|
||||||
|
def get_output_args(self, target): |
||||||
|
return ['-o', target] |
||||||
|
|
||||||
|
def name_string(self): |
||||||
|
return ' '.join(self.exelist) |
||||||
|
|
||||||
|
def get_dependency_gen_args(self, outtarget, outfile): |
||||||
|
return [] |
||||||
|
|
||||||
|
def get_compile_only_args(self): |
||||||
|
return ['-c'] |
||||||
|
|
||||||
|
def get_no_optimization_args(self): |
||||||
|
return ['-O0'] |
||||||
|
|
||||||
|
def get_optimization_args(self, optimization_level): |
||||||
|
return cuda_optimization_args[optimization_level] |
||||||
|
|
||||||
|
def get_debug_args(self, is_debug): |
||||||
|
return cuda_debug_args[is_debug] |
||||||
|
|
||||||
|
def get_linker_exelist(self): |
||||||
|
return self.exelist[:] |
||||||
|
|
||||||
|
def get_linker_output_args(self, outputname): |
||||||
|
return ['-o', outputname] |
||||||
|
|
||||||
|
def get_warn_args(self, level): |
||||||
|
return self.warn_args[level] |
||||||
|
|
||||||
|
def get_buildtype_args(self, buildtype): |
||||||
|
return cuda_buildtype_args[buildtype] |
||||||
|
|
||||||
|
def get_include_args(self, path, is_system): |
||||||
|
if path == '': |
||||||
|
path = '.' |
||||||
|
return ['-I' + path] |
||||||
|
|
||||||
|
def depfile_for_object(self, objfile): |
||||||
|
return objfile + '.' + self.get_depfile_suffix() |
||||||
|
|
||||||
|
def get_depfile_suffix(self): |
||||||
|
return 'd' |
||||||
|
|
||||||
|
def get_buildtype_linker_args(self, buildtype): |
||||||
|
return [] |
||||||
|
|
||||||
|
def get_std_exe_link_args(self): |
||||||
|
return [] |
||||||
|
|
||||||
|
def build_rpath_args(self, build_dir, from_dir, rpath_paths, build_rpath, install_rpath): |
||||||
|
return [] |
||||||
|
|
||||||
|
def get_linker_search_args(self, dirname): |
||||||
|
return ['/LIBPATH:' + dirname] |
||||||
|
|
||||||
|
def linker_to_compiler_args(self, args): |
||||||
|
return ['/link'] + args |
||||||
|
|
||||||
|
def get_pic_args(self): |
||||||
|
return [] |
||||||
|
|
||||||
|
def compute_parameters_with_absolute_paths(self, parameter_list, build_dir): |
||||||
|
return [] |
@ -0,0 +1,5 @@ |
|||||||
|
project('simple', 'cuda', version : '1.0.0') |
||||||
|
|
||||||
|
exe = executable('prog', 'prog.cu') |
||||||
|
test('cudatest', exe) |
||||||
|
|
@ -0,0 +1,30 @@ |
|||||||
|
#include <iostream> |
||||||
|
|
||||||
|
int main(int argc, char **argv) { |
||||||
|
int cuda_devices = 0; |
||||||
|
std::cout << "CUDA version: " << CUDART_VERSION << "\n"; |
||||||
|
cudaGetDeviceCount(&cuda_devices); |
||||||
|
if(cuda_devices == 0) { |
||||||
|
std::cout << "No Cuda hardware found. Exiting.\n"; |
||||||
|
return 0; |
||||||
|
} |
||||||
|
std::cout << "This computer has " << cuda_devices << " Cuda device(s).\n"; |
||||||
|
cudaDeviceProp props; |
||||||
|
cudaGetDeviceProperties(&props, 0); |
||||||
|
std::cout << "Properties of device 0.\n\n"; |
||||||
|
|
||||||
|
std::cout << " Name: " << props.name << "\n"; |
||||||
|
std::cout << " Global memory: " << props.totalGlobalMem << "\n"; |
||||||
|
std::cout << " Shared memory: " << props.sharedMemPerBlock << "\n"; |
||||||
|
std::cout << " Constant memory: " << props.totalConstMem << "\n"; |
||||||
|
std::cout << " Block registers: " << props.regsPerBlock << "\n"; |
||||||
|
|
||||||
|
std::cout << " Warp size: " << props.warpSize << "\n"; |
||||||
|
std::cout << " Threads per block: " << props.maxThreadsPerBlock << "\n"; |
||||||
|
std::cout << " Max block dimensions: [ " << props.maxThreadsDim[0] << ", " << props.maxThreadsDim[1] << ", " << props.maxThreadsDim[2] << " ]" << "\n"; |
||||||
|
std::cout << " Max grid dimensions: [ " << props.maxGridSize[0] << ", " << props.maxGridSize[1] << ", " << props.maxGridSize[2] << " ]" << "\n"; |
||||||
|
std::cout << "\n"; |
||||||
|
|
||||||
|
return 0; |
||||||
|
} |
||||||
|
|
@ -0,0 +1,13 @@ |
|||||||
|
#include <stdio.h> |
||||||
|
#include <iostream> |
||||||
|
|
||||||
|
__global__ void kernel (void){ |
||||||
|
} |
||||||
|
|
||||||
|
int do_cuda_stuff() { |
||||||
|
kernel<<<1,1>>>(); |
||||||
|
|
||||||
|
printf("Hello, World!\n"); |
||||||
|
return 0; |
||||||
|
} |
||||||
|
|
@ -0,0 +1,7 @@ |
|||||||
|
#include<iostream> |
||||||
|
|
||||||
|
int do_cuda_stuff(); |
||||||
|
|
||||||
|
int main(int argc, char **argv) { |
||||||
|
return do_cuda_stuff(); |
||||||
|
} |
@ -0,0 +1,7 @@ |
|||||||
|
project('simple', 'cuda', 'cpp') |
||||||
|
|
||||||
|
exe = executable('prog', 'main.cpp', 'lib.cu') |
||||||
|
test('cudatest', exe) |
||||||
|
|
||||||
|
subdir('static') |
||||||
|
|
@ -0,0 +1,13 @@ |
|||||||
|
#include <stdio.h> |
||||||
|
#include <iostream> |
||||||
|
|
||||||
|
__global__ void kernel (void){ |
||||||
|
} |
||||||
|
|
||||||
|
int do_cuda_stuff() { |
||||||
|
kernel<<<1,1>>>(); |
||||||
|
|
||||||
|
printf("Hello, World!\n"); |
||||||
|
return 0; |
||||||
|
} |
||||||
|
|
@ -0,0 +1,13 @@ |
|||||||
|
#include <stdio.h> |
||||||
|
#include <iostream> |
||||||
|
|
||||||
|
__global__ void kernel (void){ |
||||||
|
} |
||||||
|
|
||||||
|
int do_cuda_stuff() { |
||||||
|
kernel<<<1,1>>>(); |
||||||
|
|
||||||
|
printf("Hello, World!\n"); |
||||||
|
return 0; |
||||||
|
} |
||||||
|
|
@ -0,0 +1,7 @@ |
|||||||
|
#include<iostream> |
||||||
|
|
||||||
|
int do_cuda_stuff(); |
||||||
|
|
||||||
|
int main(int argc, char **argv) { |
||||||
|
return do_cuda_stuff(); |
||||||
|
} |
@ -0,0 +1,4 @@ |
|||||||
|
l = static_library('clib', 'lib.cu') |
||||||
|
exe = executable('staexe', 'main_static.cpp', |
||||||
|
link_with : l) |
||||||
|
test('static Cuda test', exe) |
Loading…
Reference in new issue