commit
379b42c5b1
15 changed files with 375 additions and 2 deletions
@ -0,0 +1,7 @@ |
||||
## Cuda support |
||||
|
||||
Compiling Cuda source code is now supported, though only with the |
||||
Ninja backend. This has been tested only on Linux for now. |
||||
|
||||
Because NVidia's Cuda compiler does not produce `.d` dependency files, |
||||
dependency tracking does not work. |
@ -0,0 +1,202 @@ |
||||
# Copyright 2012-2017 The Meson development team |
||||
|
||||
# Licensed under the Apache License, Version 2.0 (the "License"); |
||||
# you may not use this file except in compliance with the License. |
||||
# You may obtain a copy of the License at |
||||
|
||||
# http://www.apache.org/licenses/LICENSE-2.0 |
||||
|
||||
# Unless required by applicable law or agreed to in writing, software |
||||
# distributed under the License is distributed on an "AS IS" BASIS, |
||||
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. |
||||
# See the License for the specific language governing permissions and |
||||
# limitations under the License. |
||||
|
||||
import subprocess, os.path |
||||
|
||||
from .. import mlog |
||||
from ..mesonlib import EnvironmentException, Popen_safe |
||||
from .compilers import Compiler, cuda_buildtype_args, cuda_optimization_args, cuda_debug_args |
||||
|
||||
class CudaCompiler(Compiler): |
||||
def __init__(self, exelist, version, is_cross, exe_wrapper=None): |
||||
if not hasattr(self, 'language'): |
||||
self.language = 'cuda' |
||||
super().__init__(exelist, version) |
||||
self.is_cross = is_cross |
||||
self.exe_wrapper = exe_wrapper |
||||
self.id = 'nvcc' |
||||
default_warn_args = [] |
||||
self.warn_args = {'1': default_warn_args, |
||||
'2': default_warn_args + ['-Wextra'], |
||||
'3': default_warn_args + ['-Wextra', '-Wpedantic']} |
||||
|
||||
def needs_static_linker(self): |
||||
return False |
||||
|
||||
def get_display_language(self): |
||||
return 'Cuda' |
||||
|
||||
def get_no_stdinc_args(self): |
||||
return [] |
||||
|
||||
def sanity_check(self, work_dir, environment): |
||||
source_name = os.path.join(work_dir, 'sanitycheckcuda.cu') |
||||
binary_name = os.path.join(work_dir, 'sanitycheckcuda') |
||||
extra_flags = self.get_cross_extra_flags(environment, link=False) |
||||
if self.is_cross: |
||||
extra_flags += self.get_compile_only_args() |
||||
|
||||
code = ''' |
||||
__global__ void kernel (void) { |
||||
|
||||
} |
||||
|
||||
int main(int argc,char** argv){ |
||||
return 0; |
||||
} |
||||
''' |
||||
|
||||
with open(source_name, 'w') as ofile: |
||||
ofile.write(code) |
||||
pc = subprocess.Popen(self.exelist + extra_flags + [source_name, '-o', binary_name]) |
||||
pc.wait() |
||||
if pc.returncode != 0: |
||||
raise EnvironmentException('Cuda compiler %s can not compile programs.' % self.name_string()) |
||||
if self.is_cross: |
||||
# Can't check if the binaries run so we have to assume they do |
||||
return |
||||
pe = subprocess.Popen(binary_name) |
||||
pe.wait() |
||||
if pe.returncode != 0: |
||||
raise EnvironmentException('Executables created by Cuda compiler %s are not runnable.' % self.name_string()) |
||||
|
||||
def get_compiler_check_args(self): |
||||
return super().get_compiler_check_args() + [] |
||||
|
||||
def has_header_symbol(self, hname, symbol, prefix, env, extra_args=None, dependencies=None): |
||||
if super().has_header_symbol(hname, symbol, prefix, env, extra_args, dependencies): |
||||
return True |
||||
if extra_args is None: |
||||
extra_args = [] |
||||
fargs = {'prefix': prefix, 'header': hname, 'symbol': symbol} |
||||
t = '''{prefix} |
||||
#include <{header}> |
||||
using {symbol}; |
||||
int main () {{ return 0; }}''' |
||||
return self.compiles(t.format(**fargs), env, extra_args, dependencies) |
||||
|
||||
def sanity_check_impl(self, work_dir, environment, sname, code): |
||||
mlog.debug('Sanity testing ' + self.get_display_language() + ' compiler:', ' '.join(self.exelist)) |
||||
mlog.debug('Is cross compiler: %s.' % str(self.is_cross)) |
||||
|
||||
extra_flags = [] |
||||
source_name = os.path.join(work_dir, sname) |
||||
binname = sname.rsplit('.', 1)[0] |
||||
if self.is_cross: |
||||
binname += '_cross' |
||||
if self.exe_wrapper is None: |
||||
# Linking cross built apps is painful. You can't really |
||||
# tell if you should use -nostdlib or not and for example |
||||
# on OSX the compiler binary is the same but you need |
||||
# a ton of compiler flags to differentiate between |
||||
# arm and x86_64. So just compile. |
||||
extra_flags += self.get_cross_extra_flags(environment, link=False) |
||||
extra_flags += self.get_compile_only_args() |
||||
else: |
||||
extra_flags += self.get_cross_extra_flags(environment, link=True) |
||||
# Is a valid executable output for all toolchains and platforms |
||||
binname += '.exe' |
||||
# Write binary check source |
||||
binary_name = os.path.join(work_dir, binname) |
||||
with open(source_name, 'w') as ofile: |
||||
ofile.write(code) |
||||
# Compile sanity check |
||||
cmdlist = self.exelist + extra_flags + [source_name] + self.get_output_args(binary_name) |
||||
pc, stdo, stde = Popen_safe(cmdlist, cwd=work_dir) |
||||
mlog.debug('Sanity check compiler command line:', ' '.join(cmdlist)) |
||||
mlog.debug('Sanity check compile stdout:') |
||||
mlog.debug(stdo) |
||||
mlog.debug('-----\nSanity check compile stderr:') |
||||
mlog.debug(stde) |
||||
mlog.debug('-----') |
||||
if pc.returncode != 0: |
||||
raise EnvironmentException('Compiler {0} can not compile programs.'.format(self.name_string())) |
||||
# Run sanity check |
||||
if self.is_cross: |
||||
if self.exe_wrapper is None: |
||||
# Can't check if the binaries run so we have to assume they do |
||||
return |
||||
cmdlist = self.exe_wrapper + [binary_name] |
||||
else: |
||||
cmdlist = [binary_name] |
||||
mlog.debug('Running test binary command: ' + ' '.join(cmdlist)) |
||||
pe = subprocess.Popen(cmdlist) |
||||
pe.wait() |
||||
if pe.returncode != 0: |
||||
raise EnvironmentException('Executables created by {0} compiler {1} are not runnable.'.format(self.language, self.name_string())) |
||||
|
||||
def get_output_args(self, target): |
||||
return ['-o', target] |
||||
|
||||
def name_string(self): |
||||
return ' '.join(self.exelist) |
||||
|
||||
def get_dependency_gen_args(self, outtarget, outfile): |
||||
return [] |
||||
|
||||
def get_compile_only_args(self): |
||||
return ['-c'] |
||||
|
||||
def get_no_optimization_args(self): |
||||
return ['-O0'] |
||||
|
||||
def get_optimization_args(self, optimization_level): |
||||
return cuda_optimization_args[optimization_level] |
||||
|
||||
def get_debug_args(self, is_debug): |
||||
return cuda_debug_args[is_debug] |
||||
|
||||
def get_linker_exelist(self): |
||||
return self.exelist[:] |
||||
|
||||
def get_linker_output_args(self, outputname): |
||||
return ['-o', outputname] |
||||
|
||||
def get_warn_args(self, level): |
||||
return self.warn_args[level] |
||||
|
||||
def get_buildtype_args(self, buildtype): |
||||
return cuda_buildtype_args[buildtype] |
||||
|
||||
def get_include_args(self, path, is_system): |
||||
if path == '': |
||||
path = '.' |
||||
return ['-I' + path] |
||||
|
||||
def depfile_for_object(self, objfile): |
||||
return objfile + '.' + self.get_depfile_suffix() |
||||
|
||||
def get_depfile_suffix(self): |
||||
return 'd' |
||||
|
||||
def get_buildtype_linker_args(self, buildtype): |
||||
return [] |
||||
|
||||
def get_std_exe_link_args(self): |
||||
return [] |
||||
|
||||
def build_rpath_args(self, build_dir, from_dir, rpath_paths, build_rpath, install_rpath): |
||||
return [] |
||||
|
||||
def get_linker_search_args(self, dirname): |
||||
return ['/LIBPATH:' + dirname] |
||||
|
||||
def linker_to_compiler_args(self, args): |
||||
return ['/link'] + args |
||||
|
||||
def get_pic_args(self): |
||||
return [] |
||||
|
||||
def compute_parameters_with_absolute_paths(self, parameter_list, build_dir): |
||||
return [] |
@ -0,0 +1,5 @@ |
||||
project('simple', 'cuda', version : '1.0.0') |
||||
|
||||
exe = executable('prog', 'prog.cu') |
||||
test('cudatest', exe) |
||||
|
@ -0,0 +1,30 @@ |
||||
#include <iostream> |
||||
|
||||
int main(int argc, char **argv) { |
||||
int cuda_devices = 0; |
||||
std::cout << "CUDA version: " << CUDART_VERSION << "\n"; |
||||
cudaGetDeviceCount(&cuda_devices); |
||||
if(cuda_devices == 0) { |
||||
std::cout << "No Cuda hardware found. Exiting.\n"; |
||||
return 0; |
||||
} |
||||
std::cout << "This computer has " << cuda_devices << " Cuda device(s).\n"; |
||||
cudaDeviceProp props; |
||||
cudaGetDeviceProperties(&props, 0); |
||||
std::cout << "Properties of device 0.\n\n"; |
||||
|
||||
std::cout << " Name: " << props.name << "\n"; |
||||
std::cout << " Global memory: " << props.totalGlobalMem << "\n"; |
||||
std::cout << " Shared memory: " << props.sharedMemPerBlock << "\n"; |
||||
std::cout << " Constant memory: " << props.totalConstMem << "\n"; |
||||
std::cout << " Block registers: " << props.regsPerBlock << "\n"; |
||||
|
||||
std::cout << " Warp size: " << props.warpSize << "\n"; |
||||
std::cout << " Threads per block: " << props.maxThreadsPerBlock << "\n"; |
||||
std::cout << " Max block dimensions: [ " << props.maxThreadsDim[0] << ", " << props.maxThreadsDim[1] << ", " << props.maxThreadsDim[2] << " ]" << "\n"; |
||||
std::cout << " Max grid dimensions: [ " << props.maxGridSize[0] << ", " << props.maxGridSize[1] << ", " << props.maxGridSize[2] << " ]" << "\n"; |
||||
std::cout << "\n"; |
||||
|
||||
return 0; |
||||
} |
||||
|
@ -0,0 +1,13 @@ |
||||
#include <stdio.h> |
||||
#include <iostream> |
||||
|
||||
__global__ void kernel (void){ |
||||
} |
||||
|
||||
int do_cuda_stuff() { |
||||
kernel<<<1,1>>>(); |
||||
|
||||
printf("Hello, World!\n"); |
||||
return 0; |
||||
} |
||||
|
@ -0,0 +1,7 @@ |
||||
#include<iostream> |
||||
|
||||
int do_cuda_stuff(); |
||||
|
||||
int main(int argc, char **argv) { |
||||
return do_cuda_stuff(); |
||||
} |
@ -0,0 +1,7 @@ |
||||
project('simple', 'cuda', 'cpp') |
||||
|
||||
exe = executable('prog', 'main.cpp', 'lib.cu') |
||||
test('cudatest', exe) |
||||
|
||||
subdir('static') |
||||
|
@ -0,0 +1,13 @@ |
||||
#include <stdio.h> |
||||
#include <iostream> |
||||
|
||||
__global__ void kernel (void){ |
||||
} |
||||
|
||||
int do_cuda_stuff() { |
||||
kernel<<<1,1>>>(); |
||||
|
||||
printf("Hello, World!\n"); |
||||
return 0; |
||||
} |
||||
|
@ -0,0 +1,13 @@ |
||||
#include <stdio.h> |
||||
#include <iostream> |
||||
|
||||
__global__ void kernel (void){ |
||||
} |
||||
|
||||
int do_cuda_stuff() { |
||||
kernel<<<1,1>>>(); |
||||
|
||||
printf("Hello, World!\n"); |
||||
return 0; |
||||
} |
||||
|
@ -0,0 +1,7 @@ |
||||
#include<iostream> |
||||
|
||||
int do_cuda_stuff(); |
||||
|
||||
int main(int argc, char **argv) { |
||||
return do_cuda_stuff(); |
||||
} |
@ -0,0 +1,4 @@ |
||||
l = static_library('clib', 'lib.cu') |
||||
exe = executable('staexe', 'main_static.cpp', |
||||
link_with : l) |
||||
test('static Cuda test', exe) |
Loading…
Reference in new issue