mirror of https://github.com/opencv/opencv.git
Open Source Computer Vision Library
https://opencv.org/
You can not select more than 25 topics
Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
12305 lines
271 KiB
12305 lines
271 KiB
/******************************************************************************* |
|
* Copyright (c) 2008-2013 The Khronos Group Inc. |
|
* |
|
* Permission is hereby granted, free of charge, to any person obtaining a |
|
* copy of this software and/or associated documentation files (the |
|
* "Materials"), to deal in the Materials without restriction, including |
|
* without limitation the rights to use, copy, modify, merge, publish, |
|
* distribute, sublicense, and/or sell copies of the Materials, and to |
|
* permit persons to whom the Materials are furnished to do so, subject to |
|
* the following conditions: |
|
* |
|
* The above copyright notice and this permission notice shall be included |
|
* in all copies or substantial portions of the Materials. |
|
* |
|
* THE MATERIALS ARE PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, |
|
* EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF |
|
* MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. |
|
* IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY |
|
* CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, |
|
* TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE |
|
* MATERIALS OR THE USE OR OTHER DEALINGS IN THE MATERIALS. |
|
******************************************************************************/ |
|
|
|
/*! \file |
|
* |
|
* \brief C++ bindings for OpenCL 1.0 (rev 48), OpenCL 1.1 (rev 33) and |
|
* OpenCL 1.2 (rev 15) |
|
* \author Benedict R. Gaster, Laurent Morichetti and Lee Howes |
|
* |
|
* Additions and fixes from: |
|
* Brian Cole, March 3rd 2010 and April 2012 |
|
* Matt Gruenke, April 2012. |
|
* Bruce Merry, February 2013. |
|
* |
|
* \version 1.2.5 |
|
* \date June 2013 |
|
* |
|
* Optional extension support |
|
* |
|
* cl |
|
* cl_ext_device_fission |
|
* #define USE_CL_DEVICE_FISSION |
|
*/ |
|
|
|
/*! \mainpage |
|
* \section intro Introduction |
|
* For many large applications C++ is the language of choice and so it seems |
|
* reasonable to define C++ bindings for OpenCL. |
|
* |
|
* |
|
* The interface is contained with a single C++ header file \em cl.hpp and all |
|
* definitions are contained within the namespace \em cl. There is no additional |
|
* requirement to include \em cl.h and to use either the C++ or original C |
|
* bindings it is enough to simply include \em cl.hpp. |
|
* |
|
* The bindings themselves are lightweight and correspond closely to the |
|
* underlying C API. Using the C++ bindings introduces no additional execution |
|
* overhead. |
|
* |
|
* For detail documentation on the bindings see: |
|
* |
|
* The OpenCL C++ Wrapper API 1.2 (revision 09) |
|
* http://www.khronos.org/registry/cl/specs/opencl-cplusplus-1.2.pdf |
|
* |
|
* \section example Example |
|
* |
|
* The following example shows a general use case for the C++ |
|
* bindings, including support for the optional exception feature and |
|
* also the supplied vector and string classes, see following sections for |
|
* decriptions of these features. |
|
* |
|
* \code |
|
* #define __CL_ENABLE_EXCEPTIONS |
|
* |
|
* #if defined(__APPLE__) || defined(__MACOSX) |
|
* #include <OpenCL/cl.hpp> |
|
* #else |
|
* #include <CL/cl.hpp> |
|
* #endif |
|
* #include <cstdio> |
|
* #include <cstdlib> |
|
* #include <iostream> |
|
* |
|
* const char * helloStr = "__kernel void " |
|
* "hello(void) " |
|
* "{ " |
|
* " " |
|
* "} "; |
|
* |
|
* int |
|
* main(void) |
|
* { |
|
* cl_int err = CL_SUCCESS; |
|
* try { |
|
* |
|
* std::vector<cl::Platform> platforms; |
|
* cl::Platform::get(&platforms); |
|
* if (platforms.size() == 0) { |
|
* std::cout << "Platform size 0\n"; |
|
* return -1; |
|
* } |
|
* |
|
* cl_context_properties properties[] = |
|
* { CL_CONTEXT_PLATFORM, (cl_context_properties)(platforms[0])(), 0}; |
|
* cl::Context context(CL_DEVICE_TYPE_CPU, properties); |
|
* |
|
* std::vector<cl::Device> devices = context.getInfo<CL_CONTEXT_DEVICES>(); |
|
* |
|
* cl::Program::Sources source(1, |
|
* std::make_pair(helloStr,strlen(helloStr))); |
|
* cl::Program program_ = cl::Program(context, source); |
|
* program_.build(devices); |
|
* |
|
* cl::Kernel kernel(program_, "hello", &err); |
|
* |
|
* cl::Event event; |
|
* cl::CommandQueue queue(context, devices[0], 0, &err); |
|
* queue.enqueueNDRangeKernel( |
|
* kernel, |
|
* cl::NullRange, |
|
* cl::NDRange(4,4), |
|
* cl::NullRange, |
|
* NULL, |
|
* &event); |
|
* |
|
* event.wait(); |
|
* } |
|
* catch (cl::Error err) { |
|
* std::cerr |
|
* << "ERROR: " |
|
* << err.what() |
|
* << "(" |
|
* << err.err() |
|
* << ")" |
|
* << std::endl; |
|
* } |
|
* |
|
* return EXIT_SUCCESS; |
|
* } |
|
* |
|
* \endcode |
|
* |
|
*/ |
|
#ifndef CL_HPP_ |
|
#define CL_HPP_ |
|
|
|
#ifdef _WIN32 |
|
|
|
#include <windows.h> |
|
#include <malloc.h> |
|
#include <iterator> |
|
#include <intrin.h> |
|
|
|
#if defined(__CL_ENABLE_EXCEPTIONS) |
|
#include <exception> |
|
#endif // #if defined(__CL_ENABLE_EXCEPTIONS) |
|
|
|
#pragma push_macro("max") |
|
#undef max |
|
#if defined(USE_DX_INTEROP) |
|
#include <CL/cl_d3d10.h> |
|
#include <CL/cl_dx9_media_sharing.h> |
|
#endif |
|
#endif // _WIN32 |
|
|
|
// |
|
#if defined(USE_CL_DEVICE_FISSION) |
|
#include <CL/cl_ext.h> |
|
#endif |
|
|
|
#if defined(__APPLE__) || defined(__MACOSX) |
|
#include <OpenGL/OpenGL.h> |
|
#include <OpenCL/opencl.h> |
|
#include <libkern/OSAtomic.h> |
|
#else |
|
#include <GL/gl.h> |
|
#include <CL/opencl.h> |
|
#endif // !__APPLE__ |
|
|
|
// To avoid accidentally taking ownership of core OpenCL types |
|
// such as cl_kernel constructors are made explicit |
|
// under OpenCL 1.2 |
|
#if defined(CL_VERSION_1_2) && !defined(CL_USE_DEPRECATED_OPENCL_1_1_APIS) |
|
#define __CL_EXPLICIT_CONSTRUCTORS explicit |
|
#else // #if defined(CL_USE_DEPRECATED_OPENCL_1_1_APIS) |
|
#define __CL_EXPLICIT_CONSTRUCTORS |
|
#endif // #if defined(CL_USE_DEPRECATED_OPENCL_1_1_APIS) |
|
|
|
// Define deprecated prefixes and suffixes to ensure compilation |
|
// in case they are not pre-defined |
|
#if !defined(CL_EXT_PREFIX__VERSION_1_1_DEPRECATED) |
|
#define CL_EXT_PREFIX__VERSION_1_1_DEPRECATED |
|
#endif // #if !defined(CL_EXT_PREFIX__VERSION_1_1_DEPRECATED) |
|
#if !defined(CL_EXT_SUFFIX__VERSION_1_1_DEPRECATED) |
|
#define CL_EXT_SUFFIX__VERSION_1_1_DEPRECATED |
|
#endif // #if !defined(CL_EXT_PREFIX__VERSION_1_1_DEPRECATED) |
|
|
|
#if !defined(CL_CALLBACK) |
|
#define CL_CALLBACK |
|
#endif //CL_CALLBACK |
|
|
|
#include <utility> |
|
#include <limits> |
|
|
|
#if !defined(__NO_STD_VECTOR) |
|
#include <vector> |
|
#endif |
|
|
|
#if !defined(__NO_STD_STRING) |
|
#include <string> |
|
#endif |
|
|
|
#if defined(linux) || defined(__APPLE__) || defined(__MACOSX) |
|
#include <alloca.h> |
|
|
|
#include <emmintrin.h> |
|
#include <xmmintrin.h> |
|
#endif // linux |
|
|
|
#include <cstring> |
|
|
|
|
|
/*! \namespace cl |
|
* |
|
* \brief The OpenCL C++ bindings are defined within this namespace. |
|
* |
|
*/ |
|
namespace cl { |
|
|
|
class Memory; |
|
|
|
/** |
|
* Deprecated APIs for 1.2 |
|
*/ |
|
#if defined(CL_USE_DEPRECATED_OPENCL_1_1_APIS) || (defined(CL_VERSION_1_1) && !defined(CL_VERSION_1_2)) |
|
#define __INIT_CL_EXT_FCN_PTR(name) \ |
|
if(!pfn_##name) { \ |
|
pfn_##name = (PFN_##name) \ |
|
clGetExtensionFunctionAddress(#name); \ |
|
if(!pfn_##name) { \ |
|
} \ |
|
} |
|
#endif // #if defined(CL_VERSION_1_1) |
|
|
|
#if defined(CL_VERSION_1_2) |
|
#define __INIT_CL_EXT_FCN_PTR_PLATFORM(platform, name) \ |
|
if(!pfn_##name) { \ |
|
pfn_##name = (PFN_##name) \ |
|
clGetExtensionFunctionAddressForPlatform(platform, #name); \ |
|
if(!pfn_##name) { \ |
|
} \ |
|
} |
|
#endif // #if defined(CL_VERSION_1_1) |
|
|
|
class Program; |
|
class Device; |
|
class Context; |
|
class CommandQueue; |
|
class Memory; |
|
class Buffer; |
|
|
|
#if defined(__CL_ENABLE_EXCEPTIONS) |
|
/*! \brief Exception class |
|
* |
|
* This may be thrown by API functions when __CL_ENABLE_EXCEPTIONS is defined. |
|
*/ |
|
class Error : public std::exception |
|
{ |
|
private: |
|
cl_int err_; |
|
const char * errStr_; |
|
public: |
|
/*! \brief Create a new CL error exception for a given error code |
|
* and corresponding message. |
|
* |
|
* \param err error code value. |
|
* |
|
* \param errStr a descriptive string that must remain in scope until |
|
* handling of the exception has concluded. If set, it |
|
* will be returned by what(). |
|
*/ |
|
Error(cl_int err, const char * errStr = NULL) : err_(err), errStr_(errStr) |
|
{} |
|
|
|
~Error() throw() {} |
|
|
|
/*! \brief Get error string associated with exception |
|
* |
|
* \return A memory pointer to the error message string. |
|
*/ |
|
virtual const char * what() const throw () |
|
{ |
|
if (errStr_ == NULL) { |
|
return "empty"; |
|
} |
|
else { |
|
return errStr_; |
|
} |
|
} |
|
|
|
/*! \brief Get error code associated with exception |
|
* |
|
* \return The error code. |
|
*/ |
|
cl_int err(void) const { return err_; } |
|
}; |
|
|
|
#define __ERR_STR(x) #x |
|
#else |
|
#define __ERR_STR(x) NULL |
|
#endif // __CL_ENABLE_EXCEPTIONS |
|
|
|
|
|
namespace detail |
|
{ |
|
#if defined(__CL_ENABLE_EXCEPTIONS) |
|
static inline cl_int errHandler ( |
|
cl_int err, |
|
const char * errStr = NULL) |
|
{ |
|
if (err != CL_SUCCESS) { |
|
throw Error(err, errStr); |
|
} |
|
return err; |
|
} |
|
#else |
|
static inline cl_int errHandler (cl_int err, const char * errStr = NULL) |
|
{ |
|
(void) errStr; // suppress unused variable warning |
|
return err; |
|
} |
|
#endif // __CL_ENABLE_EXCEPTIONS |
|
} |
|
|
|
|
|
|
|
//! \cond DOXYGEN_DETAIL |
|
#if !defined(__CL_USER_OVERRIDE_ERROR_STRINGS) |
|
#define __GET_DEVICE_INFO_ERR __ERR_STR(clGetDeviceInfo) |
|
#define __GET_PLATFORM_INFO_ERR __ERR_STR(clGetPlatformInfo) |
|
#define __GET_DEVICE_IDS_ERR __ERR_STR(clGetDeviceIDs) |
|
#define __GET_PLATFORM_IDS_ERR __ERR_STR(clGetPlatformIDs) |
|
#define __GET_CONTEXT_INFO_ERR __ERR_STR(clGetContextInfo) |
|
#define __GET_EVENT_INFO_ERR __ERR_STR(clGetEventInfo) |
|
#define __GET_EVENT_PROFILE_INFO_ERR __ERR_STR(clGetEventProfileInfo) |
|
#define __GET_MEM_OBJECT_INFO_ERR __ERR_STR(clGetMemObjectInfo) |
|
#define __GET_IMAGE_INFO_ERR __ERR_STR(clGetImageInfo) |
|
#define __GET_SAMPLER_INFO_ERR __ERR_STR(clGetSamplerInfo) |
|
#define __GET_KERNEL_INFO_ERR __ERR_STR(clGetKernelInfo) |
|
#if defined(CL_VERSION_1_2) |
|
#define __GET_KERNEL_ARG_INFO_ERR __ERR_STR(clGetKernelArgInfo) |
|
#endif // #if defined(CL_VERSION_1_2) |
|
#define __GET_KERNEL_WORK_GROUP_INFO_ERR __ERR_STR(clGetKernelWorkGroupInfo) |
|
#define __GET_PROGRAM_INFO_ERR __ERR_STR(clGetProgramInfo) |
|
#define __GET_PROGRAM_BUILD_INFO_ERR __ERR_STR(clGetProgramBuildInfo) |
|
#define __GET_COMMAND_QUEUE_INFO_ERR __ERR_STR(clGetCommandQueueInfo) |
|
|
|
#define __CREATE_CONTEXT_ERR __ERR_STR(clCreateContext) |
|
#define __CREATE_CONTEXT_FROM_TYPE_ERR __ERR_STR(clCreateContextFromType) |
|
#define __GET_SUPPORTED_IMAGE_FORMATS_ERR __ERR_STR(clGetSupportedImageFormats) |
|
|
|
#define __CREATE_BUFFER_ERR __ERR_STR(clCreateBuffer) |
|
#define __COPY_ERR __ERR_STR(cl::copy) |
|
#define __CREATE_SUBBUFFER_ERR __ERR_STR(clCreateSubBuffer) |
|
#define __CREATE_GL_BUFFER_ERR __ERR_STR(clCreateFromGLBuffer) |
|
#define __CREATE_GL_RENDER_BUFFER_ERR __ERR_STR(clCreateFromGLBuffer) |
|
#define __GET_GL_OBJECT_INFO_ERR __ERR_STR(clGetGLObjectInfo) |
|
#if defined(CL_VERSION_1_2) |
|
#define __CREATE_IMAGE_ERR __ERR_STR(clCreateImage) |
|
#define __CREATE_GL_TEXTURE_ERR __ERR_STR(clCreateFromGLTexture) |
|
#define __IMAGE_DIMENSION_ERR __ERR_STR(Incorrect image dimensions) |
|
#endif // #if defined(CL_VERSION_1_2) |
|
#define __CREATE_SAMPLER_ERR __ERR_STR(clCreateSampler) |
|
#define __SET_MEM_OBJECT_DESTRUCTOR_CALLBACK_ERR __ERR_STR(clSetMemObjectDestructorCallback) |
|
|
|
#define __CREATE_USER_EVENT_ERR __ERR_STR(clCreateUserEvent) |
|
#define __SET_USER_EVENT_STATUS_ERR __ERR_STR(clSetUserEventStatus) |
|
#define __SET_EVENT_CALLBACK_ERR __ERR_STR(clSetEventCallback) |
|
#define __WAIT_FOR_EVENTS_ERR __ERR_STR(clWaitForEvents) |
|
|
|
#define __CREATE_KERNEL_ERR __ERR_STR(clCreateKernel) |
|
#define __SET_KERNEL_ARGS_ERR __ERR_STR(clSetKernelArg) |
|
#define __CREATE_PROGRAM_WITH_SOURCE_ERR __ERR_STR(clCreateProgramWithSource) |
|
#define __CREATE_PROGRAM_WITH_BINARY_ERR __ERR_STR(clCreateProgramWithBinary) |
|
#if defined(CL_VERSION_1_2) |
|
#define __CREATE_PROGRAM_WITH_BUILT_IN_KERNELS_ERR __ERR_STR(clCreateProgramWithBuiltInKernels) |
|
#endif // #if defined(CL_VERSION_1_2) |
|
#define __BUILD_PROGRAM_ERR __ERR_STR(clBuildProgram) |
|
#if defined(CL_VERSION_1_2) |
|
#define __COMPILE_PROGRAM_ERR __ERR_STR(clCompileProgram) |
|
|
|
#endif // #if defined(CL_VERSION_1_2) |
|
#define __CREATE_KERNELS_IN_PROGRAM_ERR __ERR_STR(clCreateKernelsInProgram) |
|
|
|
#define __CREATE_COMMAND_QUEUE_ERR __ERR_STR(clCreateCommandQueue) |
|
#define __SET_COMMAND_QUEUE_PROPERTY_ERR __ERR_STR(clSetCommandQueueProperty) |
|
#define __ENQUEUE_READ_BUFFER_ERR __ERR_STR(clEnqueueReadBuffer) |
|
#define __ENQUEUE_READ_BUFFER_RECT_ERR __ERR_STR(clEnqueueReadBufferRect) |
|
#define __ENQUEUE_WRITE_BUFFER_ERR __ERR_STR(clEnqueueWriteBuffer) |
|
#define __ENQUEUE_WRITE_BUFFER_RECT_ERR __ERR_STR(clEnqueueWriteBufferRect) |
|
#define __ENQEUE_COPY_BUFFER_ERR __ERR_STR(clEnqueueCopyBuffer) |
|
#define __ENQEUE_COPY_BUFFER_RECT_ERR __ERR_STR(clEnqueueCopyBufferRect) |
|
#define __ENQUEUE_FILL_BUFFER_ERR __ERR_STR(clEnqueueFillBuffer) |
|
#define __ENQUEUE_READ_IMAGE_ERR __ERR_STR(clEnqueueReadImage) |
|
#define __ENQUEUE_WRITE_IMAGE_ERR __ERR_STR(clEnqueueWriteImage) |
|
#define __ENQUEUE_COPY_IMAGE_ERR __ERR_STR(clEnqueueCopyImage) |
|
#define __ENQUEUE_FILL_IMAGE_ERR __ERR_STR(clEnqueueFillImage) |
|
#define __ENQUEUE_COPY_IMAGE_TO_BUFFER_ERR __ERR_STR(clEnqueueCopyImageToBuffer) |
|
#define __ENQUEUE_COPY_BUFFER_TO_IMAGE_ERR __ERR_STR(clEnqueueCopyBufferToImage) |
|
#define __ENQUEUE_MAP_BUFFER_ERR __ERR_STR(clEnqueueMapBuffer) |
|
#define __ENQUEUE_MAP_IMAGE_ERR __ERR_STR(clEnqueueMapImage) |
|
#define __ENQUEUE_UNMAP_MEM_OBJECT_ERR __ERR_STR(clEnqueueUnMapMemObject) |
|
#define __ENQUEUE_NDRANGE_KERNEL_ERR __ERR_STR(clEnqueueNDRangeKernel) |
|
#define __ENQUEUE_TASK_ERR __ERR_STR(clEnqueueTask) |
|
#define __ENQUEUE_NATIVE_KERNEL __ERR_STR(clEnqueueNativeKernel) |
|
#if defined(CL_VERSION_1_2) |
|
#define __ENQUEUE_MIGRATE_MEM_OBJECTS_ERR __ERR_STR(clEnqueueMigrateMemObjects) |
|
#endif // #if defined(CL_VERSION_1_2) |
|
|
|
#define __ENQUEUE_ACQUIRE_GL_ERR __ERR_STR(clEnqueueAcquireGLObjects) |
|
#define __ENQUEUE_RELEASE_GL_ERR __ERR_STR(clEnqueueReleaseGLObjects) |
|
|
|
|
|
#define __RETAIN_ERR __ERR_STR(Retain Object) |
|
#define __RELEASE_ERR __ERR_STR(Release Object) |
|
#define __FLUSH_ERR __ERR_STR(clFlush) |
|
#define __FINISH_ERR __ERR_STR(clFinish) |
|
#define __VECTOR_CAPACITY_ERR __ERR_STR(Vector capacity error) |
|
|
|
/** |
|
* CL 1.2 version that uses device fission. |
|
*/ |
|
#if defined(CL_VERSION_1_2) |
|
#define __CREATE_SUB_DEVICES __ERR_STR(clCreateSubDevices) |
|
#else |
|
#define __CREATE_SUB_DEVICES __ERR_STR(clCreateSubDevicesEXT) |
|
#endif // #if defined(CL_VERSION_1_2) |
|
|
|
/** |
|
* Deprecated APIs for 1.2 |
|
*/ |
|
#if defined(CL_USE_DEPRECATED_OPENCL_1_1_APIS) || (defined(CL_VERSION_1_1) && !defined(CL_VERSION_1_2)) |
|
#define __ENQUEUE_MARKER_ERR __ERR_STR(clEnqueueMarker) |
|
#define __ENQUEUE_WAIT_FOR_EVENTS_ERR __ERR_STR(clEnqueueWaitForEvents) |
|
#define __ENQUEUE_BARRIER_ERR __ERR_STR(clEnqueueBarrier) |
|
#define __UNLOAD_COMPILER_ERR __ERR_STR(clUnloadCompiler) |
|
#define __CREATE_GL_TEXTURE_2D_ERR __ERR_STR(clCreateFromGLTexture2D) |
|
#define __CREATE_GL_TEXTURE_3D_ERR __ERR_STR(clCreateFromGLTexture3D) |
|
#define __CREATE_IMAGE2D_ERR __ERR_STR(clCreateImage2D) |
|
#define __CREATE_IMAGE3D_ERR __ERR_STR(clCreateImage3D) |
|
#endif // #if defined(CL_VERSION_1_1) |
|
|
|
#endif // __CL_USER_OVERRIDE_ERROR_STRINGS |
|
//! \endcond |
|
|
|
/** |
|
* CL 1.2 marker and barrier commands |
|
*/ |
|
#if defined(CL_VERSION_1_2) |
|
#define __ENQUEUE_MARKER_WAIT_LIST_ERR __ERR_STR(clEnqueueMarkerWithWaitList) |
|
#define __ENQUEUE_BARRIER_WAIT_LIST_ERR __ERR_STR(clEnqueueBarrierWithWaitList) |
|
#endif // #if defined(CL_VERSION_1_2) |
|
|
|
#if !defined(__USE_DEV_STRING) && !defined(__NO_STD_STRING) |
|
typedef std::string STRING_CLASS; |
|
#elif !defined(__USE_DEV_STRING) |
|
|
|
/*! \class string |
|
* \brief Simple string class, that provides a limited subset of std::string |
|
* functionality but avoids many of the issues that come with that class. |
|
|
|
* \note Deprecated. Please use std::string as default or |
|
* re-define the string class to match the std::string |
|
* interface by defining STRING_CLASS |
|
*/ |
|
class CL_EXT_PREFIX__VERSION_1_1_DEPRECATED string CL_EXT_SUFFIX__VERSION_1_1_DEPRECATED |
|
{ |
|
private: |
|
::size_t size_; |
|
char * str_; |
|
public: |
|
//! \brief Constructs an empty string, allocating no memory. |
|
string(void) : size_(0), str_(NULL) |
|
{ |
|
} |
|
|
|
/*! \brief Constructs a string populated from an arbitrary value of |
|
* specified size. |
|
* |
|
* An extra '\0' is added, in case none was contained in str. |
|
* |
|
* \param str the initial value of the string instance. Note that '\0' |
|
* characters receive no special treatment. If NULL, |
|
* the string is left empty, with a size of 0. |
|
* |
|
* \param size the number of characters to copy from str. |
|
*/ |
|
string(const char * str, ::size_t size) : |
|
size_(size), |
|
str_(NULL) |
|
{ |
|
if( size > 0 ) { |
|
str_ = new char[size_+1]; |
|
if (str_ != NULL) { |
|
memcpy(str_, str, size_ * sizeof(char)); |
|
str_[size_] = '\0'; |
|
} |
|
else { |
|
size_ = 0; |
|
} |
|
} |
|
} |
|
|
|
/*! \brief Constructs a string populated from a null-terminated value. |
|
* |
|
* \param str the null-terminated initial value of the string instance. |
|
* If NULL, the string is left empty, with a size of 0. |
|
*/ |
|
string(const char * str) : |
|
size_(0), |
|
str_(NULL) |
|
{ |
|
if( str ) { |
|
size_= ::strlen(str); |
|
} |
|
if( size_ > 0 ) { |
|
str_ = new char[size_ + 1]; |
|
if (str_ != NULL) { |
|
memcpy(str_, str, (size_ + 1) * sizeof(char)); |
|
} |
|
} |
|
} |
|
|
|
void resize( ::size_t n ) |
|
{ |
|
if( size_ == n ) { |
|
return; |
|
} |
|
if (n == 0) { |
|
if( str_ ) { |
|
delete [] str_; |
|
} |
|
str_ = NULL; |
|
size_ = 0; |
|
} |
|
else { |
|
char *newString = new char[n + 1]; |
|
int copySize = n; |
|
if( size_ < n ) { |
|
copySize = size_; |
|
} |
|
size_ = n; |
|
|
|
if(str_) { |
|
memcpy(newString, str_, (copySize + 1) * sizeof(char)); |
|
} |
|
if( copySize < size_ ) { |
|
memset(newString + copySize, 0, size_ - copySize); |
|
} |
|
newString[size_] = '\0'; |
|
|
|
delete [] str_; |
|
str_ = newString; |
|
} |
|
} |
|
|
|
const char& operator[] ( ::size_t pos ) const |
|
{ |
|
return str_[pos]; |
|
} |
|
|
|
char& operator[] ( ::size_t pos ) |
|
{ |
|
return str_[pos]; |
|
} |
|
|
|
/*! \brief Copies the value of another string to this one. |
|
* |
|
* \param rhs the string to copy. |
|
* |
|
* \returns a reference to the modified instance. |
|
*/ |
|
string& operator=(const string& rhs) |
|
{ |
|
if (this == &rhs) { |
|
return *this; |
|
} |
|
|
|
if( str_ != NULL ) { |
|
delete [] str_; |
|
str_ = NULL; |
|
size_ = 0; |
|
} |
|
|
|
if (rhs.size_ == 0 || rhs.str_ == NULL) { |
|
str_ = NULL; |
|
size_ = 0; |
|
} |
|
else { |
|
str_ = new char[rhs.size_ + 1]; |
|
size_ = rhs.size_; |
|
|
|
if (str_ != NULL) { |
|
memcpy(str_, rhs.str_, (size_ + 1) * sizeof(char)); |
|
} |
|
else { |
|
size_ = 0; |
|
} |
|
} |
|
|
|
return *this; |
|
} |
|
|
|
/*! \brief Constructs a string by copying the value of another instance. |
|
* |
|
* \param rhs the string to copy. |
|
*/ |
|
string(const string& rhs) : |
|
size_(0), |
|
str_(NULL) |
|
{ |
|
*this = rhs; |
|
} |
|
|
|
//! \brief Destructor - frees memory used to hold the current value. |
|
~string() |
|
{ |
|
delete[] str_; |
|
str_ = NULL; |
|
} |
|
|
|
//! \brief Queries the length of the string, excluding any added '\0's. |
|
::size_t size(void) const { return size_; } |
|
|
|
//! \brief Queries the length of the string, excluding any added '\0's. |
|
::size_t length(void) const { return size(); } |
|
|
|
/*! \brief Returns a pointer to the private copy held by this instance, |
|
* or "" if empty/unset. |
|
*/ |
|
const char * c_str(void) const { return (str_) ? str_ : "";} |
|
}; |
|
typedef cl::string STRING_CLASS; |
|
#endif // #elif !defined(__USE_DEV_STRING) |
|
|
|
#if !defined(__USE_DEV_VECTOR) && !defined(__NO_STD_VECTOR) |
|
#define VECTOR_CLASS std::vector |
|
#elif !defined(__USE_DEV_VECTOR) |
|
#define VECTOR_CLASS cl::vector |
|
|
|
#if !defined(__MAX_DEFAULT_VECTOR_SIZE) |
|
#define __MAX_DEFAULT_VECTOR_SIZE 10 |
|
#endif |
|
|
|
/*! \class vector |
|
* \brief Fixed sized vector implementation that mirroring |
|
* |
|
* \note Deprecated. Please use std::vector as default or |
|
* re-define the vector class to match the std::vector |
|
* interface by defining VECTOR_CLASS |
|
|
|
* \note Not recommended for use with custom objects as |
|
* current implementation will construct N elements |
|
* |
|
* std::vector functionality. |
|
* \brief Fixed sized vector compatible with std::vector. |
|
* |
|
* \note |
|
* This differs from std::vector<> not just in memory allocation, |
|
* but also in terms of when members are constructed, destroyed, |
|
* and assigned instead of being copy constructed. |
|
* |
|
* \param T type of element contained in the vector. |
|
* |
|
* \param N maximum size of the vector. |
|
*/ |
|
template <typename T, unsigned int N = __MAX_DEFAULT_VECTOR_SIZE> |
|
class CL_EXT_PREFIX__VERSION_1_1_DEPRECATED vector CL_EXT_SUFFIX__VERSION_1_1_DEPRECATED |
|
{ |
|
private: |
|
T data_[N]; |
|
unsigned int size_; |
|
|
|
public: |
|
//! \brief Constructs an empty vector with no memory allocated. |
|
vector() : |
|
size_(static_cast<unsigned int>(0)) |
|
{} |
|
|
|
//! \brief Deallocates the vector's memory and destroys all of its elements. |
|
~vector() |
|
{ |
|
clear(); |
|
} |
|
|
|
//! \brief Returns the number of elements currently contained. |
|
unsigned int size(void) const |
|
{ |
|
return size_; |
|
} |
|
|
|
/*! \brief Empties the vector of all elements. |
|
* \note |
|
* This does not deallocate memory but will invoke destructors |
|
* on contained elements. |
|
*/ |
|
void clear() |
|
{ |
|
while(!empty()) { |
|
pop_back(); |
|
} |
|
} |
|
|
|
/*! \brief Appends an element after the last valid element. |
|
* Calling this on a vector that has reached capacity will throw an |
|
* exception if exceptions are enabled. |
|
*/ |
|
void push_back (const T& x) |
|
{ |
|
if (size() < N) { |
|
new (&data_[size_]) T(x); |
|
size_++; |
|
} else { |
|
detail::errHandler(CL_MEM_OBJECT_ALLOCATION_FAILURE, __VECTOR_CAPACITY_ERR); |
|
} |
|
} |
|
|
|
/*! \brief Removes the last valid element from the vector. |
|
* Calling this on an empty vector will throw an exception |
|
* if exceptions are enabled. |
|
*/ |
|
void pop_back(void) |
|
{ |
|
if (size_ != 0) { |
|
--size_; |
|
data_[size_].~T(); |
|
} else { |
|
detail::errHandler(CL_MEM_OBJECT_ALLOCATION_FAILURE, __VECTOR_CAPACITY_ERR); |
|
} |
|
} |
|
|
|
/*! \brief Constructs with a value copied from another. |
|
* |
|
* \param vec the vector to copy. |
|
*/ |
|
vector(const vector<T, N>& vec) : |
|
size_(vec.size_) |
|
{ |
|
if (size_ != 0) { |
|
assign(vec.begin(), vec.end()); |
|
} |
|
} |
|
|
|
/*! \brief Constructs with a specified number of initial elements. |
|
* |
|
* \param size number of initial elements. |
|
* |
|
* \param val value of initial elements. |
|
*/ |
|
vector(unsigned int size, const T& val = T()) : |
|
size_(0) |
|
{ |
|
for (unsigned int i = 0; i < size; i++) { |
|
push_back(val); |
|
} |
|
} |
|
|
|
/*! \brief Overwrites the current content with that copied from another |
|
* instance. |
|
* |
|
* \param rhs vector to copy. |
|
* |
|
* \returns a reference to this. |
|
*/ |
|
vector<T, N>& operator=(const vector<T, N>& rhs) |
|
{ |
|
if (this == &rhs) { |
|
return *this; |
|
} |
|
|
|
if (rhs.size_ != 0) { |
|
assign(rhs.begin(), rhs.end()); |
|
} else { |
|
clear(); |
|
} |
|
|
|
return *this; |
|
} |
|
|
|
/*! \brief Tests equality against another instance. |
|
* |
|
* \param vec the vector against which to compare. |
|
*/ |
|
bool operator==(vector<T,N> &vec) |
|
{ |
|
if (size() != vec.size()) { |
|
return false; |
|
} |
|
|
|
for( unsigned int i = 0; i < size(); ++i ) { |
|
if( operator[](i) != vec[i] ) { |
|
return false; |
|
} |
|
} |
|
return true; |
|
} |
|
|
|
//! \brief Conversion operator to T*. |
|
operator T* () { return data_; } |
|
|
|
//! \brief Conversion operator to const T*. |
|
operator const T* () const { return data_; } |
|
|
|
//! \brief Tests whether this instance has any elements. |
|
bool empty (void) const |
|
{ |
|
return size_==0; |
|
} |
|
|
|
//! \brief Returns the maximum number of elements this instance can hold. |
|
unsigned int max_size (void) const |
|
{ |
|
return N; |
|
} |
|
|
|
//! \brief Returns the maximum number of elements this instance can hold. |
|
unsigned int capacity () const |
|
{ |
|
return N; |
|
} |
|
|
|
/*! \brief Returns a reference to a given element. |
|
* |
|
* \param index which element to access. * |
|
* \note |
|
* The caller is responsible for ensuring index is >= 0 and < size(). |
|
*/ |
|
T& operator[](int index) |
|
{ |
|
return data_[index]; |
|
} |
|
|
|
/*! \brief Returns a const reference to a given element. |
|
* |
|
* \param index which element to access. |
|
* |
|
* \note |
|
* The caller is responsible for ensuring index is >= 0 and < size(). |
|
*/ |
|
const T& operator[](int index) const |
|
{ |
|
return data_[index]; |
|
} |
|
|
|
/*! \brief Assigns elements of the vector based on a source iterator range. |
|
* |
|
* \param start Beginning iterator of source range |
|
* \param end Enditerator of source range |
|
* |
|
* \note |
|
* Will throw an exception if exceptions are enabled and size exceeded. |
|
*/ |
|
template<class I> |
|
void assign(I start, I end) |
|
{ |
|
clear(); |
|
while(start != end) { |
|
push_back(*start); |
|
start++; |
|
} |
|
} |
|
|
|
/*! \class iterator |
|
* \brief Const iterator class for vectors |
|
*/ |
|
class iterator |
|
{ |
|
private: |
|
const vector<T,N> *vec_; |
|
int index_; |
|
|
|
/** |
|
* Internal iterator constructor to capture reference |
|
* to the vector it iterates over rather than taking |
|
* the vector by copy. |
|
*/ |
|
iterator (const vector<T,N> &vec, int index) : |
|
vec_(&vec) |
|
{ |
|
if( !vec.empty() ) { |
|
index_ = index; |
|
} else { |
|
index_ = -1; |
|
} |
|
} |
|
|
|
public: |
|
iterator(void) : |
|
index_(-1), |
|
vec_(NULL) |
|
{ |
|
} |
|
|
|
iterator(const iterator& rhs) : |
|
vec_(rhs.vec_), |
|
index_(rhs.index_) |
|
{ |
|
} |
|
|
|
~iterator(void) {} |
|
|
|
static iterator begin(const cl::vector<T,N> &vec) |
|
{ |
|
iterator i(vec, 0); |
|
|
|
return i; |
|
} |
|
|
|
static iterator end(const cl::vector<T,N> &vec) |
|
{ |
|
iterator i(vec, vec.size()); |
|
|
|
return i; |
|
} |
|
|
|
bool operator==(iterator i) |
|
{ |
|
return ((vec_ == i.vec_) && |
|
(index_ == i.index_)); |
|
} |
|
|
|
bool operator!=(iterator i) |
|
{ |
|
return (!(*this==i)); |
|
} |
|
|
|
iterator& operator++() |
|
{ |
|
++index_; |
|
return *this; |
|
} |
|
|
|
iterator operator++(int) |
|
{ |
|
iterator retVal(*this); |
|
++index_; |
|
return retVal; |
|
} |
|
|
|
iterator& operator--() |
|
{ |
|
--index_; |
|
return *this; |
|
} |
|
|
|
iterator operator--(int) |
|
{ |
|
iterator retVal(*this); |
|
--index_; |
|
return retVal; |
|
} |
|
|
|
const T& operator *() const |
|
{ |
|
return (*vec_)[index_]; |
|
} |
|
}; |
|
|
|
iterator begin(void) |
|
{ |
|
return iterator::begin(*this); |
|
} |
|
|
|
iterator begin(void) const |
|
{ |
|
return iterator::begin(*this); |
|
} |
|
|
|
iterator end(void) |
|
{ |
|
return iterator::end(*this); |
|
} |
|
|
|
iterator end(void) const |
|
{ |
|
return iterator::end(*this); |
|
} |
|
|
|
T& front(void) |
|
{ |
|
return data_[0]; |
|
} |
|
|
|
T& back(void) |
|
{ |
|
return data_[size_]; |
|
} |
|
|
|
const T& front(void) const |
|
{ |
|
return data_[0]; |
|
} |
|
|
|
const T& back(void) const |
|
{ |
|
return data_[size_-1]; |
|
} |
|
}; |
|
#endif // #if !defined(__USE_DEV_VECTOR) && !defined(__NO_STD_VECTOR) |
|
|
|
|
|
|
|
|
|
|
|
namespace detail { |
|
#define __DEFAULT_NOT_INITIALIZED 1 |
|
#define __DEFAULT_BEING_INITIALIZED 2 |
|
#define __DEFAULT_INITIALIZED 4 |
|
|
|
/* |
|
* Compare and exchange primitives are needed for handling of defaults |
|
*/ |
|
inline int compare_exchange(volatile int * dest, int exchange, int comparand) |
|
{ |
|
#ifdef _WIN32 |
|
return (int)(InterlockedCompareExchange( |
|
(volatile long*)dest, |
|
(long)exchange, |
|
(long)comparand)); |
|
#elif defined(__APPLE__) || defined(__MACOSX) |
|
return OSAtomicOr32Orig((uint32_t)exchange, (volatile uint32_t*)dest); |
|
#else // !_WIN32 || defined(__APPLE__) || defined(__MACOSX) |
|
return (__sync_val_compare_and_swap( |
|
dest, |
|
comparand, |
|
exchange)); |
|
#endif // !_WIN32 |
|
} |
|
|
|
inline void fence() { _mm_mfence(); } |
|
}; // namespace detail |
|
|
|
|
|
/*! \brief class used to interface between C++ and |
|
* OpenCL C calls that require arrays of size_t values, whose |
|
* size is known statically. |
|
*/ |
|
template <int N> |
|
class size_t |
|
{ |
|
private: |
|
::size_t data_[N]; |
|
|
|
public: |
|
//! \brief Initialize size_t to all 0s |
|
size_t() |
|
{ |
|
for( int i = 0; i < N; ++i ) { |
|
data_[i] = 0; |
|
} |
|
} |
|
|
|
::size_t& operator[](int index) |
|
{ |
|
return data_[index]; |
|
} |
|
|
|
const ::size_t& operator[](int index) const |
|
{ |
|
return data_[index]; |
|
} |
|
|
|
//! \brief Conversion operator to T*. |
|
operator ::size_t* () { return data_; } |
|
|
|
//! \brief Conversion operator to const T*. |
|
operator const ::size_t* () const { return data_; } |
|
}; |
|
|
|
namespace detail { |
|
|
|
// Generic getInfoHelper. The final parameter is used to guide overload |
|
// resolution: the actual parameter passed is an int, which makes this |
|
// a worse conversion sequence than a specialization that declares the |
|
// parameter as an int. |
|
template<typename Functor, typename T> |
|
inline cl_int getInfoHelper(Functor f, cl_uint name, T* param, long) |
|
{ |
|
return f(name, sizeof(T), param, NULL); |
|
} |
|
|
|
// Specialized getInfoHelper for VECTOR_CLASS params |
|
template <typename Func, typename T> |
|
inline cl_int getInfoHelper(Func f, cl_uint name, VECTOR_CLASS<T>* param, long) |
|
{ |
|
::size_t required; |
|
cl_int err = f(name, 0, NULL, &required); |
|
if (err != CL_SUCCESS) { |
|
return err; |
|
} |
|
|
|
T* value = (T*) alloca(required); |
|
err = f(name, required, value, NULL); |
|
if (err != CL_SUCCESS) { |
|
return err; |
|
} |
|
|
|
param->assign(&value[0], &value[required/sizeof(T)]); |
|
return CL_SUCCESS; |
|
} |
|
|
|
/* Specialization for reference-counted types. This depends on the |
|
* existence of Wrapper<T>::cl_type, and none of the other types having the |
|
* cl_type member. Note that simplify specifying the parameter as Wrapper<T> |
|
* does not work, because when using a derived type (e.g. Context) the generic |
|
* template will provide a better match. |
|
*/ |
|
template <typename Func, typename T> |
|
inline cl_int getInfoHelper(Func f, cl_uint name, VECTOR_CLASS<T>* param, int, typename T::cl_type = 0) |
|
{ |
|
::size_t required; |
|
cl_int err = f(name, 0, NULL, &required); |
|
if (err != CL_SUCCESS) { |
|
return err; |
|
} |
|
|
|
typename T::cl_type * value = (typename T::cl_type *) alloca(required); |
|
err = f(name, required, value, NULL); |
|
if (err != CL_SUCCESS) { |
|
return err; |
|
} |
|
|
|
::size_t elements = required / sizeof(typename T::cl_type); |
|
param->assign(&value[0], &value[elements]); |
|
for (::size_t i = 0; i < elements; i++) |
|
{ |
|
if (value[i] != NULL) |
|
{ |
|
err = (*param)[i].retain(); |
|
if (err != CL_SUCCESS) { |
|
return err; |
|
} |
|
} |
|
} |
|
return CL_SUCCESS; |
|
} |
|
|
|
// Specialized for getInfo<CL_PROGRAM_BINARIES> |
|
template <typename Func> |
|
inline cl_int getInfoHelper(Func f, cl_uint name, VECTOR_CLASS<char *>* param, int) |
|
{ |
|
cl_int err = f(name, param->size() * sizeof(char *), &(*param)[0], NULL); |
|
|
|
if (err != CL_SUCCESS) { |
|
return err; |
|
} |
|
|
|
return CL_SUCCESS; |
|
} |
|
|
|
// Specialized GetInfoHelper for STRING_CLASS params |
|
template <typename Func> |
|
inline cl_int getInfoHelper(Func f, cl_uint name, STRING_CLASS* param, long) |
|
{ |
|
::size_t required; |
|
cl_int err = f(name, 0, NULL, &required); |
|
if (err != CL_SUCCESS) { |
|
return err; |
|
} |
|
|
|
char* value = (char*) alloca(required); |
|
err = f(name, required, value, NULL); |
|
if (err != CL_SUCCESS) { |
|
return err; |
|
} |
|
|
|
*param = value; |
|
return CL_SUCCESS; |
|
} |
|
|
|
// Specialized GetInfoHelper for cl::size_t params |
|
template <typename Func, ::size_t N> |
|
inline cl_int getInfoHelper(Func f, cl_uint name, size_t<N>* param, long) |
|
{ |
|
::size_t required; |
|
cl_int err = f(name, 0, NULL, &required); |
|
if (err != CL_SUCCESS) { |
|
return err; |
|
} |
|
|
|
::size_t* value = (::size_t*) alloca(required); |
|
err = f(name, required, value, NULL); |
|
if (err != CL_SUCCESS) { |
|
return err; |
|
} |
|
|
|
for(int i = 0; i < N; ++i) { |
|
(*param)[i] = value[i]; |
|
} |
|
|
|
return CL_SUCCESS; |
|
} |
|
|
|
template<typename T> struct ReferenceHandler; |
|
|
|
/* Specialization for reference-counted types. This depends on the |
|
* existence of Wrapper<T>::cl_type, and none of the other types having the |
|
* cl_type member. Note that simplify specifying the parameter as Wrapper<T> |
|
* does not work, because when using a derived type (e.g. Context) the generic |
|
* template will provide a better match. |
|
*/ |
|
template<typename Func, typename T> |
|
inline cl_int getInfoHelper(Func f, cl_uint name, T* param, int, typename T::cl_type = 0) |
|
{ |
|
typename T::cl_type value; |
|
cl_int err = f(name, sizeof(value), &value, NULL); |
|
if (err != CL_SUCCESS) { |
|
return err; |
|
} |
|
*param = value; |
|
if (value != NULL) |
|
{ |
|
err = param->retain(); |
|
if (err != CL_SUCCESS) { |
|
return err; |
|
} |
|
} |
|
return CL_SUCCESS; |
|
} |
|
|
|
#define __PARAM_NAME_INFO_1_0(F) \ |
|
F(cl_platform_info, CL_PLATFORM_PROFILE, STRING_CLASS) \ |
|
F(cl_platform_info, CL_PLATFORM_VERSION, STRING_CLASS) \ |
|
F(cl_platform_info, CL_PLATFORM_NAME, STRING_CLASS) \ |
|
F(cl_platform_info, CL_PLATFORM_VENDOR, STRING_CLASS) \ |
|
F(cl_platform_info, CL_PLATFORM_EXTENSIONS, STRING_CLASS) \ |
|
\ |
|
F(cl_device_info, CL_DEVICE_TYPE, cl_device_type) \ |
|
F(cl_device_info, CL_DEVICE_VENDOR_ID, cl_uint) \ |
|
F(cl_device_info, CL_DEVICE_MAX_COMPUTE_UNITS, cl_uint) \ |
|
F(cl_device_info, CL_DEVICE_MAX_WORK_ITEM_DIMENSIONS, cl_uint) \ |
|
F(cl_device_info, CL_DEVICE_MAX_WORK_GROUP_SIZE, ::size_t) \ |
|
F(cl_device_info, CL_DEVICE_MAX_WORK_ITEM_SIZES, VECTOR_CLASS< ::size_t>) \ |
|
F(cl_device_info, CL_DEVICE_PREFERRED_VECTOR_WIDTH_CHAR, cl_uint) \ |
|
F(cl_device_info, CL_DEVICE_PREFERRED_VECTOR_WIDTH_SHORT, cl_uint) \ |
|
F(cl_device_info, CL_DEVICE_PREFERRED_VECTOR_WIDTH_INT, cl_uint) \ |
|
F(cl_device_info, CL_DEVICE_PREFERRED_VECTOR_WIDTH_LONG, cl_uint) \ |
|
F(cl_device_info, CL_DEVICE_PREFERRED_VECTOR_WIDTH_FLOAT, cl_uint) \ |
|
F(cl_device_info, CL_DEVICE_PREFERRED_VECTOR_WIDTH_DOUBLE, cl_uint) \ |
|
F(cl_device_info, CL_DEVICE_MAX_CLOCK_FREQUENCY, cl_uint) \ |
|
F(cl_device_info, CL_DEVICE_ADDRESS_BITS, cl_uint) \ |
|
F(cl_device_info, CL_DEVICE_MAX_READ_IMAGE_ARGS, cl_uint) \ |
|
F(cl_device_info, CL_DEVICE_MAX_WRITE_IMAGE_ARGS, cl_uint) \ |
|
F(cl_device_info, CL_DEVICE_MAX_MEM_ALLOC_SIZE, cl_ulong) \ |
|
F(cl_device_info, CL_DEVICE_IMAGE2D_MAX_WIDTH, ::size_t) \ |
|
F(cl_device_info, CL_DEVICE_IMAGE2D_MAX_HEIGHT, ::size_t) \ |
|
F(cl_device_info, CL_DEVICE_IMAGE3D_MAX_WIDTH, ::size_t) \ |
|
F(cl_device_info, CL_DEVICE_IMAGE3D_MAX_HEIGHT, ::size_t) \ |
|
F(cl_device_info, CL_DEVICE_IMAGE3D_MAX_DEPTH, ::size_t) \ |
|
F(cl_device_info, CL_DEVICE_IMAGE_SUPPORT, cl_bool) \ |
|
F(cl_device_info, CL_DEVICE_MAX_PARAMETER_SIZE, ::size_t) \ |
|
F(cl_device_info, CL_DEVICE_MAX_SAMPLERS, cl_uint) \ |
|
F(cl_device_info, CL_DEVICE_MEM_BASE_ADDR_ALIGN, cl_uint) \ |
|
F(cl_device_info, CL_DEVICE_MIN_DATA_TYPE_ALIGN_SIZE, cl_uint) \ |
|
F(cl_device_info, CL_DEVICE_SINGLE_FP_CONFIG, cl_device_fp_config) \ |
|
F(cl_device_info, CL_DEVICE_GLOBAL_MEM_CACHE_TYPE, cl_device_mem_cache_type) \ |
|
F(cl_device_info, CL_DEVICE_GLOBAL_MEM_CACHELINE_SIZE, cl_uint)\ |
|
F(cl_device_info, CL_DEVICE_GLOBAL_MEM_CACHE_SIZE, cl_ulong) \ |
|
F(cl_device_info, CL_DEVICE_GLOBAL_MEM_SIZE, cl_ulong) \ |
|
F(cl_device_info, CL_DEVICE_MAX_CONSTANT_BUFFER_SIZE, cl_ulong) \ |
|
F(cl_device_info, CL_DEVICE_MAX_CONSTANT_ARGS, cl_uint) \ |
|
F(cl_device_info, CL_DEVICE_LOCAL_MEM_TYPE, cl_device_local_mem_type) \ |
|
F(cl_device_info, CL_DEVICE_LOCAL_MEM_SIZE, cl_ulong) \ |
|
F(cl_device_info, CL_DEVICE_ERROR_CORRECTION_SUPPORT, cl_bool) \ |
|
F(cl_device_info, CL_DEVICE_PROFILING_TIMER_RESOLUTION, ::size_t) \ |
|
F(cl_device_info, CL_DEVICE_ENDIAN_LITTLE, cl_bool) \ |
|
F(cl_device_info, CL_DEVICE_AVAILABLE, cl_bool) \ |
|
F(cl_device_info, CL_DEVICE_COMPILER_AVAILABLE, cl_bool) \ |
|
F(cl_device_info, CL_DEVICE_EXECUTION_CAPABILITIES, cl_device_exec_capabilities) \ |
|
F(cl_device_info, CL_DEVICE_QUEUE_PROPERTIES, cl_command_queue_properties) \ |
|
F(cl_device_info, CL_DEVICE_PLATFORM, cl_platform_id) \ |
|
F(cl_device_info, CL_DEVICE_NAME, STRING_CLASS) \ |
|
F(cl_device_info, CL_DEVICE_VENDOR, STRING_CLASS) \ |
|
F(cl_device_info, CL_DRIVER_VERSION, STRING_CLASS) \ |
|
F(cl_device_info, CL_DEVICE_PROFILE, STRING_CLASS) \ |
|
F(cl_device_info, CL_DEVICE_VERSION, STRING_CLASS) \ |
|
F(cl_device_info, CL_DEVICE_EXTENSIONS, STRING_CLASS) \ |
|
\ |
|
F(cl_context_info, CL_CONTEXT_REFERENCE_COUNT, cl_uint) \ |
|
F(cl_context_info, CL_CONTEXT_DEVICES, VECTOR_CLASS<Device>) \ |
|
F(cl_context_info, CL_CONTEXT_PROPERTIES, VECTOR_CLASS<cl_context_properties>) \ |
|
\ |
|
F(cl_event_info, CL_EVENT_COMMAND_QUEUE, cl::CommandQueue) \ |
|
F(cl_event_info, CL_EVENT_COMMAND_TYPE, cl_command_type) \ |
|
F(cl_event_info, CL_EVENT_REFERENCE_COUNT, cl_uint) \ |
|
F(cl_event_info, CL_EVENT_COMMAND_EXECUTION_STATUS, cl_uint) \ |
|
\ |
|
F(cl_profiling_info, CL_PROFILING_COMMAND_QUEUED, cl_ulong) \ |
|
F(cl_profiling_info, CL_PROFILING_COMMAND_SUBMIT, cl_ulong) \ |
|
F(cl_profiling_info, CL_PROFILING_COMMAND_START, cl_ulong) \ |
|
F(cl_profiling_info, CL_PROFILING_COMMAND_END, cl_ulong) \ |
|
\ |
|
F(cl_mem_info, CL_MEM_TYPE, cl_mem_object_type) \ |
|
F(cl_mem_info, CL_MEM_FLAGS, cl_mem_flags) \ |
|
F(cl_mem_info, CL_MEM_SIZE, ::size_t) \ |
|
F(cl_mem_info, CL_MEM_HOST_PTR, void*) \ |
|
F(cl_mem_info, CL_MEM_MAP_COUNT, cl_uint) \ |
|
F(cl_mem_info, CL_MEM_REFERENCE_COUNT, cl_uint) \ |
|
F(cl_mem_info, CL_MEM_CONTEXT, cl::Context) \ |
|
\ |
|
F(cl_image_info, CL_IMAGE_FORMAT, cl_image_format) \ |
|
F(cl_image_info, CL_IMAGE_ELEMENT_SIZE, ::size_t) \ |
|
F(cl_image_info, CL_IMAGE_ROW_PITCH, ::size_t) \ |
|
F(cl_image_info, CL_IMAGE_SLICE_PITCH, ::size_t) \ |
|
F(cl_image_info, CL_IMAGE_WIDTH, ::size_t) \ |
|
F(cl_image_info, CL_IMAGE_HEIGHT, ::size_t) \ |
|
F(cl_image_info, CL_IMAGE_DEPTH, ::size_t) \ |
|
\ |
|
F(cl_sampler_info, CL_SAMPLER_REFERENCE_COUNT, cl_uint) \ |
|
F(cl_sampler_info, CL_SAMPLER_CONTEXT, cl::Context) \ |
|
F(cl_sampler_info, CL_SAMPLER_NORMALIZED_COORDS, cl_addressing_mode) \ |
|
F(cl_sampler_info, CL_SAMPLER_ADDRESSING_MODE, cl_filter_mode) \ |
|
F(cl_sampler_info, CL_SAMPLER_FILTER_MODE, cl_bool) \ |
|
\ |
|
F(cl_program_info, CL_PROGRAM_REFERENCE_COUNT, cl_uint) \ |
|
F(cl_program_info, CL_PROGRAM_CONTEXT, cl::Context) \ |
|
F(cl_program_info, CL_PROGRAM_NUM_DEVICES, cl_uint) \ |
|
F(cl_program_info, CL_PROGRAM_DEVICES, VECTOR_CLASS<Device>) \ |
|
F(cl_program_info, CL_PROGRAM_SOURCE, STRING_CLASS) \ |
|
F(cl_program_info, CL_PROGRAM_BINARY_SIZES, VECTOR_CLASS< ::size_t>) \ |
|
F(cl_program_info, CL_PROGRAM_BINARIES, VECTOR_CLASS<char *>) \ |
|
\ |
|
F(cl_program_build_info, CL_PROGRAM_BUILD_STATUS, cl_build_status) \ |
|
F(cl_program_build_info, CL_PROGRAM_BUILD_OPTIONS, STRING_CLASS) \ |
|
F(cl_program_build_info, CL_PROGRAM_BUILD_LOG, STRING_CLASS) \ |
|
\ |
|
F(cl_kernel_info, CL_KERNEL_FUNCTION_NAME, STRING_CLASS) \ |
|
F(cl_kernel_info, CL_KERNEL_NUM_ARGS, cl_uint) \ |
|
F(cl_kernel_info, CL_KERNEL_REFERENCE_COUNT, cl_uint) \ |
|
F(cl_kernel_info, CL_KERNEL_CONTEXT, cl::Context) \ |
|
F(cl_kernel_info, CL_KERNEL_PROGRAM, cl::Program) \ |
|
\ |
|
F(cl_kernel_work_group_info, CL_KERNEL_WORK_GROUP_SIZE, ::size_t) \ |
|
F(cl_kernel_work_group_info, CL_KERNEL_COMPILE_WORK_GROUP_SIZE, cl::size_t<3>) \ |
|
F(cl_kernel_work_group_info, CL_KERNEL_LOCAL_MEM_SIZE, cl_ulong) \ |
|
\ |
|
F(cl_command_queue_info, CL_QUEUE_CONTEXT, cl::Context) \ |
|
F(cl_command_queue_info, CL_QUEUE_DEVICE, cl::Device) \ |
|
F(cl_command_queue_info, CL_QUEUE_REFERENCE_COUNT, cl_uint) \ |
|
F(cl_command_queue_info, CL_QUEUE_PROPERTIES, cl_command_queue_properties) |
|
|
|
#if defined(CL_VERSION_1_1) |
|
#define __PARAM_NAME_INFO_1_1(F) \ |
|
F(cl_context_info, CL_CONTEXT_NUM_DEVICES, cl_uint)\ |
|
F(cl_device_info, CL_DEVICE_PREFERRED_VECTOR_WIDTH_HALF, cl_uint) \ |
|
F(cl_device_info, CL_DEVICE_NATIVE_VECTOR_WIDTH_CHAR, cl_uint) \ |
|
F(cl_device_info, CL_DEVICE_NATIVE_VECTOR_WIDTH_SHORT, cl_uint) \ |
|
F(cl_device_info, CL_DEVICE_NATIVE_VECTOR_WIDTH_INT, cl_uint) \ |
|
F(cl_device_info, CL_DEVICE_NATIVE_VECTOR_WIDTH_LONG, cl_uint) \ |
|
F(cl_device_info, CL_DEVICE_NATIVE_VECTOR_WIDTH_FLOAT, cl_uint) \ |
|
F(cl_device_info, CL_DEVICE_NATIVE_VECTOR_WIDTH_DOUBLE, cl_uint) \ |
|
F(cl_device_info, CL_DEVICE_NATIVE_VECTOR_WIDTH_HALF, cl_uint) \ |
|
F(cl_device_info, CL_DEVICE_DOUBLE_FP_CONFIG, cl_device_fp_config) \ |
|
F(cl_device_info, CL_DEVICE_HALF_FP_CONFIG, cl_device_fp_config) \ |
|
F(cl_device_info, CL_DEVICE_HOST_UNIFIED_MEMORY, cl_bool) \ |
|
F(cl_device_info, CL_DEVICE_OPENCL_C_VERSION, STRING_CLASS) \ |
|
\ |
|
F(cl_mem_info, CL_MEM_ASSOCIATED_MEMOBJECT, cl::Memory) \ |
|
F(cl_mem_info, CL_MEM_OFFSET, ::size_t) \ |
|
\ |
|
F(cl_kernel_work_group_info, CL_KERNEL_PREFERRED_WORK_GROUP_SIZE_MULTIPLE, ::size_t) \ |
|
F(cl_kernel_work_group_info, CL_KERNEL_PRIVATE_MEM_SIZE, cl_ulong) \ |
|
\ |
|
F(cl_event_info, CL_EVENT_CONTEXT, cl::Context) |
|
#endif // CL_VERSION_1_1 |
|
|
|
|
|
#if defined(CL_VERSION_1_2) |
|
#define __PARAM_NAME_INFO_1_2(F) \ |
|
F(cl_image_info, CL_IMAGE_BUFFER, cl::Buffer) \ |
|
\ |
|
F(cl_program_info, CL_PROGRAM_NUM_KERNELS, ::size_t) \ |
|
F(cl_program_info, CL_PROGRAM_KERNEL_NAMES, STRING_CLASS) \ |
|
\ |
|
F(cl_program_build_info, CL_PROGRAM_BINARY_TYPE, cl_program_binary_type) \ |
|
\ |
|
F(cl_kernel_info, CL_KERNEL_ATTRIBUTES, STRING_CLASS) \ |
|
\ |
|
F(cl_kernel_arg_info, CL_KERNEL_ARG_ADDRESS_QUALIFIER, cl_kernel_arg_address_qualifier) \ |
|
F(cl_kernel_arg_info, CL_KERNEL_ARG_ACCESS_QUALIFIER, cl_kernel_arg_access_qualifier) \ |
|
F(cl_kernel_arg_info, CL_KERNEL_ARG_TYPE_NAME, STRING_CLASS) \ |
|
F(cl_kernel_arg_info, CL_KERNEL_ARG_NAME, STRING_CLASS) \ |
|
\ |
|
F(cl_device_info, CL_DEVICE_PARENT_DEVICE, cl_device_id) \ |
|
F(cl_device_info, CL_DEVICE_PARTITION_PROPERTIES, VECTOR_CLASS<cl_device_partition_property>) \ |
|
F(cl_device_info, CL_DEVICE_PARTITION_TYPE, VECTOR_CLASS<cl_device_partition_property>) \ |
|
F(cl_device_info, CL_DEVICE_REFERENCE_COUNT, cl_uint) \ |
|
F(cl_device_info, CL_DEVICE_PREFERRED_INTEROP_USER_SYNC, ::size_t) \ |
|
F(cl_device_info, CL_DEVICE_PARTITION_AFFINITY_DOMAIN, cl_device_affinity_domain) \ |
|
F(cl_device_info, CL_DEVICE_BUILT_IN_KERNELS, STRING_CLASS) |
|
#endif // #if defined(CL_VERSION_1_2) |
|
|
|
#if defined(USE_CL_DEVICE_FISSION) |
|
#define __PARAM_NAME_DEVICE_FISSION(F) \ |
|
F(cl_device_info, CL_DEVICE_PARENT_DEVICE_EXT, cl_device_id) \ |
|
F(cl_device_info, CL_DEVICE_PARTITION_TYPES_EXT, VECTOR_CLASS<cl_device_partition_property_ext>) \ |
|
F(cl_device_info, CL_DEVICE_AFFINITY_DOMAINS_EXT, VECTOR_CLASS<cl_device_partition_property_ext>) \ |
|
F(cl_device_info, CL_DEVICE_REFERENCE_COUNT_EXT , cl_uint) \ |
|
F(cl_device_info, CL_DEVICE_PARTITION_STYLE_EXT, VECTOR_CLASS<cl_device_partition_property_ext>) |
|
#endif // USE_CL_DEVICE_FISSION |
|
|
|
template <typename enum_type, cl_int Name> |
|
struct param_traits {}; |
|
|
|
#define __CL_DECLARE_PARAM_TRAITS(token, param_name, T) \ |
|
struct token; \ |
|
template<> \ |
|
struct param_traits<detail:: token,param_name> \ |
|
{ \ |
|
enum { value = param_name }; \ |
|
typedef T param_type; \ |
|
}; |
|
|
|
__PARAM_NAME_INFO_1_0(__CL_DECLARE_PARAM_TRAITS) |
|
#if defined(CL_VERSION_1_1) |
|
__PARAM_NAME_INFO_1_1(__CL_DECLARE_PARAM_TRAITS) |
|
#endif // CL_VERSION_1_1 |
|
#if defined(CL_VERSION_1_2) |
|
__PARAM_NAME_INFO_1_2(__CL_DECLARE_PARAM_TRAITS) |
|
#endif // CL_VERSION_1_1 |
|
|
|
#if defined(USE_CL_DEVICE_FISSION) |
|
__PARAM_NAME_DEVICE_FISSION(__CL_DECLARE_PARAM_TRAITS); |
|
#endif // USE_CL_DEVICE_FISSION |
|
|
|
#ifdef CL_PLATFORM_ICD_SUFFIX_KHR |
|
__CL_DECLARE_PARAM_TRAITS(cl_platform_info, CL_PLATFORM_ICD_SUFFIX_KHR, STRING_CLASS) |
|
#endif |
|
|
|
#ifdef CL_DEVICE_PROFILING_TIMER_OFFSET_AMD |
|
__CL_DECLARE_PARAM_TRAITS(cl_device_info, CL_DEVICE_PROFILING_TIMER_OFFSET_AMD, cl_ulong) |
|
#endif |
|
|
|
#ifdef CL_DEVICE_GLOBAL_FREE_MEMORY_AMD |
|
__CL_DECLARE_PARAM_TRAITS(cl_device_info, CL_DEVICE_GLOBAL_FREE_MEMORY_AMD, VECTOR_CLASS< ::size_t>) |
|
#endif |
|
#ifdef CL_DEVICE_SIMD_PER_COMPUTE_UNIT_AMD |
|
__CL_DECLARE_PARAM_TRAITS(cl_device_info, CL_DEVICE_SIMD_PER_COMPUTE_UNIT_AMD, cl_uint) |
|
#endif |
|
#ifdef CL_DEVICE_SIMD_WIDTH_AMD |
|
__CL_DECLARE_PARAM_TRAITS(cl_device_info, CL_DEVICE_SIMD_WIDTH_AMD, cl_uint) |
|
#endif |
|
#ifdef CL_DEVICE_SIMD_INSTRUCTION_WIDTH_AMD |
|
__CL_DECLARE_PARAM_TRAITS(cl_device_info, CL_DEVICE_SIMD_INSTRUCTION_WIDTH_AMD, cl_uint) |
|
#endif |
|
#ifdef CL_DEVICE_WAVEFRONT_WIDTH_AMD |
|
__CL_DECLARE_PARAM_TRAITS(cl_device_info, CL_DEVICE_WAVEFRONT_WIDTH_AMD, cl_uint) |
|
#endif |
|
#ifdef CL_DEVICE_GLOBAL_MEM_CHANNELS_AMD |
|
__CL_DECLARE_PARAM_TRAITS(cl_device_info, CL_DEVICE_GLOBAL_MEM_CHANNELS_AMD, cl_uint) |
|
#endif |
|
#ifdef CL_DEVICE_GLOBAL_MEM_CHANNEL_BANKS_AMD |
|
__CL_DECLARE_PARAM_TRAITS(cl_device_info, CL_DEVICE_GLOBAL_MEM_CHANNEL_BANKS_AMD, cl_uint) |
|
#endif |
|
#ifdef CL_DEVICE_GLOBAL_MEM_CHANNEL_BANK_WIDTH_AMD |
|
__CL_DECLARE_PARAM_TRAITS(cl_device_info, CL_DEVICE_GLOBAL_MEM_CHANNEL_BANK_WIDTH_AMD, cl_uint) |
|
#endif |
|
#ifdef CL_DEVICE_LOCAL_MEM_SIZE_PER_COMPUTE_UNIT_AMD |
|
__CL_DECLARE_PARAM_TRAITS(cl_device_info, CL_DEVICE_LOCAL_MEM_SIZE_PER_COMPUTE_UNIT_AMD, cl_uint) |
|
#endif |
|
#ifdef CL_DEVICE_LOCAL_MEM_BANKS_AMD |
|
__CL_DECLARE_PARAM_TRAITS(cl_device_info, CL_DEVICE_LOCAL_MEM_BANKS_AMD, cl_uint) |
|
#endif |
|
|
|
#ifdef CL_DEVICE_COMPUTE_CAPABILITY_MAJOR_NV |
|
__CL_DECLARE_PARAM_TRAITS(cl_device_info, CL_DEVICE_COMPUTE_CAPABILITY_MAJOR_NV, cl_uint) |
|
#endif |
|
#ifdef CL_DEVICE_COMPUTE_CAPABILITY_MINOR_NV |
|
__CL_DECLARE_PARAM_TRAITS(cl_device_info, CL_DEVICE_COMPUTE_CAPABILITY_MINOR_NV, cl_uint) |
|
#endif |
|
#ifdef CL_DEVICE_REGISTERS_PER_BLOCK_NV |
|
__CL_DECLARE_PARAM_TRAITS(cl_device_info, CL_DEVICE_REGISTERS_PER_BLOCK_NV, cl_uint) |
|
#endif |
|
#ifdef CL_DEVICE_WARP_SIZE_NV |
|
__CL_DECLARE_PARAM_TRAITS(cl_device_info, CL_DEVICE_WARP_SIZE_NV, cl_uint) |
|
#endif |
|
#ifdef CL_DEVICE_GPU_OVERLAP_NV |
|
__CL_DECLARE_PARAM_TRAITS(cl_device_info, CL_DEVICE_GPU_OVERLAP_NV, cl_bool) |
|
#endif |
|
#ifdef CL_DEVICE_KERNEL_EXEC_TIMEOUT_NV |
|
__CL_DECLARE_PARAM_TRAITS(cl_device_info, CL_DEVICE_KERNEL_EXEC_TIMEOUT_NV, cl_bool) |
|
#endif |
|
#ifdef CL_DEVICE_INTEGRATED_MEMORY_NV |
|
__CL_DECLARE_PARAM_TRAITS(cl_device_info, CL_DEVICE_INTEGRATED_MEMORY_NV, cl_bool) |
|
#endif |
|
|
|
// Convenience functions |
|
|
|
template <typename Func, typename T> |
|
inline cl_int |
|
getInfo(Func f, cl_uint name, T* param) |
|
{ |
|
return getInfoHelper(f, name, param, 0); |
|
} |
|
|
|
template <typename Func, typename Arg0> |
|
struct GetInfoFunctor0 |
|
{ |
|
Func f_; const Arg0& arg0_; |
|
cl_int operator ()( |
|
cl_uint param, ::size_t size, void* value, ::size_t* size_ret) |
|
{ return f_(arg0_, param, size, value, size_ret); } |
|
}; |
|
|
|
template <typename Func, typename Arg0, typename Arg1> |
|
struct GetInfoFunctor1 |
|
{ |
|
Func f_; const Arg0& arg0_; const Arg1& arg1_; |
|
cl_int operator ()( |
|
cl_uint param, ::size_t size, void* value, ::size_t* size_ret) |
|
{ return f_(arg0_, arg1_, param, size, value, size_ret); } |
|
}; |
|
|
|
template <typename Func, typename Arg0, typename T> |
|
inline cl_int |
|
getInfo(Func f, const Arg0& arg0, cl_uint name, T* param) |
|
{ |
|
GetInfoFunctor0<Func, Arg0> f0 = { f, arg0 }; |
|
return getInfoHelper(f0, name, param, 0); |
|
} |
|
|
|
template <typename Func, typename Arg0, typename Arg1, typename T> |
|
inline cl_int |
|
getInfo(Func f, const Arg0& arg0, const Arg1& arg1, cl_uint name, T* param) |
|
{ |
|
GetInfoFunctor1<Func, Arg0, Arg1> f0 = { f, arg0, arg1 }; |
|
return getInfoHelper(f0, name, param, 0); |
|
} |
|
|
|
template<typename T> |
|
struct ReferenceHandler |
|
{ }; |
|
|
|
#if defined(CL_VERSION_1_2) |
|
/** |
|
* OpenCL 1.2 devices do have retain/release. |
|
*/ |
|
template <> |
|
struct ReferenceHandler<cl_device_id> |
|
{ |
|
/** |
|
* Retain the device. |
|
* \param device A valid device created using createSubDevices |
|
* \return |
|
* CL_SUCCESS if the function executed successfully. |
|
* CL_INVALID_DEVICE if device was not a valid subdevice |
|
* CL_OUT_OF_RESOURCES |
|
* CL_OUT_OF_HOST_MEMORY |
|
*/ |
|
static cl_int retain(cl_device_id device) |
|
{ return ::clRetainDevice(device); } |
|
/** |
|
* Retain the device. |
|
* \param device A valid device created using createSubDevices |
|
* \return |
|
* CL_SUCCESS if the function executed successfully. |
|
* CL_INVALID_DEVICE if device was not a valid subdevice |
|
* CL_OUT_OF_RESOURCES |
|
* CL_OUT_OF_HOST_MEMORY |
|
*/ |
|
static cl_int release(cl_device_id device) |
|
{ return ::clReleaseDevice(device); } |
|
}; |
|
#else // #if defined(CL_VERSION_1_2) |
|
/** |
|
* OpenCL 1.1 devices do not have retain/release. |
|
*/ |
|
template <> |
|
struct ReferenceHandler<cl_device_id> |
|
{ |
|
// cl_device_id does not have retain(). |
|
static cl_int retain(cl_device_id) |
|
{ return CL_SUCCESS; } |
|
// cl_device_id does not have release(). |
|
static cl_int release(cl_device_id) |
|
{ return CL_SUCCESS; } |
|
}; |
|
#endif // #if defined(CL_VERSION_1_2) |
|
|
|
template <> |
|
struct ReferenceHandler<cl_platform_id> |
|
{ |
|
// cl_platform_id does not have retain(). |
|
static cl_int retain(cl_platform_id) |
|
{ return CL_SUCCESS; } |
|
// cl_platform_id does not have release(). |
|
static cl_int release(cl_platform_id) |
|
{ return CL_SUCCESS; } |
|
}; |
|
|
|
template <> |
|
struct ReferenceHandler<cl_context> |
|
{ |
|
static cl_int retain(cl_context context) |
|
{ return ::clRetainContext(context); } |
|
static cl_int release(cl_context context) |
|
{ return ::clReleaseContext(context); } |
|
}; |
|
|
|
template <> |
|
struct ReferenceHandler<cl_command_queue> |
|
{ |
|
static cl_int retain(cl_command_queue queue) |
|
{ return ::clRetainCommandQueue(queue); } |
|
static cl_int release(cl_command_queue queue) |
|
{ return ::clReleaseCommandQueue(queue); } |
|
}; |
|
|
|
template <> |
|
struct ReferenceHandler<cl_mem> |
|
{ |
|
static cl_int retain(cl_mem memory) |
|
{ return ::clRetainMemObject(memory); } |
|
static cl_int release(cl_mem memory) |
|
{ return ::clReleaseMemObject(memory); } |
|
}; |
|
|
|
template <> |
|
struct ReferenceHandler<cl_sampler> |
|
{ |
|
static cl_int retain(cl_sampler sampler) |
|
{ return ::clRetainSampler(sampler); } |
|
static cl_int release(cl_sampler sampler) |
|
{ return ::clReleaseSampler(sampler); } |
|
}; |
|
|
|
template <> |
|
struct ReferenceHandler<cl_program> |
|
{ |
|
static cl_int retain(cl_program program) |
|
{ return ::clRetainProgram(program); } |
|
static cl_int release(cl_program program) |
|
{ return ::clReleaseProgram(program); } |
|
}; |
|
|
|
template <> |
|
struct ReferenceHandler<cl_kernel> |
|
{ |
|
static cl_int retain(cl_kernel kernel) |
|
{ return ::clRetainKernel(kernel); } |
|
static cl_int release(cl_kernel kernel) |
|
{ return ::clReleaseKernel(kernel); } |
|
}; |
|
|
|
template <> |
|
struct ReferenceHandler<cl_event> |
|
{ |
|
static cl_int retain(cl_event event) |
|
{ return ::clRetainEvent(event); } |
|
static cl_int release(cl_event event) |
|
{ return ::clReleaseEvent(event); } |
|
}; |
|
|
|
|
|
// Extracts version number with major in the upper 16 bits, minor in the lower 16 |
|
static cl_uint getVersion(const char *versionInfo) |
|
{ |
|
int highVersion = 0; |
|
int lowVersion = 0; |
|
int index = 7; |
|
while(versionInfo[index] != '.' ) { |
|
highVersion *= 10; |
|
highVersion += versionInfo[index]-'0'; |
|
++index; |
|
} |
|
++index; |
|
while(versionInfo[index] != ' ' ) { |
|
lowVersion *= 10; |
|
lowVersion += versionInfo[index]-'0'; |
|
++index; |
|
} |
|
return (highVersion << 16) | lowVersion; |
|
} |
|
|
|
static cl_uint getPlatformVersion(cl_platform_id platform) |
|
{ |
|
::size_t size = 0; |
|
clGetPlatformInfo(platform, CL_PLATFORM_VERSION, 0, NULL, &size); |
|
char *versionInfo = (char *) alloca(size); |
|
clGetPlatformInfo(platform, CL_PLATFORM_VERSION, size, &versionInfo[0], &size); |
|
return getVersion(versionInfo); |
|
} |
|
|
|
static cl_uint getDevicePlatformVersion(cl_device_id device) |
|
{ |
|
cl_platform_id platform; |
|
clGetDeviceInfo(device, CL_DEVICE_PLATFORM, sizeof(platform), &platform, NULL); |
|
return getPlatformVersion(platform); |
|
} |
|
|
|
#if defined(CL_VERSION_1_2) && defined(CL_USE_DEPRECATED_OPENCL_1_1_APIS) |
|
static cl_uint getContextPlatformVersion(cl_context context) |
|
{ |
|
// The platform cannot be queried directly, so we first have to grab a |
|
// device and obtain its context |
|
::size_t size = 0; |
|
clGetContextInfo(context, CL_CONTEXT_DEVICES, 0, NULL, &size); |
|
if (size == 0) |
|
return 0; |
|
cl_device_id *devices = (cl_device_id *) alloca(size); |
|
clGetContextInfo(context, CL_CONTEXT_DEVICES, size, devices, NULL); |
|
return getDevicePlatformVersion(devices[0]); |
|
} |
|
#endif // #if defined(CL_VERSION_1_2) && defined(CL_USE_DEPRECATED_OPENCL_1_1_APIS) |
|
|
|
template <typename T> |
|
class Wrapper |
|
{ |
|
public: |
|
typedef T cl_type; |
|
|
|
protected: |
|
cl_type object_; |
|
|
|
public: |
|
Wrapper() : object_(NULL) { } |
|
|
|
Wrapper(const cl_type &obj) : object_(obj) { } |
|
|
|
~Wrapper() |
|
{ |
|
if (object_ != NULL) { release(); } |
|
} |
|
|
|
Wrapper(const Wrapper<cl_type>& rhs) |
|
{ |
|
object_ = rhs.object_; |
|
if (object_ != NULL) { detail::errHandler(retain(), __RETAIN_ERR); } |
|
} |
|
|
|
Wrapper<cl_type>& operator = (const Wrapper<cl_type>& rhs) |
|
{ |
|
if (object_ != NULL) { detail::errHandler(release(), __RELEASE_ERR); } |
|
object_ = rhs.object_; |
|
if (object_ != NULL) { detail::errHandler(retain(), __RETAIN_ERR); } |
|
return *this; |
|
} |
|
|
|
Wrapper<cl_type>& operator = (const cl_type &rhs) |
|
{ |
|
if (object_ != NULL) { detail::errHandler(release(), __RELEASE_ERR); } |
|
object_ = rhs; |
|
return *this; |
|
} |
|
|
|
cl_type operator ()() const { return object_; } |
|
|
|
cl_type& operator ()() { return object_; } |
|
|
|
protected: |
|
template<typename Func, typename U> |
|
friend inline cl_int getInfoHelper(Func, cl_uint, U*, int, typename U::cl_type); |
|
|
|
cl_int retain() const |
|
{ |
|
return ReferenceHandler<cl_type>::retain(object_); |
|
} |
|
|
|
cl_int release() const |
|
{ |
|
return ReferenceHandler<cl_type>::release(object_); |
|
} |
|
}; |
|
|
|
template <> |
|
class Wrapper<cl_device_id> |
|
{ |
|
public: |
|
typedef cl_device_id cl_type; |
|
|
|
protected: |
|
cl_type object_; |
|
bool referenceCountable_; |
|
|
|
static bool isReferenceCountable(cl_device_id device) |
|
{ |
|
bool retVal = false; |
|
if (device != NULL) { |
|
int version = getDevicePlatformVersion(device); |
|
if(version > ((1 << 16) + 1)) { |
|
retVal = true; |
|
} |
|
} |
|
return retVal; |
|
} |
|
|
|
public: |
|
Wrapper() : object_(NULL), referenceCountable_(false) |
|
{ |
|
} |
|
|
|
Wrapper(const cl_type &obj) : object_(obj), referenceCountable_(false) |
|
{ |
|
referenceCountable_ = isReferenceCountable(obj); |
|
} |
|
|
|
~Wrapper() |
|
{ |
|
if (object_ != NULL) { release(); } |
|
} |
|
|
|
Wrapper(const Wrapper<cl_type>& rhs) |
|
{ |
|
object_ = rhs.object_; |
|
referenceCountable_ = isReferenceCountable(object_); |
|
if (object_ != NULL) { detail::errHandler(retain(), __RETAIN_ERR); } |
|
} |
|
|
|
Wrapper<cl_type>& operator = (const Wrapper<cl_type>& rhs) |
|
{ |
|
if (object_ != NULL) { detail::errHandler(release(), __RELEASE_ERR); } |
|
object_ = rhs.object_; |
|
referenceCountable_ = rhs.referenceCountable_; |
|
if (object_ != NULL) { detail::errHandler(retain(), __RETAIN_ERR); } |
|
return *this; |
|
} |
|
|
|
Wrapper<cl_type>& operator = (const cl_type &rhs) |
|
{ |
|
if (object_ != NULL) { detail::errHandler(release(), __RELEASE_ERR); } |
|
object_ = rhs; |
|
referenceCountable_ = isReferenceCountable(object_); |
|
return *this; |
|
} |
|
|
|
cl_type operator ()() const { return object_; } |
|
|
|
cl_type& operator ()() { return object_; } |
|
|
|
protected: |
|
template<typename Func, typename U> |
|
friend inline cl_int getInfoHelper(Func, cl_uint, U*, int, typename U::cl_type); |
|
|
|
template<typename Func, typename U> |
|
friend inline cl_int getInfoHelper(Func, cl_uint, VECTOR_CLASS<U>*, int, typename U::cl_type); |
|
|
|
cl_int retain() const |
|
{ |
|
if( referenceCountable_ ) { |
|
return ReferenceHandler<cl_type>::retain(object_); |
|
} |
|
else { |
|
return CL_SUCCESS; |
|
} |
|
} |
|
|
|
cl_int release() const |
|
{ |
|
if( referenceCountable_ ) { |
|
return ReferenceHandler<cl_type>::release(object_); |
|
} |
|
else { |
|
return CL_SUCCESS; |
|
} |
|
} |
|
}; |
|
|
|
} // namespace detail |
|
//! \endcond |
|
|
|
/*! \stuct ImageFormat |
|
* \brief Adds constructors and member functions for cl_image_format. |
|
* |
|
* \see cl_image_format |
|
*/ |
|
struct ImageFormat : public cl_image_format |
|
{ |
|
//! \brief Default constructor - performs no initialization. |
|
ImageFormat(){} |
|
|
|
//! \brief Initializing constructor. |
|
ImageFormat(cl_channel_order order, cl_channel_type type) |
|
{ |
|
image_channel_order = order; |
|
image_channel_data_type = type; |
|
} |
|
|
|
//! \brief Assignment operator. |
|
ImageFormat& operator = (const ImageFormat& rhs) |
|
{ |
|
if (this != &rhs) { |
|
this->image_channel_data_type = rhs.image_channel_data_type; |
|
this->image_channel_order = rhs.image_channel_order; |
|
} |
|
return *this; |
|
} |
|
}; |
|
|
|
/*! \brief Class interface for cl_device_id. |
|
* |
|
* \note Copies of these objects are inexpensive, since they don't 'own' |
|
* any underlying resources or data structures. |
|
* |
|
* \see cl_device_id |
|
*/ |
|
class Device : public detail::Wrapper<cl_device_id> |
|
{ |
|
public: |
|
//! \brief Default constructor - initializes to NULL. |
|
Device() : detail::Wrapper<cl_type>() { } |
|
|
|
/*! \brief Copy constructor. |
|
* |
|
* This simply copies the device ID value, which is an inexpensive operation. |
|
*/ |
|
Device(const Device& device) : detail::Wrapper<cl_type>(device) { } |
|
|
|
/*! \brief Constructor from cl_device_id. |
|
* |
|
* This simply copies the device ID value, which is an inexpensive operation. |
|
*/ |
|
Device(const cl_device_id &device) : detail::Wrapper<cl_type>(device) { } |
|
|
|
/*! \brief Returns the first device on the default context. |
|
* |
|
* \see Context::getDefault() |
|
*/ |
|
static Device getDefault(cl_int * err = NULL); |
|
|
|
/*! \brief Assignment operator from Device. |
|
* |
|
* This simply copies the device ID value, which is an inexpensive operation. |
|
*/ |
|
Device& operator = (const Device& rhs) |
|
{ |
|
if (this != &rhs) { |
|
detail::Wrapper<cl_type>::operator=(rhs); |
|
} |
|
return *this; |
|
} |
|
|
|
/*! \brief Assignment operator from cl_device_id. |
|
* |
|
* This simply copies the device ID value, which is an inexpensive operation. |
|
*/ |
|
Device& operator = (const cl_device_id& rhs) |
|
{ |
|
detail::Wrapper<cl_type>::operator=(rhs); |
|
return *this; |
|
} |
|
|
|
//! \brief Wrapper for clGetDeviceInfo(). |
|
template <typename T> |
|
cl_int getInfo(cl_device_info name, T* param) const |
|
{ |
|
return detail::errHandler( |
|
detail::getInfo(&::clGetDeviceInfo, object_, name, param), |
|
__GET_DEVICE_INFO_ERR); |
|
} |
|
|
|
//! \brief Wrapper for clGetDeviceInfo() that returns by value. |
|
template <cl_int name> typename |
|
detail::param_traits<detail::cl_device_info, name>::param_type |
|
getInfo(cl_int* err = NULL) const |
|
{ |
|
typename detail::param_traits< |
|
detail::cl_device_info, name>::param_type param; |
|
cl_int result = getInfo(name, ¶m); |
|
if (err != NULL) { |
|
*err = result; |
|
} |
|
return param; |
|
} |
|
|
|
/** |
|
* CL 1.2 version |
|
*/ |
|
#if defined(CL_VERSION_1_2) |
|
//! \brief Wrapper for clCreateSubDevicesEXT(). |
|
cl_int createSubDevices( |
|
const cl_device_partition_property * properties, |
|
VECTOR_CLASS<Device>* devices) |
|
{ |
|
cl_uint n = 0; |
|
cl_int err = clCreateSubDevices(object_, properties, 0, NULL, &n); |
|
if (err != CL_SUCCESS) { |
|
return detail::errHandler(err, __CREATE_SUB_DEVICES); |
|
} |
|
|
|
cl_device_id* ids = (cl_device_id*) alloca(n * sizeof(cl_device_id)); |
|
err = clCreateSubDevices(object_, properties, n, ids, NULL); |
|
if (err != CL_SUCCESS) { |
|
return detail::errHandler(err, __CREATE_SUB_DEVICES); |
|
} |
|
|
|
devices->assign(&ids[0], &ids[n]); |
|
return CL_SUCCESS; |
|
} |
|
#endif // #if defined(CL_VERSION_1_2) |
|
|
|
/** |
|
* CL 1.1 version that uses device fission. |
|
*/ |
|
#if defined(CL_VERSION_1_1) |
|
#if defined(USE_CL_DEVICE_FISSION) |
|
cl_int createSubDevices( |
|
const cl_device_partition_property_ext * properties, |
|
VECTOR_CLASS<Device>* devices) |
|
{ |
|
typedef CL_API_ENTRY cl_int |
|
( CL_API_CALL * PFN_clCreateSubDevicesEXT)( |
|
cl_device_id /*in_device*/, |
|
const cl_device_partition_property_ext * /* properties */, |
|
cl_uint /*num_entries*/, |
|
cl_device_id * /*out_devices*/, |
|
cl_uint * /*num_devices*/ ) CL_EXT_SUFFIX__VERSION_1_1; |
|
|
|
static PFN_clCreateSubDevicesEXT pfn_clCreateSubDevicesEXT = NULL; |
|
__INIT_CL_EXT_FCN_PTR(clCreateSubDevicesEXT); |
|
|
|
cl_uint n = 0; |
|
cl_int err = pfn_clCreateSubDevicesEXT(object_, properties, 0, NULL, &n); |
|
if (err != CL_SUCCESS) { |
|
return detail::errHandler(err, __CREATE_SUB_DEVICES); |
|
} |
|
|
|
cl_device_id* ids = (cl_device_id*) alloca(n * sizeof(cl_device_id)); |
|
err = pfn_clCreateSubDevicesEXT(object_, properties, n, ids, NULL); |
|
if (err != CL_SUCCESS) { |
|
return detail::errHandler(err, __CREATE_SUB_DEVICES); |
|
} |
|
|
|
devices->assign(&ids[0], &ids[n]); |
|
return CL_SUCCESS; |
|
} |
|
#endif // #if defined(USE_CL_DEVICE_FISSION) |
|
#endif // #if defined(CL_VERSION_1_1) |
|
}; |
|
|
|
/*! \brief Class interface for cl_platform_id. |
|
* |
|
* \note Copies of these objects are inexpensive, since they don't 'own' |
|
* any underlying resources or data structures. |
|
* |
|
* \see cl_platform_id |
|
*/ |
|
class Platform : public detail::Wrapper<cl_platform_id> |
|
{ |
|
public: |
|
//! \brief Default constructor - initializes to NULL. |
|
Platform() : detail::Wrapper<cl_type>() { } |
|
|
|
/*! \brief Copy constructor. |
|
* |
|
* This simply copies the platform ID value, which is an inexpensive operation. |
|
*/ |
|
Platform(const Platform& platform) : detail::Wrapper<cl_type>(platform) { } |
|
|
|
/*! \brief Constructor from cl_platform_id. |
|
* |
|
* This simply copies the platform ID value, which is an inexpensive operation. |
|
*/ |
|
Platform(const cl_platform_id &platform) : detail::Wrapper<cl_type>(platform) { } |
|
|
|
/*! \brief Assignment operator from Platform. |
|
* |
|
* This simply copies the platform ID value, which is an inexpensive operation. |
|
*/ |
|
Platform& operator = (const Platform& rhs) |
|
{ |
|
if (this != &rhs) { |
|
detail::Wrapper<cl_type>::operator=(rhs); |
|
} |
|
return *this; |
|
} |
|
|
|
/*! \brief Assignment operator from cl_platform_id. |
|
* |
|
* This simply copies the platform ID value, which is an inexpensive operation. |
|
*/ |
|
Platform& operator = (const cl_platform_id& rhs) |
|
{ |
|
detail::Wrapper<cl_type>::operator=(rhs); |
|
return *this; |
|
} |
|
|
|
//! \brief Wrapper for clGetPlatformInfo(). |
|
cl_int getInfo(cl_platform_info name, STRING_CLASS* param) const |
|
{ |
|
return detail::errHandler( |
|
detail::getInfo(&::clGetPlatformInfo, object_, name, param), |
|
__GET_PLATFORM_INFO_ERR); |
|
} |
|
|
|
//! \brief Wrapper for clGetPlatformInfo() that returns by value. |
|
template <cl_int name> typename |
|
detail::param_traits<detail::cl_platform_info, name>::param_type |
|
getInfo(cl_int* err = NULL) const |
|
{ |
|
typename detail::param_traits< |
|
detail::cl_platform_info, name>::param_type param; |
|
cl_int result = getInfo(name, ¶m); |
|
if (err != NULL) { |
|
*err = result; |
|
} |
|
return param; |
|
} |
|
|
|
/*! \brief Gets a list of devices for this platform. |
|
* |
|
* Wraps clGetDeviceIDs(). |
|
*/ |
|
cl_int getDevices( |
|
cl_device_type type, |
|
VECTOR_CLASS<Device>* devices) const |
|
{ |
|
cl_uint n = 0; |
|
if( devices == NULL ) { |
|
return detail::errHandler(CL_INVALID_ARG_VALUE, __GET_DEVICE_IDS_ERR); |
|
} |
|
cl_int err = ::clGetDeviceIDs(object_, type, 0, NULL, &n); |
|
if (err != CL_SUCCESS) { |
|
return detail::errHandler(err, __GET_DEVICE_IDS_ERR); |
|
} |
|
|
|
cl_device_id* ids = (cl_device_id*) alloca(n * sizeof(cl_device_id)); |
|
err = ::clGetDeviceIDs(object_, type, n, ids, NULL); |
|
if (err != CL_SUCCESS) { |
|
return detail::errHandler(err, __GET_DEVICE_IDS_ERR); |
|
} |
|
|
|
devices->assign(&ids[0], &ids[n]); |
|
return CL_SUCCESS; |
|
} |
|
|
|
#if defined(USE_DX_INTEROP) |
|
/*! \brief Get the list of available D3D10 devices. |
|
* |
|
* \param d3d_device_source. |
|
* |
|
* \param d3d_object. |
|
* |
|
* \param d3d_device_set. |
|
* |
|
* \param devices returns a vector of OpenCL D3D10 devices found. The cl::Device |
|
* values returned in devices can be used to identify a specific OpenCL |
|
* device. If \a devices argument is NULL, this argument is ignored. |
|
* |
|
* \return One of the following values: |
|
* - CL_SUCCESS if the function is executed successfully. |
|
* |
|
* The application can query specific capabilities of the OpenCL device(s) |
|
* returned by cl::getDevices. This can be used by the application to |
|
* determine which device(s) to use. |
|
* |
|
* \note In the case that exceptions are enabled and a return value |
|
* other than CL_SUCCESS is generated, then cl::Error exception is |
|
* generated. |
|
*/ |
|
cl_int getDevices( |
|
cl_d3d10_device_source_khr d3d_device_source, |
|
void * d3d_object, |
|
cl_d3d10_device_set_khr d3d_device_set, |
|
VECTOR_CLASS<Device>* devices) const |
|
{ |
|
typedef CL_API_ENTRY cl_int (CL_API_CALL *PFN_clGetDeviceIDsFromD3D10KHR)( |
|
cl_platform_id platform, |
|
cl_d3d10_device_source_khr d3d_device_source, |
|
void * d3d_object, |
|
cl_d3d10_device_set_khr d3d_device_set, |
|
cl_uint num_entries, |
|
cl_device_id * devices, |
|
cl_uint* num_devices); |
|
|
|
if( devices == NULL ) { |
|
return detail::errHandler(CL_INVALID_ARG_VALUE, __GET_DEVICE_IDS_ERR); |
|
} |
|
|
|
static PFN_clGetDeviceIDsFromD3D10KHR pfn_clGetDeviceIDsFromD3D10KHR = NULL; |
|
__INIT_CL_EXT_FCN_PTR_PLATFORM(object_, clGetDeviceIDsFromD3D10KHR); |
|
|
|
cl_uint n = 0; |
|
cl_int err = pfn_clGetDeviceIDsFromD3D10KHR( |
|
object_, |
|
d3d_device_source, |
|
d3d_object, |
|
d3d_device_set, |
|
0, |
|
NULL, |
|
&n); |
|
if (err != CL_SUCCESS) { |
|
return detail::errHandler(err, __GET_DEVICE_IDS_ERR); |
|
} |
|
|
|
cl_device_id* ids = (cl_device_id*) alloca(n * sizeof(cl_device_id)); |
|
err = pfn_clGetDeviceIDsFromD3D10KHR( |
|
object_, |
|
d3d_device_source, |
|
d3d_object, |
|
d3d_device_set, |
|
n, |
|
ids, |
|
NULL); |
|
if (err != CL_SUCCESS) { |
|
return detail::errHandler(err, __GET_DEVICE_IDS_ERR); |
|
} |
|
|
|
devices->assign(&ids[0], &ids[n]); |
|
return CL_SUCCESS; |
|
} |
|
#endif |
|
|
|
/*! \brief Gets a list of available platforms. |
|
* |
|
* Wraps clGetPlatformIDs(). |
|
*/ |
|
static cl_int get( |
|
VECTOR_CLASS<Platform>* platforms) |
|
{ |
|
cl_uint n = 0; |
|
|
|
if( platforms == NULL ) { |
|
return detail::errHandler(CL_INVALID_ARG_VALUE, __GET_PLATFORM_IDS_ERR); |
|
} |
|
|
|
cl_int err = ::clGetPlatformIDs(0, NULL, &n); |
|
if (err != CL_SUCCESS) { |
|
return detail::errHandler(err, __GET_PLATFORM_IDS_ERR); |
|
} |
|
|
|
cl_platform_id* ids = (cl_platform_id*) alloca( |
|
n * sizeof(cl_platform_id)); |
|
err = ::clGetPlatformIDs(n, ids, NULL); |
|
if (err != CL_SUCCESS) { |
|
return detail::errHandler(err, __GET_PLATFORM_IDS_ERR); |
|
} |
|
|
|
platforms->assign(&ids[0], &ids[n]); |
|
return CL_SUCCESS; |
|
} |
|
|
|
/*! \brief Gets the first available platform. |
|
* |
|
* Wraps clGetPlatformIDs(), returning the first result. |
|
*/ |
|
static cl_int get( |
|
Platform * platform) |
|
{ |
|
cl_uint n = 0; |
|
|
|
if( platform == NULL ) { |
|
return detail::errHandler(CL_INVALID_ARG_VALUE, __GET_PLATFORM_IDS_ERR); |
|
} |
|
|
|
cl_int err = ::clGetPlatformIDs(0, NULL, &n); |
|
if (err != CL_SUCCESS) { |
|
return detail::errHandler(err, __GET_PLATFORM_IDS_ERR); |
|
} |
|
|
|
cl_platform_id* ids = (cl_platform_id*) alloca( |
|
n * sizeof(cl_platform_id)); |
|
err = ::clGetPlatformIDs(n, ids, NULL); |
|
if (err != CL_SUCCESS) { |
|
return detail::errHandler(err, __GET_PLATFORM_IDS_ERR); |
|
} |
|
|
|
*platform = ids[0]; |
|
return CL_SUCCESS; |
|
} |
|
|
|
/*! \brief Gets the first available platform, returning it by value. |
|
* |
|
* Wraps clGetPlatformIDs(), returning the first result. |
|
*/ |
|
static Platform get( |
|
cl_int * errResult = NULL) |
|
{ |
|
Platform platform; |
|
cl_uint n = 0; |
|
cl_int err = ::clGetPlatformIDs(0, NULL, &n); |
|
if (err != CL_SUCCESS) { |
|
detail::errHandler(err, __GET_PLATFORM_IDS_ERR); |
|
if (errResult != NULL) { |
|
*errResult = err; |
|
} |
|
} |
|
|
|
cl_platform_id* ids = (cl_platform_id*) alloca( |
|
n * sizeof(cl_platform_id)); |
|
err = ::clGetPlatformIDs(n, ids, NULL); |
|
|
|
if (err != CL_SUCCESS) { |
|
detail::errHandler(err, __GET_PLATFORM_IDS_ERR); |
|
} |
|
|
|
if (errResult != NULL) { |
|
*errResult = err; |
|
} |
|
|
|
return ids[0]; |
|
} |
|
|
|
static Platform getDefault( |
|
cl_int *errResult = NULL ) |
|
{ |
|
return get(errResult); |
|
} |
|
|
|
|
|
#if defined(CL_VERSION_1_2) |
|
//! \brief Wrapper for clUnloadCompiler(). |
|
cl_int |
|
unloadCompiler() |
|
{ |
|
return ::clUnloadPlatformCompiler(object_); |
|
} |
|
#endif // #if defined(CL_VERSION_1_2) |
|
}; // class Platform |
|
|
|
/** |
|
* Deprecated APIs for 1.2 |
|
*/ |
|
#if defined(CL_USE_DEPRECATED_OPENCL_1_1_APIS) || (defined(CL_VERSION_1_1) && !defined(CL_VERSION_1_2)) |
|
/** |
|
* Unload the OpenCL compiler. |
|
* \note Deprecated for OpenCL 1.2. Use Platform::unloadCompiler instead. |
|
*/ |
|
inline CL_EXT_PREFIX__VERSION_1_1_DEPRECATED cl_int |
|
UnloadCompiler() CL_EXT_SUFFIX__VERSION_1_1_DEPRECATED; |
|
inline cl_int |
|
UnloadCompiler() |
|
{ |
|
return ::clUnloadCompiler(); |
|
} |
|
#endif // #if defined(CL_VERSION_1_1) |
|
|
|
/*! \brief Class interface for cl_context. |
|
* |
|
* \note Copies of these objects are shallow, meaning that the copy will refer |
|
* to the same underlying cl_context as the original. For details, see |
|
* clRetainContext() and clReleaseContext(). |
|
* |
|
* \see cl_context |
|
*/ |
|
class Context |
|
: public detail::Wrapper<cl_context> |
|
{ |
|
private: |
|
static volatile int default_initialized_; |
|
static Context default_; |
|
static volatile cl_int default_error_; |
|
public: |
|
/*! \brief Destructor. |
|
* |
|
* This calls clReleaseContext() on the value held by this instance. |
|
*/ |
|
~Context() { } |
|
|
|
/*! \brief Constructs a context including a list of specified devices. |
|
* |
|
* Wraps clCreateContext(). |
|
*/ |
|
Context( |
|
const VECTOR_CLASS<Device>& devices, |
|
cl_context_properties* properties = NULL, |
|
void (CL_CALLBACK * notifyFptr)( |
|
const char *, |
|
const void *, |
|
::size_t, |
|
void *) = NULL, |
|
void* data = NULL, |
|
cl_int* err = NULL) |
|
{ |
|
cl_int error; |
|
|
|
::size_t numDevices = devices.size(); |
|
cl_device_id* deviceIDs = (cl_device_id*) alloca(numDevices * sizeof(cl_device_id)); |
|
for( ::size_t deviceIndex = 0; deviceIndex < numDevices; ++deviceIndex ) { |
|
deviceIDs[deviceIndex] = (devices[deviceIndex])(); |
|
} |
|
|
|
object_ = ::clCreateContext( |
|
properties, (cl_uint) numDevices, |
|
deviceIDs, |
|
notifyFptr, data, &error); |
|
|
|
detail::errHandler(error, __CREATE_CONTEXT_ERR); |
|
if (err != NULL) { |
|
*err = error; |
|
} |
|
} |
|
|
|
Context( |
|
const Device& device, |
|
cl_context_properties* properties = NULL, |
|
void (CL_CALLBACK * notifyFptr)( |
|
const char *, |
|
const void *, |
|
::size_t, |
|
void *) = NULL, |
|
void* data = NULL, |
|
cl_int* err = NULL) |
|
{ |
|
cl_int error; |
|
|
|
cl_device_id deviceID = device(); |
|
|
|
object_ = ::clCreateContext( |
|
properties, 1, |
|
&deviceID, |
|
notifyFptr, data, &error); |
|
|
|
detail::errHandler(error, __CREATE_CONTEXT_ERR); |
|
if (err != NULL) { |
|
*err = error; |
|
} |
|
} |
|
|
|
/*! \brief Constructs a context including all devices of a specified type. |
|
* |
|
* Wraps clCreateContextFromType(). |
|
*/ |
|
Context( |
|
cl_device_type type, |
|
cl_context_properties* properties = NULL, |
|
void (CL_CALLBACK * notifyFptr)( |
|
const char *, |
|
const void *, |
|
::size_t, |
|
void *) = NULL, |
|
void* data = NULL, |
|
cl_int* err = NULL) |
|
{ |
|
cl_int error; |
|
|
|
#if !defined(__APPLE__) || !defined(__MACOS) |
|
cl_context_properties prop[4] = {CL_CONTEXT_PLATFORM, 0, 0, 0 }; |
|
if (properties == NULL) { |
|
prop[1] = (cl_context_properties)Platform::get(&error)(); |
|
if (error != CL_SUCCESS) { |
|
detail::errHandler(error, __CREATE_CONTEXT_FROM_TYPE_ERR); |
|
if (err != NULL) { |
|
*err = error; |
|
return; |
|
} |
|
} |
|
|
|
properties = &prop[0]; |
|
} |
|
#endif |
|
object_ = ::clCreateContextFromType( |
|
properties, type, notifyFptr, data, &error); |
|
|
|
detail::errHandler(error, __CREATE_CONTEXT_FROM_TYPE_ERR); |
|
if (err != NULL) { |
|
*err = error; |
|
} |
|
} |
|
|
|
/*! \brief Returns a singleton context including all devices of CL_DEVICE_TYPE_DEFAULT. |
|
* |
|
* \note All calls to this function return the same cl_context as the first. |
|
*/ |
|
static Context getDefault(cl_int * err = NULL) |
|
{ |
|
int state = detail::compare_exchange( |
|
&default_initialized_, |
|
__DEFAULT_BEING_INITIALIZED, __DEFAULT_NOT_INITIALIZED); |
|
|
|
if (state & __DEFAULT_INITIALIZED) { |
|
if (err != NULL) { |
|
*err = default_error_; |
|
} |
|
return default_; |
|
} |
|
|
|
if (state & __DEFAULT_BEING_INITIALIZED) { |
|
// Assume writes will propagate eventually... |
|
while(default_initialized_ != __DEFAULT_INITIALIZED) { |
|
detail::fence(); |
|
} |
|
|
|
if (err != NULL) { |
|
*err = default_error_; |
|
} |
|
return default_; |
|
} |
|
|
|
cl_int error; |
|
default_ = Context( |
|
CL_DEVICE_TYPE_DEFAULT, |
|
NULL, |
|
NULL, |
|
NULL, |
|
&error); |
|
|
|
detail::fence(); |
|
|
|
default_error_ = error; |
|
// Assume writes will propagate eventually... |
|
default_initialized_ = __DEFAULT_INITIALIZED; |
|
|
|
detail::fence(); |
|
|
|
if (err != NULL) { |
|
*err = default_error_; |
|
} |
|
return default_; |
|
|
|
} |
|
|
|
//! \brief Default constructor - initializes to NULL. |
|
Context() : detail::Wrapper<cl_type>() { } |
|
|
|
/*! \brief Copy constructor. |
|
* |
|
* This calls clRetainContext() on the parameter's cl_context. |
|
*/ |
|
Context(const Context& context) : detail::Wrapper<cl_type>(context) { } |
|
|
|
/*! \brief Constructor from cl_context - takes ownership. |
|
* |
|
* This effectively transfers ownership of a refcount on the cl_context |
|
* into the new Context object. |
|
*/ |
|
__CL_EXPLICIT_CONSTRUCTORS Context(const cl_context& context) : detail::Wrapper<cl_type>(context) { } |
|
|
|
/*! \brief Assignment operator from Context. |
|
* |
|
* This calls clRetainContext() on the parameter and clReleaseContext() on |
|
* the previous value held by this instance. |
|
*/ |
|
Context& operator = (const Context& rhs) |
|
{ |
|
if (this != &rhs) { |
|
detail::Wrapper<cl_type>::operator=(rhs); |
|
} |
|
return *this; |
|
} |
|
|
|
/*! \brief Assignment operator from cl_context - takes ownership. |
|
* |
|
* This effectively transfers ownership of a refcount on the rhs and calls |
|
* clReleaseContext() on the value previously held by this instance. |
|
*/ |
|
Context& operator = (const cl_context& rhs) |
|
{ |
|
detail::Wrapper<cl_type>::operator=(rhs); |
|
return *this; |
|
} |
|
|
|
//! \brief Wrapper for clGetContextInfo(). |
|
template <typename T> |
|
cl_int getInfo(cl_context_info name, T* param) const |
|
{ |
|
return detail::errHandler( |
|
detail::getInfo(&::clGetContextInfo, object_, name, param), |
|
__GET_CONTEXT_INFO_ERR); |
|
} |
|
|
|
//! \brief Wrapper for clGetContextInfo() that returns by value. |
|
template <cl_int name> typename |
|
detail::param_traits<detail::cl_context_info, name>::param_type |
|
getInfo(cl_int* err = NULL) const |
|
{ |
|
typename detail::param_traits< |
|
detail::cl_context_info, name>::param_type param; |
|
cl_int result = getInfo(name, ¶m); |
|
if (err != NULL) { |
|
*err = result; |
|
} |
|
return param; |
|
} |
|
|
|
/*! \brief Gets a list of supported image formats. |
|
* |
|
* Wraps clGetSupportedImageFormats(). |
|
*/ |
|
cl_int getSupportedImageFormats( |
|
cl_mem_flags flags, |
|
cl_mem_object_type type, |
|
VECTOR_CLASS<ImageFormat>* formats) const |
|
{ |
|
cl_uint numEntries; |
|
cl_int err = ::clGetSupportedImageFormats( |
|
object_, |
|
flags, |
|
type, |
|
0, |
|
NULL, |
|
&numEntries); |
|
if (err != CL_SUCCESS) { |
|
return detail::errHandler(err, __GET_SUPPORTED_IMAGE_FORMATS_ERR); |
|
} |
|
|
|
ImageFormat* value = (ImageFormat*) |
|
alloca(numEntries * sizeof(ImageFormat)); |
|
err = ::clGetSupportedImageFormats( |
|
object_, |
|
flags, |
|
type, |
|
numEntries, |
|
(cl_image_format*) value, |
|
NULL); |
|
if (err != CL_SUCCESS) { |
|
return detail::errHandler(err, __GET_SUPPORTED_IMAGE_FORMATS_ERR); |
|
} |
|
|
|
formats->assign(&value[0], &value[numEntries]); |
|
return CL_SUCCESS; |
|
} |
|
}; |
|
|
|
inline Device Device::getDefault(cl_int * err) |
|
{ |
|
cl_int error; |
|
Device device; |
|
|
|
Context context = Context::getDefault(&error); |
|
detail::errHandler(error, __CREATE_COMMAND_QUEUE_ERR); |
|
|
|
if (error != CL_SUCCESS) { |
|
if (err != NULL) { |
|
*err = error; |
|
} |
|
} |
|
else { |
|
device = context.getInfo<CL_CONTEXT_DEVICES>()[0]; |
|
if (err != NULL) { |
|
*err = CL_SUCCESS; |
|
} |
|
} |
|
|
|
return device; |
|
} |
|
|
|
|
|
#ifdef _WIN32 |
|
__declspec(selectany) volatile int Context::default_initialized_ = __DEFAULT_NOT_INITIALIZED; |
|
__declspec(selectany) Context Context::default_; |
|
__declspec(selectany) volatile cl_int Context::default_error_ = CL_SUCCESS; |
|
#else |
|
__attribute__((weak)) volatile int Context::default_initialized_ = __DEFAULT_NOT_INITIALIZED; |
|
__attribute__((weak)) Context Context::default_; |
|
__attribute__((weak)) volatile cl_int Context::default_error_ = CL_SUCCESS; |
|
#endif |
|
|
|
/*! \brief Class interface for cl_event. |
|
* |
|
* \note Copies of these objects are shallow, meaning that the copy will refer |
|
* to the same underlying cl_event as the original. For details, see |
|
* clRetainEvent() and clReleaseEvent(). |
|
* |
|
* \see cl_event |
|
*/ |
|
class Event : public detail::Wrapper<cl_event> |
|
{ |
|
public: |
|
/*! \brief Destructor. |
|
* |
|
* This calls clReleaseEvent() on the value held by this instance. |
|
*/ |
|
~Event() { } |
|
|
|
//! \brief Default constructor - initializes to NULL. |
|
Event() : detail::Wrapper<cl_type>() { } |
|
|
|
/*! \brief Copy constructor. |
|
* |
|
* This calls clRetainEvent() on the parameter's cl_event. |
|
*/ |
|
Event(const Event& event) : detail::Wrapper<cl_type>(event) { } |
|
|
|
/*! \brief Constructor from cl_event - takes ownership. |
|
* |
|
* This effectively transfers ownership of a refcount on the cl_event |
|
* into the new Event object. |
|
*/ |
|
Event(const cl_event& event) : detail::Wrapper<cl_type>(event) { } |
|
|
|
/*! \brief Assignment operator from cl_event - takes ownership. |
|
* |
|
* This effectively transfers ownership of a refcount on the rhs and calls |
|
* clReleaseEvent() on the value previously held by this instance. |
|
*/ |
|
Event& operator = (const Event& rhs) |
|
{ |
|
if (this != &rhs) { |
|
detail::Wrapper<cl_type>::operator=(rhs); |
|
} |
|
return *this; |
|
} |
|
|
|
/*! \brief Assignment operator from cl_event. |
|
* |
|
* This calls clRetainEvent() on the parameter and clReleaseEvent() on |
|
* the previous value held by this instance. |
|
*/ |
|
Event& operator = (const cl_event& rhs) |
|
{ |
|
detail::Wrapper<cl_type>::operator=(rhs); |
|
return *this; |
|
} |
|
|
|
//! \brief Wrapper for clGetEventInfo(). |
|
template <typename T> |
|
cl_int getInfo(cl_event_info name, T* param) const |
|
{ |
|
return detail::errHandler( |
|
detail::getInfo(&::clGetEventInfo, object_, name, param), |
|
__GET_EVENT_INFO_ERR); |
|
} |
|
|
|
//! \brief Wrapper for clGetEventInfo() that returns by value. |
|
template <cl_int name> typename |
|
detail::param_traits<detail::cl_event_info, name>::param_type |
|
getInfo(cl_int* err = NULL) const |
|
{ |
|
typename detail::param_traits< |
|
detail::cl_event_info, name>::param_type param; |
|
cl_int result = getInfo(name, ¶m); |
|
if (err != NULL) { |
|
*err = result; |
|
} |
|
return param; |
|
} |
|
|
|
//! \brief Wrapper for clGetEventProfilingInfo(). |
|
template <typename T> |
|
cl_int getProfilingInfo(cl_profiling_info name, T* param) const |
|
{ |
|
return detail::errHandler(detail::getInfo( |
|
&::clGetEventProfilingInfo, object_, name, param), |
|
__GET_EVENT_PROFILE_INFO_ERR); |
|
} |
|
|
|
//! \brief Wrapper for clGetEventProfilingInfo() that returns by value. |
|
template <cl_int name> typename |
|
detail::param_traits<detail::cl_profiling_info, name>::param_type |
|
getProfilingInfo(cl_int* err = NULL) const |
|
{ |
|
typename detail::param_traits< |
|
detail::cl_profiling_info, name>::param_type param; |
|
cl_int result = getProfilingInfo(name, ¶m); |
|
if (err != NULL) { |
|
*err = result; |
|
} |
|
return param; |
|
} |
|
|
|
/*! \brief Blocks the calling thread until this event completes. |
|
* |
|
* Wraps clWaitForEvents(). |
|
*/ |
|
cl_int wait() const |
|
{ |
|
return detail::errHandler( |
|
::clWaitForEvents(1, &object_), |
|
__WAIT_FOR_EVENTS_ERR); |
|
} |
|
|
|
#if defined(CL_VERSION_1_1) |
|
/*! \brief Registers a user callback function for a specific command execution status. |
|
* |
|
* Wraps clSetEventCallback(). |
|
*/ |
|
cl_int setCallback( |
|
cl_int type, |
|
void (CL_CALLBACK * pfn_notify)(cl_event, cl_int, void *), |
|
void * user_data = NULL) |
|
{ |
|
return detail::errHandler( |
|
::clSetEventCallback( |
|
object_, |
|
type, |
|
pfn_notify, |
|
user_data), |
|
__SET_EVENT_CALLBACK_ERR); |
|
} |
|
#endif |
|
|
|
/*! \brief Blocks the calling thread until every event specified is complete. |
|
* |
|
* Wraps clWaitForEvents(). |
|
*/ |
|
static cl_int |
|
waitForEvents(const VECTOR_CLASS<Event>& events) |
|
{ |
|
return detail::errHandler( |
|
::clWaitForEvents( |
|
(cl_uint) events.size(), (cl_event*)&events.front()), |
|
__WAIT_FOR_EVENTS_ERR); |
|
} |
|
}; |
|
|
|
#if defined(CL_VERSION_1_1) |
|
/*! \brief Class interface for user events (a subset of cl_event's). |
|
* |
|
* See Event for details about copy semantics, etc. |
|
*/ |
|
class UserEvent : public Event |
|
{ |
|
public: |
|
/*! \brief Constructs a user event on a given context. |
|
* |
|
* Wraps clCreateUserEvent(). |
|
*/ |
|
UserEvent( |
|
const Context& context, |
|
cl_int * err = NULL) |
|
{ |
|
cl_int error; |
|
object_ = ::clCreateUserEvent( |
|
context(), |
|
&error); |
|
|
|
detail::errHandler(error, __CREATE_USER_EVENT_ERR); |
|
if (err != NULL) { |
|
*err = error; |
|
} |
|
} |
|
|
|
//! \brief Default constructor - initializes to NULL. |
|
UserEvent() : Event() { } |
|
|
|
//! \brief Copy constructor - performs shallow copy. |
|
UserEvent(const UserEvent& event) : Event(event) { } |
|
|
|
//! \brief Assignment Operator - performs shallow copy. |
|
UserEvent& operator = (const UserEvent& rhs) |
|
{ |
|
if (this != &rhs) { |
|
Event::operator=(rhs); |
|
} |
|
return *this; |
|
} |
|
|
|
/*! \brief Sets the execution status of a user event object. |
|
* |
|
* Wraps clSetUserEventStatus(). |
|
*/ |
|
cl_int setStatus(cl_int status) |
|
{ |
|
return detail::errHandler( |
|
::clSetUserEventStatus(object_,status), |
|
__SET_USER_EVENT_STATUS_ERR); |
|
} |
|
}; |
|
#endif |
|
|
|
/*! \brief Blocks the calling thread until every event specified is complete. |
|
* |
|
* Wraps clWaitForEvents(). |
|
*/ |
|
inline static cl_int |
|
WaitForEvents(const VECTOR_CLASS<Event>& events) |
|
{ |
|
return detail::errHandler( |
|
::clWaitForEvents( |
|
(cl_uint) events.size(), (cl_event*)&events.front()), |
|
__WAIT_FOR_EVENTS_ERR); |
|
} |
|
|
|
/*! \brief Class interface for cl_mem. |
|
* |
|
* \note Copies of these objects are shallow, meaning that the copy will refer |
|
* to the same underlying cl_mem as the original. For details, see |
|
* clRetainMemObject() and clReleaseMemObject(). |
|
* |
|
* \see cl_mem |
|
*/ |
|
class Memory : public detail::Wrapper<cl_mem> |
|
{ |
|
public: |
|
|
|
/*! \brief Destructor. |
|
* |
|
* This calls clReleaseMemObject() on the value held by this instance. |
|
*/ |
|
~Memory() {} |
|
|
|
//! \brief Default constructor - initializes to NULL. |
|
Memory() : detail::Wrapper<cl_type>() { } |
|
|
|
/*! \brief Copy constructor - performs shallow copy. |
|
* |
|
* This calls clRetainMemObject() on the parameter's cl_mem. |
|
*/ |
|
Memory(const Memory& memory) : detail::Wrapper<cl_type>(memory) { } |
|
|
|
/*! \brief Constructor from cl_mem - takes ownership. |
|
* |
|
* This effectively transfers ownership of a refcount on the cl_mem |
|
* into the new Memory object. |
|
*/ |
|
__CL_EXPLICIT_CONSTRUCTORS Memory(const cl_mem& memory) : detail::Wrapper<cl_type>(memory) { } |
|
|
|
/*! \brief Assignment operator from Memory. |
|
* |
|
* This calls clRetainMemObject() on the parameter and clReleaseMemObject() |
|
* on the previous value held by this instance. |
|
*/ |
|
Memory& operator = (const Memory& rhs) |
|
{ |
|
if (this != &rhs) { |
|
detail::Wrapper<cl_type>::operator=(rhs); |
|
} |
|
return *this; |
|
} |
|
|
|
/*! \brief Assignment operator from cl_mem - takes ownership. |
|
* |
|
* This effectively transfers ownership of a refcount on the rhs and calls |
|
* clReleaseMemObject() on the value previously held by this instance. |
|
*/ |
|
Memory& operator = (const cl_mem& rhs) |
|
{ |
|
detail::Wrapper<cl_type>::operator=(rhs); |
|
return *this; |
|
} |
|
|
|
//! \brief Wrapper for clGetMemObjectInfo(). |
|
template <typename T> |
|
cl_int getInfo(cl_mem_info name, T* param) const |
|
{ |
|
return detail::errHandler( |
|
detail::getInfo(&::clGetMemObjectInfo, object_, name, param), |
|
__GET_MEM_OBJECT_INFO_ERR); |
|
} |
|
|
|
//! \brief Wrapper for clGetMemObjectInfo() that returns by value. |
|
template <cl_int name> typename |
|
detail::param_traits<detail::cl_mem_info, name>::param_type |
|
getInfo(cl_int* err = NULL) const |
|
{ |
|
typename detail::param_traits< |
|
detail::cl_mem_info, name>::param_type param; |
|
cl_int result = getInfo(name, ¶m); |
|
if (err != NULL) { |
|
*err = result; |
|
} |
|
return param; |
|
} |
|
|
|
#if defined(CL_VERSION_1_1) |
|
/*! \brief Registers a callback function to be called when the memory object |
|
* is no longer needed. |
|
* |
|
* Wraps clSetMemObjectDestructorCallback(). |
|
* |
|
* Repeated calls to this function, for a given cl_mem value, will append |
|
* to the list of functions called (in reverse order) when memory object's |
|
* resources are freed and the memory object is deleted. |
|
* |
|
* \note |
|
* The registered callbacks are associated with the underlying cl_mem |
|
* value - not the Memory class instance. |
|
*/ |
|
cl_int setDestructorCallback( |
|
void (CL_CALLBACK * pfn_notify)(cl_mem, void *), |
|
void * user_data = NULL) |
|
{ |
|
return detail::errHandler( |
|
::clSetMemObjectDestructorCallback( |
|
object_, |
|
pfn_notify, |
|
user_data), |
|
__SET_MEM_OBJECT_DESTRUCTOR_CALLBACK_ERR); |
|
} |
|
#endif |
|
|
|
}; |
|
|
|
// Pre-declare copy functions |
|
class Buffer; |
|
template< typename IteratorType > |
|
cl_int copy( IteratorType startIterator, IteratorType endIterator, cl::Buffer &buffer ); |
|
template< typename IteratorType > |
|
cl_int copy( const cl::Buffer &buffer, IteratorType startIterator, IteratorType endIterator ); |
|
|
|
/*! \brief Class interface for Buffer Memory Objects. |
|
* |
|
* See Memory for details about copy semantics, etc. |
|
* |
|
* \see Memory |
|
*/ |
|
class Buffer : public Memory |
|
{ |
|
public: |
|
|
|
/*! \brief Constructs a Buffer in a specified context. |
|
* |
|
* Wraps clCreateBuffer(). |
|
* |
|
* \param host_ptr Storage to be used if the CL_MEM_USE_HOST_PTR flag was |
|
* specified. Note alignment & exclusivity requirements. |
|
*/ |
|
Buffer( |
|
const Context& context, |
|
cl_mem_flags flags, |
|
::size_t size, |
|
void* host_ptr = NULL, |
|
cl_int* err = NULL) |
|
{ |
|
cl_int error; |
|
object_ = ::clCreateBuffer(context(), flags, size, host_ptr, &error); |
|
|
|
detail::errHandler(error, __CREATE_BUFFER_ERR); |
|
if (err != NULL) { |
|
*err = error; |
|
} |
|
} |
|
|
|
/*! \brief Constructs a Buffer in the default context. |
|
* |
|
* Wraps clCreateBuffer(). |
|
* |
|
* \param host_ptr Storage to be used if the CL_MEM_USE_HOST_PTR flag was |
|
* specified. Note alignment & exclusivity requirements. |
|
* |
|
* \see Context::getDefault() |
|
*/ |
|
Buffer( |
|
cl_mem_flags flags, |
|
::size_t size, |
|
void* host_ptr = NULL, |
|
cl_int* err = NULL) |
|
{ |
|
cl_int error; |
|
|
|
Context context = Context::getDefault(err); |
|
|
|
object_ = ::clCreateBuffer(context(), flags, size, host_ptr, &error); |
|
|
|
detail::errHandler(error, __CREATE_BUFFER_ERR); |
|
if (err != NULL) { |
|
*err = error; |
|
} |
|
} |
|
|
|
/*! |
|
* \brief Construct a Buffer from a host container via iterators. |
|
* If useHostPtr is specified iterators must be random access. |
|
*/ |
|
template< typename IteratorType > |
|
Buffer( |
|
IteratorType startIterator, |
|
IteratorType endIterator, |
|
bool readOnly, |
|
bool useHostPtr = false, |
|
cl_int* err = NULL) |
|
{ |
|
typedef typename std::iterator_traits<IteratorType>::value_type DataType; |
|
cl_int error; |
|
|
|
cl_mem_flags flags = 0; |
|
if( readOnly ) { |
|
flags |= CL_MEM_READ_ONLY; |
|
} |
|
else { |
|
flags |= CL_MEM_READ_WRITE; |
|
} |
|
if( useHostPtr ) { |
|
flags |= CL_MEM_USE_HOST_PTR; |
|
} |
|
|
|
::size_t size = sizeof(DataType)*(endIterator - startIterator); |
|
|
|
Context context = Context::getDefault(err); |
|
|
|
if( useHostPtr ) { |
|
object_ = ::clCreateBuffer(context(), flags, size, static_cast<DataType*>(&*startIterator), &error); |
|
} else { |
|
object_ = ::clCreateBuffer(context(), flags, size, 0, &error); |
|
} |
|
|
|
detail::errHandler(error, __CREATE_BUFFER_ERR); |
|
if (err != NULL) { |
|
*err = error; |
|
} |
|
|
|
if( !useHostPtr ) { |
|
error = cl::copy(startIterator, endIterator, *this); |
|
detail::errHandler(error, __CREATE_BUFFER_ERR); |
|
if (err != NULL) { |
|
*err = error; |
|
} |
|
} |
|
} |
|
|
|
//! \brief Default constructor - initializes to NULL. |
|
Buffer() : Memory() { } |
|
|
|
/*! \brief Copy constructor - performs shallow copy. |
|
* |
|
* See Memory for further details. |
|
*/ |
|
Buffer(const Buffer& buffer) : Memory(buffer) { } |
|
|
|
/*! \brief Constructor from cl_mem - takes ownership. |
|
* |
|
* See Memory for further details. |
|
*/ |
|
__CL_EXPLICIT_CONSTRUCTORS Buffer(const cl_mem& buffer) : Memory(buffer) { } |
|
|
|
/*! \brief Assignment from Buffer - performs shallow copy. |
|
* |
|
* See Memory for further details. |
|
*/ |
|
Buffer& operator = (const Buffer& rhs) |
|
{ |
|
if (this != &rhs) { |
|
Memory::operator=(rhs); |
|
} |
|
return *this; |
|
} |
|
|
|
/*! \brief Assignment from cl_mem - performs shallow copy. |
|
* |
|
* See Memory for further details. |
|
*/ |
|
Buffer& operator = (const cl_mem& rhs) |
|
{ |
|
Memory::operator=(rhs); |
|
return *this; |
|
} |
|
|
|
#if defined(CL_VERSION_1_1) |
|
/*! \brief Creates a new buffer object from this. |
|
* |
|
* Wraps clCreateSubBuffer(). |
|
*/ |
|
Buffer createSubBuffer( |
|
cl_mem_flags flags, |
|
cl_buffer_create_type buffer_create_type, |
|
const void * buffer_create_info, |
|
cl_int * err = NULL) |
|
{ |
|
Buffer result; |
|
cl_int error; |
|
result.object_ = ::clCreateSubBuffer( |
|
object_, |
|
flags, |
|
buffer_create_type, |
|
buffer_create_info, |
|
&error); |
|
|
|
detail::errHandler(error, __CREATE_SUBBUFFER_ERR); |
|
if (err != NULL) { |
|
*err = error; |
|
} |
|
|
|
return result; |
|
} |
|
#endif |
|
}; |
|
|
|
#if defined (USE_DX_INTEROP) |
|
/*! \brief Class interface for creating OpenCL buffers from ID3D10Buffer's. |
|
* |
|
* This is provided to facilitate interoperability with Direct3D. |
|
* |
|
* See Memory for details about copy semantics, etc. |
|
* |
|
* \see Memory |
|
*/ |
|
class BufferD3D10 : public Buffer |
|
{ |
|
public: |
|
typedef CL_API_ENTRY cl_mem (CL_API_CALL *PFN_clCreateFromD3D10BufferKHR)( |
|
cl_context context, cl_mem_flags flags, ID3D10Buffer* buffer, |
|
cl_int* errcode_ret); |
|
|
|
/*! \brief Constructs a BufferD3D10, in a specified context, from a |
|
* given ID3D10Buffer. |
|
* |
|
* Wraps clCreateFromD3D10BufferKHR(). |
|
*/ |
|
BufferD3D10( |
|
const Context& context, |
|
cl_mem_flags flags, |
|
ID3D10Buffer* bufobj, |
|
cl_int * err = NULL) |
|
{ |
|
static PFN_clCreateFromD3D10BufferKHR pfn_clCreateFromD3D10BufferKHR = NULL; |
|
|
|
#if defined(CL_VERSION_1_2) |
|
vector<cl_context_properties> props = context.getInfo<CL_CONTEXT_PROPERTIES>(); |
|
cl_platform platform = -1; |
|
for( int i = 0; i < props.size(); ++i ) { |
|
if( props[i] == CL_CONTEXT_PLATFORM ) { |
|
platform = props[i+1]; |
|
} |
|
} |
|
__INIT_CL_EXT_FCN_PTR_PLATFORM(platform, clCreateFromD3D10BufferKHR); |
|
#endif |
|
#if defined(CL_VERSION_1_1) |
|
__INIT_CL_EXT_FCN_PTR(clCreateFromD3D10BufferKHR); |
|
#endif |
|
|
|
cl_int error; |
|
object_ = pfn_clCreateFromD3D10BufferKHR( |
|
context(), |
|
flags, |
|
bufobj, |
|
&error); |
|
|
|
detail::errHandler(error, __CREATE_GL_BUFFER_ERR); |
|
if (err != NULL) { |
|
*err = error; |
|
} |
|
} |
|
|
|
//! \brief Default constructor - initializes to NULL. |
|
BufferD3D10() : Buffer() { } |
|
|
|
/*! \brief Copy constructor - performs shallow copy. |
|
* |
|
* See Memory for further details. |
|
*/ |
|
BufferD3D10(const BufferD3D10& buffer) : Buffer(buffer) { } |
|
|
|
/*! \brief Constructor from cl_mem - takes ownership. |
|
* |
|
* See Memory for further details. |
|
*/ |
|
__CL_EXPLICIT_CONSTRUCTORS BufferD3D10(const cl_mem& buffer) : Buffer(buffer) { } |
|
|
|
/*! \brief Assignment from BufferD3D10 - performs shallow copy. |
|
* |
|
* See Memory for further details. |
|
*/ |
|
BufferD3D10& operator = (const BufferD3D10& rhs) |
|
{ |
|
if (this != &rhs) { |
|
Buffer::operator=(rhs); |
|
} |
|
return *this; |
|
} |
|
|
|
/*! \brief Assignment from cl_mem - performs shallow copy. |
|
* |
|
* See Memory for further details. |
|
*/ |
|
BufferD3D10& operator = (const cl_mem& rhs) |
|
{ |
|
Buffer::operator=(rhs); |
|
return *this; |
|
} |
|
}; |
|
#endif |
|
|
|
/*! \brief Class interface for GL Buffer Memory Objects. |
|
* |
|
* This is provided to facilitate interoperability with OpenGL. |
|
* |
|
* See Memory for details about copy semantics, etc. |
|
* |
|
* \see Memory |
|
*/ |
|
class BufferGL : public Buffer |
|
{ |
|
public: |
|
/*! \brief Constructs a BufferGL in a specified context, from a given |
|
* GL buffer. |
|
* |
|
* Wraps clCreateFromGLBuffer(). |
|
*/ |
|
BufferGL( |
|
const Context& context, |
|
cl_mem_flags flags, |
|
GLuint bufobj, |
|
cl_int * err = NULL) |
|
{ |
|
cl_int error; |
|
object_ = ::clCreateFromGLBuffer( |
|
context(), |
|
flags, |
|
bufobj, |
|
&error); |
|
|
|
detail::errHandler(error, __CREATE_GL_BUFFER_ERR); |
|
if (err != NULL) { |
|
*err = error; |
|
} |
|
} |
|
|
|
//! \brief Default constructor - initializes to NULL. |
|
BufferGL() : Buffer() { } |
|
|
|
/*! \brief Copy constructor - performs shallow copy. |
|
* |
|
* See Memory for further details. |
|
*/ |
|
BufferGL(const BufferGL& buffer) : Buffer(buffer) { } |
|
|
|
/*! \brief Constructor from cl_mem - takes ownership. |
|
* |
|
* See Memory for further details. |
|
*/ |
|
__CL_EXPLICIT_CONSTRUCTORS BufferGL(const cl_mem& buffer) : Buffer(buffer) { } |
|
|
|
/*! \brief Assignment from BufferGL - performs shallow copy. |
|
* |
|
* See Memory for further details. |
|
*/ |
|
BufferGL& operator = (const BufferGL& rhs) |
|
{ |
|
if (this != &rhs) { |
|
Buffer::operator=(rhs); |
|
} |
|
return *this; |
|
} |
|
|
|
/*! \brief Assignment from cl_mem - performs shallow copy. |
|
* |
|
* See Memory for further details. |
|
*/ |
|
BufferGL& operator = (const cl_mem& rhs) |
|
{ |
|
Buffer::operator=(rhs); |
|
return *this; |
|
} |
|
|
|
//! \brief Wrapper for clGetGLObjectInfo(). |
|
cl_int getObjectInfo( |
|
cl_gl_object_type *type, |
|
GLuint * gl_object_name) |
|
{ |
|
return detail::errHandler( |
|
::clGetGLObjectInfo(object_,type,gl_object_name), |
|
__GET_GL_OBJECT_INFO_ERR); |
|
} |
|
}; |
|
|
|
/*! \brief Class interface for GL Render Buffer Memory Objects. |
|
* |
|
* This is provided to facilitate interoperability with OpenGL. |
|
* |
|
* See Memory for details about copy semantics, etc. |
|
* |
|
* \see Memory |
|
*/ |
|
class BufferRenderGL : public Buffer |
|
{ |
|
public: |
|
/*! \brief Constructs a BufferRenderGL in a specified context, from a given |
|
* GL Renderbuffer. |
|
* |
|
* Wraps clCreateFromGLRenderbuffer(). |
|
*/ |
|
BufferRenderGL( |
|
const Context& context, |
|
cl_mem_flags flags, |
|
GLuint bufobj, |
|
cl_int * err = NULL) |
|
{ |
|
cl_int error; |
|
object_ = ::clCreateFromGLRenderbuffer( |
|
context(), |
|
flags, |
|
bufobj, |
|
&error); |
|
|
|
detail::errHandler(error, __CREATE_GL_RENDER_BUFFER_ERR); |
|
if (err != NULL) { |
|
*err = error; |
|
} |
|
} |
|
|
|
//! \brief Default constructor - initializes to NULL. |
|
BufferRenderGL() : Buffer() { } |
|
|
|
/*! \brief Copy constructor - performs shallow copy. |
|
* |
|
* See Memory for further details. |
|
*/ |
|
BufferRenderGL(const BufferGL& buffer) : Buffer(buffer) { } |
|
|
|
/*! \brief Constructor from cl_mem - takes ownership. |
|
* |
|
* See Memory for further details. |
|
*/ |
|
__CL_EXPLICIT_CONSTRUCTORS BufferRenderGL(const cl_mem& buffer) : Buffer(buffer) { } |
|
|
|
/*! \brief Assignment from BufferGL - performs shallow copy. |
|
* |
|
* See Memory for further details. |
|
*/ |
|
BufferRenderGL& operator = (const BufferRenderGL& rhs) |
|
{ |
|
if (this != &rhs) { |
|
Buffer::operator=(rhs); |
|
} |
|
return *this; |
|
} |
|
|
|
/*! \brief Assignment from cl_mem - performs shallow copy. |
|
* |
|
* See Memory for further details. |
|
*/ |
|
BufferRenderGL& operator = (const cl_mem& rhs) |
|
{ |
|
Buffer::operator=(rhs); |
|
return *this; |
|
} |
|
|
|
//! \brief Wrapper for clGetGLObjectInfo(). |
|
cl_int getObjectInfo( |
|
cl_gl_object_type *type, |
|
GLuint * gl_object_name) |
|
{ |
|
return detail::errHandler( |
|
::clGetGLObjectInfo(object_,type,gl_object_name), |
|
__GET_GL_OBJECT_INFO_ERR); |
|
} |
|
}; |
|
|
|
/*! \brief C++ base class for Image Memory objects. |
|
* |
|
* See Memory for details about copy semantics, etc. |
|
* |
|
* \see Memory |
|
*/ |
|
class Image : public Memory |
|
{ |
|
protected: |
|
//! \brief Default constructor - initializes to NULL. |
|
Image() : Memory() { } |
|
|
|
/*! \brief Copy constructor - performs shallow copy. |
|
* |
|
* See Memory for further details. |
|
*/ |
|
Image(const Image& image) : Memory(image) { } |
|
|
|
/*! \brief Constructor from cl_mem - takes ownership. |
|
* |
|
* See Memory for further details. |
|
*/ |
|
__CL_EXPLICIT_CONSTRUCTORS Image(const cl_mem& image) : Memory(image) { } |
|
|
|
/*! \brief Assignment from Image - performs shallow copy. |
|
* |
|
* See Memory for further details. |
|
*/ |
|
Image& operator = (const Image& rhs) |
|
{ |
|
if (this != &rhs) { |
|
Memory::operator=(rhs); |
|
} |
|
return *this; |
|
} |
|
|
|
/*! \brief Assignment from cl_mem - performs shallow copy. |
|
* |
|
* See Memory for further details. |
|
*/ |
|
Image& operator = (const cl_mem& rhs) |
|
{ |
|
Memory::operator=(rhs); |
|
return *this; |
|
} |
|
|
|
public: |
|
//! \brief Wrapper for clGetImageInfo(). |
|
template <typename T> |
|
cl_int getImageInfo(cl_image_info name, T* param) const |
|
{ |
|
return detail::errHandler( |
|
detail::getInfo(&::clGetImageInfo, object_, name, param), |
|
__GET_IMAGE_INFO_ERR); |
|
} |
|
|
|
//! \brief Wrapper for clGetImageInfo() that returns by value. |
|
template <cl_int name> typename |
|
detail::param_traits<detail::cl_image_info, name>::param_type |
|
getImageInfo(cl_int* err = NULL) const |
|
{ |
|
typename detail::param_traits< |
|
detail::cl_image_info, name>::param_type param; |
|
cl_int result = getImageInfo(name, ¶m); |
|
if (err != NULL) { |
|
*err = result; |
|
} |
|
return param; |
|
} |
|
}; |
|
|
|
#if defined(CL_VERSION_1_2) |
|
/*! \brief Class interface for 1D Image Memory objects. |
|
* |
|
* See Memory for details about copy semantics, etc. |
|
* |
|
* \see Memory |
|
*/ |
|
class Image1D : public Image |
|
{ |
|
public: |
|
/*! \brief Constructs a 1D Image in a specified context. |
|
* |
|
* Wraps clCreateImage(). |
|
*/ |
|
Image1D( |
|
const Context& context, |
|
cl_mem_flags flags, |
|
ImageFormat format, |
|
::size_t width, |
|
void* host_ptr = NULL, |
|
cl_int* err = NULL) |
|
{ |
|
cl_int error; |
|
cl_image_desc desc; |
|
desc.image_type = CL_MEM_OBJECT_IMAGE1D; |
|
desc.image_width = width; |
|
desc.image_row_pitch = 0; |
|
desc.num_mip_levels = 0; |
|
desc.num_samples = 0; |
|
desc.buffer = 0; |
|
object_ = ::clCreateImage( |
|
context(), |
|
flags, |
|
&format, |
|
&desc, |
|
host_ptr, |
|
&error); |
|
|
|
detail::errHandler(error, __CREATE_IMAGE_ERR); |
|
if (err != NULL) { |
|
*err = error; |
|
} |
|
} |
|
|
|
//! \brief Default constructor - initializes to NULL. |
|
Image1D() { } |
|
|
|
/*! \brief Copy constructor - performs shallow copy. |
|
* |
|
* See Memory for further details. |
|
*/ |
|
Image1D(const Image1D& image1D) : Image(image1D) { } |
|
|
|
/*! \brief Constructor from cl_mem - takes ownership. |
|
* |
|
* See Memory for further details. |
|
*/ |
|
__CL_EXPLICIT_CONSTRUCTORS Image1D(const cl_mem& image1D) : Image(image1D) { } |
|
|
|
/*! \brief Assignment from Image1D - performs shallow copy. |
|
* |
|
* See Memory for further details. |
|
*/ |
|
Image1D& operator = (const Image1D& rhs) |
|
{ |
|
if (this != &rhs) { |
|
Image::operator=(rhs); |
|
} |
|
return *this; |
|
} |
|
|
|
/*! \brief Assignment from cl_mem - performs shallow copy. |
|
* |
|
* See Memory for further details. |
|
*/ |
|
Image1D& operator = (const cl_mem& rhs) |
|
{ |
|
Image::operator=(rhs); |
|
return *this; |
|
} |
|
}; |
|
|
|
/*! \class Image1DBuffer |
|
* \brief Image interface for 1D buffer images. |
|
*/ |
|
class Image1DBuffer : public Image |
|
{ |
|
public: |
|
Image1DBuffer( |
|
const Context& context, |
|
cl_mem_flags flags, |
|
ImageFormat format, |
|
::size_t width, |
|
const Buffer &buffer, |
|
cl_int* err = NULL) |
|
{ |
|
cl_int error; |
|
cl_image_desc desc; |
|
desc.image_type = CL_MEM_OBJECT_IMAGE1D_BUFFER; |
|
desc.image_width = width; |
|
desc.image_row_pitch = 0; |
|
desc.num_mip_levels = 0; |
|
desc.num_samples = 0; |
|
desc.buffer = buffer(); |
|
object_ = ::clCreateImage( |
|
context(), |
|
flags, |
|
&format, |
|
&desc, |
|
NULL, |
|
&error); |
|
|
|
detail::errHandler(error, __CREATE_IMAGE_ERR); |
|
if (err != NULL) { |
|
*err = error; |
|
} |
|
} |
|
|
|
Image1DBuffer() { } |
|
|
|
Image1DBuffer(const Image1DBuffer& image1D) : Image(image1D) { } |
|
|
|
__CL_EXPLICIT_CONSTRUCTORS Image1DBuffer(const cl_mem& image1D) : Image(image1D) { } |
|
|
|
Image1DBuffer& operator = (const Image1DBuffer& rhs) |
|
{ |
|
if (this != &rhs) { |
|
Image::operator=(rhs); |
|
} |
|
return *this; |
|
} |
|
|
|
Image1DBuffer& operator = (const cl_mem& rhs) |
|
{ |
|
Image::operator=(rhs); |
|
return *this; |
|
} |
|
}; |
|
|
|
/*! \class Image1DArray |
|
* \brief Image interface for arrays of 1D images. |
|
*/ |
|
class Image1DArray : public Image |
|
{ |
|
public: |
|
Image1DArray( |
|
const Context& context, |
|
cl_mem_flags flags, |
|
ImageFormat format, |
|
::size_t arraySize, |
|
::size_t width, |
|
::size_t rowPitch, |
|
void* host_ptr = NULL, |
|
cl_int* err = NULL) |
|
{ |
|
cl_int error; |
|
cl_image_desc desc; |
|
desc.image_type = CL_MEM_OBJECT_IMAGE1D_ARRAY; |
|
desc.image_array_size = arraySize; |
|
desc.image_width = width; |
|
desc.image_row_pitch = rowPitch; |
|
desc.num_mip_levels = 0; |
|
desc.num_samples = 0; |
|
desc.buffer = 0; |
|
object_ = ::clCreateImage( |
|
context(), |
|
flags, |
|
&format, |
|
&desc, |
|
host_ptr, |
|
&error); |
|
|
|
detail::errHandler(error, __CREATE_IMAGE_ERR); |
|
if (err != NULL) { |
|
*err = error; |
|
} |
|
} |
|
|
|
Image1DArray() { } |
|
|
|
Image1DArray(const Image1DArray& imageArray) : Image(imageArray) { } |
|
|
|
__CL_EXPLICIT_CONSTRUCTORS Image1DArray(const cl_mem& imageArray) : Image(imageArray) { } |
|
|
|
Image1DArray& operator = (const Image1DArray& rhs) |
|
{ |
|
if (this != &rhs) { |
|
Image::operator=(rhs); |
|
} |
|
return *this; |
|
} |
|
|
|
Image1DArray& operator = (const cl_mem& rhs) |
|
{ |
|
Image::operator=(rhs); |
|
return *this; |
|
} |
|
}; |
|
#endif // #if defined(CL_VERSION_1_2) |
|
|
|
|
|
/*! \brief Class interface for 2D Image Memory objects. |
|
* |
|
* See Memory for details about copy semantics, etc. |
|
* |
|
* \see Memory |
|
*/ |
|
class Image2D : public Image |
|
{ |
|
public: |
|
/*! \brief Constructs a 1D Image in a specified context. |
|
* |
|
* Wraps clCreateImage(). |
|
*/ |
|
Image2D( |
|
const Context& context, |
|
cl_mem_flags flags, |
|
ImageFormat format, |
|
::size_t width, |
|
::size_t height, |
|
::size_t row_pitch = 0, |
|
void* host_ptr = NULL, |
|
cl_int* err = NULL) |
|
{ |
|
cl_int error; |
|
bool useCreateImage; |
|
|
|
#if defined(CL_VERSION_1_2) && defined(CL_USE_DEPRECATED_OPENCL_1_1_APIS) |
|
// Run-time decision based on the actual platform |
|
{ |
|
cl_uint version = detail::getContextPlatformVersion(context()); |
|
useCreateImage = (version >= 0x10002); // OpenCL 1.2 or above |
|
} |
|
#elif defined(CL_VERSION_1_2) |
|
useCreateImage = true; |
|
#else |
|
useCreateImage = false; |
|
#endif |
|
|
|
#if defined(CL_VERSION_1_2) |
|
if (useCreateImage) |
|
{ |
|
cl_image_desc desc; |
|
desc.image_type = CL_MEM_OBJECT_IMAGE2D; |
|
desc.image_width = width; |
|
desc.image_height = height; |
|
desc.image_row_pitch = row_pitch; |
|
desc.num_mip_levels = 0; |
|
desc.num_samples = 0; |
|
desc.buffer = 0; |
|
object_ = ::clCreateImage( |
|
context(), |
|
flags, |
|
&format, |
|
&desc, |
|
host_ptr, |
|
&error); |
|
|
|
detail::errHandler(error, __CREATE_IMAGE_ERR); |
|
if (err != NULL) { |
|
*err = error; |
|
} |
|
} |
|
#endif // #if defined(CL_VERSION_1_2) |
|
#if !defined(CL_VERSION_1_2) || defined(CL_USE_DEPRECATED_OPENCL_1_1_APIS) |
|
if (!useCreateImage) |
|
{ |
|
object_ = ::clCreateImage2D( |
|
context(), flags,&format, width, height, row_pitch, host_ptr, &error); |
|
|
|
detail::errHandler(error, __CREATE_IMAGE2D_ERR); |
|
if (err != NULL) { |
|
*err = error; |
|
} |
|
} |
|
#endif // #if !defined(CL_VERSION_1_2) || defined(CL_USE_DEPRECATED_OPENCL_1_1_APIS) |
|
} |
|
|
|
//! \brief Default constructor - initializes to NULL. |
|
Image2D() { } |
|
|
|
/*! \brief Copy constructor - performs shallow copy. |
|
* |
|
* See Memory for further details. |
|
*/ |
|
Image2D(const Image2D& image2D) : Image(image2D) { } |
|
|
|
/*! \brief Constructor from cl_mem - takes ownership. |
|
* |
|
* See Memory for further details. |
|
*/ |
|
__CL_EXPLICIT_CONSTRUCTORS Image2D(const cl_mem& image2D) : Image(image2D) { } |
|
|
|
/*! \brief Assignment from Image2D - performs shallow copy. |
|
* |
|
* See Memory for further details. |
|
*/ |
|
Image2D& operator = (const Image2D& rhs) |
|
{ |
|
if (this != &rhs) { |
|
Image::operator=(rhs); |
|
} |
|
return *this; |
|
} |
|
|
|
/*! \brief Assignment from cl_mem - performs shallow copy. |
|
* |
|
* See Memory for further details. |
|
*/ |
|
Image2D& operator = (const cl_mem& rhs) |
|
{ |
|
Image::operator=(rhs); |
|
return *this; |
|
} |
|
}; |
|
|
|
|
|
#if !defined(CL_VERSION_1_2) |
|
/*! \brief Class interface for GL 2D Image Memory objects. |
|
* |
|
* This is provided to facilitate interoperability with OpenGL. |
|
* |
|
* See Memory for details about copy semantics, etc. |
|
* |
|
* \see Memory |
|
* \note Deprecated for OpenCL 1.2. Please use ImageGL instead. |
|
*/ |
|
class CL_EXT_PREFIX__VERSION_1_1_DEPRECATED Image2DGL CL_EXT_SUFFIX__VERSION_1_1_DEPRECATED : public Image2D |
|
{ |
|
public: |
|
/*! \brief Constructs an Image2DGL in a specified context, from a given |
|
* GL Texture. |
|
* |
|
* Wraps clCreateFromGLTexture2D(). |
|
*/ |
|
Image2DGL( |
|
const Context& context, |
|
cl_mem_flags flags, |
|
GLenum target, |
|
GLint miplevel, |
|
GLuint texobj, |
|
cl_int * err = NULL) |
|
{ |
|
cl_int error; |
|
object_ = ::clCreateFromGLTexture2D( |
|
context(), |
|
flags, |
|
target, |
|
miplevel, |
|
texobj, |
|
&error); |
|
|
|
detail::errHandler(error, __CREATE_GL_TEXTURE_2D_ERR); |
|
if (err != NULL) { |
|
*err = error; |
|
} |
|
|
|
} |
|
|
|
//! \brief Default constructor - initializes to NULL. |
|
Image2DGL() : Image2D() { } |
|
|
|
/*! \brief Copy constructor - performs shallow copy. |
|
* |
|
* See Memory for further details. |
|
*/ |
|
Image2DGL(const Image2DGL& image) : Image2D(image) { } |
|
|
|
/*! \brief Constructor from cl_mem - takes ownership. |
|
* |
|
* See Memory for further details. |
|
*/ |
|
__CL_EXPLICIT_CONSTRUCTORS Image2DGL(const cl_mem& image) : Image2D(image) { } |
|
|
|
/*! \brief Assignment from Image2DGL - performs shallow copy. |
|
* |
|
* See Memory for further details. |
|
*/ |
|
Image2DGL& operator = (const Image2DGL& rhs) |
|
{ |
|
if (this != &rhs) { |
|
Image2D::operator=(rhs); |
|
} |
|
return *this; |
|
} |
|
|
|
/*! \brief Assignment from cl_mem - performs shallow copy. |
|
* |
|
* See Memory for further details. |
|
*/ |
|
Image2DGL& operator = (const cl_mem& rhs) |
|
{ |
|
Image2D::operator=(rhs); |
|
return *this; |
|
} |
|
}; |
|
#endif // #if !defined(CL_VERSION_1_2) |
|
|
|
#if defined(CL_VERSION_1_2) |
|
/*! \class Image2DArray |
|
* \brief Image interface for arrays of 2D images. |
|
*/ |
|
class Image2DArray : public Image |
|
{ |
|
public: |
|
Image2DArray( |
|
const Context& context, |
|
cl_mem_flags flags, |
|
ImageFormat format, |
|
::size_t arraySize, |
|
::size_t width, |
|
::size_t height, |
|
::size_t rowPitch, |
|
::size_t slicePitch, |
|
void* host_ptr = NULL, |
|
cl_int* err = NULL) |
|
{ |
|
cl_int error; |
|
cl_image_desc desc; |
|
desc.image_type = CL_MEM_OBJECT_IMAGE2D_ARRAY; |
|
desc.image_array_size = arraySize; |
|
desc.image_width = width; |
|
desc.image_height = height; |
|
desc.image_row_pitch = rowPitch; |
|
desc.image_slice_pitch = slicePitch; |
|
desc.num_mip_levels = 0; |
|
desc.num_samples = 0; |
|
desc.buffer = 0; |
|
object_ = ::clCreateImage( |
|
context(), |
|
flags, |
|
&format, |
|
&desc, |
|
host_ptr, |
|
&error); |
|
|
|
detail::errHandler(error, __CREATE_IMAGE_ERR); |
|
if (err != NULL) { |
|
*err = error; |
|
} |
|
} |
|
|
|
Image2DArray() { } |
|
|
|
Image2DArray(const Image2DArray& imageArray) : Image(imageArray) { } |
|
|
|
__CL_EXPLICIT_CONSTRUCTORS Image2DArray(const cl_mem& imageArray) : Image(imageArray) { } |
|
|
|
Image2DArray& operator = (const Image2DArray& rhs) |
|
{ |
|
if (this != &rhs) { |
|
Image::operator=(rhs); |
|
} |
|
return *this; |
|
} |
|
|
|
Image2DArray& operator = (const cl_mem& rhs) |
|
{ |
|
Image::operator=(rhs); |
|
return *this; |
|
} |
|
}; |
|
#endif // #if defined(CL_VERSION_1_2) |
|
|
|
/*! \brief Class interface for 3D Image Memory objects. |
|
* |
|
* See Memory for details about copy semantics, etc. |
|
* |
|
* \see Memory |
|
*/ |
|
class Image3D : public Image |
|
{ |
|
public: |
|
/*! \brief Constructs a 3D Image in a specified context. |
|
* |
|
* Wraps clCreateImage(). |
|
*/ |
|
Image3D( |
|
const Context& context, |
|
cl_mem_flags flags, |
|
ImageFormat format, |
|
::size_t width, |
|
::size_t height, |
|
::size_t depth, |
|
::size_t row_pitch = 0, |
|
::size_t slice_pitch = 0, |
|
void* host_ptr = NULL, |
|
cl_int* err = NULL) |
|
{ |
|
cl_int error; |
|
bool useCreateImage; |
|
|
|
#if defined(CL_VERSION_1_2) && defined(CL_USE_DEPRECATED_OPENCL_1_1_APIS) |
|
// Run-time decision based on the actual platform |
|
{ |
|
cl_uint version = detail::getContextPlatformVersion(context()); |
|
useCreateImage = (version >= 0x10002); // OpenCL 1.2 or above |
|
} |
|
#elif defined(CL_VERSION_1_2) |
|
useCreateImage = true; |
|
#else |
|
useCreateImage = false; |
|
#endif |
|
|
|
#if defined(CL_VERSION_1_2) |
|
if (useCreateImage) |
|
{ |
|
cl_image_desc desc; |
|
desc.image_type = CL_MEM_OBJECT_IMAGE3D; |
|
desc.image_width = width; |
|
desc.image_height = height; |
|
desc.image_depth = depth; |
|
desc.image_row_pitch = row_pitch; |
|
desc.image_slice_pitch = slice_pitch; |
|
desc.num_mip_levels = 0; |
|
desc.num_samples = 0; |
|
desc.buffer = 0; |
|
object_ = ::clCreateImage( |
|
context(), |
|
flags, |
|
&format, |
|
&desc, |
|
host_ptr, |
|
&error); |
|
|
|
detail::errHandler(error, __CREATE_IMAGE_ERR); |
|
if (err != NULL) { |
|
*err = error; |
|
} |
|
} |
|
#endif // #if defined(CL_VERSION_1_2) |
|
#if !defined(CL_VERSION_1_2) || defined(CL_USE_DEPRECATED_OPENCL_1_1_APIS) |
|
if (!useCreateImage) |
|
{ |
|
object_ = ::clCreateImage3D( |
|
context(), flags, &format, width, height, depth, row_pitch, |
|
slice_pitch, host_ptr, &error); |
|
|
|
detail::errHandler(error, __CREATE_IMAGE3D_ERR); |
|
if (err != NULL) { |
|
*err = error; |
|
} |
|
} |
|
#endif // #if !defined(CL_VERSION_1_2) || defined(CL_USE_DEPRECATED_OPENCL_1_1_APIS) |
|
} |
|
|
|
//! \brief Default constructor - initializes to NULL. |
|
Image3D() { } |
|
|
|
/*! \brief Copy constructor - performs shallow copy. |
|
* |
|
* See Memory for further details. |
|
*/ |
|
Image3D(const Image3D& image3D) : Image(image3D) { } |
|
|
|
/*! \brief Constructor from cl_mem - takes ownership. |
|
* |
|
* See Memory for further details. |
|
*/ |
|
__CL_EXPLICIT_CONSTRUCTORS Image3D(const cl_mem& image3D) : Image(image3D) { } |
|
|
|
/*! \brief Assignment from Image3D - performs shallow copy. |
|
* |
|
* See Memory for further details. |
|
*/ |
|
Image3D& operator = (const Image3D& rhs) |
|
{ |
|
if (this != &rhs) { |
|
Image::operator=(rhs); |
|
} |
|
return *this; |
|
} |
|
|
|
/*! \brief Assignment from cl_mem - performs shallow copy. |
|
* |
|
* See Memory for further details. |
|
*/ |
|
Image3D& operator = (const cl_mem& rhs) |
|
{ |
|
Image::operator=(rhs); |
|
return *this; |
|
} |
|
}; |
|
|
|
#if !defined(CL_VERSION_1_2) |
|
/*! \brief Class interface for GL 3D Image Memory objects. |
|
* |
|
* This is provided to facilitate interoperability with OpenGL. |
|
* |
|
* See Memory for details about copy semantics, etc. |
|
* |
|
* \see Memory |
|
*/ |
|
class Image3DGL : public Image3D |
|
{ |
|
public: |
|
/*! \brief Constructs an Image3DGL in a specified context, from a given |
|
* GL Texture. |
|
* |
|
* Wraps clCreateFromGLTexture3D(). |
|
*/ |
|
Image3DGL( |
|
const Context& context, |
|
cl_mem_flags flags, |
|
GLenum target, |
|
GLint miplevel, |
|
GLuint texobj, |
|
cl_int * err = NULL) |
|
{ |
|
cl_int error; |
|
object_ = ::clCreateFromGLTexture3D( |
|
context(), |
|
flags, |
|
target, |
|
miplevel, |
|
texobj, |
|
&error); |
|
|
|
detail::errHandler(error, __CREATE_GL_TEXTURE_3D_ERR); |
|
if (err != NULL) { |
|
*err = error; |
|
} |
|
} |
|
|
|
//! \brief Default constructor - initializes to NULL. |
|
Image3DGL() : Image3D() { } |
|
|
|
/*! \brief Copy constructor - performs shallow copy. |
|
* |
|
* See Memory for further details. |
|
*/ |
|
Image3DGL(const Image3DGL& image) : Image3D(image) { } |
|
|
|
/*! \brief Constructor from cl_mem - takes ownership. |
|
* |
|
* See Memory for further details. |
|
*/ |
|
__CL_EXPLICIT_CONSTRUCTORS Image3DGL(const cl_mem& image) : Image3D(image) { } |
|
|
|
/*! \brief Assignment from Image3DGL - performs shallow copy. |
|
* |
|
* See Memory for further details. |
|
*/ |
|
Image3DGL& operator = (const Image3DGL& rhs) |
|
{ |
|
if (this != &rhs) { |
|
Image3D::operator=(rhs); |
|
} |
|
return *this; |
|
} |
|
|
|
/*! \brief Assignment from cl_mem - performs shallow copy. |
|
* |
|
* See Memory for further details. |
|
*/ |
|
Image3DGL& operator = (const cl_mem& rhs) |
|
{ |
|
Image3D::operator=(rhs); |
|
return *this; |
|
} |
|
}; |
|
#endif // #if !defined(CL_VERSION_1_2) |
|
|
|
#if defined(CL_VERSION_1_2) |
|
/*! \class ImageGL |
|
* \brief general image interface for GL interop. |
|
* We abstract the 2D and 3D GL images into a single instance here |
|
* that wraps all GL sourced images on the grounds that setup information |
|
* was performed by OpenCL anyway. |
|
*/ |
|
class ImageGL : public Image |
|
{ |
|
public: |
|
ImageGL( |
|
const Context& context, |
|
cl_mem_flags flags, |
|
GLenum target, |
|
GLint miplevel, |
|
GLuint texobj, |
|
cl_int * err = NULL) |
|
{ |
|
cl_int error; |
|
object_ = ::clCreateFromGLTexture( |
|
context(), |
|
flags, |
|
target, |
|
miplevel, |
|
texobj, |
|
&error); |
|
|
|
detail::errHandler(error, __CREATE_GL_TEXTURE_ERR); |
|
if (err != NULL) { |
|
*err = error; |
|
} |
|
} |
|
|
|
ImageGL() : Image() { } |
|
|
|
ImageGL(const ImageGL& image) : Image(image) { } |
|
|
|
__CL_EXPLICIT_CONSTRUCTORS ImageGL(const cl_mem& image) : Image(image) { } |
|
|
|
ImageGL& operator = (const ImageGL& rhs) |
|
{ |
|
if (this != &rhs) { |
|
Image::operator=(rhs); |
|
} |
|
return *this; |
|
} |
|
|
|
ImageGL& operator = (const cl_mem& rhs) |
|
{ |
|
Image::operator=(rhs); |
|
return *this; |
|
} |
|
}; |
|
#endif // #if defined(CL_VERSION_1_2) |
|
|
|
/*! \brief Class interface for cl_sampler. |
|
* |
|
* \note Copies of these objects are shallow, meaning that the copy will refer |
|
* to the same underlying cl_sampler as the original. For details, see |
|
* clRetainSampler() and clReleaseSampler(). |
|
* |
|
* \see cl_sampler |
|
*/ |
|
class Sampler : public detail::Wrapper<cl_sampler> |
|
{ |
|
public: |
|
/*! \brief Destructor. |
|
* |
|
* This calls clReleaseSampler() on the value held by this instance. |
|
*/ |
|
~Sampler() { } |
|
|
|
//! \brief Default constructor - initializes to NULL. |
|
Sampler() { } |
|
|
|
/*! \brief Constructs a Sampler in a specified context. |
|
* |
|
* Wraps clCreateSampler(). |
|
*/ |
|
Sampler( |
|
const Context& context, |
|
cl_bool normalized_coords, |
|
cl_addressing_mode addressing_mode, |
|
cl_filter_mode filter_mode, |
|
cl_int* err = NULL) |
|
{ |
|
cl_int error; |
|
object_ = ::clCreateSampler( |
|
context(), |
|
normalized_coords, |
|
addressing_mode, |
|
filter_mode, |
|
&error); |
|
|
|
detail::errHandler(error, __CREATE_SAMPLER_ERR); |
|
if (err != NULL) { |
|
*err = error; |
|
} |
|
} |
|
|
|
/*! \brief Copy constructor - performs shallow copy. |
|
* |
|
* This calls clRetainSampler() on the parameter's cl_sampler. |
|
*/ |
|
Sampler(const Sampler& sampler) : detail::Wrapper<cl_type>(sampler) { } |
|
|
|
/*! \brief Constructor from cl_sampler - takes ownership. |
|
* |
|
* This effectively transfers ownership of a refcount on the cl_sampler |
|
* into the new Sampler object. |
|
*/ |
|
Sampler(const cl_sampler& sampler) : detail::Wrapper<cl_type>(sampler) { } |
|
|
|
/*! \brief Assignment operator from Sampler. |
|
* |
|
* This calls clRetainSampler() on the parameter and clReleaseSampler() |
|
* on the previous value held by this instance. |
|
*/ |
|
Sampler& operator = (const Sampler& rhs) |
|
{ |
|
if (this != &rhs) { |
|
detail::Wrapper<cl_type>::operator=(rhs); |
|
} |
|
return *this; |
|
} |
|
|
|
/*! \brief Assignment operator from cl_sampler - takes ownership. |
|
* |
|
* This effectively transfers ownership of a refcount on the rhs and calls |
|
* clReleaseSampler() on the value previously held by this instance. |
|
*/ |
|
Sampler& operator = (const cl_sampler& rhs) |
|
{ |
|
detail::Wrapper<cl_type>::operator=(rhs); |
|
return *this; |
|
} |
|
|
|
//! \brief Wrapper for clGetSamplerInfo(). |
|
template <typename T> |
|
cl_int getInfo(cl_sampler_info name, T* param) const |
|
{ |
|
return detail::errHandler( |
|
detail::getInfo(&::clGetSamplerInfo, object_, name, param), |
|
__GET_SAMPLER_INFO_ERR); |
|
} |
|
|
|
//! \brief Wrapper for clGetSamplerInfo() that returns by value. |
|
template <cl_int name> typename |
|
detail::param_traits<detail::cl_sampler_info, name>::param_type |
|
getInfo(cl_int* err = NULL) const |
|
{ |
|
typename detail::param_traits< |
|
detail::cl_sampler_info, name>::param_type param; |
|
cl_int result = getInfo(name, ¶m); |
|
if (err != NULL) { |
|
*err = result; |
|
} |
|
return param; |
|
} |
|
}; |
|
|
|
class Program; |
|
class CommandQueue; |
|
class Kernel; |
|
|
|
//! \brief Class interface for specifying NDRange values. |
|
class NDRange |
|
{ |
|
private: |
|
size_t<3> sizes_; |
|
cl_uint dimensions_; |
|
|
|
public: |
|
//! \brief Default constructor - resulting range has zero dimensions. |
|
NDRange() |
|
: dimensions_(0) |
|
{ } |
|
|
|
//! \brief Constructs one-dimensional range. |
|
NDRange(::size_t size0) |
|
: dimensions_(1) |
|
{ |
|
sizes_[0] = size0; |
|
} |
|
|
|
//! \brief Constructs two-dimensional range. |
|
NDRange(::size_t size0, ::size_t size1) |
|
: dimensions_(2) |
|
{ |
|
sizes_[0] = size0; |
|
sizes_[1] = size1; |
|
} |
|
|
|
//! \brief Constructs three-dimensional range. |
|
NDRange(::size_t size0, ::size_t size1, ::size_t size2) |
|
: dimensions_(3) |
|
{ |
|
sizes_[0] = size0; |
|
sizes_[1] = size1; |
|
sizes_[2] = size2; |
|
} |
|
|
|
/*! \brief Conversion operator to const ::size_t *. |
|
* |
|
* \returns a pointer to the size of the first dimension. |
|
*/ |
|
operator const ::size_t*() const { |
|
return (const ::size_t*) sizes_; |
|
} |
|
|
|
//! \brief Queries the number of dimensions in the range. |
|
::size_t dimensions() const { return dimensions_; } |
|
}; |
|
|
|
//! \brief A zero-dimensional range. |
|
static const NDRange NullRange; |
|
|
|
//! \brief Local address wrapper for use with Kernel::setArg |
|
struct LocalSpaceArg |
|
{ |
|
::size_t size_; |
|
}; |
|
|
|
namespace detail { |
|
|
|
template <typename T> |
|
struct KernelArgumentHandler |
|
{ |
|
static ::size_t size(const T&) { return sizeof(T); } |
|
static T* ptr(T& value) { return &value; } |
|
}; |
|
|
|
template <> |
|
struct KernelArgumentHandler<LocalSpaceArg> |
|
{ |
|
static ::size_t size(const LocalSpaceArg& value) { return value.size_; } |
|
static void* ptr(LocalSpaceArg&) { return NULL; } |
|
}; |
|
|
|
} |
|
//! \endcond |
|
|
|
/*! __local |
|
* \brief Helper function for generating LocalSpaceArg objects. |
|
* Deprecated. Replaced with Local. |
|
*/ |
|
inline CL_EXT_PREFIX__VERSION_1_1_DEPRECATED LocalSpaceArg |
|
__local(::size_t size) CL_EXT_SUFFIX__VERSION_1_1_DEPRECATED; |
|
inline LocalSpaceArg |
|
__local(::size_t size) |
|
{ |
|
LocalSpaceArg ret = { size }; |
|
return ret; |
|
} |
|
|
|
/*! Local |
|
* \brief Helper function for generating LocalSpaceArg objects. |
|
*/ |
|
inline LocalSpaceArg |
|
Local(::size_t size) |
|
{ |
|
LocalSpaceArg ret = { size }; |
|
return ret; |
|
} |
|
|
|
//class KernelFunctor; |
|
|
|
/*! \brief Class interface for cl_kernel. |
|
* |
|
* \note Copies of these objects are shallow, meaning that the copy will refer |
|
* to the same underlying cl_kernel as the original. For details, see |
|
* clRetainKernel() and clReleaseKernel(). |
|
* |
|
* \see cl_kernel |
|
*/ |
|
class Kernel : public detail::Wrapper<cl_kernel> |
|
{ |
|
public: |
|
inline Kernel(const Program& program, const char* name, cl_int* err = NULL); |
|
|
|
/*! \brief Destructor. |
|
* |
|
* This calls clReleaseKernel() on the value held by this instance. |
|
*/ |
|
~Kernel() { } |
|
|
|
//! \brief Default constructor - initializes to NULL. |
|
Kernel() { } |
|
|
|
/*! \brief Copy constructor - performs shallow copy. |
|
* |
|
* This calls clRetainKernel() on the parameter's cl_kernel. |
|
*/ |
|
Kernel(const Kernel& kernel) : detail::Wrapper<cl_type>(kernel) { } |
|
|
|
/*! \brief Constructor from cl_kernel - takes ownership. |
|
* |
|
* This effectively transfers ownership of a refcount on the cl_kernel |
|
* into the new Kernel object. |
|
*/ |
|
__CL_EXPLICIT_CONSTRUCTORS Kernel(const cl_kernel& kernel) : detail::Wrapper<cl_type>(kernel) { } |
|
|
|
/*! \brief Assignment operator from Kernel. |
|
* |
|
* This calls clRetainKernel() on the parameter and clReleaseKernel() |
|
* on the previous value held by this instance. |
|
*/ |
|
Kernel& operator = (const Kernel& rhs) |
|
{ |
|
if (this != &rhs) { |
|
detail::Wrapper<cl_type>::operator=(rhs); |
|
} |
|
return *this; |
|
} |
|
|
|
/*! \brief Assignment operator from cl_kernel - takes ownership. |
|
* |
|
* This effectively transfers ownership of a refcount on the rhs and calls |
|
* clReleaseKernel() on the value previously held by this instance. |
|
*/ |
|
Kernel& operator = (const cl_kernel& rhs) |
|
{ |
|
detail::Wrapper<cl_type>::operator=(rhs); |
|
return *this; |
|
} |
|
|
|
template <typename T> |
|
cl_int getInfo(cl_kernel_info name, T* param) const |
|
{ |
|
return detail::errHandler( |
|
detail::getInfo(&::clGetKernelInfo, object_, name, param), |
|
__GET_KERNEL_INFO_ERR); |
|
} |
|
|
|
template <cl_int name> typename |
|
detail::param_traits<detail::cl_kernel_info, name>::param_type |
|
getInfo(cl_int* err = NULL) const |
|
{ |
|
typename detail::param_traits< |
|
detail::cl_kernel_info, name>::param_type param; |
|
cl_int result = getInfo(name, ¶m); |
|
if (err != NULL) { |
|
*err = result; |
|
} |
|
return param; |
|
} |
|
|
|
#if defined(CL_VERSION_1_2) |
|
template <typename T> |
|
cl_int getArgInfo(cl_uint argIndex, cl_kernel_arg_info name, T* param) const |
|
{ |
|
return detail::errHandler( |
|
detail::getInfo(&::clGetKernelArgInfo, object_, argIndex, name, param), |
|
__GET_KERNEL_ARG_INFO_ERR); |
|
} |
|
|
|
template <cl_int name> typename |
|
detail::param_traits<detail::cl_kernel_arg_info, name>::param_type |
|
getArgInfo(cl_uint argIndex, cl_int* err = NULL) const |
|
{ |
|
typename detail::param_traits< |
|
detail::cl_kernel_arg_info, name>::param_type param; |
|
cl_int result = getArgInfo(argIndex, name, ¶m); |
|
if (err != NULL) { |
|
*err = result; |
|
} |
|
return param; |
|
} |
|
#endif // #if defined(CL_VERSION_1_2) |
|
|
|
template <typename T> |
|
cl_int getWorkGroupInfo( |
|
const Device& device, cl_kernel_work_group_info name, T* param) const |
|
{ |
|
return detail::errHandler( |
|
detail::getInfo( |
|
&::clGetKernelWorkGroupInfo, object_, device(), name, param), |
|
__GET_KERNEL_WORK_GROUP_INFO_ERR); |
|
} |
|
|
|
template <cl_int name> typename |
|
detail::param_traits<detail::cl_kernel_work_group_info, name>::param_type |
|
getWorkGroupInfo(const Device& device, cl_int* err = NULL) const |
|
{ |
|
typename detail::param_traits< |
|
detail::cl_kernel_work_group_info, name>::param_type param; |
|
cl_int result = getWorkGroupInfo(device, name, ¶m); |
|
if (err != NULL) { |
|
*err = result; |
|
} |
|
return param; |
|
} |
|
|
|
template <typename T> |
|
cl_int setArg(cl_uint index, T value) |
|
{ |
|
return detail::errHandler( |
|
::clSetKernelArg( |
|
object_, |
|
index, |
|
detail::KernelArgumentHandler<T>::size(value), |
|
detail::KernelArgumentHandler<T>::ptr(value)), |
|
__SET_KERNEL_ARGS_ERR); |
|
} |
|
|
|
cl_int setArg(cl_uint index, ::size_t size, void* argPtr) |
|
{ |
|
return detail::errHandler( |
|
::clSetKernelArg(object_, index, size, argPtr), |
|
__SET_KERNEL_ARGS_ERR); |
|
} |
|
}; |
|
|
|
/*! \class Program |
|
* \brief Program interface that implements cl_program. |
|
*/ |
|
class Program : public detail::Wrapper<cl_program> |
|
{ |
|
public: |
|
typedef VECTOR_CLASS<std::pair<const void*, ::size_t> > Binaries; |
|
typedef VECTOR_CLASS<std::pair<const char*, ::size_t> > Sources; |
|
|
|
Program( |
|
const STRING_CLASS& source, |
|
cl_int* err = NULL) |
|
{ |
|
cl_int error; |
|
|
|
const char * strings = source.c_str(); |
|
const ::size_t length = source.size(); |
|
|
|
Context context = Context::getDefault(err); |
|
|
|
object_ = ::clCreateProgramWithSource( |
|
context(), (cl_uint)1, &strings, &length, &error); |
|
|
|
detail::errHandler(error, __CREATE_PROGRAM_WITH_SOURCE_ERR); |
|
|
|
if (error == CL_SUCCESS) { |
|
|
|
error = ::clBuildProgram( |
|
object_, |
|
0, |
|
NULL, |
|
"", |
|
NULL, |
|
NULL); |
|
|
|
detail::errHandler(error, __BUILD_PROGRAM_ERR); |
|
} |
|
|
|
if (err != NULL) { |
|
*err = error; |
|
} |
|
} |
|
|
|
Program( |
|
const STRING_CLASS& source, |
|
bool build, |
|
cl_int* err = NULL) |
|
{ |
|
cl_int error; |
|
|
|
const char * strings = source.c_str(); |
|
const ::size_t length = source.size(); |
|
|
|
Context context = Context::getDefault(err); |
|
|
|
object_ = ::clCreateProgramWithSource( |
|
context(), (cl_uint)1, &strings, &length, &error); |
|
|
|
detail::errHandler(error, __CREATE_PROGRAM_WITH_SOURCE_ERR); |
|
|
|
if (error == CL_SUCCESS && build) { |
|
|
|
error = ::clBuildProgram( |
|
object_, |
|
0, |
|
NULL, |
|
"", |
|
NULL, |
|
NULL); |
|
|
|
detail::errHandler(error, __BUILD_PROGRAM_ERR); |
|
} |
|
|
|
if (err != NULL) { |
|
*err = error; |
|
} |
|
} |
|
|
|
Program( |
|
const Context& context, |
|
const STRING_CLASS& source, |
|
bool build = false, |
|
cl_int* err = NULL) |
|
{ |
|
cl_int error; |
|
|
|
const char * strings = source.c_str(); |
|
const ::size_t length = source.size(); |
|
|
|
object_ = ::clCreateProgramWithSource( |
|
context(), (cl_uint)1, &strings, &length, &error); |
|
|
|
detail::errHandler(error, __CREATE_PROGRAM_WITH_SOURCE_ERR); |
|
|
|
if (error == CL_SUCCESS && build) { |
|
|
|
error = ::clBuildProgram( |
|
object_, |
|
0, |
|
NULL, |
|
"", |
|
NULL, |
|
NULL); |
|
|
|
detail::errHandler(error, __BUILD_PROGRAM_ERR); |
|
} |
|
|
|
if (err != NULL) { |
|
*err = error; |
|
} |
|
} |
|
|
|
Program( |
|
const Context& context, |
|
const Sources& sources, |
|
cl_int* err = NULL) |
|
{ |
|
cl_int error; |
|
|
|
const ::size_t n = (::size_t)sources.size(); |
|
::size_t* lengths = (::size_t*) alloca(n * sizeof(::size_t)); |
|
const char** strings = (const char**) alloca(n * sizeof(const char*)); |
|
|
|
for (::size_t i = 0; i < n; ++i) { |
|
strings[i] = sources[(int)i].first; |
|
lengths[i] = sources[(int)i].second; |
|
} |
|
|
|
object_ = ::clCreateProgramWithSource( |
|
context(), (cl_uint)n, strings, lengths, &error); |
|
|
|
detail::errHandler(error, __CREATE_PROGRAM_WITH_SOURCE_ERR); |
|
if (err != NULL) { |
|
*err = error; |
|
} |
|
} |
|
|
|
/** |
|
* Construct a program object from a list of devices and a per-device list of binaries. |
|
* \param context A valid OpenCL context in which to construct the program. |
|
* \param devices A vector of OpenCL device objects for which the program will be created. |
|
* \param binaries A vector of pairs of a pointer to a binary object and its length. |
|
* \param binaryStatus An optional vector that on completion will be resized to |
|
* match the size of binaries and filled with values to specify if each binary |
|
* was successfully loaded. |
|
* Set to CL_SUCCESS if the binary was successfully loaded. |
|
* Set to CL_INVALID_VALUE if the length is 0 or the binary pointer is NULL. |
|
* Set to CL_INVALID_BINARY if the binary provided is not valid for the matching device. |
|
* \param err if non-NULL will be set to CL_SUCCESS on successful operation or one of the following errors: |
|
* CL_INVALID_CONTEXT if context is not a valid context. |
|
* CL_INVALID_VALUE if the length of devices is zero; or if the length of binaries does not match the length of devices; |
|
* or if any entry in binaries is NULL or has length 0. |
|
* CL_INVALID_DEVICE if OpenCL devices listed in devices are not in the list of devices associated with context. |
|
* CL_INVALID_BINARY if an invalid program binary was encountered for any device. binaryStatus will return specific status for each device. |
|
* CL_OUT_OF_HOST_MEMORY if there is a failure to allocate resources required by the OpenCL implementation on the host. |
|
*/ |
|
Program( |
|
const Context& context, |
|
const VECTOR_CLASS<Device>& devices, |
|
const Binaries& binaries, |
|
VECTOR_CLASS<cl_int>* binaryStatus = NULL, |
|
cl_int* err = NULL) |
|
{ |
|
cl_int error; |
|
|
|
const ::size_t numDevices = devices.size(); |
|
|
|
// Catch size mismatch early and return |
|
if(binaries.size() != numDevices) { |
|
error = CL_INVALID_VALUE; |
|
detail::errHandler(error, __CREATE_PROGRAM_WITH_BINARY_ERR); |
|
if (err != NULL) { |
|
*err = error; |
|
} |
|
return; |
|
} |
|
|
|
::size_t* lengths = (::size_t*) alloca(numDevices * sizeof(::size_t)); |
|
const unsigned char** images = (const unsigned char**) alloca(numDevices * sizeof(const unsigned char**)); |
|
|
|
for (::size_t i = 0; i < numDevices; ++i) { |
|
images[i] = (const unsigned char*)binaries[i].first; |
|
lengths[i] = binaries[(int)i].second; |
|
} |
|
|
|
cl_device_id* deviceIDs = (cl_device_id*) alloca(numDevices * sizeof(cl_device_id)); |
|
for( ::size_t deviceIndex = 0; deviceIndex < numDevices; ++deviceIndex ) { |
|
deviceIDs[deviceIndex] = (devices[deviceIndex])(); |
|
} |
|
|
|
if(binaryStatus) { |
|
binaryStatus->resize(numDevices); |
|
} |
|
|
|
object_ = ::clCreateProgramWithBinary( |
|
context(), (cl_uint) devices.size(), |
|
deviceIDs, |
|
lengths, images, binaryStatus != NULL |
|
? &binaryStatus->front() |
|
: NULL, &error); |
|
|
|
detail::errHandler(error, __CREATE_PROGRAM_WITH_BINARY_ERR); |
|
if (err != NULL) { |
|
*err = error; |
|
} |
|
} |
|
|
|
|
|
#if defined(CL_VERSION_1_2) |
|
/** |
|
* Create program using builtin kernels. |
|
* \param kernelNames Semi-colon separated list of builtin kernel names |
|
*/ |
|
Program( |
|
const Context& context, |
|
const VECTOR_CLASS<Device>& devices, |
|
const STRING_CLASS& kernelNames, |
|
cl_int* err = NULL) |
|
{ |
|
cl_int error; |
|
|
|
|
|
::size_t numDevices = devices.size(); |
|
cl_device_id* deviceIDs = (cl_device_id*) alloca(numDevices * sizeof(cl_device_id)); |
|
for( ::size_t deviceIndex = 0; deviceIndex < numDevices; ++deviceIndex ) { |
|
deviceIDs[deviceIndex] = (devices[deviceIndex])(); |
|
} |
|
|
|
object_ = ::clCreateProgramWithBuiltInKernels( |
|
context(), |
|
(cl_uint) devices.size(), |
|
deviceIDs, |
|
kernelNames.c_str(), |
|
&error); |
|
|
|
detail::errHandler(error, __CREATE_PROGRAM_WITH_BUILT_IN_KERNELS_ERR); |
|
if (err != NULL) { |
|
*err = error; |
|
} |
|
} |
|
#endif // #if defined(CL_VERSION_1_2) |
|
|
|
Program() { } |
|
|
|
Program(const Program& program) : detail::Wrapper<cl_type>(program) { } |
|
|
|
__CL_EXPLICIT_CONSTRUCTORS Program(const cl_program& program) : detail::Wrapper<cl_type>(program) { } |
|
|
|
Program& operator = (const Program& rhs) |
|
{ |
|
if (this != &rhs) { |
|
detail::Wrapper<cl_type>::operator=(rhs); |
|
} |
|
return *this; |
|
} |
|
|
|
Program& operator = (const cl_program& rhs) |
|
{ |
|
detail::Wrapper<cl_type>::operator=(rhs); |
|
return *this; |
|
} |
|
|
|
cl_int build( |
|
const VECTOR_CLASS<Device>& devices, |
|
const char* options = NULL, |
|
void (CL_CALLBACK * notifyFptr)(cl_program, void *) = NULL, |
|
void* data = NULL) const |
|
{ |
|
::size_t numDevices = devices.size(); |
|
cl_device_id* deviceIDs = (cl_device_id*) alloca(numDevices * sizeof(cl_device_id)); |
|
for( ::size_t deviceIndex = 0; deviceIndex < numDevices; ++deviceIndex ) { |
|
deviceIDs[deviceIndex] = (devices[deviceIndex])(); |
|
} |
|
|
|
return detail::errHandler( |
|
::clBuildProgram( |
|
object_, |
|
(cl_uint) |
|
devices.size(), |
|
deviceIDs, |
|
options, |
|
notifyFptr, |
|
data), |
|
__BUILD_PROGRAM_ERR); |
|
} |
|
|
|
cl_int build( |
|
const char* options = NULL, |
|
void (CL_CALLBACK * notifyFptr)(cl_program, void *) = NULL, |
|
void* data = NULL) const |
|
{ |
|
return detail::errHandler( |
|
::clBuildProgram( |
|
object_, |
|
0, |
|
NULL, |
|
options, |
|
notifyFptr, |
|
data), |
|
__BUILD_PROGRAM_ERR); |
|
} |
|
|
|
#if defined(CL_VERSION_1_2) |
|
cl_int compile( |
|
const char* options = NULL, |
|
void (CL_CALLBACK * notifyFptr)(cl_program, void *) = NULL, |
|
void* data = NULL) const |
|
{ |
|
return detail::errHandler( |
|
::clCompileProgram( |
|
object_, |
|
0, |
|
NULL, |
|
options, |
|
0, |
|
NULL, |
|
NULL, |
|
notifyFptr, |
|
data), |
|
__COMPILE_PROGRAM_ERR); |
|
} |
|
#endif |
|
|
|
template <typename T> |
|
cl_int getInfo(cl_program_info name, T* param) const |
|
{ |
|
return detail::errHandler( |
|
detail::getInfo(&::clGetProgramInfo, object_, name, param), |
|
__GET_PROGRAM_INFO_ERR); |
|
} |
|
|
|
template <cl_int name> typename |
|
detail::param_traits<detail::cl_program_info, name>::param_type |
|
getInfo(cl_int* err = NULL) const |
|
{ |
|
typename detail::param_traits< |
|
detail::cl_program_info, name>::param_type param; |
|
cl_int result = getInfo(name, ¶m); |
|
if (err != NULL) { |
|
*err = result; |
|
} |
|
return param; |
|
} |
|
|
|
template <typename T> |
|
cl_int getBuildInfo( |
|
const Device& device, cl_program_build_info name, T* param) const |
|
{ |
|
return detail::errHandler( |
|
detail::getInfo( |
|
&::clGetProgramBuildInfo, object_, device(), name, param), |
|
__GET_PROGRAM_BUILD_INFO_ERR); |
|
} |
|
|
|
template <cl_int name> typename |
|
detail::param_traits<detail::cl_program_build_info, name>::param_type |
|
getBuildInfo(const Device& device, cl_int* err = NULL) const |
|
{ |
|
typename detail::param_traits< |
|
detail::cl_program_build_info, name>::param_type param; |
|
cl_int result = getBuildInfo(device, name, ¶m); |
|
if (err != NULL) { |
|
*err = result; |
|
} |
|
return param; |
|
} |
|
|
|
cl_int createKernels(VECTOR_CLASS<Kernel>* kernels) |
|
{ |
|
cl_uint numKernels; |
|
cl_int err = ::clCreateKernelsInProgram(object_, 0, NULL, &numKernels); |
|
if (err != CL_SUCCESS) { |
|
return detail::errHandler(err, __CREATE_KERNELS_IN_PROGRAM_ERR); |
|
} |
|
|
|
Kernel* value = (Kernel*) alloca(numKernels * sizeof(Kernel)); |
|
err = ::clCreateKernelsInProgram( |
|
object_, numKernels, (cl_kernel*) value, NULL); |
|
if (err != CL_SUCCESS) { |
|
return detail::errHandler(err, __CREATE_KERNELS_IN_PROGRAM_ERR); |
|
} |
|
|
|
kernels->assign(&value[0], &value[numKernels]); |
|
return CL_SUCCESS; |
|
} |
|
}; |
|
|
|
#if defined(CL_VERSION_1_2) |
|
inline Program linkProgram( |
|
Program input1, |
|
Program input2, |
|
const char* options = NULL, |
|
void (CL_CALLBACK * notifyFptr)(cl_program, void *) = NULL, |
|
void* data = NULL, |
|
cl_int* err = NULL) |
|
{ |
|
cl_int err_local = CL_SUCCESS; |
|
|
|
cl_program programs[2] = { input1(), input2() }; |
|
|
|
Context ctx = input1.getInfo<CL_PROGRAM_CONTEXT>(); |
|
|
|
cl_program prog = ::clLinkProgram( |
|
ctx(), |
|
0, |
|
NULL, |
|
options, |
|
2, |
|
programs, |
|
notifyFptr, |
|
data, |
|
&err_local); |
|
|
|
detail::errHandler(err_local,__COMPILE_PROGRAM_ERR); |
|
if (err != NULL) { |
|
*err = err_local; |
|
} |
|
|
|
return Program(prog); |
|
} |
|
|
|
inline Program linkProgram( |
|
VECTOR_CLASS<Program> inputPrograms, |
|
const char* options = NULL, |
|
void (CL_CALLBACK * notifyFptr)(cl_program, void *) = NULL, |
|
void* data = NULL, |
|
cl_int* err = NULL) |
|
{ |
|
cl_int err_local = CL_SUCCESS; |
|
|
|
cl_program * programs = (cl_program*) alloca(inputPrograms.size() * sizeof(cl_program)); |
|
|
|
if (programs != NULL) { |
|
for (unsigned int i = 0; i < inputPrograms.size(); i++) { |
|
programs[i] = inputPrograms[i](); |
|
} |
|
} |
|
|
|
cl_program prog = ::clLinkProgram( |
|
Context::getDefault()(), |
|
0, |
|
NULL, |
|
options, |
|
(cl_uint)inputPrograms.size(), |
|
programs, |
|
notifyFptr, |
|
data, |
|
&err_local); |
|
|
|
detail::errHandler(err_local,__COMPILE_PROGRAM_ERR); |
|
if (err != NULL) { |
|
*err = err_local; |
|
} |
|
|
|
return Program(prog); |
|
} |
|
#endif |
|
|
|
template<> |
|
inline VECTOR_CLASS<char *> cl::Program::getInfo<CL_PROGRAM_BINARIES>(cl_int* err) const |
|
{ |
|
VECTOR_CLASS< ::size_t> sizes = getInfo<CL_PROGRAM_BINARY_SIZES>(); |
|
VECTOR_CLASS<char *> binaries; |
|
for (VECTOR_CLASS< ::size_t>::iterator s = sizes.begin(); s != sizes.end(); ++s) |
|
{ |
|
char *ptr = NULL; |
|
if (*s != 0) |
|
ptr = new char[*s]; |
|
binaries.push_back(ptr); |
|
} |
|
|
|
cl_int result = getInfo(CL_PROGRAM_BINARIES, &binaries); |
|
if (err != NULL) { |
|
*err = result; |
|
} |
|
return binaries; |
|
} |
|
|
|
inline Kernel::Kernel(const Program& program, const char* name, cl_int* err) |
|
{ |
|
cl_int error; |
|
|
|
object_ = ::clCreateKernel(program(), name, &error); |
|
detail::errHandler(error, __CREATE_KERNEL_ERR); |
|
|
|
if (err != NULL) { |
|
*err = error; |
|
} |
|
|
|
} |
|
|
|
/*! \class CommandQueue |
|
* \brief CommandQueue interface for cl_command_queue. |
|
*/ |
|
class CommandQueue : public detail::Wrapper<cl_command_queue> |
|
{ |
|
private: |
|
static volatile int default_initialized_; |
|
static CommandQueue default_; |
|
static volatile cl_int default_error_; |
|
public: |
|
CommandQueue( |
|
cl_command_queue_properties properties, |
|
cl_int* err = NULL) |
|
{ |
|
cl_int error; |
|
|
|
Context context = Context::getDefault(&error); |
|
detail::errHandler(error, __CREATE_COMMAND_QUEUE_ERR); |
|
|
|
if (error != CL_SUCCESS) { |
|
if (err != NULL) { |
|
*err = error; |
|
} |
|
} |
|
else { |
|
Device device = context.getInfo<CL_CONTEXT_DEVICES>()[0]; |
|
|
|
object_ = ::clCreateCommandQueue( |
|
context(), device(), properties, &error); |
|
|
|
detail::errHandler(error, __CREATE_COMMAND_QUEUE_ERR); |
|
if (err != NULL) { |
|
*err = error; |
|
} |
|
} |
|
} |
|
|
|
CommandQueue( |
|
const Context& context, |
|
const Device& device, |
|
cl_command_queue_properties properties = 0, |
|
cl_int* err = NULL) |
|
{ |
|
cl_int error; |
|
object_ = ::clCreateCommandQueue( |
|
context(), device(), properties, &error); |
|
|
|
detail::errHandler(error, __CREATE_COMMAND_QUEUE_ERR); |
|
if (err != NULL) { |
|
*err = error; |
|
} |
|
} |
|
|
|
static CommandQueue getDefault(cl_int * err = NULL) |
|
{ |
|
int state = detail::compare_exchange( |
|
&default_initialized_, |
|
__DEFAULT_BEING_INITIALIZED, __DEFAULT_NOT_INITIALIZED); |
|
|
|
if (state & __DEFAULT_INITIALIZED) { |
|
if (err != NULL) { |
|
*err = default_error_; |
|
} |
|
return default_; |
|
} |
|
|
|
if (state & __DEFAULT_BEING_INITIALIZED) { |
|
// Assume writes will propagate eventually... |
|
while(default_initialized_ != __DEFAULT_INITIALIZED) { |
|
detail::fence(); |
|
} |
|
|
|
if (err != NULL) { |
|
*err = default_error_; |
|
} |
|
return default_; |
|
} |
|
|
|
cl_int error; |
|
|
|
Context context = Context::getDefault(&error); |
|
detail::errHandler(error, __CREATE_COMMAND_QUEUE_ERR); |
|
|
|
if (error != CL_SUCCESS) { |
|
if (err != NULL) { |
|
*err = error; |
|
} |
|
} |
|
else { |
|
Device device = context.getInfo<CL_CONTEXT_DEVICES>()[0]; |
|
|
|
default_ = CommandQueue(context, device, 0, &error); |
|
|
|
detail::errHandler(error, __CREATE_COMMAND_QUEUE_ERR); |
|
if (err != NULL) { |
|
*err = error; |
|
} |
|
} |
|
|
|
detail::fence(); |
|
|
|
default_error_ = error; |
|
// Assume writes will propagate eventually... |
|
default_initialized_ = __DEFAULT_INITIALIZED; |
|
|
|
detail::fence(); |
|
|
|
if (err != NULL) { |
|
*err = default_error_; |
|
} |
|
return default_; |
|
|
|
} |
|
|
|
CommandQueue() { } |
|
|
|
CommandQueue(const CommandQueue& commandQueue) : detail::Wrapper<cl_type>(commandQueue) { } |
|
|
|
CommandQueue(const cl_command_queue& commandQueue) : detail::Wrapper<cl_type>(commandQueue) { } |
|
|
|
CommandQueue& operator = (const CommandQueue& rhs) |
|
{ |
|
if (this != &rhs) { |
|
detail::Wrapper<cl_type>::operator=(rhs); |
|
} |
|
return *this; |
|
} |
|
|
|
CommandQueue& operator = (const cl_command_queue& rhs) |
|
{ |
|
detail::Wrapper<cl_type>::operator=(rhs); |
|
return *this; |
|
} |
|
|
|
template <typename T> |
|
cl_int getInfo(cl_command_queue_info name, T* param) const |
|
{ |
|
return detail::errHandler( |
|
detail::getInfo( |
|
&::clGetCommandQueueInfo, object_, name, param), |
|
__GET_COMMAND_QUEUE_INFO_ERR); |
|
} |
|
|
|
template <cl_int name> typename |
|
detail::param_traits<detail::cl_command_queue_info, name>::param_type |
|
getInfo(cl_int* err = NULL) const |
|
{ |
|
typename detail::param_traits< |
|
detail::cl_command_queue_info, name>::param_type param; |
|
cl_int result = getInfo(name, ¶m); |
|
if (err != NULL) { |
|
*err = result; |
|
} |
|
return param; |
|
} |
|
|
|
cl_int enqueueReadBuffer( |
|
const Buffer& buffer, |
|
cl_bool blocking, |
|
::size_t offset, |
|
::size_t size, |
|
void* ptr, |
|
const VECTOR_CLASS<Event>* events = NULL, |
|
Event* event = NULL) const |
|
{ |
|
cl_event tmp; |
|
cl_int err = detail::errHandler( |
|
::clEnqueueReadBuffer( |
|
object_, buffer(), blocking, offset, size, |
|
ptr, |
|
(events != NULL) ? (cl_uint) events->size() : 0, |
|
(events != NULL && events->size() > 0) ? (cl_event*) &events->front() : NULL, |
|
(event != NULL) ? &tmp : NULL), |
|
__ENQUEUE_READ_BUFFER_ERR); |
|
|
|
if (event != NULL && err == CL_SUCCESS) |
|
*event = tmp; |
|
|
|
return err; |
|
} |
|
|
|
cl_int enqueueWriteBuffer( |
|
const Buffer& buffer, |
|
cl_bool blocking, |
|
::size_t offset, |
|
::size_t size, |
|
const void* ptr, |
|
const VECTOR_CLASS<Event>* events = NULL, |
|
Event* event = NULL) const |
|
{ |
|
cl_event tmp; |
|
cl_int err = detail::errHandler( |
|
::clEnqueueWriteBuffer( |
|
object_, buffer(), blocking, offset, size, |
|
ptr, |
|
(events != NULL) ? (cl_uint) events->size() : 0, |
|
(events != NULL && events->size() > 0) ? (cl_event*) &events->front() : NULL, |
|
(event != NULL) ? &tmp : NULL), |
|
__ENQUEUE_WRITE_BUFFER_ERR); |
|
|
|
if (event != NULL && err == CL_SUCCESS) |
|
*event = tmp; |
|
|
|
return err; |
|
} |
|
|
|
cl_int enqueueCopyBuffer( |
|
const Buffer& src, |
|
const Buffer& dst, |
|
::size_t src_offset, |
|
::size_t dst_offset, |
|
::size_t size, |
|
const VECTOR_CLASS<Event>* events = NULL, |
|
Event* event = NULL) const |
|
{ |
|
cl_event tmp; |
|
cl_int err = detail::errHandler( |
|
::clEnqueueCopyBuffer( |
|
object_, src(), dst(), src_offset, dst_offset, size, |
|
(events != NULL) ? (cl_uint) events->size() : 0, |
|
(events != NULL && events->size() > 0) ? (cl_event*) &events->front() : NULL, |
|
(event != NULL) ? &tmp : NULL), |
|
__ENQEUE_COPY_BUFFER_ERR); |
|
|
|
if (event != NULL && err == CL_SUCCESS) |
|
*event = tmp; |
|
|
|
return err; |
|
} |
|
|
|
cl_int enqueueReadBufferRect( |
|
const Buffer& buffer, |
|
cl_bool blocking, |
|
const size_t<3>& buffer_offset, |
|
const size_t<3>& host_offset, |
|
const size_t<3>& region, |
|
::size_t buffer_row_pitch, |
|
::size_t buffer_slice_pitch, |
|
::size_t host_row_pitch, |
|
::size_t host_slice_pitch, |
|
void *ptr, |
|
const VECTOR_CLASS<Event>* events = NULL, |
|
Event* event = NULL) const |
|
{ |
|
cl_event tmp; |
|
cl_int err = detail::errHandler( |
|
::clEnqueueReadBufferRect( |
|
object_, |
|
buffer(), |
|
blocking, |
|
(const ::size_t *)buffer_offset, |
|
(const ::size_t *)host_offset, |
|
(const ::size_t *)region, |
|
buffer_row_pitch, |
|
buffer_slice_pitch, |
|
host_row_pitch, |
|
host_slice_pitch, |
|
ptr, |
|
(events != NULL) ? (cl_uint) events->size() : 0, |
|
(events != NULL && events->size() > 0) ? (cl_event*) &events->front() : NULL, |
|
(event != NULL) ? &tmp : NULL), |
|
__ENQUEUE_READ_BUFFER_RECT_ERR); |
|
|
|
if (event != NULL && err == CL_SUCCESS) |
|
*event = tmp; |
|
|
|
return err; |
|
} |
|
|
|
cl_int enqueueWriteBufferRect( |
|
const Buffer& buffer, |
|
cl_bool blocking, |
|
const size_t<3>& buffer_offset, |
|
const size_t<3>& host_offset, |
|
const size_t<3>& region, |
|
::size_t buffer_row_pitch, |
|
::size_t buffer_slice_pitch, |
|
::size_t host_row_pitch, |
|
::size_t host_slice_pitch, |
|
void *ptr, |
|
const VECTOR_CLASS<Event>* events = NULL, |
|
Event* event = NULL) const |
|
{ |
|
cl_event tmp; |
|
cl_int err = detail::errHandler( |
|
::clEnqueueWriteBufferRect( |
|
object_, |
|
buffer(), |
|
blocking, |
|
(const ::size_t *)buffer_offset, |
|
(const ::size_t *)host_offset, |
|
(const ::size_t *)region, |
|
buffer_row_pitch, |
|
buffer_slice_pitch, |
|
host_row_pitch, |
|
host_slice_pitch, |
|
ptr, |
|
(events != NULL) ? (cl_uint) events->size() : 0, |
|
(events != NULL && events->size() > 0) ? (cl_event*) &events->front() : NULL, |
|
(event != NULL) ? &tmp : NULL), |
|
__ENQUEUE_WRITE_BUFFER_RECT_ERR); |
|
|
|
if (event != NULL && err == CL_SUCCESS) |
|
*event = tmp; |
|
|
|
return err; |
|
} |
|
|
|
cl_int enqueueCopyBufferRect( |
|
const Buffer& src, |
|
const Buffer& dst, |
|
const size_t<3>& src_origin, |
|
const size_t<3>& dst_origin, |
|
const size_t<3>& region, |
|
::size_t src_row_pitch, |
|
::size_t src_slice_pitch, |
|
::size_t dst_row_pitch, |
|
::size_t dst_slice_pitch, |
|
const VECTOR_CLASS<Event>* events = NULL, |
|
Event* event = NULL) const |
|
{ |
|
cl_event tmp; |
|
cl_int err = detail::errHandler( |
|
::clEnqueueCopyBufferRect( |
|
object_, |
|
src(), |
|
dst(), |
|
(const ::size_t *)src_origin, |
|
(const ::size_t *)dst_origin, |
|
(const ::size_t *)region, |
|
src_row_pitch, |
|
src_slice_pitch, |
|
dst_row_pitch, |
|
dst_slice_pitch, |
|
(events != NULL) ? (cl_uint) events->size() : 0, |
|
(events != NULL && events->size() > 0) ? (cl_event*) &events->front() : NULL, |
|
(event != NULL) ? &tmp : NULL), |
|
__ENQEUE_COPY_BUFFER_RECT_ERR); |
|
|
|
if (event != NULL && err == CL_SUCCESS) |
|
*event = tmp; |
|
|
|
return err; |
|
} |
|
|
|
#if defined(CL_VERSION_1_2) |
|
/** |
|
* Enqueue a command to fill a buffer object with a pattern |
|
* of a given size. The pattern is specified a as vector. |
|
* \tparam PatternType The datatype of the pattern field. |
|
* The pattern type must be an accepted OpenCL data type. |
|
*/ |
|
template<typename PatternType> |
|
cl_int enqueueFillBuffer( |
|
const Buffer& buffer, |
|
PatternType pattern, |
|
::size_t offset, |
|
::size_t size, |
|
const VECTOR_CLASS<Event>* events = NULL, |
|
Event* event = NULL) const |
|
{ |
|
cl_event tmp; |
|
cl_int err = detail::errHandler( |
|
::clEnqueueFillBuffer( |
|
object_, |
|
buffer(), |
|
static_cast<void*>(&pattern), |
|
sizeof(PatternType), |
|
offset, |
|
size, |
|
(events != NULL) ? (cl_uint) events->size() : 0, |
|
(events != NULL && events->size() > 0) ? (cl_event*) &events->front() : NULL, |
|
(event != NULL) ? &tmp : NULL), |
|
__ENQUEUE_FILL_BUFFER_ERR); |
|
|
|
if (event != NULL && err == CL_SUCCESS) |
|
*event = tmp; |
|
|
|
return err; |
|
} |
|
#endif // #if defined(CL_VERSION_1_2) |
|
|
|
cl_int enqueueReadImage( |
|
const Image& image, |
|
cl_bool blocking, |
|
const size_t<3>& origin, |
|
const size_t<3>& region, |
|
::size_t row_pitch, |
|
::size_t slice_pitch, |
|
void* ptr, |
|
const VECTOR_CLASS<Event>* events = NULL, |
|
Event* event = NULL) const |
|
{ |
|
cl_event tmp; |
|
cl_int err = detail::errHandler( |
|
::clEnqueueReadImage( |
|
object_, image(), blocking, (const ::size_t *) origin, |
|
(const ::size_t *) region, row_pitch, slice_pitch, ptr, |
|
(events != NULL) ? (cl_uint) events->size() : 0, |
|
(events != NULL && events->size() > 0) ? (cl_event*) &events->front() : NULL, |
|
(event != NULL) ? &tmp : NULL), |
|
__ENQUEUE_READ_IMAGE_ERR); |
|
|
|
if (event != NULL && err == CL_SUCCESS) |
|
*event = tmp; |
|
|
|
return err; |
|
} |
|
|
|
cl_int enqueueWriteImage( |
|
const Image& image, |
|
cl_bool blocking, |
|
const size_t<3>& origin, |
|
const size_t<3>& region, |
|
::size_t row_pitch, |
|
::size_t slice_pitch, |
|
void* ptr, |
|
const VECTOR_CLASS<Event>* events = NULL, |
|
Event* event = NULL) const |
|
{ |
|
cl_event tmp; |
|
cl_int err = detail::errHandler( |
|
::clEnqueueWriteImage( |
|
object_, image(), blocking, (const ::size_t *) origin, |
|
(const ::size_t *) region, row_pitch, slice_pitch, ptr, |
|
(events != NULL) ? (cl_uint) events->size() : 0, |
|
(events != NULL && events->size() > 0) ? (cl_event*) &events->front() : NULL, |
|
(event != NULL) ? &tmp : NULL), |
|
__ENQUEUE_WRITE_IMAGE_ERR); |
|
|
|
if (event != NULL && err == CL_SUCCESS) |
|
*event = tmp; |
|
|
|
return err; |
|
} |
|
|
|
cl_int enqueueCopyImage( |
|
const Image& src, |
|
const Image& dst, |
|
const size_t<3>& src_origin, |
|
const size_t<3>& dst_origin, |
|
const size_t<3>& region, |
|
const VECTOR_CLASS<Event>* events = NULL, |
|
Event* event = NULL) const |
|
{ |
|
cl_event tmp; |
|
cl_int err = detail::errHandler( |
|
::clEnqueueCopyImage( |
|
object_, src(), dst(), (const ::size_t *) src_origin, |
|
(const ::size_t *)dst_origin, (const ::size_t *) region, |
|
(events != NULL) ? (cl_uint) events->size() : 0, |
|
(events != NULL && events->size() > 0) ? (cl_event*) &events->front() : NULL, |
|
(event != NULL) ? &tmp : NULL), |
|
__ENQUEUE_COPY_IMAGE_ERR); |
|
|
|
if (event != NULL && err == CL_SUCCESS) |
|
*event = tmp; |
|
|
|
return err; |
|
} |
|
|
|
#if defined(CL_VERSION_1_2) |
|
/** |
|
* Enqueue a command to fill an image object with a specified color. |
|
* \param fillColor is the color to use to fill the image. |
|
* This is a four component RGBA floating-point color value if |
|
* the image channel data type is not an unnormalized signed or |
|
* unsigned data type. |
|
*/ |
|
cl_int enqueueFillImage( |
|
const Image& image, |
|
cl_float4 fillColor, |
|
const size_t<3>& origin, |
|
const size_t<3>& region, |
|
const VECTOR_CLASS<Event>* events = NULL, |
|
Event* event = NULL) const |
|
{ |
|
cl_event tmp; |
|
cl_int err = detail::errHandler( |
|
::clEnqueueFillImage( |
|
object_, |
|
image(), |
|
static_cast<void*>(&fillColor), |
|
(const ::size_t *) origin, |
|
(const ::size_t *) region, |
|
(events != NULL) ? (cl_uint) events->size() : 0, |
|
(events != NULL && events->size() > 0) ? (cl_event*) &events->front() : NULL, |
|
(event != NULL) ? &tmp : NULL), |
|
__ENQUEUE_FILL_IMAGE_ERR); |
|
|
|
if (event != NULL && err == CL_SUCCESS) |
|
*event = tmp; |
|
|
|
return err; |
|
} |
|
|
|
/** |
|
* Enqueue a command to fill an image object with a specified color. |
|
* \param fillColor is the color to use to fill the image. |
|
* This is a four component RGBA signed integer color value if |
|
* the image channel data type is an unnormalized signed integer |
|
* type. |
|
*/ |
|
cl_int enqueueFillImage( |
|
const Image& image, |
|
cl_int4 fillColor, |
|
const size_t<3>& origin, |
|
const size_t<3>& region, |
|
const VECTOR_CLASS<Event>* events = NULL, |
|
Event* event = NULL) const |
|
{ |
|
cl_event tmp; |
|
cl_int err = detail::errHandler( |
|
::clEnqueueFillImage( |
|
object_, |
|
image(), |
|
static_cast<void*>(&fillColor), |
|
(const ::size_t *) origin, |
|
(const ::size_t *) region, |
|
(events != NULL) ? (cl_uint) events->size() : 0, |
|
(events != NULL && events->size() > 0) ? (cl_event*) &events->front() : NULL, |
|
(event != NULL) ? &tmp : NULL), |
|
__ENQUEUE_FILL_IMAGE_ERR); |
|
|
|
if (event != NULL && err == CL_SUCCESS) |
|
*event = tmp; |
|
|
|
return err; |
|
} |
|
|
|
/** |
|
* Enqueue a command to fill an image object with a specified color. |
|
* \param fillColor is the color to use to fill the image. |
|
* This is a four component RGBA unsigned integer color value if |
|
* the image channel data type is an unnormalized unsigned integer |
|
* type. |
|
*/ |
|
cl_int enqueueFillImage( |
|
const Image& image, |
|
cl_uint4 fillColor, |
|
const size_t<3>& origin, |
|
const size_t<3>& region, |
|
const VECTOR_CLASS<Event>* events = NULL, |
|
Event* event = NULL) const |
|
{ |
|
cl_event tmp; |
|
cl_int err = detail::errHandler( |
|
::clEnqueueFillImage( |
|
object_, |
|
image(), |
|
static_cast<void*>(&fillColor), |
|
(const ::size_t *) origin, |
|
(const ::size_t *) region, |
|
(events != NULL) ? (cl_uint) events->size() : 0, |
|
(events != NULL && events->size() > 0) ? (cl_event*) &events->front() : NULL, |
|
(event != NULL) ? &tmp : NULL), |
|
__ENQUEUE_FILL_IMAGE_ERR); |
|
|
|
if (event != NULL && err == CL_SUCCESS) |
|
*event = tmp; |
|
|
|
return err; |
|
} |
|
#endif // #if defined(CL_VERSION_1_2) |
|
|
|
cl_int enqueueCopyImageToBuffer( |
|
const Image& src, |
|
const Buffer& dst, |
|
const size_t<3>& src_origin, |
|
const size_t<3>& region, |
|
::size_t dst_offset, |
|
const VECTOR_CLASS<Event>* events = NULL, |
|
Event* event = NULL) const |
|
{ |
|
cl_event tmp; |
|
cl_int err = detail::errHandler( |
|
::clEnqueueCopyImageToBuffer( |
|
object_, src(), dst(), (const ::size_t *) src_origin, |
|
(const ::size_t *) region, dst_offset, |
|
(events != NULL) ? (cl_uint) events->size() : 0, |
|
(events != NULL && events->size() > 0) ? (cl_event*) &events->front() : NULL, |
|
(event != NULL) ? &tmp : NULL), |
|
__ENQUEUE_COPY_IMAGE_TO_BUFFER_ERR); |
|
|
|
if (event != NULL && err == CL_SUCCESS) |
|
*event = tmp; |
|
|
|
return err; |
|
} |
|
|
|
cl_int enqueueCopyBufferToImage( |
|
const Buffer& src, |
|
const Image& dst, |
|
::size_t src_offset, |
|
const size_t<3>& dst_origin, |
|
const size_t<3>& region, |
|
const VECTOR_CLASS<Event>* events = NULL, |
|
Event* event = NULL) const |
|
{ |
|
cl_event tmp; |
|
cl_int err = detail::errHandler( |
|
::clEnqueueCopyBufferToImage( |
|
object_, src(), dst(), src_offset, |
|
(const ::size_t *) dst_origin, (const ::size_t *) region, |
|
(events != NULL) ? (cl_uint) events->size() : 0, |
|
(events != NULL && events->size() > 0) ? (cl_event*) &events->front() : NULL, |
|
(event != NULL) ? &tmp : NULL), |
|
__ENQUEUE_COPY_BUFFER_TO_IMAGE_ERR); |
|
|
|
if (event != NULL && err == CL_SUCCESS) |
|
*event = tmp; |
|
|
|
return err; |
|
} |
|
|
|
void* enqueueMapBuffer( |
|
const Buffer& buffer, |
|
cl_bool blocking, |
|
cl_map_flags flags, |
|
::size_t offset, |
|
::size_t size, |
|
const VECTOR_CLASS<Event>* events = NULL, |
|
Event* event = NULL, |
|
cl_int* err = NULL) const |
|
{ |
|
cl_int error; |
|
void * result = ::clEnqueueMapBuffer( |
|
object_, buffer(), blocking, flags, offset, size, |
|
(events != NULL) ? (cl_uint) events->size() : 0, |
|
(events != NULL && events->size() > 0) ? (cl_event*) &events->front() : NULL, |
|
(cl_event*) event, |
|
&error); |
|
|
|
detail::errHandler(error, __ENQUEUE_MAP_BUFFER_ERR); |
|
if (err != NULL) { |
|
*err = error; |
|
} |
|
return result; |
|
} |
|
|
|
void* enqueueMapImage( |
|
const Image& buffer, |
|
cl_bool blocking, |
|
cl_map_flags flags, |
|
const size_t<3>& origin, |
|
const size_t<3>& region, |
|
::size_t * row_pitch, |
|
::size_t * slice_pitch, |
|
const VECTOR_CLASS<Event>* events = NULL, |
|
Event* event = NULL, |
|
cl_int* err = NULL) const |
|
{ |
|
cl_int error; |
|
void * result = ::clEnqueueMapImage( |
|
object_, buffer(), blocking, flags, |
|
(const ::size_t *) origin, (const ::size_t *) region, |
|
row_pitch, slice_pitch, |
|
(events != NULL) ? (cl_uint) events->size() : 0, |
|
(events != NULL && events->size() > 0) ? (cl_event*) &events->front() : NULL, |
|
(cl_event*) event, |
|
&error); |
|
|
|
detail::errHandler(error, __ENQUEUE_MAP_IMAGE_ERR); |
|
if (err != NULL) { |
|
*err = error; |
|
} |
|
return result; |
|
} |
|
|
|
cl_int enqueueUnmapMemObject( |
|
const Memory& memory, |
|
void* mapped_ptr, |
|
const VECTOR_CLASS<Event>* events = NULL, |
|
Event* event = NULL) const |
|
{ |
|
cl_event tmp; |
|
cl_int err = detail::errHandler( |
|
::clEnqueueUnmapMemObject( |
|
object_, memory(), mapped_ptr, |
|
(events != NULL) ? (cl_uint) events->size() : 0, |
|
(events != NULL && events->size() > 0) ? (cl_event*) &events->front() : NULL, |
|
(event != NULL) ? &tmp : NULL), |
|
__ENQUEUE_UNMAP_MEM_OBJECT_ERR); |
|
|
|
if (event != NULL && err == CL_SUCCESS) |
|
*event = tmp; |
|
|
|
return err; |
|
} |
|
|
|
#if defined(CL_VERSION_1_2) |
|
/** |
|
* Enqueues a marker command which waits for either a list of events to complete, |
|
* or all previously enqueued commands to complete. |
|
* |
|
* Enqueues a marker command which waits for either a list of events to complete, |
|
* or if the list is empty it waits for all commands previously enqueued in command_queue |
|
* to complete before it completes. This command returns an event which can be waited on, |
|
* i.e. this event can be waited on to insure that all events either in the event_wait_list |
|
* or all previously enqueued commands, queued before this command to command_queue, |
|
* have completed. |
|
*/ |
|
cl_int enqueueMarkerWithWaitList( |
|
const VECTOR_CLASS<Event> *events = 0, |
|
Event *event = 0) |
|
{ |
|
cl_event tmp; |
|
cl_int err = detail::errHandler( |
|
::clEnqueueMarkerWithWaitList( |
|
object_, |
|
(events != NULL) ? (cl_uint) events->size() : 0, |
|
(events != NULL && events->size() > 0) ? (cl_event*) &events->front() : NULL, |
|
(event != NULL) ? &tmp : NULL), |
|
__ENQUEUE_MARKER_WAIT_LIST_ERR); |
|
|
|
if (event != NULL && err == CL_SUCCESS) |
|
*event = tmp; |
|
|
|
return err; |
|
} |
|
|
|
/** |
|
* A synchronization point that enqueues a barrier operation. |
|
* |
|
* Enqueues a barrier command which waits for either a list of events to complete, |
|
* or if the list is empty it waits for all commands previously enqueued in command_queue |
|
* to complete before it completes. This command blocks command execution, that is, any |
|
* following commands enqueued after it do not execute until it completes. This command |
|
* returns an event which can be waited on, i.e. this event can be waited on to insure that |
|
* all events either in the event_wait_list or all previously enqueued commands, queued |
|
* before this command to command_queue, have completed. |
|
*/ |
|
cl_int enqueueBarrierWithWaitList( |
|
const VECTOR_CLASS<Event> *events = 0, |
|
Event *event = 0) |
|
{ |
|
cl_event tmp; |
|
cl_int err = detail::errHandler( |
|
::clEnqueueBarrierWithWaitList( |
|
object_, |
|
(events != NULL) ? (cl_uint) events->size() : 0, |
|
(events != NULL && events->size() > 0) ? (cl_event*) &events->front() : NULL, |
|
(event != NULL) ? &tmp : NULL), |
|
__ENQUEUE_BARRIER_WAIT_LIST_ERR); |
|
|
|
if (event != NULL && err == CL_SUCCESS) |
|
*event = tmp; |
|
|
|
return err; |
|
} |
|
|
|
/** |
|
* Enqueues a command to indicate with which device a set of memory objects |
|
* should be associated. |
|
*/ |
|
cl_int enqueueMigrateMemObjects( |
|
const VECTOR_CLASS<Memory> &memObjects, |
|
cl_mem_migration_flags flags, |
|
const VECTOR_CLASS<Event>* events = NULL, |
|
Event* event = NULL |
|
) |
|
{ |
|
cl_event tmp; |
|
|
|
cl_mem* localMemObjects = static_cast<cl_mem*>(alloca(memObjects.size() * sizeof(cl_mem))); |
|
for( int i = 0; i < (int)memObjects.size(); ++i ) { |
|
localMemObjects[i] = memObjects[i](); |
|
} |
|
|
|
|
|
cl_int err = detail::errHandler( |
|
::clEnqueueMigrateMemObjects( |
|
object_, |
|
(cl_uint)memObjects.size(), |
|
static_cast<const cl_mem*>(localMemObjects), |
|
flags, |
|
(events != NULL) ? (cl_uint) events->size() : 0, |
|
(events != NULL && events->size() > 0) ? (cl_event*) &events->front() : NULL, |
|
(event != NULL) ? &tmp : NULL), |
|
__ENQUEUE_UNMAP_MEM_OBJECT_ERR); |
|
|
|
if (event != NULL && err == CL_SUCCESS) |
|
*event = tmp; |
|
|
|
return err; |
|
} |
|
#endif // #if defined(CL_VERSION_1_2) |
|
|
|
cl_int enqueueNDRangeKernel( |
|
const Kernel& kernel, |
|
const NDRange& offset, |
|
const NDRange& global, |
|
const NDRange& local = NullRange, |
|
const VECTOR_CLASS<Event>* events = NULL, |
|
Event* event = NULL) const |
|
{ |
|
cl_event tmp; |
|
cl_int err = detail::errHandler( |
|
::clEnqueueNDRangeKernel( |
|
object_, kernel(), (cl_uint) global.dimensions(), |
|
offset.dimensions() != 0 ? (const ::size_t*) offset : NULL, |
|
(const ::size_t*) global, |
|
local.dimensions() != 0 ? (const ::size_t*) local : NULL, |
|
(events != NULL) ? (cl_uint) events->size() : 0, |
|
(events != NULL && events->size() > 0) ? (cl_event*) &events->front() : NULL, |
|
(event != NULL) ? &tmp : NULL), |
|
__ENQUEUE_NDRANGE_KERNEL_ERR); |
|
|
|
if (event != NULL && err == CL_SUCCESS) |
|
*event = tmp; |
|
|
|
return err; |
|
} |
|
|
|
cl_int enqueueTask( |
|
const Kernel& kernel, |
|
const VECTOR_CLASS<Event>* events = NULL, |
|
Event* event = NULL) const |
|
{ |
|
cl_event tmp; |
|
cl_int err = detail::errHandler( |
|
::clEnqueueTask( |
|
object_, kernel(), |
|
(events != NULL) ? (cl_uint) events->size() : 0, |
|
(events != NULL && events->size() > 0) ? (cl_event*) &events->front() : NULL, |
|
(event != NULL) ? &tmp : NULL), |
|
__ENQUEUE_TASK_ERR); |
|
|
|
if (event != NULL && err == CL_SUCCESS) |
|
*event = tmp; |
|
|
|
return err; |
|
} |
|
|
|
cl_int enqueueNativeKernel( |
|
void (CL_CALLBACK *userFptr)(void *), |
|
std::pair<void*, ::size_t> args, |
|
const VECTOR_CLASS<Memory>* mem_objects = NULL, |
|
const VECTOR_CLASS<const void*>* mem_locs = NULL, |
|
const VECTOR_CLASS<Event>* events = NULL, |
|
Event* event = NULL) const |
|
{ |
|
cl_mem * mems = (mem_objects != NULL && mem_objects->size() > 0) |
|
? (cl_mem*) alloca(mem_objects->size() * sizeof(cl_mem)) |
|
: NULL; |
|
|
|
if (mems != NULL) { |
|
for (unsigned int i = 0; i < mem_objects->size(); i++) { |
|
mems[i] = ((*mem_objects)[i])(); |
|
} |
|
} |
|
|
|
cl_event tmp; |
|
cl_int err = detail::errHandler( |
|
::clEnqueueNativeKernel( |
|
object_, userFptr, args.first, args.second, |
|
(mem_objects != NULL) ? (cl_uint) mem_objects->size() : 0, |
|
mems, |
|
(mem_locs != NULL) ? (const void **) &mem_locs->front() : NULL, |
|
(events != NULL) ? (cl_uint) events->size() : 0, |
|
(events != NULL && events->size() > 0) ? (cl_event*) &events->front() : NULL, |
|
(event != NULL) ? &tmp : NULL), |
|
__ENQUEUE_NATIVE_KERNEL); |
|
|
|
if (event != NULL && err == CL_SUCCESS) |
|
*event = tmp; |
|
|
|
return err; |
|
} |
|
|
|
/** |
|
* Deprecated APIs for 1.2 |
|
*/ |
|
#if defined(CL_USE_DEPRECATED_OPENCL_1_1_APIS) || (defined(CL_VERSION_1_1) && !defined(CL_VERSION_1_2)) |
|
CL_EXT_PREFIX__VERSION_1_1_DEPRECATED |
|
cl_int enqueueMarker(Event* event = NULL) const CL_EXT_SUFFIX__VERSION_1_1_DEPRECATED |
|
{ |
|
return detail::errHandler( |
|
::clEnqueueMarker(object_, (cl_event*) event), |
|
__ENQUEUE_MARKER_ERR); |
|
} |
|
|
|
CL_EXT_PREFIX__VERSION_1_1_DEPRECATED |
|
cl_int enqueueWaitForEvents(const VECTOR_CLASS<Event>& events) const CL_EXT_SUFFIX__VERSION_1_1_DEPRECATED |
|
{ |
|
return detail::errHandler( |
|
::clEnqueueWaitForEvents( |
|
object_, |
|
(cl_uint) events.size(), |
|
(const cl_event*) &events.front()), |
|
__ENQUEUE_WAIT_FOR_EVENTS_ERR); |
|
} |
|
#endif // #if defined(CL_VERSION_1_1) |
|
|
|
cl_int enqueueAcquireGLObjects( |
|
const VECTOR_CLASS<Memory>* mem_objects = NULL, |
|
const VECTOR_CLASS<Event>* events = NULL, |
|
Event* event = NULL) const |
|
{ |
|
cl_event tmp; |
|
cl_int err = detail::errHandler( |
|
::clEnqueueAcquireGLObjects( |
|
object_, |
|
(mem_objects != NULL) ? (cl_uint) mem_objects->size() : 0, |
|
(mem_objects != NULL) ? (const cl_mem *) &mem_objects->front(): NULL, |
|
(events != NULL) ? (cl_uint) events->size() : 0, |
|
(events != NULL && events->size() > 0) ? (cl_event*) &events->front() : NULL, |
|
(event != NULL) ? &tmp : NULL), |
|
__ENQUEUE_ACQUIRE_GL_ERR); |
|
|
|
if (event != NULL && err == CL_SUCCESS) |
|
*event = tmp; |
|
|
|
return err; |
|
} |
|
|
|
cl_int enqueueReleaseGLObjects( |
|
const VECTOR_CLASS<Memory>* mem_objects = NULL, |
|
const VECTOR_CLASS<Event>* events = NULL, |
|
Event* event = NULL) const |
|
{ |
|
cl_event tmp; |
|
cl_int err = detail::errHandler( |
|
::clEnqueueReleaseGLObjects( |
|
object_, |
|
(mem_objects != NULL) ? (cl_uint) mem_objects->size() : 0, |
|
(mem_objects != NULL) ? (const cl_mem *) &mem_objects->front(): NULL, |
|
(events != NULL) ? (cl_uint) events->size() : 0, |
|
(events != NULL && events->size() > 0) ? (cl_event*) &events->front() : NULL, |
|
(event != NULL) ? &tmp : NULL), |
|
__ENQUEUE_RELEASE_GL_ERR); |
|
|
|
if (event != NULL && err == CL_SUCCESS) |
|
*event = tmp; |
|
|
|
return err; |
|
} |
|
|
|
#if defined (USE_DX_INTEROP) |
|
typedef CL_API_ENTRY cl_int (CL_API_CALL *PFN_clEnqueueAcquireD3D10ObjectsKHR)( |
|
cl_command_queue command_queue, cl_uint num_objects, |
|
const cl_mem* mem_objects, cl_uint num_events_in_wait_list, |
|
const cl_event* event_wait_list, cl_event* event); |
|
typedef CL_API_ENTRY cl_int (CL_API_CALL *PFN_clEnqueueReleaseD3D10ObjectsKHR)( |
|
cl_command_queue command_queue, cl_uint num_objects, |
|
const cl_mem* mem_objects, cl_uint num_events_in_wait_list, |
|
const cl_event* event_wait_list, cl_event* event); |
|
|
|
cl_int enqueueAcquireD3D10Objects( |
|
const VECTOR_CLASS<Memory>* mem_objects = NULL, |
|
const VECTOR_CLASS<Event>* events = NULL, |
|
Event* event = NULL) const |
|
{ |
|
static PFN_clEnqueueAcquireD3D10ObjectsKHR pfn_clEnqueueAcquireD3D10ObjectsKHR = NULL; |
|
#if defined(CL_VERSION_1_2) |
|
cl_context context = getInfo<CL_QUEUE_CONTEXT>(); |
|
cl::Device device(getInfo<CL_QUEUE_DEVICE>()); |
|
cl_platform_id platform = device.getInfo<CL_DEVICE_PLATFORM>(); |
|
__INIT_CL_EXT_FCN_PTR_PLATFORM(platform, clEnqueueAcquireD3D10ObjectsKHR); |
|
#endif |
|
#if defined(CL_VERSION_1_1) |
|
__INIT_CL_EXT_FCN_PTR(clEnqueueAcquireD3D10ObjectsKHR); |
|
#endif |
|
|
|
cl_event tmp; |
|
cl_int err = detail::errHandler( |
|
pfn_clEnqueueAcquireD3D10ObjectsKHR( |
|
object_, |
|
(mem_objects != NULL) ? (cl_uint) mem_objects->size() : 0, |
|
(mem_objects != NULL) ? (const cl_mem *) &mem_objects->front(): NULL, |
|
(events != NULL) ? (cl_uint) events->size() : 0, |
|
(events != NULL) ? (cl_event*) &events->front() : NULL, |
|
(event != NULL) ? &tmp : NULL), |
|
__ENQUEUE_ACQUIRE_GL_ERR); |
|
|
|
if (event != NULL && err == CL_SUCCESS) |
|
*event = tmp; |
|
|
|
return err; |
|
} |
|
|
|
cl_int enqueueReleaseD3D10Objects( |
|
const VECTOR_CLASS<Memory>* mem_objects = NULL, |
|
const VECTOR_CLASS<Event>* events = NULL, |
|
Event* event = NULL) const |
|
{ |
|
static PFN_clEnqueueReleaseD3D10ObjectsKHR pfn_clEnqueueReleaseD3D10ObjectsKHR = NULL; |
|
#if defined(CL_VERSION_1_2) |
|
cl_context context = getInfo<CL_QUEUE_CONTEXT>(); |
|
cl::Device device(getInfo<CL_QUEUE_DEVICE>()); |
|
cl_platform_id platform = device.getInfo<CL_DEVICE_PLATFORM>(); |
|
__INIT_CL_EXT_FCN_PTR_PLATFORM(platform, clEnqueueReleaseD3D10ObjectsKHR); |
|
#endif // #if defined(CL_VERSION_1_2) |
|
#if defined(CL_VERSION_1_1) |
|
__INIT_CL_EXT_FCN_PTR(clEnqueueReleaseD3D10ObjectsKHR); |
|
#endif // #if defined(CL_VERSION_1_1) |
|
|
|
cl_event tmp; |
|
cl_int err = detail::errHandler( |
|
pfn_clEnqueueReleaseD3D10ObjectsKHR( |
|
object_, |
|
(mem_objects != NULL) ? (cl_uint) mem_objects->size() : 0, |
|
(mem_objects != NULL) ? (const cl_mem *) &mem_objects->front(): NULL, |
|
(events != NULL) ? (cl_uint) events->size() : 0, |
|
(events != NULL) ? (cl_event*) &events->front() : NULL, |
|
(event != NULL) ? &tmp : NULL), |
|
__ENQUEUE_RELEASE_GL_ERR); |
|
|
|
if (event != NULL && err == CL_SUCCESS) |
|
*event = tmp; |
|
|
|
return err; |
|
} |
|
#endif |
|
|
|
/** |
|
* Deprecated APIs for 1.2 |
|
*/ |
|
#if defined(CL_USE_DEPRECATED_OPENCL_1_1_APIS) || (defined(CL_VERSION_1_1) && !defined(CL_VERSION_1_2)) |
|
CL_EXT_PREFIX__VERSION_1_1_DEPRECATED |
|
cl_int enqueueBarrier() const CL_EXT_SUFFIX__VERSION_1_1_DEPRECATED |
|
{ |
|
return detail::errHandler( |
|
::clEnqueueBarrier(object_), |
|
__ENQUEUE_BARRIER_ERR); |
|
} |
|
#endif // #if defined(CL_VERSION_1_1) |
|
|
|
cl_int flush() const |
|
{ |
|
return detail::errHandler(::clFlush(object_), __FLUSH_ERR); |
|
} |
|
|
|
cl_int finish() const |
|
{ |
|
return detail::errHandler(::clFinish(object_), __FINISH_ERR); |
|
} |
|
}; |
|
|
|
#ifdef _WIN32 |
|
__declspec(selectany) volatile int CommandQueue::default_initialized_ = __DEFAULT_NOT_INITIALIZED; |
|
__declspec(selectany) CommandQueue CommandQueue::default_; |
|
__declspec(selectany) volatile cl_int CommandQueue::default_error_ = CL_SUCCESS; |
|
#else |
|
__attribute__((weak)) volatile int CommandQueue::default_initialized_ = __DEFAULT_NOT_INITIALIZED; |
|
__attribute__((weak)) CommandQueue CommandQueue::default_; |
|
__attribute__((weak)) volatile cl_int CommandQueue::default_error_ = CL_SUCCESS; |
|
#endif |
|
|
|
inline cl_int enqueueReadBuffer( |
|
const Buffer& buffer, |
|
cl_bool blocking, |
|
::size_t offset, |
|
::size_t size, |
|
void* ptr, |
|
const VECTOR_CLASS<Event>* events = NULL, |
|
Event* event = NULL) |
|
{ |
|
cl_int error; |
|
CommandQueue queue = CommandQueue::getDefault(&error); |
|
|
|
if (error != CL_SUCCESS) { |
|
return error; |
|
} |
|
|
|
return queue.enqueueReadBuffer(buffer, blocking, offset, size, ptr, events, event); |
|
} |
|
|
|
inline cl_int enqueueWriteBuffer( |
|
const Buffer& buffer, |
|
cl_bool blocking, |
|
::size_t offset, |
|
::size_t size, |
|
const void* ptr, |
|
const VECTOR_CLASS<Event>* events = NULL, |
|
Event* event = NULL) |
|
{ |
|
cl_int error; |
|
CommandQueue queue = CommandQueue::getDefault(&error); |
|
|
|
if (error != CL_SUCCESS) { |
|
return error; |
|
} |
|
|
|
return queue.enqueueWriteBuffer(buffer, blocking, offset, size, ptr, events, event); |
|
} |
|
|
|
inline void* enqueueMapBuffer( |
|
const Buffer& buffer, |
|
cl_bool blocking, |
|
cl_map_flags flags, |
|
::size_t offset, |
|
::size_t size, |
|
const VECTOR_CLASS<Event>* events = NULL, |
|
Event* event = NULL, |
|
cl_int* err = NULL) |
|
{ |
|
cl_int error; |
|
CommandQueue queue = CommandQueue::getDefault(&error); |
|
detail::errHandler(error, __ENQUEUE_MAP_BUFFER_ERR); |
|
if (err != NULL) { |
|
*err = error; |
|
} |
|
|
|
void * result = ::clEnqueueMapBuffer( |
|
queue(), buffer(), blocking, flags, offset, size, |
|
(events != NULL) ? (cl_uint) events->size() : 0, |
|
(events != NULL && events->size() > 0) ? (cl_event*) &events->front() : NULL, |
|
(cl_event*) event, |
|
&error); |
|
|
|
detail::errHandler(error, __ENQUEUE_MAP_BUFFER_ERR); |
|
if (err != NULL) { |
|
*err = error; |
|
} |
|
return result; |
|
} |
|
|
|
inline cl_int enqueueUnmapMemObject( |
|
const Memory& memory, |
|
void* mapped_ptr, |
|
const VECTOR_CLASS<Event>* events = NULL, |
|
Event* event = NULL) |
|
{ |
|
cl_int error; |
|
CommandQueue queue = CommandQueue::getDefault(&error); |
|
detail::errHandler(error, __ENQUEUE_MAP_BUFFER_ERR); |
|
if (error != CL_SUCCESS) { |
|
return error; |
|
} |
|
|
|
cl_event tmp; |
|
cl_int err = detail::errHandler( |
|
::clEnqueueUnmapMemObject( |
|
queue(), memory(), mapped_ptr, |
|
(events != NULL) ? (cl_uint) events->size() : 0, |
|
(events != NULL && events->size() > 0) ? (cl_event*) &events->front() : NULL, |
|
(event != NULL) ? &tmp : NULL), |
|
__ENQUEUE_UNMAP_MEM_OBJECT_ERR); |
|
|
|
if (event != NULL && err == CL_SUCCESS) |
|
*event = tmp; |
|
|
|
return err; |
|
} |
|
|
|
inline cl_int enqueueCopyBuffer( |
|
const Buffer& src, |
|
const Buffer& dst, |
|
::size_t src_offset, |
|
::size_t dst_offset, |
|
::size_t size, |
|
const VECTOR_CLASS<Event>* events = NULL, |
|
Event* event = NULL) |
|
{ |
|
cl_int error; |
|
CommandQueue queue = CommandQueue::getDefault(&error); |
|
|
|
if (error != CL_SUCCESS) { |
|
return error; |
|
} |
|
|
|
return queue.enqueueCopyBuffer(src, dst, src_offset, dst_offset, size, events, event); |
|
} |
|
|
|
/** |
|
* Blocking copy operation between iterators and a buffer. |
|
*/ |
|
template< typename IteratorType > |
|
inline cl_int copy( IteratorType startIterator, IteratorType endIterator, cl::Buffer &buffer ) |
|
{ |
|
typedef typename std::iterator_traits<IteratorType>::value_type DataType; |
|
cl_int error; |
|
|
|
::size_t length = endIterator-startIterator; |
|
::size_t byteLength = length*sizeof(DataType); |
|
|
|
DataType *pointer = |
|
static_cast<DataType*>(enqueueMapBuffer(buffer, CL_TRUE, CL_MAP_WRITE, 0, byteLength, 0, 0, &error)); |
|
// if exceptions enabled, enqueueMapBuffer will throw |
|
if( error != CL_SUCCESS ) { |
|
return error; |
|
} |
|
#if defined(_MSC_VER) |
|
std::copy( |
|
startIterator, |
|
endIterator, |
|
stdext::checked_array_iterator<DataType*>( |
|
pointer, length)); |
|
#else |
|
std::copy(startIterator, endIterator, pointer); |
|
#endif |
|
Event endEvent; |
|
error = enqueueUnmapMemObject(buffer, pointer, 0, &endEvent); |
|
// if exceptions enabled, enqueueUnmapMemObject will throw |
|
if( error != CL_SUCCESS ) { |
|
return error; |
|
} |
|
endEvent.wait(); |
|
return CL_SUCCESS; |
|
} |
|
|
|
/** |
|
* Blocking copy operation between iterators and a buffer. |
|
*/ |
|
template< typename IteratorType > |
|
inline cl_int copy( const cl::Buffer &buffer, IteratorType startIterator, IteratorType endIterator ) |
|
{ |
|
typedef typename std::iterator_traits<IteratorType>::value_type DataType; |
|
cl_int error; |
|
|
|
::size_t length = endIterator-startIterator; |
|
::size_t byteLength = length*sizeof(DataType); |
|
|
|
DataType *pointer = |
|
static_cast<DataType*>(enqueueMapBuffer(buffer, CL_TRUE, CL_MAP_READ, 0, byteLength, 0, 0, &error)); |
|
// if exceptions enabled, enqueueMapBuffer will throw |
|
if( error != CL_SUCCESS ) { |
|
return error; |
|
} |
|
std::copy(pointer, pointer + length, startIterator); |
|
Event endEvent; |
|
error = enqueueUnmapMemObject(buffer, pointer, 0, &endEvent); |
|
// if exceptions enabled, enqueueUnmapMemObject will throw |
|
if( error != CL_SUCCESS ) { |
|
return error; |
|
} |
|
endEvent.wait(); |
|
return CL_SUCCESS; |
|
} |
|
|
|
#if defined(CL_VERSION_1_1) |
|
inline cl_int enqueueReadBufferRect( |
|
const Buffer& buffer, |
|
cl_bool blocking, |
|
const size_t<3>& buffer_offset, |
|
const size_t<3>& host_offset, |
|
const size_t<3>& region, |
|
::size_t buffer_row_pitch, |
|
::size_t buffer_slice_pitch, |
|
::size_t host_row_pitch, |
|
::size_t host_slice_pitch, |
|
void *ptr, |
|
const VECTOR_CLASS<Event>* events = NULL, |
|
Event* event = NULL) |
|
{ |
|
cl_int error; |
|
CommandQueue queue = CommandQueue::getDefault(&error); |
|
|
|
if (error != CL_SUCCESS) { |
|
return error; |
|
} |
|
|
|
return queue.enqueueReadBufferRect( |
|
buffer, |
|
blocking, |
|
buffer_offset, |
|
host_offset, |
|
region, |
|
buffer_row_pitch, |
|
buffer_slice_pitch, |
|
host_row_pitch, |
|
host_slice_pitch, |
|
ptr, |
|
events, |
|
event); |
|
} |
|
|
|
inline cl_int enqueueWriteBufferRect( |
|
const Buffer& buffer, |
|
cl_bool blocking, |
|
const size_t<3>& buffer_offset, |
|
const size_t<3>& host_offset, |
|
const size_t<3>& region, |
|
::size_t buffer_row_pitch, |
|
::size_t buffer_slice_pitch, |
|
::size_t host_row_pitch, |
|
::size_t host_slice_pitch, |
|
void *ptr, |
|
const VECTOR_CLASS<Event>* events = NULL, |
|
Event* event = NULL) |
|
{ |
|
cl_int error; |
|
CommandQueue queue = CommandQueue::getDefault(&error); |
|
|
|
if (error != CL_SUCCESS) { |
|
return error; |
|
} |
|
|
|
return queue.enqueueWriteBufferRect( |
|
buffer, |
|
blocking, |
|
buffer_offset, |
|
host_offset, |
|
region, |
|
buffer_row_pitch, |
|
buffer_slice_pitch, |
|
host_row_pitch, |
|
host_slice_pitch, |
|
ptr, |
|
events, |
|
event); |
|
} |
|
|
|
inline cl_int enqueueCopyBufferRect( |
|
const Buffer& src, |
|
const Buffer& dst, |
|
const size_t<3>& src_origin, |
|
const size_t<3>& dst_origin, |
|
const size_t<3>& region, |
|
::size_t src_row_pitch, |
|
::size_t src_slice_pitch, |
|
::size_t dst_row_pitch, |
|
::size_t dst_slice_pitch, |
|
const VECTOR_CLASS<Event>* events = NULL, |
|
Event* event = NULL) |
|
{ |
|
cl_int error; |
|
CommandQueue queue = CommandQueue::getDefault(&error); |
|
|
|
if (error != CL_SUCCESS) { |
|
return error; |
|
} |
|
|
|
return queue.enqueueCopyBufferRect( |
|
src, |
|
dst, |
|
src_origin, |
|
dst_origin, |
|
region, |
|
src_row_pitch, |
|
src_slice_pitch, |
|
dst_row_pitch, |
|
dst_slice_pitch, |
|
events, |
|
event); |
|
} |
|
#endif |
|
|
|
inline cl_int enqueueReadImage( |
|
const Image& image, |
|
cl_bool blocking, |
|
const size_t<3>& origin, |
|
const size_t<3>& region, |
|
::size_t row_pitch, |
|
::size_t slice_pitch, |
|
void* ptr, |
|
const VECTOR_CLASS<Event>* events = NULL, |
|
Event* event = NULL) |
|
{ |
|
cl_int error; |
|
CommandQueue queue = CommandQueue::getDefault(&error); |
|
|
|
if (error != CL_SUCCESS) { |
|
return error; |
|
} |
|
|
|
return queue.enqueueReadImage( |
|
image, |
|
blocking, |
|
origin, |
|
region, |
|
row_pitch, |
|
slice_pitch, |
|
ptr, |
|
events, |
|
event); |
|
} |
|
|
|
inline cl_int enqueueWriteImage( |
|
const Image& image, |
|
cl_bool blocking, |
|
const size_t<3>& origin, |
|
const size_t<3>& region, |
|
::size_t row_pitch, |
|
::size_t slice_pitch, |
|
void* ptr, |
|
const VECTOR_CLASS<Event>* events = NULL, |
|
Event* event = NULL) |
|
{ |
|
cl_int error; |
|
CommandQueue queue = CommandQueue::getDefault(&error); |
|
|
|
if (error != CL_SUCCESS) { |
|
return error; |
|
} |
|
|
|
return queue.enqueueWriteImage( |
|
image, |
|
blocking, |
|
origin, |
|
region, |
|
row_pitch, |
|
slice_pitch, |
|
ptr, |
|
events, |
|
event); |
|
} |
|
|
|
inline cl_int enqueueCopyImage( |
|
const Image& src, |
|
const Image& dst, |
|
const size_t<3>& src_origin, |
|
const size_t<3>& dst_origin, |
|
const size_t<3>& region, |
|
const VECTOR_CLASS<Event>* events = NULL, |
|
Event* event = NULL) |
|
{ |
|
cl_int error; |
|
CommandQueue queue = CommandQueue::getDefault(&error); |
|
|
|
if (error != CL_SUCCESS) { |
|
return error; |
|
} |
|
|
|
return queue.enqueueCopyImage( |
|
src, |
|
dst, |
|
src_origin, |
|
dst_origin, |
|
region, |
|
events, |
|
event); |
|
} |
|
|
|
inline cl_int enqueueCopyImageToBuffer( |
|
const Image& src, |
|
const Buffer& dst, |
|
const size_t<3>& src_origin, |
|
const size_t<3>& region, |
|
::size_t dst_offset, |
|
const VECTOR_CLASS<Event>* events = NULL, |
|
Event* event = NULL) |
|
{ |
|
cl_int error; |
|
CommandQueue queue = CommandQueue::getDefault(&error); |
|
|
|
if (error != CL_SUCCESS) { |
|
return error; |
|
} |
|
|
|
return queue.enqueueCopyImageToBuffer( |
|
src, |
|
dst, |
|
src_origin, |
|
region, |
|
dst_offset, |
|
events, |
|
event); |
|
} |
|
|
|
inline cl_int enqueueCopyBufferToImage( |
|
const Buffer& src, |
|
const Image& dst, |
|
::size_t src_offset, |
|
const size_t<3>& dst_origin, |
|
const size_t<3>& region, |
|
const VECTOR_CLASS<Event>* events = NULL, |
|
Event* event = NULL) |
|
{ |
|
cl_int error; |
|
CommandQueue queue = CommandQueue::getDefault(&error); |
|
|
|
if (error != CL_SUCCESS) { |
|
return error; |
|
} |
|
|
|
return queue.enqueueCopyBufferToImage( |
|
src, |
|
dst, |
|
src_offset, |
|
dst_origin, |
|
region, |
|
events, |
|
event); |
|
} |
|
|
|
|
|
inline cl_int flush(void) |
|
{ |
|
cl_int error; |
|
CommandQueue queue = CommandQueue::getDefault(&error); |
|
|
|
if (error != CL_SUCCESS) { |
|
return error; |
|
} |
|
|
|
return queue.flush(); |
|
} |
|
|
|
inline cl_int finish(void) |
|
{ |
|
cl_int error; |
|
CommandQueue queue = CommandQueue::getDefault(&error); |
|
|
|
if (error != CL_SUCCESS) { |
|
return error; |
|
} |
|
|
|
|
|
return queue.finish(); |
|
} |
|
|
|
// Kernel Functor support |
|
// New interface as of September 2011 |
|
// Requires the C++11 std::tr1::function (note do not support TR1) |
|
// Visual Studio 2010 and GCC 4.2 |
|
|
|
struct EnqueueArgs |
|
{ |
|
CommandQueue queue_; |
|
const NDRange offset_; |
|
const NDRange global_; |
|
const NDRange local_; |
|
VECTOR_CLASS<Event> events_; |
|
|
|
EnqueueArgs(NDRange global) : |
|
queue_(CommandQueue::getDefault()), |
|
offset_(NullRange), |
|
global_(global), |
|
local_(NullRange) |
|
{ |
|
|
|
} |
|
|
|
EnqueueArgs(NDRange global, NDRange local) : |
|
queue_(CommandQueue::getDefault()), |
|
offset_(NullRange), |
|
global_(global), |
|
local_(local) |
|
{ |
|
|
|
} |
|
|
|
EnqueueArgs(NDRange offset, NDRange global, NDRange local) : |
|
queue_(CommandQueue::getDefault()), |
|
offset_(offset), |
|
global_(global), |
|
local_(local) |
|
{ |
|
|
|
} |
|
|
|
EnqueueArgs(Event e, NDRange global) : |
|
queue_(CommandQueue::getDefault()), |
|
offset_(NullRange), |
|
global_(global), |
|
local_(NullRange) |
|
{ |
|
events_.push_back(e); |
|
} |
|
|
|
EnqueueArgs(Event e, NDRange global, NDRange local) : |
|
queue_(CommandQueue::getDefault()), |
|
offset_(NullRange), |
|
global_(global), |
|
local_(local) |
|
{ |
|
events_.push_back(e); |
|
} |
|
|
|
EnqueueArgs(Event e, NDRange offset, NDRange global, NDRange local) : |
|
queue_(CommandQueue::getDefault()), |
|
offset_(offset), |
|
global_(global), |
|
local_(local) |
|
{ |
|
events_.push_back(e); |
|
} |
|
|
|
EnqueueArgs(const VECTOR_CLASS<Event> &events, NDRange global) : |
|
queue_(CommandQueue::getDefault()), |
|
offset_(NullRange), |
|
global_(global), |
|
local_(NullRange), |
|
events_(events) |
|
{ |
|
|
|
} |
|
|
|
EnqueueArgs(const VECTOR_CLASS<Event> &events, NDRange global, NDRange local) : |
|
queue_(CommandQueue::getDefault()), |
|
offset_(NullRange), |
|
global_(global), |
|
local_(local), |
|
events_(events) |
|
{ |
|
|
|
} |
|
|
|
EnqueueArgs(const VECTOR_CLASS<Event> &events, NDRange offset, NDRange global, NDRange local) : |
|
queue_(CommandQueue::getDefault()), |
|
offset_(offset), |
|
global_(global), |
|
local_(local), |
|
events_(events) |
|
{ |
|
|
|
} |
|
|
|
EnqueueArgs(CommandQueue &queue, NDRange global) : |
|
queue_(queue), |
|
offset_(NullRange), |
|
global_(global), |
|
local_(NullRange) |
|
{ |
|
|
|
} |
|
|
|
EnqueueArgs(CommandQueue &queue, NDRange global, NDRange local) : |
|
queue_(queue), |
|
offset_(NullRange), |
|
global_(global), |
|
local_(local) |
|
{ |
|
|
|
} |
|
|
|
EnqueueArgs(CommandQueue &queue, NDRange offset, NDRange global, NDRange local) : |
|
queue_(queue), |
|
offset_(offset), |
|
global_(global), |
|
local_(local) |
|
{ |
|
|
|
} |
|
|
|
EnqueueArgs(CommandQueue &queue, Event e, NDRange global) : |
|
queue_(queue), |
|
offset_(NullRange), |
|
global_(global), |
|
local_(NullRange) |
|
{ |
|
events_.push_back(e); |
|
} |
|
|
|
EnqueueArgs(CommandQueue &queue, Event e, NDRange global, NDRange local) : |
|
queue_(queue), |
|
offset_(NullRange), |
|
global_(global), |
|
local_(local) |
|
{ |
|
events_.push_back(e); |
|
} |
|
|
|
EnqueueArgs(CommandQueue &queue, Event e, NDRange offset, NDRange global, NDRange local) : |
|
queue_(queue), |
|
offset_(offset), |
|
global_(global), |
|
local_(local) |
|
{ |
|
events_.push_back(e); |
|
} |
|
|
|
EnqueueArgs(CommandQueue &queue, const VECTOR_CLASS<Event> &events, NDRange global) : |
|
queue_(queue), |
|
offset_(NullRange), |
|
global_(global), |
|
local_(NullRange), |
|
events_(events) |
|
{ |
|
|
|
} |
|
|
|
EnqueueArgs(CommandQueue &queue, const VECTOR_CLASS<Event> &events, NDRange global, NDRange local) : |
|
queue_(queue), |
|
offset_(NullRange), |
|
global_(global), |
|
local_(local), |
|
events_(events) |
|
{ |
|
|
|
} |
|
|
|
EnqueueArgs(CommandQueue &queue, const VECTOR_CLASS<Event> &events, NDRange offset, NDRange global, NDRange local) : |
|
queue_(queue), |
|
offset_(offset), |
|
global_(global), |
|
local_(local), |
|
events_(events) |
|
{ |
|
|
|
} |
|
}; |
|
|
|
namespace detail { |
|
|
|
class NullType {}; |
|
|
|
template<int index, typename T0> |
|
struct SetArg |
|
{ |
|
static void set (Kernel kernel, T0 arg) |
|
{ |
|
kernel.setArg(index, arg); |
|
} |
|
}; |
|
|
|
template<int index> |
|
struct SetArg<index, NullType> |
|
{ |
|
static void set (Kernel, NullType) |
|
{ |
|
} |
|
}; |
|
|
|
template < |
|
typename T0, typename T1, typename T2, typename T3, |
|
typename T4, typename T5, typename T6, typename T7, |
|
typename T8, typename T9, typename T10, typename T11, |
|
typename T12, typename T13, typename T14, typename T15, |
|
typename T16, typename T17, typename T18, typename T19, |
|
typename T20, typename T21, typename T22, typename T23, |
|
typename T24, typename T25, typename T26, typename T27, |
|
typename T28, typename T29, typename T30, typename T31 |
|
> |
|
class KernelFunctorGlobal |
|
{ |
|
private: |
|
Kernel kernel_; |
|
|
|
public: |
|
KernelFunctorGlobal( |
|
Kernel kernel) : |
|
kernel_(kernel) |
|
{} |
|
|
|
KernelFunctorGlobal( |
|
const Program& program, |
|
const STRING_CLASS name, |
|
cl_int * err = NULL) : |
|
kernel_(program, name.c_str(), err) |
|
{} |
|
|
|
Event operator() ( |
|
const EnqueueArgs& args, |
|
T0 t0, |
|
T1 t1 = NullType(), |
|
T2 t2 = NullType(), |
|
T3 t3 = NullType(), |
|
T4 t4 = NullType(), |
|
T5 t5 = NullType(), |
|
T6 t6 = NullType(), |
|
T7 t7 = NullType(), |
|
T8 t8 = NullType(), |
|
T9 t9 = NullType(), |
|
T10 t10 = NullType(), |
|
T11 t11 = NullType(), |
|
T12 t12 = NullType(), |
|
T13 t13 = NullType(), |
|
T14 t14 = NullType(), |
|
T15 t15 = NullType(), |
|
T16 t16 = NullType(), |
|
T17 t17 = NullType(), |
|
T18 t18 = NullType(), |
|
T19 t19 = NullType(), |
|
T20 t20 = NullType(), |
|
T21 t21 = NullType(), |
|
T22 t22 = NullType(), |
|
T23 t23 = NullType(), |
|
T24 t24 = NullType(), |
|
T25 t25 = NullType(), |
|
T26 t26 = NullType(), |
|
T27 t27 = NullType(), |
|
T28 t28 = NullType(), |
|
T29 t29 = NullType(), |
|
T30 t30 = NullType(), |
|
T31 t31 = NullType() |
|
) |
|
{ |
|
Event event; |
|
SetArg<0, T0>::set(kernel_, t0); |
|
SetArg<1, T1>::set(kernel_, t1); |
|
SetArg<2, T2>::set(kernel_, t2); |
|
SetArg<3, T3>::set(kernel_, t3); |
|
SetArg<4, T4>::set(kernel_, t4); |
|
SetArg<5, T5>::set(kernel_, t5); |
|
SetArg<6, T6>::set(kernel_, t6); |
|
SetArg<7, T7>::set(kernel_, t7); |
|
SetArg<8, T8>::set(kernel_, t8); |
|
SetArg<9, T9>::set(kernel_, t9); |
|
SetArg<10, T10>::set(kernel_, t10); |
|
SetArg<11, T11>::set(kernel_, t11); |
|
SetArg<12, T12>::set(kernel_, t12); |
|
SetArg<13, T13>::set(kernel_, t13); |
|
SetArg<14, T14>::set(kernel_, t14); |
|
SetArg<15, T15>::set(kernel_, t15); |
|
SetArg<16, T16>::set(kernel_, t16); |
|
SetArg<17, T17>::set(kernel_, t17); |
|
SetArg<18, T18>::set(kernel_, t18); |
|
SetArg<19, T19>::set(kernel_, t19); |
|
SetArg<20, T20>::set(kernel_, t20); |
|
SetArg<21, T21>::set(kernel_, t21); |
|
SetArg<22, T22>::set(kernel_, t22); |
|
SetArg<23, T23>::set(kernel_, t23); |
|
SetArg<24, T24>::set(kernel_, t24); |
|
SetArg<25, T25>::set(kernel_, t25); |
|
SetArg<26, T26>::set(kernel_, t26); |
|
SetArg<27, T27>::set(kernel_, t27); |
|
SetArg<28, T28>::set(kernel_, t28); |
|
SetArg<29, T29>::set(kernel_, t29); |
|
SetArg<30, T30>::set(kernel_, t30); |
|
SetArg<31, T31>::set(kernel_, t31); |
|
|
|
args.queue_.enqueueNDRangeKernel( |
|
kernel_, |
|
args.offset_, |
|
args.global_, |
|
args.local_, |
|
&args.events_, |
|
&event); |
|
|
|
return event; |
|
} |
|
|
|
}; |
|
|
|
//------------------------------------------------------------------------------------------------------ |
|
|
|
|
|
template< |
|
typename T0, |
|
typename T1, |
|
typename T2, |
|
typename T3, |
|
typename T4, |
|
typename T5, |
|
typename T6, |
|
typename T7, |
|
typename T8, |
|
typename T9, |
|
typename T10, |
|
typename T11, |
|
typename T12, |
|
typename T13, |
|
typename T14, |
|
typename T15, |
|
typename T16, |
|
typename T17, |
|
typename T18, |
|
typename T19, |
|
typename T20, |
|
typename T21, |
|
typename T22, |
|
typename T23, |
|
typename T24, |
|
typename T25, |
|
typename T26, |
|
typename T27, |
|
typename T28, |
|
typename T29, |
|
typename T30, |
|
typename T31> |
|
struct functionImplementation_ |
|
{ |
|
typedef detail::KernelFunctorGlobal< |
|
T0, |
|
T1, |
|
T2, |
|
T3, |
|
T4, |
|
T5, |
|
T6, |
|
T7, |
|
T8, |
|
T9, |
|
T10, |
|
T11, |
|
T12, |
|
T13, |
|
T14, |
|
T15, |
|
T16, |
|
T17, |
|
T18, |
|
T19, |
|
T20, |
|
T21, |
|
T22, |
|
T23, |
|
T24, |
|
T25, |
|
T26, |
|
T27, |
|
T28, |
|
T29, |
|
T30, |
|
T31> FunctorType; |
|
|
|
FunctorType functor_; |
|
|
|
functionImplementation_(const FunctorType &functor) : |
|
functor_(functor) |
|
{ |
|
|
|
#if (defined(_WIN32) && defined(_VARIADIC_MAX) && (_VARIADIC_MAX < 32)) |
|
// Fail variadic expansion for dev11 |
|
static_assert(0, "Visual Studio has a hard limit of argument count for a std::function expansion. Please define _VARIADIC_MAX to be 10. If you need more arguments than that VC12 and below cannot support it."); |
|
#endif |
|
|
|
} |
|
|
|
//! \brief Return type of the functor |
|
typedef Event result_type; |
|
|
|
//! \brief Function signature of kernel functor with no event dependency. |
|
typedef Event type_( |
|
const EnqueueArgs&, |
|
T0, |
|
T1, |
|
T2, |
|
T3, |
|
T4, |
|
T5, |
|
T6, |
|
T7, |
|
T8, |
|
T9, |
|
T10, |
|
T11, |
|
T12, |
|
T13, |
|
T14, |
|
T15, |
|
T16, |
|
T17, |
|
T18, |
|
T19, |
|
T20, |
|
T21, |
|
T22, |
|
T23, |
|
T24, |
|
T25, |
|
T26, |
|
T27, |
|
T28, |
|
T29, |
|
T30, |
|
T31); |
|
|
|
Event operator()( |
|
const EnqueueArgs& enqueueArgs, |
|
T0 arg0, |
|
T1 arg1, |
|
T2 arg2, |
|
T3 arg3, |
|
T4 arg4, |
|
T5 arg5, |
|
T6 arg6, |
|
T7 arg7, |
|
T8 arg8, |
|
T9 arg9, |
|
T10 arg10, |
|
T11 arg11, |
|
T12 arg12, |
|
T13 arg13, |
|
T14 arg14, |
|
T15 arg15, |
|
T16 arg16, |
|
T17 arg17, |
|
T18 arg18, |
|
T19 arg19, |
|
T20 arg20, |
|
T21 arg21, |
|
T22 arg22, |
|
T23 arg23, |
|
T24 arg24, |
|
T25 arg25, |
|
T26 arg26, |
|
T27 arg27, |
|
T28 arg28, |
|
T29 arg29, |
|
T30 arg30, |
|
T31 arg31) |
|
{ |
|
return functor_( |
|
enqueueArgs, |
|
arg0, |
|
arg1, |
|
arg2, |
|
arg3, |
|
arg4, |
|
arg5, |
|
arg6, |
|
arg7, |
|
arg8, |
|
arg9, |
|
arg10, |
|
arg11, |
|
arg12, |
|
arg13, |
|
arg14, |
|
arg15, |
|
arg16, |
|
arg17, |
|
arg18, |
|
arg19, |
|
arg20, |
|
arg21, |
|
arg22, |
|
arg23, |
|
arg24, |
|
arg25, |
|
arg26, |
|
arg27, |
|
arg28, |
|
arg29, |
|
arg30, |
|
arg31); |
|
} |
|
|
|
|
|
}; |
|
|
|
template< |
|
typename T0, |
|
typename T1, |
|
typename T2, |
|
typename T3, |
|
typename T4, |
|
typename T5, |
|
typename T6, |
|
typename T7, |
|
typename T8, |
|
typename T9, |
|
typename T10, |
|
typename T11, |
|
typename T12, |
|
typename T13, |
|
typename T14, |
|
typename T15, |
|
typename T16, |
|
typename T17, |
|
typename T18, |
|
typename T19, |
|
typename T20, |
|
typename T21, |
|
typename T22, |
|
typename T23, |
|
typename T24, |
|
typename T25, |
|
typename T26, |
|
typename T27, |
|
typename T28, |
|
typename T29, |
|
typename T30> |
|
struct functionImplementation_ |
|
< T0, |
|
T1, |
|
T2, |
|
T3, |
|
T4, |
|
T5, |
|
T6, |
|
T7, |
|
T8, |
|
T9, |
|
T10, |
|
T11, |
|
T12, |
|
T13, |
|
T14, |
|
T15, |
|
T16, |
|
T17, |
|
T18, |
|
T19, |
|
T20, |
|
T21, |
|
T22, |
|
T23, |
|
T24, |
|
T25, |
|
T26, |
|
T27, |
|
T28, |
|
T29, |
|
T30, |
|
NullType> |
|
{ |
|
typedef detail::KernelFunctorGlobal< |
|
T0, |
|
T1, |
|
T2, |
|
T3, |
|
T4, |
|
T5, |
|
T6, |
|
T7, |
|
T8, |
|
T9, |
|
T10, |
|
T11, |
|
T12, |
|
T13, |
|
T14, |
|
T15, |
|
T16, |
|
T17, |
|
T18, |
|
T19, |
|
T20, |
|
T21, |
|
T22, |
|
T23, |
|
T24, |
|
T25, |
|
T26, |
|
T27, |
|
T28, |
|
T29, |
|
T30, |
|
NullType> FunctorType; |
|
|
|
FunctorType functor_; |
|
|
|
functionImplementation_(const FunctorType &functor) : |
|
functor_(functor) |
|
{ |
|
|
|
#if (defined(_WIN32) && defined(_VARIADIC_MAX) && (_VARIADIC_MAX < 31)) |
|
// Fail variadic expansion for dev11 |
|
static_assert(0, "Visual Studio has a hard limit of argument count for a std::function expansion. Please define _VARIADIC_MAX to be 10. If you need more arguments than that VC12 and below cannot support it."); |
|
#endif |
|
|
|
} |
|
|
|
//! \brief Return type of the functor |
|
typedef Event result_type; |
|
|
|
//! \brief Function signature of kernel functor with no event dependency. |
|
typedef Event type_( |
|
const EnqueueArgs&, |
|
T0, |
|
T1, |
|
T2, |
|
T3, |
|
T4, |
|
T5, |
|
T6, |
|
T7, |
|
T8, |
|
T9, |
|
T10, |
|
T11, |
|
T12, |
|
T13, |
|
T14, |
|
T15, |
|
T16, |
|
T17, |
|
T18, |
|
T19, |
|
T20, |
|
T21, |
|
T22, |
|
T23, |
|
T24, |
|
T25, |
|
T26, |
|
T27, |
|
T28, |
|
T29, |
|
T30); |
|
|
|
Event operator()( |
|
const EnqueueArgs& enqueueArgs, |
|
T0 arg0, |
|
T1 arg1, |
|
T2 arg2, |
|
T3 arg3, |
|
T4 arg4, |
|
T5 arg5, |
|
T6 arg6, |
|
T7 arg7, |
|
T8 arg8, |
|
T9 arg9, |
|
T10 arg10, |
|
T11 arg11, |
|
T12 arg12, |
|
T13 arg13, |
|
T14 arg14, |
|
T15 arg15, |
|
T16 arg16, |
|
T17 arg17, |
|
T18 arg18, |
|
T19 arg19, |
|
T20 arg20, |
|
T21 arg21, |
|
T22 arg22, |
|
T23 arg23, |
|
T24 arg24, |
|
T25 arg25, |
|
T26 arg26, |
|
T27 arg27, |
|
T28 arg28, |
|
T29 arg29, |
|
T30 arg30) |
|
{ |
|
return functor_( |
|
enqueueArgs, |
|
arg0, |
|
arg1, |
|
arg2, |
|
arg3, |
|
arg4, |
|
arg5, |
|
arg6, |
|
arg7, |
|
arg8, |
|
arg9, |
|
arg10, |
|
arg11, |
|
arg12, |
|
arg13, |
|
arg14, |
|
arg15, |
|
arg16, |
|
arg17, |
|
arg18, |
|
arg19, |
|
arg20, |
|
arg21, |
|
arg22, |
|
arg23, |
|
arg24, |
|
arg25, |
|
arg26, |
|
arg27, |
|
arg28, |
|
arg29, |
|
arg30); |
|
} |
|
|
|
|
|
}; |
|
|
|
template< |
|
typename T0, |
|
typename T1, |
|
typename T2, |
|
typename T3, |
|
typename T4, |
|
typename T5, |
|
typename T6, |
|
typename T7, |
|
typename T8, |
|
typename T9, |
|
typename T10, |
|
typename T11, |
|
typename T12, |
|
typename T13, |
|
typename T14, |
|
typename T15, |
|
typename T16, |
|
typename T17, |
|
typename T18, |
|
typename T19, |
|
typename T20, |
|
typename T21, |
|
typename T22, |
|
typename T23, |
|
typename T24, |
|
typename T25, |
|
typename T26, |
|
typename T27, |
|
typename T28, |
|
typename T29> |
|
struct functionImplementation_ |
|
< T0, |
|
T1, |
|
T2, |
|
T3, |
|
T4, |
|
T5, |
|
T6, |
|
T7, |
|
T8, |
|
T9, |
|
T10, |
|
T11, |
|
T12, |
|
T13, |
|
T14, |
|
T15, |
|
T16, |
|
T17, |
|
T18, |
|
T19, |
|
T20, |
|
T21, |
|
T22, |
|
T23, |
|
T24, |
|
T25, |
|
T26, |
|
T27, |
|
T28, |
|
T29, |
|
NullType, |
|
NullType> |
|
{ |
|
typedef detail::KernelFunctorGlobal< |
|
T0, |
|
T1, |
|
T2, |
|
T3, |
|
T4, |
|
T5, |
|
T6, |
|
T7, |
|
T8, |
|
T9, |
|
T10, |
|
T11, |
|
T12, |
|
T13, |
|
T14, |
|
T15, |
|
T16, |
|
T17, |
|
T18, |
|
T19, |
|
T20, |
|
T21, |
|
T22, |
|
T23, |
|
T24, |
|
T25, |
|
T26, |
|
T27, |
|
T28, |
|
T29, |
|
NullType, |
|
NullType> FunctorType; |
|
|
|
FunctorType functor_; |
|
|
|
functionImplementation_(const FunctorType &functor) : |
|
functor_(functor) |
|
{ |
|
|
|
#if (defined(_WIN32) && defined(_VARIADIC_MAX) && (_VARIADIC_MAX < 30)) |
|
// Fail variadic expansion for dev11 |
|
static_assert(0, "Visual Studio has a hard limit of argument count for a std::function expansion. Please define _VARIADIC_MAX to be 10. If you need more arguments than that VC12 and below cannot support it."); |
|
#endif |
|
|
|
} |
|
|
|
//! \brief Return type of the functor |
|
typedef Event result_type; |
|
|
|
//! \brief Function signature of kernel functor with no event dependency. |
|
typedef Event type_( |
|
const EnqueueArgs&, |
|
T0, |
|
T1, |
|
T2, |
|
T3, |
|
T4, |
|
T5, |
|
T6, |
|
T7, |
|
T8, |
|
T9, |
|
T10, |
|
T11, |
|
T12, |
|
T13, |
|
T14, |
|
T15, |
|
T16, |
|
T17, |
|
T18, |
|
T19, |
|
T20, |
|
T21, |
|
T22, |
|
T23, |
|
T24, |
|
T25, |
|
T26, |
|
T27, |
|
T28, |
|
T29); |
|
|
|
Event operator()( |
|
const EnqueueArgs& enqueueArgs, |
|
T0 arg0, |
|
T1 arg1, |
|
T2 arg2, |
|
T3 arg3, |
|
T4 arg4, |
|
T5 arg5, |
|
T6 arg6, |
|
T7 arg7, |
|
T8 arg8, |
|
T9 arg9, |
|
T10 arg10, |
|
T11 arg11, |
|
T12 arg12, |
|
T13 arg13, |
|
T14 arg14, |
|
T15 arg15, |
|
T16 arg16, |
|
T17 arg17, |
|
T18 arg18, |
|
T19 arg19, |
|
T20 arg20, |
|
T21 arg21, |
|
T22 arg22, |
|
T23 arg23, |
|
T24 arg24, |
|
T25 arg25, |
|
T26 arg26, |
|
T27 arg27, |
|
T28 arg28, |
|
T29 arg29) |
|
{ |
|
return functor_( |
|
enqueueArgs, |
|
arg0, |
|
arg1, |
|
arg2, |
|
arg3, |
|
arg4, |
|
arg5, |
|
arg6, |
|
arg7, |
|
arg8, |
|
arg9, |
|
arg10, |
|
arg11, |
|
arg12, |
|
arg13, |
|
arg14, |
|
arg15, |
|
arg16, |
|
arg17, |
|
arg18, |
|
arg19, |
|
arg20, |
|
arg21, |
|
arg22, |
|
arg23, |
|
arg24, |
|
arg25, |
|
arg26, |
|
arg27, |
|
arg28, |
|
arg29); |
|
} |
|
|
|
|
|
}; |
|
|
|
template< |
|
typename T0, |
|
typename T1, |
|
typename T2, |
|
typename T3, |
|
typename T4, |
|
typename T5, |
|
typename T6, |
|
typename T7, |
|
typename T8, |
|
typename T9, |
|
typename T10, |
|
typename T11, |
|
typename T12, |
|
typename T13, |
|
typename T14, |
|
typename T15, |
|
typename T16, |
|
typename T17, |
|
typename T18, |
|
typename T19, |
|
typename T20, |
|
typename T21, |
|
typename T22, |
|
typename T23, |
|
typename T24, |
|
typename T25, |
|
typename T26, |
|
typename T27, |
|
typename T28> |
|
struct functionImplementation_ |
|
< T0, |
|
T1, |
|
T2, |
|
T3, |
|
T4, |
|
T5, |
|
T6, |
|
T7, |
|
T8, |
|
T9, |
|
T10, |
|
T11, |
|
T12, |
|
T13, |
|
T14, |
|
T15, |
|
T16, |
|
T17, |
|
T18, |
|
T19, |
|
T20, |
|
T21, |
|
T22, |
|
T23, |
|
T24, |
|
T25, |
|
T26, |
|
T27, |
|
T28, |
|
NullType, |
|
NullType, |
|
NullType> |
|
{ |
|
typedef detail::KernelFunctorGlobal< |
|
T0, |
|
T1, |
|
T2, |
|
T3, |
|
T4, |
|
T5, |
|
T6, |
|
T7, |
|
T8, |
|
T9, |
|
T10, |
|
T11, |
|
T12, |
|
T13, |
|
T14, |
|
T15, |
|
T16, |
|
T17, |
|
T18, |
|
T19, |
|
T20, |
|
T21, |
|
T22, |
|
T23, |
|
T24, |
|
T25, |
|
T26, |
|
T27, |
|
T28, |
|
NullType, |
|
NullType, |
|
NullType> FunctorType; |
|
|
|
FunctorType functor_; |
|
|
|
functionImplementation_(const FunctorType &functor) : |
|
functor_(functor) |
|
{ |
|
|
|
#if (defined(_WIN32) && defined(_VARIADIC_MAX) && (_VARIADIC_MAX < 29)) |
|
// Fail variadic expansion for dev11 |
|
static_assert(0, "Visual Studio has a hard limit of argument count for a std::function expansion. Please define _VARIADIC_MAX to be 10. If you need more arguments than that VC12 and below cannot support it."); |
|
#endif |
|
|
|
} |
|
|
|
//! \brief Return type of the functor |
|
typedef Event result_type; |
|
|
|
//! \brief Function signature of kernel functor with no event dependency. |
|
typedef Event type_( |
|
const EnqueueArgs&, |
|
T0, |
|
T1, |
|
T2, |
|
T3, |
|
T4, |
|
T5, |
|
T6, |
|
T7, |
|
T8, |
|
T9, |
|
T10, |
|
T11, |
|
T12, |
|
T13, |
|
T14, |
|
T15, |
|
T16, |
|
T17, |
|
T18, |
|
T19, |
|
T20, |
|
T21, |
|
T22, |
|
T23, |
|
T24, |
|
T25, |
|
T26, |
|
T27, |
|
T28); |
|
|
|
Event operator()( |
|
const EnqueueArgs& enqueueArgs, |
|
T0 arg0, |
|
T1 arg1, |
|
T2 arg2, |
|
T3 arg3, |
|
T4 arg4, |
|
T5 arg5, |
|
T6 arg6, |
|
T7 arg7, |
|
T8 arg8, |
|
T9 arg9, |
|
T10 arg10, |
|
T11 arg11, |
|
T12 arg12, |
|
T13 arg13, |
|
T14 arg14, |
|
T15 arg15, |
|
T16 arg16, |
|
T17 arg17, |
|
T18 arg18, |
|
T19 arg19, |
|
T20 arg20, |
|
T21 arg21, |
|
T22 arg22, |
|
T23 arg23, |
|
T24 arg24, |
|
T25 arg25, |
|
T26 arg26, |
|
T27 arg27, |
|
T28 arg28) |
|
{ |
|
return functor_( |
|
enqueueArgs, |
|
arg0, |
|
arg1, |
|
arg2, |
|
arg3, |
|
arg4, |
|
arg5, |
|
arg6, |
|
arg7, |
|
arg8, |
|
arg9, |
|
arg10, |
|
arg11, |
|
arg12, |
|
arg13, |
|
arg14, |
|
arg15, |
|
arg16, |
|
arg17, |
|
arg18, |
|
arg19, |
|
arg20, |
|
arg21, |
|
arg22, |
|
arg23, |
|
arg24, |
|
arg25, |
|
arg26, |
|
arg27, |
|
arg28); |
|
} |
|
|
|
|
|
}; |
|
|
|
template< |
|
typename T0, |
|
typename T1, |
|
typename T2, |
|
typename T3, |
|
typename T4, |
|
typename T5, |
|
typename T6, |
|
typename T7, |
|
typename T8, |
|
typename T9, |
|
typename T10, |
|
typename T11, |
|
typename T12, |
|
typename T13, |
|
typename T14, |
|
typename T15, |
|
typename T16, |
|
typename T17, |
|
typename T18, |
|
typename T19, |
|
typename T20, |
|
typename T21, |
|
typename T22, |
|
typename T23, |
|
typename T24, |
|
typename T25, |
|
typename T26, |
|
typename T27> |
|
struct functionImplementation_ |
|
< T0, |
|
T1, |
|
T2, |
|
T3, |
|
T4, |
|
T5, |
|
T6, |
|
T7, |
|
T8, |
|
T9, |
|
T10, |
|
T11, |
|
T12, |
|
T13, |
|
T14, |
|
T15, |
|
T16, |
|
T17, |
|
T18, |
|
T19, |
|
T20, |
|
T21, |
|
T22, |
|
T23, |
|
T24, |
|
T25, |
|
T26, |
|
T27, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType> |
|
{ |
|
typedef detail::KernelFunctorGlobal< |
|
T0, |
|
T1, |
|
T2, |
|
T3, |
|
T4, |
|
T5, |
|
T6, |
|
T7, |
|
T8, |
|
T9, |
|
T10, |
|
T11, |
|
T12, |
|
T13, |
|
T14, |
|
T15, |
|
T16, |
|
T17, |
|
T18, |
|
T19, |
|
T20, |
|
T21, |
|
T22, |
|
T23, |
|
T24, |
|
T25, |
|
T26, |
|
T27, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType> FunctorType; |
|
|
|
FunctorType functor_; |
|
|
|
functionImplementation_(const FunctorType &functor) : |
|
functor_(functor) |
|
{ |
|
|
|
#if (defined(_WIN32) && defined(_VARIADIC_MAX) && (_VARIADIC_MAX < 28)) |
|
// Fail variadic expansion for dev11 |
|
static_assert(0, "Visual Studio has a hard limit of argument count for a std::function expansion. Please define _VARIADIC_MAX to be 10. If you need more arguments than that VC12 and below cannot support it."); |
|
#endif |
|
|
|
} |
|
|
|
//! \brief Return type of the functor |
|
typedef Event result_type; |
|
|
|
//! \brief Function signature of kernel functor with no event dependency. |
|
typedef Event type_( |
|
const EnqueueArgs&, |
|
T0, |
|
T1, |
|
T2, |
|
T3, |
|
T4, |
|
T5, |
|
T6, |
|
T7, |
|
T8, |
|
T9, |
|
T10, |
|
T11, |
|
T12, |
|
T13, |
|
T14, |
|
T15, |
|
T16, |
|
T17, |
|
T18, |
|
T19, |
|
T20, |
|
T21, |
|
T22, |
|
T23, |
|
T24, |
|
T25, |
|
T26, |
|
T27); |
|
|
|
Event operator()( |
|
const EnqueueArgs& enqueueArgs, |
|
T0 arg0, |
|
T1 arg1, |
|
T2 arg2, |
|
T3 arg3, |
|
T4 arg4, |
|
T5 arg5, |
|
T6 arg6, |
|
T7 arg7, |
|
T8 arg8, |
|
T9 arg9, |
|
T10 arg10, |
|
T11 arg11, |
|
T12 arg12, |
|
T13 arg13, |
|
T14 arg14, |
|
T15 arg15, |
|
T16 arg16, |
|
T17 arg17, |
|
T18 arg18, |
|
T19 arg19, |
|
T20 arg20, |
|
T21 arg21, |
|
T22 arg22, |
|
T23 arg23, |
|
T24 arg24, |
|
T25 arg25, |
|
T26 arg26, |
|
T27 arg27) |
|
{ |
|
return functor_( |
|
enqueueArgs, |
|
arg0, |
|
arg1, |
|
arg2, |
|
arg3, |
|
arg4, |
|
arg5, |
|
arg6, |
|
arg7, |
|
arg8, |
|
arg9, |
|
arg10, |
|
arg11, |
|
arg12, |
|
arg13, |
|
arg14, |
|
arg15, |
|
arg16, |
|
arg17, |
|
arg18, |
|
arg19, |
|
arg20, |
|
arg21, |
|
arg22, |
|
arg23, |
|
arg24, |
|
arg25, |
|
arg26, |
|
arg27); |
|
} |
|
|
|
|
|
}; |
|
|
|
template< |
|
typename T0, |
|
typename T1, |
|
typename T2, |
|
typename T3, |
|
typename T4, |
|
typename T5, |
|
typename T6, |
|
typename T7, |
|
typename T8, |
|
typename T9, |
|
typename T10, |
|
typename T11, |
|
typename T12, |
|
typename T13, |
|
typename T14, |
|
typename T15, |
|
typename T16, |
|
typename T17, |
|
typename T18, |
|
typename T19, |
|
typename T20, |
|
typename T21, |
|
typename T22, |
|
typename T23, |
|
typename T24, |
|
typename T25, |
|
typename T26> |
|
struct functionImplementation_ |
|
< T0, |
|
T1, |
|
T2, |
|
T3, |
|
T4, |
|
T5, |
|
T6, |
|
T7, |
|
T8, |
|
T9, |
|
T10, |
|
T11, |
|
T12, |
|
T13, |
|
T14, |
|
T15, |
|
T16, |
|
T17, |
|
T18, |
|
T19, |
|
T20, |
|
T21, |
|
T22, |
|
T23, |
|
T24, |
|
T25, |
|
T26, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType> |
|
{ |
|
typedef detail::KernelFunctorGlobal< |
|
T0, |
|
T1, |
|
T2, |
|
T3, |
|
T4, |
|
T5, |
|
T6, |
|
T7, |
|
T8, |
|
T9, |
|
T10, |
|
T11, |
|
T12, |
|
T13, |
|
T14, |
|
T15, |
|
T16, |
|
T17, |
|
T18, |
|
T19, |
|
T20, |
|
T21, |
|
T22, |
|
T23, |
|
T24, |
|
T25, |
|
T26, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType> FunctorType; |
|
|
|
FunctorType functor_; |
|
|
|
functionImplementation_(const FunctorType &functor) : |
|
functor_(functor) |
|
{ |
|
|
|
#if (defined(_WIN32) && defined(_VARIADIC_MAX) && (_VARIADIC_MAX < 27)) |
|
// Fail variadic expansion for dev11 |
|
static_assert(0, "Visual Studio has a hard limit of argument count for a std::function expansion. Please define _VARIADIC_MAX to be 10. If you need more arguments than that VC12 and below cannot support it."); |
|
#endif |
|
|
|
} |
|
|
|
//! \brief Return type of the functor |
|
typedef Event result_type; |
|
|
|
//! \brief Function signature of kernel functor with no event dependency. |
|
typedef Event type_( |
|
const EnqueueArgs&, |
|
T0, |
|
T1, |
|
T2, |
|
T3, |
|
T4, |
|
T5, |
|
T6, |
|
T7, |
|
T8, |
|
T9, |
|
T10, |
|
T11, |
|
T12, |
|
T13, |
|
T14, |
|
T15, |
|
T16, |
|
T17, |
|
T18, |
|
T19, |
|
T20, |
|
T21, |
|
T22, |
|
T23, |
|
T24, |
|
T25, |
|
T26); |
|
|
|
Event operator()( |
|
const EnqueueArgs& enqueueArgs, |
|
T0 arg0, |
|
T1 arg1, |
|
T2 arg2, |
|
T3 arg3, |
|
T4 arg4, |
|
T5 arg5, |
|
T6 arg6, |
|
T7 arg7, |
|
T8 arg8, |
|
T9 arg9, |
|
T10 arg10, |
|
T11 arg11, |
|
T12 arg12, |
|
T13 arg13, |
|
T14 arg14, |
|
T15 arg15, |
|
T16 arg16, |
|
T17 arg17, |
|
T18 arg18, |
|
T19 arg19, |
|
T20 arg20, |
|
T21 arg21, |
|
T22 arg22, |
|
T23 arg23, |
|
T24 arg24, |
|
T25 arg25, |
|
T26 arg26) |
|
{ |
|
return functor_( |
|
enqueueArgs, |
|
arg0, |
|
arg1, |
|
arg2, |
|
arg3, |
|
arg4, |
|
arg5, |
|
arg6, |
|
arg7, |
|
arg8, |
|
arg9, |
|
arg10, |
|
arg11, |
|
arg12, |
|
arg13, |
|
arg14, |
|
arg15, |
|
arg16, |
|
arg17, |
|
arg18, |
|
arg19, |
|
arg20, |
|
arg21, |
|
arg22, |
|
arg23, |
|
arg24, |
|
arg25, |
|
arg26); |
|
} |
|
|
|
|
|
}; |
|
|
|
template< |
|
typename T0, |
|
typename T1, |
|
typename T2, |
|
typename T3, |
|
typename T4, |
|
typename T5, |
|
typename T6, |
|
typename T7, |
|
typename T8, |
|
typename T9, |
|
typename T10, |
|
typename T11, |
|
typename T12, |
|
typename T13, |
|
typename T14, |
|
typename T15, |
|
typename T16, |
|
typename T17, |
|
typename T18, |
|
typename T19, |
|
typename T20, |
|
typename T21, |
|
typename T22, |
|
typename T23, |
|
typename T24, |
|
typename T25> |
|
struct functionImplementation_ |
|
< T0, |
|
T1, |
|
T2, |
|
T3, |
|
T4, |
|
T5, |
|
T6, |
|
T7, |
|
T8, |
|
T9, |
|
T10, |
|
T11, |
|
T12, |
|
T13, |
|
T14, |
|
T15, |
|
T16, |
|
T17, |
|
T18, |
|
T19, |
|
T20, |
|
T21, |
|
T22, |
|
T23, |
|
T24, |
|
T25, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType> |
|
{ |
|
typedef detail::KernelFunctorGlobal< |
|
T0, |
|
T1, |
|
T2, |
|
T3, |
|
T4, |
|
T5, |
|
T6, |
|
T7, |
|
T8, |
|
T9, |
|
T10, |
|
T11, |
|
T12, |
|
T13, |
|
T14, |
|
T15, |
|
T16, |
|
T17, |
|
T18, |
|
T19, |
|
T20, |
|
T21, |
|
T22, |
|
T23, |
|
T24, |
|
T25, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType> FunctorType; |
|
|
|
FunctorType functor_; |
|
|
|
functionImplementation_(const FunctorType &functor) : |
|
functor_(functor) |
|
{ |
|
|
|
#if (defined(_WIN32) && defined(_VARIADIC_MAX) && (_VARIADIC_MAX < 26)) |
|
// Fail variadic expansion for dev11 |
|
static_assert(0, "Visual Studio has a hard limit of argument count for a std::function expansion. Please define _VARIADIC_MAX to be 10. If you need more arguments than that VC12 and below cannot support it."); |
|
#endif |
|
|
|
} |
|
|
|
//! \brief Return type of the functor |
|
typedef Event result_type; |
|
|
|
//! \brief Function signature of kernel functor with no event dependency. |
|
typedef Event type_( |
|
const EnqueueArgs&, |
|
T0, |
|
T1, |
|
T2, |
|
T3, |
|
T4, |
|
T5, |
|
T6, |
|
T7, |
|
T8, |
|
T9, |
|
T10, |
|
T11, |
|
T12, |
|
T13, |
|
T14, |
|
T15, |
|
T16, |
|
T17, |
|
T18, |
|
T19, |
|
T20, |
|
T21, |
|
T22, |
|
T23, |
|
T24, |
|
T25); |
|
|
|
Event operator()( |
|
const EnqueueArgs& enqueueArgs, |
|
T0 arg0, |
|
T1 arg1, |
|
T2 arg2, |
|
T3 arg3, |
|
T4 arg4, |
|
T5 arg5, |
|
T6 arg6, |
|
T7 arg7, |
|
T8 arg8, |
|
T9 arg9, |
|
T10 arg10, |
|
T11 arg11, |
|
T12 arg12, |
|
T13 arg13, |
|
T14 arg14, |
|
T15 arg15, |
|
T16 arg16, |
|
T17 arg17, |
|
T18 arg18, |
|
T19 arg19, |
|
T20 arg20, |
|
T21 arg21, |
|
T22 arg22, |
|
T23 arg23, |
|
T24 arg24, |
|
T25 arg25) |
|
{ |
|
return functor_( |
|
enqueueArgs, |
|
arg0, |
|
arg1, |
|
arg2, |
|
arg3, |
|
arg4, |
|
arg5, |
|
arg6, |
|
arg7, |
|
arg8, |
|
arg9, |
|
arg10, |
|
arg11, |
|
arg12, |
|
arg13, |
|
arg14, |
|
arg15, |
|
arg16, |
|
arg17, |
|
arg18, |
|
arg19, |
|
arg20, |
|
arg21, |
|
arg22, |
|
arg23, |
|
arg24, |
|
arg25); |
|
} |
|
|
|
|
|
}; |
|
|
|
template< |
|
typename T0, |
|
typename T1, |
|
typename T2, |
|
typename T3, |
|
typename T4, |
|
typename T5, |
|
typename T6, |
|
typename T7, |
|
typename T8, |
|
typename T9, |
|
typename T10, |
|
typename T11, |
|
typename T12, |
|
typename T13, |
|
typename T14, |
|
typename T15, |
|
typename T16, |
|
typename T17, |
|
typename T18, |
|
typename T19, |
|
typename T20, |
|
typename T21, |
|
typename T22, |
|
typename T23, |
|
typename T24> |
|
struct functionImplementation_ |
|
< T0, |
|
T1, |
|
T2, |
|
T3, |
|
T4, |
|
T5, |
|
T6, |
|
T7, |
|
T8, |
|
T9, |
|
T10, |
|
T11, |
|
T12, |
|
T13, |
|
T14, |
|
T15, |
|
T16, |
|
T17, |
|
T18, |
|
T19, |
|
T20, |
|
T21, |
|
T22, |
|
T23, |
|
T24, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType> |
|
{ |
|
typedef detail::KernelFunctorGlobal< |
|
T0, |
|
T1, |
|
T2, |
|
T3, |
|
T4, |
|
T5, |
|
T6, |
|
T7, |
|
T8, |
|
T9, |
|
T10, |
|
T11, |
|
T12, |
|
T13, |
|
T14, |
|
T15, |
|
T16, |
|
T17, |
|
T18, |
|
T19, |
|
T20, |
|
T21, |
|
T22, |
|
T23, |
|
T24, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType> FunctorType; |
|
|
|
FunctorType functor_; |
|
|
|
functionImplementation_(const FunctorType &functor) : |
|
functor_(functor) |
|
{ |
|
|
|
#if (defined(_WIN32) && defined(_VARIADIC_MAX) && (_VARIADIC_MAX < 25)) |
|
// Fail variadic expansion for dev11 |
|
static_assert(0, "Visual Studio has a hard limit of argument count for a std::function expansion. Please define _VARIADIC_MAX to be 10. If you need more arguments than that VC12 and below cannot support it."); |
|
#endif |
|
|
|
} |
|
|
|
//! \brief Return type of the functor |
|
typedef Event result_type; |
|
|
|
//! \brief Function signature of kernel functor with no event dependency. |
|
typedef Event type_( |
|
const EnqueueArgs&, |
|
T0, |
|
T1, |
|
T2, |
|
T3, |
|
T4, |
|
T5, |
|
T6, |
|
T7, |
|
T8, |
|
T9, |
|
T10, |
|
T11, |
|
T12, |
|
T13, |
|
T14, |
|
T15, |
|
T16, |
|
T17, |
|
T18, |
|
T19, |
|
T20, |
|
T21, |
|
T22, |
|
T23, |
|
T24); |
|
|
|
Event operator()( |
|
const EnqueueArgs& enqueueArgs, |
|
T0 arg0, |
|
T1 arg1, |
|
T2 arg2, |
|
T3 arg3, |
|
T4 arg4, |
|
T5 arg5, |
|
T6 arg6, |
|
T7 arg7, |
|
T8 arg8, |
|
T9 arg9, |
|
T10 arg10, |
|
T11 arg11, |
|
T12 arg12, |
|
T13 arg13, |
|
T14 arg14, |
|
T15 arg15, |
|
T16 arg16, |
|
T17 arg17, |
|
T18 arg18, |
|
T19 arg19, |
|
T20 arg20, |
|
T21 arg21, |
|
T22 arg22, |
|
T23 arg23, |
|
T24 arg24) |
|
{ |
|
return functor_( |
|
enqueueArgs, |
|
arg0, |
|
arg1, |
|
arg2, |
|
arg3, |
|
arg4, |
|
arg5, |
|
arg6, |
|
arg7, |
|
arg8, |
|
arg9, |
|
arg10, |
|
arg11, |
|
arg12, |
|
arg13, |
|
arg14, |
|
arg15, |
|
arg16, |
|
arg17, |
|
arg18, |
|
arg19, |
|
arg20, |
|
arg21, |
|
arg22, |
|
arg23, |
|
arg24); |
|
} |
|
|
|
|
|
}; |
|
|
|
template< |
|
typename T0, |
|
typename T1, |
|
typename T2, |
|
typename T3, |
|
typename T4, |
|
typename T5, |
|
typename T6, |
|
typename T7, |
|
typename T8, |
|
typename T9, |
|
typename T10, |
|
typename T11, |
|
typename T12, |
|
typename T13, |
|
typename T14, |
|
typename T15, |
|
typename T16, |
|
typename T17, |
|
typename T18, |
|
typename T19, |
|
typename T20, |
|
typename T21, |
|
typename T22, |
|
typename T23> |
|
struct functionImplementation_ |
|
< T0, |
|
T1, |
|
T2, |
|
T3, |
|
T4, |
|
T5, |
|
T6, |
|
T7, |
|
T8, |
|
T9, |
|
T10, |
|
T11, |
|
T12, |
|
T13, |
|
T14, |
|
T15, |
|
T16, |
|
T17, |
|
T18, |
|
T19, |
|
T20, |
|
T21, |
|
T22, |
|
T23, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType> |
|
{ |
|
typedef detail::KernelFunctorGlobal< |
|
T0, |
|
T1, |
|
T2, |
|
T3, |
|
T4, |
|
T5, |
|
T6, |
|
T7, |
|
T8, |
|
T9, |
|
T10, |
|
T11, |
|
T12, |
|
T13, |
|
T14, |
|
T15, |
|
T16, |
|
T17, |
|
T18, |
|
T19, |
|
T20, |
|
T21, |
|
T22, |
|
T23, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType> FunctorType; |
|
|
|
FunctorType functor_; |
|
|
|
functionImplementation_(const FunctorType &functor) : |
|
functor_(functor) |
|
{ |
|
|
|
#if (defined(_WIN32) && defined(_VARIADIC_MAX) && (_VARIADIC_MAX < 24)) |
|
// Fail variadic expansion for dev11 |
|
static_assert(0, "Visual Studio has a hard limit of argument count for a std::function expansion. Please define _VARIADIC_MAX to be 10. If you need more arguments than that VC12 and below cannot support it."); |
|
#endif |
|
|
|
} |
|
|
|
//! \brief Return type of the functor |
|
typedef Event result_type; |
|
|
|
//! \brief Function signature of kernel functor with no event dependency. |
|
typedef Event type_( |
|
const EnqueueArgs&, |
|
T0, |
|
T1, |
|
T2, |
|
T3, |
|
T4, |
|
T5, |
|
T6, |
|
T7, |
|
T8, |
|
T9, |
|
T10, |
|
T11, |
|
T12, |
|
T13, |
|
T14, |
|
T15, |
|
T16, |
|
T17, |
|
T18, |
|
T19, |
|
T20, |
|
T21, |
|
T22, |
|
T23); |
|
|
|
Event operator()( |
|
const EnqueueArgs& enqueueArgs, |
|
T0 arg0, |
|
T1 arg1, |
|
T2 arg2, |
|
T3 arg3, |
|
T4 arg4, |
|
T5 arg5, |
|
T6 arg6, |
|
T7 arg7, |
|
T8 arg8, |
|
T9 arg9, |
|
T10 arg10, |
|
T11 arg11, |
|
T12 arg12, |
|
T13 arg13, |
|
T14 arg14, |
|
T15 arg15, |
|
T16 arg16, |
|
T17 arg17, |
|
T18 arg18, |
|
T19 arg19, |
|
T20 arg20, |
|
T21 arg21, |
|
T22 arg22, |
|
T23 arg23) |
|
{ |
|
return functor_( |
|
enqueueArgs, |
|
arg0, |
|
arg1, |
|
arg2, |
|
arg3, |
|
arg4, |
|
arg5, |
|
arg6, |
|
arg7, |
|
arg8, |
|
arg9, |
|
arg10, |
|
arg11, |
|
arg12, |
|
arg13, |
|
arg14, |
|
arg15, |
|
arg16, |
|
arg17, |
|
arg18, |
|
arg19, |
|
arg20, |
|
arg21, |
|
arg22, |
|
arg23); |
|
} |
|
|
|
|
|
}; |
|
|
|
template< |
|
typename T0, |
|
typename T1, |
|
typename T2, |
|
typename T3, |
|
typename T4, |
|
typename T5, |
|
typename T6, |
|
typename T7, |
|
typename T8, |
|
typename T9, |
|
typename T10, |
|
typename T11, |
|
typename T12, |
|
typename T13, |
|
typename T14, |
|
typename T15, |
|
typename T16, |
|
typename T17, |
|
typename T18, |
|
typename T19, |
|
typename T20, |
|
typename T21, |
|
typename T22> |
|
struct functionImplementation_ |
|
< T0, |
|
T1, |
|
T2, |
|
T3, |
|
T4, |
|
T5, |
|
T6, |
|
T7, |
|
T8, |
|
T9, |
|
T10, |
|
T11, |
|
T12, |
|
T13, |
|
T14, |
|
T15, |
|
T16, |
|
T17, |
|
T18, |
|
T19, |
|
T20, |
|
T21, |
|
T22, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType> |
|
{ |
|
typedef detail::KernelFunctorGlobal< |
|
T0, |
|
T1, |
|
T2, |
|
T3, |
|
T4, |
|
T5, |
|
T6, |
|
T7, |
|
T8, |
|
T9, |
|
T10, |
|
T11, |
|
T12, |
|
T13, |
|
T14, |
|
T15, |
|
T16, |
|
T17, |
|
T18, |
|
T19, |
|
T20, |
|
T21, |
|
T22, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType> FunctorType; |
|
|
|
FunctorType functor_; |
|
|
|
functionImplementation_(const FunctorType &functor) : |
|
functor_(functor) |
|
{ |
|
|
|
#if (defined(_WIN32) && defined(_VARIADIC_MAX) && (_VARIADIC_MAX < 23)) |
|
// Fail variadic expansion for dev11 |
|
static_assert(0, "Visual Studio has a hard limit of argument count for a std::function expansion. Please define _VARIADIC_MAX to be 10. If you need more arguments than that VC12 and below cannot support it."); |
|
#endif |
|
|
|
} |
|
|
|
//! \brief Return type of the functor |
|
typedef Event result_type; |
|
|
|
//! \brief Function signature of kernel functor with no event dependency. |
|
typedef Event type_( |
|
const EnqueueArgs&, |
|
T0, |
|
T1, |
|
T2, |
|
T3, |
|
T4, |
|
T5, |
|
T6, |
|
T7, |
|
T8, |
|
T9, |
|
T10, |
|
T11, |
|
T12, |
|
T13, |
|
T14, |
|
T15, |
|
T16, |
|
T17, |
|
T18, |
|
T19, |
|
T20, |
|
T21, |
|
T22); |
|
|
|
Event operator()( |
|
const EnqueueArgs& enqueueArgs, |
|
T0 arg0, |
|
T1 arg1, |
|
T2 arg2, |
|
T3 arg3, |
|
T4 arg4, |
|
T5 arg5, |
|
T6 arg6, |
|
T7 arg7, |
|
T8 arg8, |
|
T9 arg9, |
|
T10 arg10, |
|
T11 arg11, |
|
T12 arg12, |
|
T13 arg13, |
|
T14 arg14, |
|
T15 arg15, |
|
T16 arg16, |
|
T17 arg17, |
|
T18 arg18, |
|
T19 arg19, |
|
T20 arg20, |
|
T21 arg21, |
|
T22 arg22) |
|
{ |
|
return functor_( |
|
enqueueArgs, |
|
arg0, |
|
arg1, |
|
arg2, |
|
arg3, |
|
arg4, |
|
arg5, |
|
arg6, |
|
arg7, |
|
arg8, |
|
arg9, |
|
arg10, |
|
arg11, |
|
arg12, |
|
arg13, |
|
arg14, |
|
arg15, |
|
arg16, |
|
arg17, |
|
arg18, |
|
arg19, |
|
arg20, |
|
arg21, |
|
arg22); |
|
} |
|
|
|
|
|
}; |
|
|
|
template< |
|
typename T0, |
|
typename T1, |
|
typename T2, |
|
typename T3, |
|
typename T4, |
|
typename T5, |
|
typename T6, |
|
typename T7, |
|
typename T8, |
|
typename T9, |
|
typename T10, |
|
typename T11, |
|
typename T12, |
|
typename T13, |
|
typename T14, |
|
typename T15, |
|
typename T16, |
|
typename T17, |
|
typename T18, |
|
typename T19, |
|
typename T20, |
|
typename T21> |
|
struct functionImplementation_ |
|
< T0, |
|
T1, |
|
T2, |
|
T3, |
|
T4, |
|
T5, |
|
T6, |
|
T7, |
|
T8, |
|
T9, |
|
T10, |
|
T11, |
|
T12, |
|
T13, |
|
T14, |
|
T15, |
|
T16, |
|
T17, |
|
T18, |
|
T19, |
|
T20, |
|
T21, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType> |
|
{ |
|
typedef detail::KernelFunctorGlobal< |
|
T0, |
|
T1, |
|
T2, |
|
T3, |
|
T4, |
|
T5, |
|
T6, |
|
T7, |
|
T8, |
|
T9, |
|
T10, |
|
T11, |
|
T12, |
|
T13, |
|
T14, |
|
T15, |
|
T16, |
|
T17, |
|
T18, |
|
T19, |
|
T20, |
|
T21, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType> FunctorType; |
|
|
|
FunctorType functor_; |
|
|
|
functionImplementation_(const FunctorType &functor) : |
|
functor_(functor) |
|
{ |
|
|
|
#if (defined(_WIN32) && defined(_VARIADIC_MAX) && (_VARIADIC_MAX < 22)) |
|
// Fail variadic expansion for dev11 |
|
static_assert(0, "Visual Studio has a hard limit of argument count for a std::function expansion. Please define _VARIADIC_MAX to be 10. If you need more arguments than that VC12 and below cannot support it."); |
|
#endif |
|
|
|
} |
|
|
|
//! \brief Return type of the functor |
|
typedef Event result_type; |
|
|
|
//! \brief Function signature of kernel functor with no event dependency. |
|
typedef Event type_( |
|
const EnqueueArgs&, |
|
T0, |
|
T1, |
|
T2, |
|
T3, |
|
T4, |
|
T5, |
|
T6, |
|
T7, |
|
T8, |
|
T9, |
|
T10, |
|
T11, |
|
T12, |
|
T13, |
|
T14, |
|
T15, |
|
T16, |
|
T17, |
|
T18, |
|
T19, |
|
T20, |
|
T21); |
|
|
|
Event operator()( |
|
const EnqueueArgs& enqueueArgs, |
|
T0 arg0, |
|
T1 arg1, |
|
T2 arg2, |
|
T3 arg3, |
|
T4 arg4, |
|
T5 arg5, |
|
T6 arg6, |
|
T7 arg7, |
|
T8 arg8, |
|
T9 arg9, |
|
T10 arg10, |
|
T11 arg11, |
|
T12 arg12, |
|
T13 arg13, |
|
T14 arg14, |
|
T15 arg15, |
|
T16 arg16, |
|
T17 arg17, |
|
T18 arg18, |
|
T19 arg19, |
|
T20 arg20, |
|
T21 arg21) |
|
{ |
|
return functor_( |
|
enqueueArgs, |
|
arg0, |
|
arg1, |
|
arg2, |
|
arg3, |
|
arg4, |
|
arg5, |
|
arg6, |
|
arg7, |
|
arg8, |
|
arg9, |
|
arg10, |
|
arg11, |
|
arg12, |
|
arg13, |
|
arg14, |
|
arg15, |
|
arg16, |
|
arg17, |
|
arg18, |
|
arg19, |
|
arg20, |
|
arg21); |
|
} |
|
|
|
|
|
}; |
|
|
|
template< |
|
typename T0, |
|
typename T1, |
|
typename T2, |
|
typename T3, |
|
typename T4, |
|
typename T5, |
|
typename T6, |
|
typename T7, |
|
typename T8, |
|
typename T9, |
|
typename T10, |
|
typename T11, |
|
typename T12, |
|
typename T13, |
|
typename T14, |
|
typename T15, |
|
typename T16, |
|
typename T17, |
|
typename T18, |
|
typename T19, |
|
typename T20> |
|
struct functionImplementation_ |
|
< T0, |
|
T1, |
|
T2, |
|
T3, |
|
T4, |
|
T5, |
|
T6, |
|
T7, |
|
T8, |
|
T9, |
|
T10, |
|
T11, |
|
T12, |
|
T13, |
|
T14, |
|
T15, |
|
T16, |
|
T17, |
|
T18, |
|
T19, |
|
T20, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType> |
|
{ |
|
typedef detail::KernelFunctorGlobal< |
|
T0, |
|
T1, |
|
T2, |
|
T3, |
|
T4, |
|
T5, |
|
T6, |
|
T7, |
|
T8, |
|
T9, |
|
T10, |
|
T11, |
|
T12, |
|
T13, |
|
T14, |
|
T15, |
|
T16, |
|
T17, |
|
T18, |
|
T19, |
|
T20, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType> FunctorType; |
|
|
|
FunctorType functor_; |
|
|
|
functionImplementation_(const FunctorType &functor) : |
|
functor_(functor) |
|
{ |
|
|
|
#if (defined(_WIN32) && defined(_VARIADIC_MAX) && (_VARIADIC_MAX < 21)) |
|
// Fail variadic expansion for dev11 |
|
static_assert(0, "Visual Studio has a hard limit of argument count for a std::function expansion. Please define _VARIADIC_MAX to be 10. If you need more arguments than that VC12 and below cannot support it."); |
|
#endif |
|
|
|
} |
|
|
|
//! \brief Return type of the functor |
|
typedef Event result_type; |
|
|
|
//! \brief Function signature of kernel functor with no event dependency. |
|
typedef Event type_( |
|
const EnqueueArgs&, |
|
T0, |
|
T1, |
|
T2, |
|
T3, |
|
T4, |
|
T5, |
|
T6, |
|
T7, |
|
T8, |
|
T9, |
|
T10, |
|
T11, |
|
T12, |
|
T13, |
|
T14, |
|
T15, |
|
T16, |
|
T17, |
|
T18, |
|
T19, |
|
T20); |
|
|
|
Event operator()( |
|
const EnqueueArgs& enqueueArgs, |
|
T0 arg0, |
|
T1 arg1, |
|
T2 arg2, |
|
T3 arg3, |
|
T4 arg4, |
|
T5 arg5, |
|
T6 arg6, |
|
T7 arg7, |
|
T8 arg8, |
|
T9 arg9, |
|
T10 arg10, |
|
T11 arg11, |
|
T12 arg12, |
|
T13 arg13, |
|
T14 arg14, |
|
T15 arg15, |
|
T16 arg16, |
|
T17 arg17, |
|
T18 arg18, |
|
T19 arg19, |
|
T20 arg20) |
|
{ |
|
return functor_( |
|
enqueueArgs, |
|
arg0, |
|
arg1, |
|
arg2, |
|
arg3, |
|
arg4, |
|
arg5, |
|
arg6, |
|
arg7, |
|
arg8, |
|
arg9, |
|
arg10, |
|
arg11, |
|
arg12, |
|
arg13, |
|
arg14, |
|
arg15, |
|
arg16, |
|
arg17, |
|
arg18, |
|
arg19, |
|
arg20); |
|
} |
|
|
|
|
|
}; |
|
|
|
template< |
|
typename T0, |
|
typename T1, |
|
typename T2, |
|
typename T3, |
|
typename T4, |
|
typename T5, |
|
typename T6, |
|
typename T7, |
|
typename T8, |
|
typename T9, |
|
typename T10, |
|
typename T11, |
|
typename T12, |
|
typename T13, |
|
typename T14, |
|
typename T15, |
|
typename T16, |
|
typename T17, |
|
typename T18, |
|
typename T19> |
|
struct functionImplementation_ |
|
< T0, |
|
T1, |
|
T2, |
|
T3, |
|
T4, |
|
T5, |
|
T6, |
|
T7, |
|
T8, |
|
T9, |
|
T10, |
|
T11, |
|
T12, |
|
T13, |
|
T14, |
|
T15, |
|
T16, |
|
T17, |
|
T18, |
|
T19, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType> |
|
{ |
|
typedef detail::KernelFunctorGlobal< |
|
T0, |
|
T1, |
|
T2, |
|
T3, |
|
T4, |
|
T5, |
|
T6, |
|
T7, |
|
T8, |
|
T9, |
|
T10, |
|
T11, |
|
T12, |
|
T13, |
|
T14, |
|
T15, |
|
T16, |
|
T17, |
|
T18, |
|
T19, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType> FunctorType; |
|
|
|
FunctorType functor_; |
|
|
|
functionImplementation_(const FunctorType &functor) : |
|
functor_(functor) |
|
{ |
|
|
|
#if (defined(_WIN32) && defined(_VARIADIC_MAX) && (_VARIADIC_MAX < 20)) |
|
// Fail variadic expansion for dev11 |
|
static_assert(0, "Visual Studio has a hard limit of argument count for a std::function expansion. Please define _VARIADIC_MAX to be 10. If you need more arguments than that VC12 and below cannot support it."); |
|
#endif |
|
|
|
} |
|
|
|
//! \brief Return type of the functor |
|
typedef Event result_type; |
|
|
|
//! \brief Function signature of kernel functor with no event dependency. |
|
typedef Event type_( |
|
const EnqueueArgs&, |
|
T0, |
|
T1, |
|
T2, |
|
T3, |
|
T4, |
|
T5, |
|
T6, |
|
T7, |
|
T8, |
|
T9, |
|
T10, |
|
T11, |
|
T12, |
|
T13, |
|
T14, |
|
T15, |
|
T16, |
|
T17, |
|
T18, |
|
T19); |
|
|
|
Event operator()( |
|
const EnqueueArgs& enqueueArgs, |
|
T0 arg0, |
|
T1 arg1, |
|
T2 arg2, |
|
T3 arg3, |
|
T4 arg4, |
|
T5 arg5, |
|
T6 arg6, |
|
T7 arg7, |
|
T8 arg8, |
|
T9 arg9, |
|
T10 arg10, |
|
T11 arg11, |
|
T12 arg12, |
|
T13 arg13, |
|
T14 arg14, |
|
T15 arg15, |
|
T16 arg16, |
|
T17 arg17, |
|
T18 arg18, |
|
T19 arg19) |
|
{ |
|
return functor_( |
|
enqueueArgs, |
|
arg0, |
|
arg1, |
|
arg2, |
|
arg3, |
|
arg4, |
|
arg5, |
|
arg6, |
|
arg7, |
|
arg8, |
|
arg9, |
|
arg10, |
|
arg11, |
|
arg12, |
|
arg13, |
|
arg14, |
|
arg15, |
|
arg16, |
|
arg17, |
|
arg18, |
|
arg19); |
|
} |
|
|
|
|
|
}; |
|
|
|
template< |
|
typename T0, |
|
typename T1, |
|
typename T2, |
|
typename T3, |
|
typename T4, |
|
typename T5, |
|
typename T6, |
|
typename T7, |
|
typename T8, |
|
typename T9, |
|
typename T10, |
|
typename T11, |
|
typename T12, |
|
typename T13, |
|
typename T14, |
|
typename T15, |
|
typename T16, |
|
typename T17, |
|
typename T18> |
|
struct functionImplementation_ |
|
< T0, |
|
T1, |
|
T2, |
|
T3, |
|
T4, |
|
T5, |
|
T6, |
|
T7, |
|
T8, |
|
T9, |
|
T10, |
|
T11, |
|
T12, |
|
T13, |
|
T14, |
|
T15, |
|
T16, |
|
T17, |
|
T18, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType> |
|
{ |
|
typedef detail::KernelFunctorGlobal< |
|
T0, |
|
T1, |
|
T2, |
|
T3, |
|
T4, |
|
T5, |
|
T6, |
|
T7, |
|
T8, |
|
T9, |
|
T10, |
|
T11, |
|
T12, |
|
T13, |
|
T14, |
|
T15, |
|
T16, |
|
T17, |
|
T18, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType> FunctorType; |
|
|
|
FunctorType functor_; |
|
|
|
functionImplementation_(const FunctorType &functor) : |
|
functor_(functor) |
|
{ |
|
|
|
#if (defined(_WIN32) && defined(_VARIADIC_MAX) && (_VARIADIC_MAX < 19)) |
|
// Fail variadic expansion for dev11 |
|
static_assert(0, "Visual Studio has a hard limit of argument count for a std::function expansion. Please define _VARIADIC_MAX to be 10. If you need more arguments than that VC12 and below cannot support it."); |
|
#endif |
|
|
|
} |
|
|
|
//! \brief Return type of the functor |
|
typedef Event result_type; |
|
|
|
//! \brief Function signature of kernel functor with no event dependency. |
|
typedef Event type_( |
|
const EnqueueArgs&, |
|
T0, |
|
T1, |
|
T2, |
|
T3, |
|
T4, |
|
T5, |
|
T6, |
|
T7, |
|
T8, |
|
T9, |
|
T10, |
|
T11, |
|
T12, |
|
T13, |
|
T14, |
|
T15, |
|
T16, |
|
T17, |
|
T18); |
|
|
|
Event operator()( |
|
const EnqueueArgs& enqueueArgs, |
|
T0 arg0, |
|
T1 arg1, |
|
T2 arg2, |
|
T3 arg3, |
|
T4 arg4, |
|
T5 arg5, |
|
T6 arg6, |
|
T7 arg7, |
|
T8 arg8, |
|
T9 arg9, |
|
T10 arg10, |
|
T11 arg11, |
|
T12 arg12, |
|
T13 arg13, |
|
T14 arg14, |
|
T15 arg15, |
|
T16 arg16, |
|
T17 arg17, |
|
T18 arg18) |
|
{ |
|
return functor_( |
|
enqueueArgs, |
|
arg0, |
|
arg1, |
|
arg2, |
|
arg3, |
|
arg4, |
|
arg5, |
|
arg6, |
|
arg7, |
|
arg8, |
|
arg9, |
|
arg10, |
|
arg11, |
|
arg12, |
|
arg13, |
|
arg14, |
|
arg15, |
|
arg16, |
|
arg17, |
|
arg18); |
|
} |
|
|
|
|
|
}; |
|
|
|
template< |
|
typename T0, |
|
typename T1, |
|
typename T2, |
|
typename T3, |
|
typename T4, |
|
typename T5, |
|
typename T6, |
|
typename T7, |
|
typename T8, |
|
typename T9, |
|
typename T10, |
|
typename T11, |
|
typename T12, |
|
typename T13, |
|
typename T14, |
|
typename T15, |
|
typename T16, |
|
typename T17> |
|
struct functionImplementation_ |
|
< T0, |
|
T1, |
|
T2, |
|
T3, |
|
T4, |
|
T5, |
|
T6, |
|
T7, |
|
T8, |
|
T9, |
|
T10, |
|
T11, |
|
T12, |
|
T13, |
|
T14, |
|
T15, |
|
T16, |
|
T17, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType> |
|
{ |
|
typedef detail::KernelFunctorGlobal< |
|
T0, |
|
T1, |
|
T2, |
|
T3, |
|
T4, |
|
T5, |
|
T6, |
|
T7, |
|
T8, |
|
T9, |
|
T10, |
|
T11, |
|
T12, |
|
T13, |
|
T14, |
|
T15, |
|
T16, |
|
T17, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType> FunctorType; |
|
|
|
FunctorType functor_; |
|
|
|
functionImplementation_(const FunctorType &functor) : |
|
functor_(functor) |
|
{ |
|
|
|
#if (defined(_WIN32) && defined(_VARIADIC_MAX) && (_VARIADIC_MAX < 18)) |
|
// Fail variadic expansion for dev11 |
|
static_assert(0, "Visual Studio has a hard limit of argument count for a std::function expansion. Please define _VARIADIC_MAX to be 10. If you need more arguments than that VC12 and below cannot support it."); |
|
#endif |
|
|
|
} |
|
|
|
//! \brief Return type of the functor |
|
typedef Event result_type; |
|
|
|
//! \brief Function signature of kernel functor with no event dependency. |
|
typedef Event type_( |
|
const EnqueueArgs&, |
|
T0, |
|
T1, |
|
T2, |
|
T3, |
|
T4, |
|
T5, |
|
T6, |
|
T7, |
|
T8, |
|
T9, |
|
T10, |
|
T11, |
|
T12, |
|
T13, |
|
T14, |
|
T15, |
|
T16, |
|
T17); |
|
|
|
Event operator()( |
|
const EnqueueArgs& enqueueArgs, |
|
T0 arg0, |
|
T1 arg1, |
|
T2 arg2, |
|
T3 arg3, |
|
T4 arg4, |
|
T5 arg5, |
|
T6 arg6, |
|
T7 arg7, |
|
T8 arg8, |
|
T9 arg9, |
|
T10 arg10, |
|
T11 arg11, |
|
T12 arg12, |
|
T13 arg13, |
|
T14 arg14, |
|
T15 arg15, |
|
T16 arg16, |
|
T17 arg17) |
|
{ |
|
return functor_( |
|
enqueueArgs, |
|
arg0, |
|
arg1, |
|
arg2, |
|
arg3, |
|
arg4, |
|
arg5, |
|
arg6, |
|
arg7, |
|
arg8, |
|
arg9, |
|
arg10, |
|
arg11, |
|
arg12, |
|
arg13, |
|
arg14, |
|
arg15, |
|
arg16, |
|
arg17); |
|
} |
|
|
|
|
|
}; |
|
|
|
template< |
|
typename T0, |
|
typename T1, |
|
typename T2, |
|
typename T3, |
|
typename T4, |
|
typename T5, |
|
typename T6, |
|
typename T7, |
|
typename T8, |
|
typename T9, |
|
typename T10, |
|
typename T11, |
|
typename T12, |
|
typename T13, |
|
typename T14, |
|
typename T15, |
|
typename T16> |
|
struct functionImplementation_ |
|
< T0, |
|
T1, |
|
T2, |
|
T3, |
|
T4, |
|
T5, |
|
T6, |
|
T7, |
|
T8, |
|
T9, |
|
T10, |
|
T11, |
|
T12, |
|
T13, |
|
T14, |
|
T15, |
|
T16, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType> |
|
{ |
|
typedef detail::KernelFunctorGlobal< |
|
T0, |
|
T1, |
|
T2, |
|
T3, |
|
T4, |
|
T5, |
|
T6, |
|
T7, |
|
T8, |
|
T9, |
|
T10, |
|
T11, |
|
T12, |
|
T13, |
|
T14, |
|
T15, |
|
T16, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType> FunctorType; |
|
|
|
FunctorType functor_; |
|
|
|
functionImplementation_(const FunctorType &functor) : |
|
functor_(functor) |
|
{ |
|
|
|
#if (defined(_WIN32) && defined(_VARIADIC_MAX) && (_VARIADIC_MAX < 17)) |
|
// Fail variadic expansion for dev11 |
|
static_assert(0, "Visual Studio has a hard limit of argument count for a std::function expansion. Please define _VARIADIC_MAX to be 10. If you need more arguments than that VC12 and below cannot support it."); |
|
#endif |
|
|
|
} |
|
|
|
//! \brief Return type of the functor |
|
typedef Event result_type; |
|
|
|
//! \brief Function signature of kernel functor with no event dependency. |
|
typedef Event type_( |
|
const EnqueueArgs&, |
|
T0, |
|
T1, |
|
T2, |
|
T3, |
|
T4, |
|
T5, |
|
T6, |
|
T7, |
|
T8, |
|
T9, |
|
T10, |
|
T11, |
|
T12, |
|
T13, |
|
T14, |
|
T15, |
|
T16); |
|
|
|
Event operator()( |
|
const EnqueueArgs& enqueueArgs, |
|
T0 arg0, |
|
T1 arg1, |
|
T2 arg2, |
|
T3 arg3, |
|
T4 arg4, |
|
T5 arg5, |
|
T6 arg6, |
|
T7 arg7, |
|
T8 arg8, |
|
T9 arg9, |
|
T10 arg10, |
|
T11 arg11, |
|
T12 arg12, |
|
T13 arg13, |
|
T14 arg14, |
|
T15 arg15, |
|
T16 arg16) |
|
{ |
|
return functor_( |
|
enqueueArgs, |
|
arg0, |
|
arg1, |
|
arg2, |
|
arg3, |
|
arg4, |
|
arg5, |
|
arg6, |
|
arg7, |
|
arg8, |
|
arg9, |
|
arg10, |
|
arg11, |
|
arg12, |
|
arg13, |
|
arg14, |
|
arg15, |
|
arg16); |
|
} |
|
|
|
|
|
}; |
|
|
|
template< |
|
typename T0, |
|
typename T1, |
|
typename T2, |
|
typename T3, |
|
typename T4, |
|
typename T5, |
|
typename T6, |
|
typename T7, |
|
typename T8, |
|
typename T9, |
|
typename T10, |
|
typename T11, |
|
typename T12, |
|
typename T13, |
|
typename T14, |
|
typename T15> |
|
struct functionImplementation_ |
|
< T0, |
|
T1, |
|
T2, |
|
T3, |
|
T4, |
|
T5, |
|
T6, |
|
T7, |
|
T8, |
|
T9, |
|
T10, |
|
T11, |
|
T12, |
|
T13, |
|
T14, |
|
T15, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType> |
|
{ |
|
typedef detail::KernelFunctorGlobal< |
|
T0, |
|
T1, |
|
T2, |
|
T3, |
|
T4, |
|
T5, |
|
T6, |
|
T7, |
|
T8, |
|
T9, |
|
T10, |
|
T11, |
|
T12, |
|
T13, |
|
T14, |
|
T15, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType> FunctorType; |
|
|
|
FunctorType functor_; |
|
|
|
functionImplementation_(const FunctorType &functor) : |
|
functor_(functor) |
|
{ |
|
|
|
#if (defined(_WIN32) && defined(_VARIADIC_MAX) && (_VARIADIC_MAX < 16)) |
|
// Fail variadic expansion for dev11 |
|
static_assert(0, "Visual Studio has a hard limit of argument count for a std::function expansion. Please define _VARIADIC_MAX to be 10. If you need more arguments than that VC12 and below cannot support it."); |
|
#endif |
|
|
|
} |
|
|
|
//! \brief Return type of the functor |
|
typedef Event result_type; |
|
|
|
//! \brief Function signature of kernel functor with no event dependency. |
|
typedef Event type_( |
|
const EnqueueArgs&, |
|
T0, |
|
T1, |
|
T2, |
|
T3, |
|
T4, |
|
T5, |
|
T6, |
|
T7, |
|
T8, |
|
T9, |
|
T10, |
|
T11, |
|
T12, |
|
T13, |
|
T14, |
|
T15); |
|
|
|
Event operator()( |
|
const EnqueueArgs& enqueueArgs, |
|
T0 arg0, |
|
T1 arg1, |
|
T2 arg2, |
|
T3 arg3, |
|
T4 arg4, |
|
T5 arg5, |
|
T6 arg6, |
|
T7 arg7, |
|
T8 arg8, |
|
T9 arg9, |
|
T10 arg10, |
|
T11 arg11, |
|
T12 arg12, |
|
T13 arg13, |
|
T14 arg14, |
|
T15 arg15) |
|
{ |
|
return functor_( |
|
enqueueArgs, |
|
arg0, |
|
arg1, |
|
arg2, |
|
arg3, |
|
arg4, |
|
arg5, |
|
arg6, |
|
arg7, |
|
arg8, |
|
arg9, |
|
arg10, |
|
arg11, |
|
arg12, |
|
arg13, |
|
arg14, |
|
arg15); |
|
} |
|
|
|
|
|
}; |
|
|
|
template< |
|
typename T0, |
|
typename T1, |
|
typename T2, |
|
typename T3, |
|
typename T4, |
|
typename T5, |
|
typename T6, |
|
typename T7, |
|
typename T8, |
|
typename T9, |
|
typename T10, |
|
typename T11, |
|
typename T12, |
|
typename T13, |
|
typename T14> |
|
struct functionImplementation_ |
|
< T0, |
|
T1, |
|
T2, |
|
T3, |
|
T4, |
|
T5, |
|
T6, |
|
T7, |
|
T8, |
|
T9, |
|
T10, |
|
T11, |
|
T12, |
|
T13, |
|
T14, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType> |
|
{ |
|
typedef detail::KernelFunctorGlobal< |
|
T0, |
|
T1, |
|
T2, |
|
T3, |
|
T4, |
|
T5, |
|
T6, |
|
T7, |
|
T8, |
|
T9, |
|
T10, |
|
T11, |
|
T12, |
|
T13, |
|
T14, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType> FunctorType; |
|
|
|
FunctorType functor_; |
|
|
|
functionImplementation_(const FunctorType &functor) : |
|
functor_(functor) |
|
{ |
|
|
|
#if (defined(_WIN32) && defined(_VARIADIC_MAX) && (_VARIADIC_MAX < 15)) |
|
// Fail variadic expansion for dev11 |
|
static_assert(0, "Visual Studio has a hard limit of argument count for a std::function expansion. Please define _VARIADIC_MAX to be 10. If you need more arguments than that VC12 and below cannot support it."); |
|
#endif |
|
|
|
} |
|
|
|
//! \brief Return type of the functor |
|
typedef Event result_type; |
|
|
|
//! \brief Function signature of kernel functor with no event dependency. |
|
typedef Event type_( |
|
const EnqueueArgs&, |
|
T0, |
|
T1, |
|
T2, |
|
T3, |
|
T4, |
|
T5, |
|
T6, |
|
T7, |
|
T8, |
|
T9, |
|
T10, |
|
T11, |
|
T12, |
|
T13, |
|
T14); |
|
|
|
Event operator()( |
|
const EnqueueArgs& enqueueArgs, |
|
T0 arg0, |
|
T1 arg1, |
|
T2 arg2, |
|
T3 arg3, |
|
T4 arg4, |
|
T5 arg5, |
|
T6 arg6, |
|
T7 arg7, |
|
T8 arg8, |
|
T9 arg9, |
|
T10 arg10, |
|
T11 arg11, |
|
T12 arg12, |
|
T13 arg13, |
|
T14 arg14) |
|
{ |
|
return functor_( |
|
enqueueArgs, |
|
arg0, |
|
arg1, |
|
arg2, |
|
arg3, |
|
arg4, |
|
arg5, |
|
arg6, |
|
arg7, |
|
arg8, |
|
arg9, |
|
arg10, |
|
arg11, |
|
arg12, |
|
arg13, |
|
arg14); |
|
} |
|
|
|
|
|
}; |
|
|
|
template< |
|
typename T0, |
|
typename T1, |
|
typename T2, |
|
typename T3, |
|
typename T4, |
|
typename T5, |
|
typename T6, |
|
typename T7, |
|
typename T8, |
|
typename T9, |
|
typename T10, |
|
typename T11, |
|
typename T12, |
|
typename T13> |
|
struct functionImplementation_ |
|
< T0, |
|
T1, |
|
T2, |
|
T3, |
|
T4, |
|
T5, |
|
T6, |
|
T7, |
|
T8, |
|
T9, |
|
T10, |
|
T11, |
|
T12, |
|
T13, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType> |
|
{ |
|
typedef detail::KernelFunctorGlobal< |
|
T0, |
|
T1, |
|
T2, |
|
T3, |
|
T4, |
|
T5, |
|
T6, |
|
T7, |
|
T8, |
|
T9, |
|
T10, |
|
T11, |
|
T12, |
|
T13, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType> FunctorType; |
|
|
|
FunctorType functor_; |
|
|
|
functionImplementation_(const FunctorType &functor) : |
|
functor_(functor) |
|
{ |
|
|
|
#if (defined(_WIN32) && defined(_VARIADIC_MAX) && (_VARIADIC_MAX < 14)) |
|
// Fail variadic expansion for dev11 |
|
static_assert(0, "Visual Studio has a hard limit of argument count for a std::function expansion. Please define _VARIADIC_MAX to be 10. If you need more arguments than that VC12 and below cannot support it."); |
|
#endif |
|
|
|
} |
|
|
|
//! \brief Return type of the functor |
|
typedef Event result_type; |
|
|
|
//! \brief Function signature of kernel functor with no event dependency. |
|
typedef Event type_( |
|
const EnqueueArgs&, |
|
T0, |
|
T1, |
|
T2, |
|
T3, |
|
T4, |
|
T5, |
|
T6, |
|
T7, |
|
T8, |
|
T9, |
|
T10, |
|
T11, |
|
T12, |
|
T13); |
|
|
|
Event operator()( |
|
const EnqueueArgs& enqueueArgs, |
|
T0 arg0, |
|
T1 arg1, |
|
T2 arg2, |
|
T3 arg3, |
|
T4 arg4, |
|
T5 arg5, |
|
T6 arg6, |
|
T7 arg7, |
|
T8 arg8, |
|
T9 arg9, |
|
T10 arg10, |
|
T11 arg11, |
|
T12 arg12, |
|
T13 arg13) |
|
{ |
|
return functor_( |
|
enqueueArgs, |
|
arg0, |
|
arg1, |
|
arg2, |
|
arg3, |
|
arg4, |
|
arg5, |
|
arg6, |
|
arg7, |
|
arg8, |
|
arg9, |
|
arg10, |
|
arg11, |
|
arg12, |
|
arg13); |
|
} |
|
|
|
|
|
}; |
|
|
|
template< |
|
typename T0, |
|
typename T1, |
|
typename T2, |
|
typename T3, |
|
typename T4, |
|
typename T5, |
|
typename T6, |
|
typename T7, |
|
typename T8, |
|
typename T9, |
|
typename T10, |
|
typename T11, |
|
typename T12> |
|
struct functionImplementation_ |
|
< T0, |
|
T1, |
|
T2, |
|
T3, |
|
T4, |
|
T5, |
|
T6, |
|
T7, |
|
T8, |
|
T9, |
|
T10, |
|
T11, |
|
T12, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType> |
|
{ |
|
typedef detail::KernelFunctorGlobal< |
|
T0, |
|
T1, |
|
T2, |
|
T3, |
|
T4, |
|
T5, |
|
T6, |
|
T7, |
|
T8, |
|
T9, |
|
T10, |
|
T11, |
|
T12, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType> FunctorType; |
|
|
|
FunctorType functor_; |
|
|
|
functionImplementation_(const FunctorType &functor) : |
|
functor_(functor) |
|
{ |
|
|
|
#if (defined(_WIN32) && defined(_VARIADIC_MAX) && (_VARIADIC_MAX < 13)) |
|
// Fail variadic expansion for dev11 |
|
static_assert(0, "Visual Studio has a hard limit of argument count for a std::function expansion. Please define _VARIADIC_MAX to be 10. If you need more arguments than that VC12 and below cannot support it."); |
|
#endif |
|
|
|
} |
|
|
|
//! \brief Return type of the functor |
|
typedef Event result_type; |
|
|
|
//! \brief Function signature of kernel functor with no event dependency. |
|
typedef Event type_( |
|
const EnqueueArgs&, |
|
T0, |
|
T1, |
|
T2, |
|
T3, |
|
T4, |
|
T5, |
|
T6, |
|
T7, |
|
T8, |
|
T9, |
|
T10, |
|
T11, |
|
T12); |
|
|
|
Event operator()( |
|
const EnqueueArgs& enqueueArgs, |
|
T0 arg0, |
|
T1 arg1, |
|
T2 arg2, |
|
T3 arg3, |
|
T4 arg4, |
|
T5 arg5, |
|
T6 arg6, |
|
T7 arg7, |
|
T8 arg8, |
|
T9 arg9, |
|
T10 arg10, |
|
T11 arg11, |
|
T12 arg12) |
|
{ |
|
return functor_( |
|
enqueueArgs, |
|
arg0, |
|
arg1, |
|
arg2, |
|
arg3, |
|
arg4, |
|
arg5, |
|
arg6, |
|
arg7, |
|
arg8, |
|
arg9, |
|
arg10, |
|
arg11, |
|
arg12); |
|
} |
|
|
|
|
|
}; |
|
|
|
template< |
|
typename T0, |
|
typename T1, |
|
typename T2, |
|
typename T3, |
|
typename T4, |
|
typename T5, |
|
typename T6, |
|
typename T7, |
|
typename T8, |
|
typename T9, |
|
typename T10, |
|
typename T11> |
|
struct functionImplementation_ |
|
< T0, |
|
T1, |
|
T2, |
|
T3, |
|
T4, |
|
T5, |
|
T6, |
|
T7, |
|
T8, |
|
T9, |
|
T10, |
|
T11, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType> |
|
{ |
|
typedef detail::KernelFunctorGlobal< |
|
T0, |
|
T1, |
|
T2, |
|
T3, |
|
T4, |
|
T5, |
|
T6, |
|
T7, |
|
T8, |
|
T9, |
|
T10, |
|
T11, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType> FunctorType; |
|
|
|
FunctorType functor_; |
|
|
|
functionImplementation_(const FunctorType &functor) : |
|
functor_(functor) |
|
{ |
|
|
|
#if (defined(_WIN32) && defined(_VARIADIC_MAX) && (_VARIADIC_MAX < 12)) |
|
// Fail variadic expansion for dev11 |
|
static_assert(0, "Visual Studio has a hard limit of argument count for a std::function expansion. Please define _VARIADIC_MAX to be 10. If you need more arguments than that VC12 and below cannot support it."); |
|
#endif |
|
|
|
} |
|
|
|
//! \brief Return type of the functor |
|
typedef Event result_type; |
|
|
|
//! \brief Function signature of kernel functor with no event dependency. |
|
typedef Event type_( |
|
const EnqueueArgs&, |
|
T0, |
|
T1, |
|
T2, |
|
T3, |
|
T4, |
|
T5, |
|
T6, |
|
T7, |
|
T8, |
|
T9, |
|
T10, |
|
T11); |
|
|
|
Event operator()( |
|
const EnqueueArgs& enqueueArgs, |
|
T0 arg0, |
|
T1 arg1, |
|
T2 arg2, |
|
T3 arg3, |
|
T4 arg4, |
|
T5 arg5, |
|
T6 arg6, |
|
T7 arg7, |
|
T8 arg8, |
|
T9 arg9, |
|
T10 arg10, |
|
T11 arg11) |
|
{ |
|
return functor_( |
|
enqueueArgs, |
|
arg0, |
|
arg1, |
|
arg2, |
|
arg3, |
|
arg4, |
|
arg5, |
|
arg6, |
|
arg7, |
|
arg8, |
|
arg9, |
|
arg10, |
|
arg11); |
|
} |
|
|
|
|
|
}; |
|
|
|
template< |
|
typename T0, |
|
typename T1, |
|
typename T2, |
|
typename T3, |
|
typename T4, |
|
typename T5, |
|
typename T6, |
|
typename T7, |
|
typename T8, |
|
typename T9, |
|
typename T10> |
|
struct functionImplementation_ |
|
< T0, |
|
T1, |
|
T2, |
|
T3, |
|
T4, |
|
T5, |
|
T6, |
|
T7, |
|
T8, |
|
T9, |
|
T10, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType> |
|
{ |
|
typedef detail::KernelFunctorGlobal< |
|
T0, |
|
T1, |
|
T2, |
|
T3, |
|
T4, |
|
T5, |
|
T6, |
|
T7, |
|
T8, |
|
T9, |
|
T10, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType> FunctorType; |
|
|
|
FunctorType functor_; |
|
|
|
functionImplementation_(const FunctorType &functor) : |
|
functor_(functor) |
|
{ |
|
|
|
#if (defined(_WIN32) && defined(_VARIADIC_MAX) && (_VARIADIC_MAX < 11)) |
|
// Fail variadic expansion for dev11 |
|
static_assert(0, "Visual Studio has a hard limit of argument count for a std::function expansion. Please define _VARIADIC_MAX to be 10. If you need more arguments than that VC12 and below cannot support it."); |
|
#endif |
|
|
|
} |
|
|
|
//! \brief Return type of the functor |
|
typedef Event result_type; |
|
|
|
//! \brief Function signature of kernel functor with no event dependency. |
|
typedef Event type_( |
|
const EnqueueArgs&, |
|
T0, |
|
T1, |
|
T2, |
|
T3, |
|
T4, |
|
T5, |
|
T6, |
|
T7, |
|
T8, |
|
T9, |
|
T10); |
|
|
|
Event operator()( |
|
const EnqueueArgs& enqueueArgs, |
|
T0 arg0, |
|
T1 arg1, |
|
T2 arg2, |
|
T3 arg3, |
|
T4 arg4, |
|
T5 arg5, |
|
T6 arg6, |
|
T7 arg7, |
|
T8 arg8, |
|
T9 arg9, |
|
T10 arg10) |
|
{ |
|
return functor_( |
|
enqueueArgs, |
|
arg0, |
|
arg1, |
|
arg2, |
|
arg3, |
|
arg4, |
|
arg5, |
|
arg6, |
|
arg7, |
|
arg8, |
|
arg9, |
|
arg10); |
|
} |
|
|
|
|
|
}; |
|
|
|
template< |
|
typename T0, |
|
typename T1, |
|
typename T2, |
|
typename T3, |
|
typename T4, |
|
typename T5, |
|
typename T6, |
|
typename T7, |
|
typename T8, |
|
typename T9> |
|
struct functionImplementation_ |
|
< T0, |
|
T1, |
|
T2, |
|
T3, |
|
T4, |
|
T5, |
|
T6, |
|
T7, |
|
T8, |
|
T9, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType> |
|
{ |
|
typedef detail::KernelFunctorGlobal< |
|
T0, |
|
T1, |
|
T2, |
|
T3, |
|
T4, |
|
T5, |
|
T6, |
|
T7, |
|
T8, |
|
T9, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType> FunctorType; |
|
|
|
FunctorType functor_; |
|
|
|
functionImplementation_(const FunctorType &functor) : |
|
functor_(functor) |
|
{ |
|
|
|
#if (defined(_WIN32) && defined(_VARIADIC_MAX) && (_VARIADIC_MAX < 10)) |
|
// Fail variadic expansion for dev11 |
|
static_assert(0, "Visual Studio has a hard limit of argument count for a std::function expansion. Please define _VARIADIC_MAX to be 10. If you need more arguments than that VC12 and below cannot support it."); |
|
#endif |
|
|
|
} |
|
|
|
//! \brief Return type of the functor |
|
typedef Event result_type; |
|
|
|
//! \brief Function signature of kernel functor with no event dependency. |
|
typedef Event type_( |
|
const EnqueueArgs&, |
|
T0, |
|
T1, |
|
T2, |
|
T3, |
|
T4, |
|
T5, |
|
T6, |
|
T7, |
|
T8, |
|
T9); |
|
|
|
Event operator()( |
|
const EnqueueArgs& enqueueArgs, |
|
T0 arg0, |
|
T1 arg1, |
|
T2 arg2, |
|
T3 arg3, |
|
T4 arg4, |
|
T5 arg5, |
|
T6 arg6, |
|
T7 arg7, |
|
T8 arg8, |
|
T9 arg9) |
|
{ |
|
return functor_( |
|
enqueueArgs, |
|
arg0, |
|
arg1, |
|
arg2, |
|
arg3, |
|
arg4, |
|
arg5, |
|
arg6, |
|
arg7, |
|
arg8, |
|
arg9); |
|
} |
|
|
|
|
|
}; |
|
|
|
template< |
|
typename T0, |
|
typename T1, |
|
typename T2, |
|
typename T3, |
|
typename T4, |
|
typename T5, |
|
typename T6, |
|
typename T7, |
|
typename T8> |
|
struct functionImplementation_ |
|
< T0, |
|
T1, |
|
T2, |
|
T3, |
|
T4, |
|
T5, |
|
T6, |
|
T7, |
|
T8, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType> |
|
{ |
|
typedef detail::KernelFunctorGlobal< |
|
T0, |
|
T1, |
|
T2, |
|
T3, |
|
T4, |
|
T5, |
|
T6, |
|
T7, |
|
T8, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType> FunctorType; |
|
|
|
FunctorType functor_; |
|
|
|
functionImplementation_(const FunctorType &functor) : |
|
functor_(functor) |
|
{ |
|
|
|
#if (defined(_WIN32) && defined(_VARIADIC_MAX) && (_VARIADIC_MAX < 9)) |
|
// Fail variadic expansion for dev11 |
|
static_assert(0, "Visual Studio has a hard limit of argument count for a std::function expansion. Please define _VARIADIC_MAX to be 10. If you need more arguments than that VC12 and below cannot support it."); |
|
#endif |
|
|
|
} |
|
|
|
//! \brief Return type of the functor |
|
typedef Event result_type; |
|
|
|
//! \brief Function signature of kernel functor with no event dependency. |
|
typedef Event type_( |
|
const EnqueueArgs&, |
|
T0, |
|
T1, |
|
T2, |
|
T3, |
|
T4, |
|
T5, |
|
T6, |
|
T7, |
|
T8); |
|
|
|
Event operator()( |
|
const EnqueueArgs& enqueueArgs, |
|
T0 arg0, |
|
T1 arg1, |
|
T2 arg2, |
|
T3 arg3, |
|
T4 arg4, |
|
T5 arg5, |
|
T6 arg6, |
|
T7 arg7, |
|
T8 arg8) |
|
{ |
|
return functor_( |
|
enqueueArgs, |
|
arg0, |
|
arg1, |
|
arg2, |
|
arg3, |
|
arg4, |
|
arg5, |
|
arg6, |
|
arg7, |
|
arg8); |
|
} |
|
|
|
|
|
}; |
|
|
|
template< |
|
typename T0, |
|
typename T1, |
|
typename T2, |
|
typename T3, |
|
typename T4, |
|
typename T5, |
|
typename T6, |
|
typename T7> |
|
struct functionImplementation_ |
|
< T0, |
|
T1, |
|
T2, |
|
T3, |
|
T4, |
|
T5, |
|
T6, |
|
T7, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType> |
|
{ |
|
typedef detail::KernelFunctorGlobal< |
|
T0, |
|
T1, |
|
T2, |
|
T3, |
|
T4, |
|
T5, |
|
T6, |
|
T7, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType> FunctorType; |
|
|
|
FunctorType functor_; |
|
|
|
functionImplementation_(const FunctorType &functor) : |
|
functor_(functor) |
|
{ |
|
|
|
#if (defined(_WIN32) && defined(_VARIADIC_MAX) && (_VARIADIC_MAX < 8)) |
|
// Fail variadic expansion for dev11 |
|
static_assert(0, "Visual Studio has a hard limit of argument count for a std::function expansion. Please define _VARIADIC_MAX to be 10. If you need more arguments than that VC12 and below cannot support it."); |
|
#endif |
|
|
|
} |
|
|
|
//! \brief Return type of the functor |
|
typedef Event result_type; |
|
|
|
//! \brief Function signature of kernel functor with no event dependency. |
|
typedef Event type_( |
|
const EnqueueArgs&, |
|
T0, |
|
T1, |
|
T2, |
|
T3, |
|
T4, |
|
T5, |
|
T6, |
|
T7); |
|
|
|
Event operator()( |
|
const EnqueueArgs& enqueueArgs, |
|
T0 arg0, |
|
T1 arg1, |
|
T2 arg2, |
|
T3 arg3, |
|
T4 arg4, |
|
T5 arg5, |
|
T6 arg6, |
|
T7 arg7) |
|
{ |
|
return functor_( |
|
enqueueArgs, |
|
arg0, |
|
arg1, |
|
arg2, |
|
arg3, |
|
arg4, |
|
arg5, |
|
arg6, |
|
arg7); |
|
} |
|
|
|
|
|
}; |
|
|
|
template< |
|
typename T0, |
|
typename T1, |
|
typename T2, |
|
typename T3, |
|
typename T4, |
|
typename T5, |
|
typename T6> |
|
struct functionImplementation_ |
|
< T0, |
|
T1, |
|
T2, |
|
T3, |
|
T4, |
|
T5, |
|
T6, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType> |
|
{ |
|
typedef detail::KernelFunctorGlobal< |
|
T0, |
|
T1, |
|
T2, |
|
T3, |
|
T4, |
|
T5, |
|
T6, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType> FunctorType; |
|
|
|
FunctorType functor_; |
|
|
|
functionImplementation_(const FunctorType &functor) : |
|
functor_(functor) |
|
{ |
|
|
|
#if (defined(_WIN32) && defined(_VARIADIC_MAX) && (_VARIADIC_MAX < 7)) |
|
// Fail variadic expansion for dev11 |
|
static_assert(0, "Visual Studio has a hard limit of argument count for a std::function expansion. Please define _VARIADIC_MAX to be 10. If you need more arguments than that VC12 and below cannot support it."); |
|
#endif |
|
|
|
} |
|
|
|
//! \brief Return type of the functor |
|
typedef Event result_type; |
|
|
|
//! \brief Function signature of kernel functor with no event dependency. |
|
typedef Event type_( |
|
const EnqueueArgs&, |
|
T0, |
|
T1, |
|
T2, |
|
T3, |
|
T4, |
|
T5, |
|
T6); |
|
|
|
Event operator()( |
|
const EnqueueArgs& enqueueArgs, |
|
T0 arg0, |
|
T1 arg1, |
|
T2 arg2, |
|
T3 arg3, |
|
T4 arg4, |
|
T5 arg5, |
|
T6 arg6) |
|
{ |
|
return functor_( |
|
enqueueArgs, |
|
arg0, |
|
arg1, |
|
arg2, |
|
arg3, |
|
arg4, |
|
arg5, |
|
arg6); |
|
} |
|
|
|
|
|
}; |
|
|
|
template< |
|
typename T0, |
|
typename T1, |
|
typename T2, |
|
typename T3, |
|
typename T4, |
|
typename T5> |
|
struct functionImplementation_ |
|
< T0, |
|
T1, |
|
T2, |
|
T3, |
|
T4, |
|
T5, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType> |
|
{ |
|
typedef detail::KernelFunctorGlobal< |
|
T0, |
|
T1, |
|
T2, |
|
T3, |
|
T4, |
|
T5, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType> FunctorType; |
|
|
|
FunctorType functor_; |
|
|
|
functionImplementation_(const FunctorType &functor) : |
|
functor_(functor) |
|
{ |
|
|
|
#if (defined(_WIN32) && defined(_VARIADIC_MAX) && (_VARIADIC_MAX < 6)) |
|
// Fail variadic expansion for dev11 |
|
static_assert(0, "Visual Studio has a hard limit of argument count for a std::function expansion. Please define _VARIADIC_MAX to be 10. If you need more arguments than that VC12 and below cannot support it."); |
|
#endif |
|
|
|
} |
|
|
|
//! \brief Return type of the functor |
|
typedef Event result_type; |
|
|
|
//! \brief Function signature of kernel functor with no event dependency. |
|
typedef Event type_( |
|
const EnqueueArgs&, |
|
T0, |
|
T1, |
|
T2, |
|
T3, |
|
T4, |
|
T5); |
|
|
|
Event operator()( |
|
const EnqueueArgs& enqueueArgs, |
|
T0 arg0, |
|
T1 arg1, |
|
T2 arg2, |
|
T3 arg3, |
|
T4 arg4, |
|
T5 arg5) |
|
{ |
|
return functor_( |
|
enqueueArgs, |
|
arg0, |
|
arg1, |
|
arg2, |
|
arg3, |
|
arg4, |
|
arg5); |
|
} |
|
|
|
|
|
}; |
|
|
|
template< |
|
typename T0, |
|
typename T1, |
|
typename T2, |
|
typename T3, |
|
typename T4> |
|
struct functionImplementation_ |
|
< T0, |
|
T1, |
|
T2, |
|
T3, |
|
T4, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType> |
|
{ |
|
typedef detail::KernelFunctorGlobal< |
|
T0, |
|
T1, |
|
T2, |
|
T3, |
|
T4, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType> FunctorType; |
|
|
|
FunctorType functor_; |
|
|
|
functionImplementation_(const FunctorType &functor) : |
|
functor_(functor) |
|
{ |
|
|
|
#if (defined(_WIN32) && defined(_VARIADIC_MAX) && (_VARIADIC_MAX < 5)) |
|
// Fail variadic expansion for dev11 |
|
static_assert(0, "Visual Studio has a hard limit of argument count for a std::function expansion. Please define _VARIADIC_MAX to be 10. If you need more arguments than that VC12 and below cannot support it."); |
|
#endif |
|
|
|
} |
|
|
|
//! \brief Return type of the functor |
|
typedef Event result_type; |
|
|
|
//! \brief Function signature of kernel functor with no event dependency. |
|
typedef Event type_( |
|
const EnqueueArgs&, |
|
T0, |
|
T1, |
|
T2, |
|
T3, |
|
T4); |
|
|
|
Event operator()( |
|
const EnqueueArgs& enqueueArgs, |
|
T0 arg0, |
|
T1 arg1, |
|
T2 arg2, |
|
T3 arg3, |
|
T4 arg4) |
|
{ |
|
return functor_( |
|
enqueueArgs, |
|
arg0, |
|
arg1, |
|
arg2, |
|
arg3, |
|
arg4); |
|
} |
|
|
|
|
|
}; |
|
|
|
template< |
|
typename T0, |
|
typename T1, |
|
typename T2, |
|
typename T3> |
|
struct functionImplementation_ |
|
< T0, |
|
T1, |
|
T2, |
|
T3, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType> |
|
{ |
|
typedef detail::KernelFunctorGlobal< |
|
T0, |
|
T1, |
|
T2, |
|
T3, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType> FunctorType; |
|
|
|
FunctorType functor_; |
|
|
|
functionImplementation_(const FunctorType &functor) : |
|
functor_(functor) |
|
{ |
|
|
|
#if (defined(_WIN32) && defined(_VARIADIC_MAX) && (_VARIADIC_MAX < 4)) |
|
// Fail variadic expansion for dev11 |
|
static_assert(0, "Visual Studio has a hard limit of argument count for a std::function expansion. Please define _VARIADIC_MAX to be 10. If you need more arguments than that VC12 and below cannot support it."); |
|
#endif |
|
|
|
} |
|
|
|
//! \brief Return type of the functor |
|
typedef Event result_type; |
|
|
|
//! \brief Function signature of kernel functor with no event dependency. |
|
typedef Event type_( |
|
const EnqueueArgs&, |
|
T0, |
|
T1, |
|
T2, |
|
T3); |
|
|
|
Event operator()( |
|
const EnqueueArgs& enqueueArgs, |
|
T0 arg0, |
|
T1 arg1, |
|
T2 arg2, |
|
T3 arg3) |
|
{ |
|
return functor_( |
|
enqueueArgs, |
|
arg0, |
|
arg1, |
|
arg2, |
|
arg3); |
|
} |
|
|
|
|
|
}; |
|
|
|
template< |
|
typename T0, |
|
typename T1, |
|
typename T2> |
|
struct functionImplementation_ |
|
< T0, |
|
T1, |
|
T2, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType> |
|
{ |
|
typedef detail::KernelFunctorGlobal< |
|
T0, |
|
T1, |
|
T2, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType> FunctorType; |
|
|
|
FunctorType functor_; |
|
|
|
functionImplementation_(const FunctorType &functor) : |
|
functor_(functor) |
|
{ |
|
|
|
#if (defined(_WIN32) && defined(_VARIADIC_MAX) && (_VARIADIC_MAX < 3)) |
|
// Fail variadic expansion for dev11 |
|
static_assert(0, "Visual Studio has a hard limit of argument count for a std::function expansion. Please define _VARIADIC_MAX to be 10. If you need more arguments than that VC12 and below cannot support it."); |
|
#endif |
|
|
|
} |
|
|
|
//! \brief Return type of the functor |
|
typedef Event result_type; |
|
|
|
//! \brief Function signature of kernel functor with no event dependency. |
|
typedef Event type_( |
|
const EnqueueArgs&, |
|
T0, |
|
T1, |
|
T2); |
|
|
|
Event operator()( |
|
const EnqueueArgs& enqueueArgs, |
|
T0 arg0, |
|
T1 arg1, |
|
T2 arg2) |
|
{ |
|
return functor_( |
|
enqueueArgs, |
|
arg0, |
|
arg1, |
|
arg2); |
|
} |
|
|
|
|
|
}; |
|
|
|
template< |
|
typename T0, |
|
typename T1> |
|
struct functionImplementation_ |
|
< T0, |
|
T1, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType> |
|
{ |
|
typedef detail::KernelFunctorGlobal< |
|
T0, |
|
T1, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType> FunctorType; |
|
|
|
FunctorType functor_; |
|
|
|
functionImplementation_(const FunctorType &functor) : |
|
functor_(functor) |
|
{ |
|
|
|
#if (defined(_WIN32) && defined(_VARIADIC_MAX) && (_VARIADIC_MAX < 2)) |
|
// Fail variadic expansion for dev11 |
|
static_assert(0, "Visual Studio has a hard limit of argument count for a std::function expansion. Please define _VARIADIC_MAX to be 10. If you need more arguments than that VC12 and below cannot support it."); |
|
#endif |
|
|
|
} |
|
|
|
//! \brief Return type of the functor |
|
typedef Event result_type; |
|
|
|
//! \brief Function signature of kernel functor with no event dependency. |
|
typedef Event type_( |
|
const EnqueueArgs&, |
|
T0, |
|
T1); |
|
|
|
Event operator()( |
|
const EnqueueArgs& enqueueArgs, |
|
T0 arg0, |
|
T1 arg1) |
|
{ |
|
return functor_( |
|
enqueueArgs, |
|
arg0, |
|
arg1); |
|
} |
|
|
|
|
|
}; |
|
|
|
template< |
|
typename T0> |
|
struct functionImplementation_ |
|
< T0, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType> |
|
{ |
|
typedef detail::KernelFunctorGlobal< |
|
T0, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType, |
|
NullType> FunctorType; |
|
|
|
FunctorType functor_; |
|
|
|
functionImplementation_(const FunctorType &functor) : |
|
functor_(functor) |
|
{ |
|
|
|
#if (defined(_WIN32) && defined(_VARIADIC_MAX) && (_VARIADIC_MAX < 1)) |
|
// Fail variadic expansion for dev11 |
|
static_assert(0, "Visual Studio has a hard limit of argument count for a std::function expansion. Please define _VARIADIC_MAX to be 10. If you need more arguments than that VC12 and below cannot support it."); |
|
#endif |
|
|
|
} |
|
|
|
//! \brief Return type of the functor |
|
typedef Event result_type; |
|
|
|
//! \brief Function signature of kernel functor with no event dependency. |
|
typedef Event type_( |
|
const EnqueueArgs&, |
|
T0); |
|
|
|
Event operator()( |
|
const EnqueueArgs& enqueueArgs, |
|
T0 arg0) |
|
{ |
|
return functor_( |
|
enqueueArgs, |
|
arg0); |
|
} |
|
|
|
|
|
}; |
|
|
|
|
|
|
|
|
|
|
|
} // namespace detail |
|
|
|
//---------------------------------------------------------------------------------------------- |
|
|
|
template < |
|
typename T0, typename T1 = detail::NullType, typename T2 = detail::NullType, |
|
typename T3 = detail::NullType, typename T4 = detail::NullType, |
|
typename T5 = detail::NullType, typename T6 = detail::NullType, |
|
typename T7 = detail::NullType, typename T8 = detail::NullType, |
|
typename T9 = detail::NullType, typename T10 = detail::NullType, |
|
typename T11 = detail::NullType, typename T12 = detail::NullType, |
|
typename T13 = detail::NullType, typename T14 = detail::NullType, |
|
typename T15 = detail::NullType, typename T16 = detail::NullType, |
|
typename T17 = detail::NullType, typename T18 = detail::NullType, |
|
typename T19 = detail::NullType, typename T20 = detail::NullType, |
|
typename T21 = detail::NullType, typename T22 = detail::NullType, |
|
typename T23 = detail::NullType, typename T24 = detail::NullType, |
|
typename T25 = detail::NullType, typename T26 = detail::NullType, |
|
typename T27 = detail::NullType, typename T28 = detail::NullType, |
|
typename T29 = detail::NullType, typename T30 = detail::NullType, |
|
typename T31 = detail::NullType |
|
> |
|
struct make_kernel : |
|
public detail::functionImplementation_< |
|
T0, T1, T2, T3, |
|
T4, T5, T6, T7, |
|
T8, T9, T10, T11, |
|
T12, T13, T14, T15, |
|
T16, T17, T18, T19, |
|
T20, T21, T22, T23, |
|
T24, T25, T26, T27, |
|
T28, T29, T30, T31 |
|
> |
|
{ |
|
public: |
|
typedef detail::KernelFunctorGlobal< |
|
T0, T1, T2, T3, |
|
T4, T5, T6, T7, |
|
T8, T9, T10, T11, |
|
T12, T13, T14, T15, |
|
T16, T17, T18, T19, |
|
T20, T21, T22, T23, |
|
T24, T25, T26, T27, |
|
T28, T29, T30, T31 |
|
> FunctorType; |
|
|
|
make_kernel( |
|
const Program& program, |
|
const STRING_CLASS name, |
|
cl_int * err = NULL) : |
|
detail::functionImplementation_< |
|
T0, T1, T2, T3, |
|
T4, T5, T6, T7, |
|
T8, T9, T10, T11, |
|
T12, T13, T14, T15, |
|
T16, T17, T18, T19, |
|
T20, T21, T22, T23, |
|
T24, T25, T26, T27, |
|
T28, T29, T30, T31 |
|
>( |
|
FunctorType(program, name, err)) |
|
{} |
|
|
|
make_kernel( |
|
const Kernel kernel) : |
|
detail::functionImplementation_< |
|
T0, T1, T2, T3, |
|
T4, T5, T6, T7, |
|
T8, T9, T10, T11, |
|
T12, T13, T14, T15, |
|
T16, T17, T18, T19, |
|
T20, T21, T22, T23, |
|
T24, T25, T26, T27, |
|
T28, T29, T30, T31 |
|
>( |
|
FunctorType(kernel)) |
|
{} |
|
}; |
|
|
|
|
|
//---------------------------------------------------------------------------------------------------------------------- |
|
|
|
#undef __ERR_STR |
|
#if !defined(__CL_USER_OVERRIDE_ERROR_STRINGS) |
|
#undef __GET_DEVICE_INFO_ERR |
|
#undef __GET_PLATFORM_INFO_ERR |
|
#undef __GET_DEVICE_IDS_ERR |
|
#undef __GET_CONTEXT_INFO_ERR |
|
#undef __GET_EVENT_INFO_ERR |
|
#undef __GET_EVENT_PROFILE_INFO_ERR |
|
#undef __GET_MEM_OBJECT_INFO_ERR |
|
#undef __GET_IMAGE_INFO_ERR |
|
#undef __GET_SAMPLER_INFO_ERR |
|
#undef __GET_KERNEL_INFO_ERR |
|
#undef __GET_KERNEL_ARG_INFO_ERR |
|
#undef __GET_KERNEL_WORK_GROUP_INFO_ERR |
|
#undef __GET_PROGRAM_INFO_ERR |
|
#undef __GET_PROGRAM_BUILD_INFO_ERR |
|
#undef __GET_COMMAND_QUEUE_INFO_ERR |
|
|
|
#undef __CREATE_CONTEXT_ERR |
|
#undef __CREATE_CONTEXT_FROM_TYPE_ERR |
|
#undef __GET_SUPPORTED_IMAGE_FORMATS_ERR |
|
|
|
#undef __CREATE_BUFFER_ERR |
|
#undef __CREATE_SUBBUFFER_ERR |
|
#undef __CREATE_IMAGE2D_ERR |
|
#undef __CREATE_IMAGE3D_ERR |
|
#undef __CREATE_SAMPLER_ERR |
|
#undef __SET_MEM_OBJECT_DESTRUCTOR_CALLBACK_ERR |
|
|
|
#undef __CREATE_USER_EVENT_ERR |
|
#undef __SET_USER_EVENT_STATUS_ERR |
|
#undef __SET_EVENT_CALLBACK_ERR |
|
#undef __SET_PRINTF_CALLBACK_ERR |
|
|
|
#undef __WAIT_FOR_EVENTS_ERR |
|
|
|
#undef __CREATE_KERNEL_ERR |
|
#undef __SET_KERNEL_ARGS_ERR |
|
#undef __CREATE_PROGRAM_WITH_SOURCE_ERR |
|
#undef __CREATE_PROGRAM_WITH_BINARY_ERR |
|
#undef __CREATE_PROGRAM_WITH_BUILT_IN_KERNELS_ERR |
|
#undef __BUILD_PROGRAM_ERR |
|
#undef __CREATE_KERNELS_IN_PROGRAM_ERR |
|
|
|
#undef __CREATE_COMMAND_QUEUE_ERR |
|
#undef __SET_COMMAND_QUEUE_PROPERTY_ERR |
|
#undef __ENQUEUE_READ_BUFFER_ERR |
|
#undef __ENQUEUE_WRITE_BUFFER_ERR |
|
#undef __ENQUEUE_READ_BUFFER_RECT_ERR |
|
#undef __ENQUEUE_WRITE_BUFFER_RECT_ERR |
|
#undef __ENQEUE_COPY_BUFFER_ERR |
|
#undef __ENQEUE_COPY_BUFFER_RECT_ERR |
|
#undef __ENQUEUE_READ_IMAGE_ERR |
|
#undef __ENQUEUE_WRITE_IMAGE_ERR |
|
#undef __ENQUEUE_COPY_IMAGE_ERR |
|
#undef __ENQUEUE_COPY_IMAGE_TO_BUFFER_ERR |
|
#undef __ENQUEUE_COPY_BUFFER_TO_IMAGE_ERR |
|
#undef __ENQUEUE_MAP_BUFFER_ERR |
|
#undef __ENQUEUE_MAP_IMAGE_ERR |
|
#undef __ENQUEUE_UNMAP_MEM_OBJECT_ERR |
|
#undef __ENQUEUE_NDRANGE_KERNEL_ERR |
|
#undef __ENQUEUE_TASK_ERR |
|
#undef __ENQUEUE_NATIVE_KERNEL |
|
|
|
#undef __CL_EXPLICIT_CONSTRUCTORS |
|
|
|
#undef __UNLOAD_COMPILER_ERR |
|
#endif //__CL_USER_OVERRIDE_ERROR_STRINGS |
|
|
|
#undef __CL_FUNCTION_TYPE |
|
|
|
// Extensions |
|
/** |
|
* Deprecated APIs for 1.2 |
|
*/ |
|
#if defined(CL_VERSION_1_1) |
|
#undef __INIT_CL_EXT_FCN_PTR |
|
#endif // #if defined(CL_VERSION_1_1) |
|
#undef __CREATE_SUB_DEVICES |
|
|
|
#if defined(USE_CL_DEVICE_FISSION) |
|
#undef __PARAM_NAME_DEVICE_FISSION |
|
#endif // USE_CL_DEVICE_FISSION |
|
|
|
#undef __DEFAULT_NOT_INITIALIZED |
|
#undef __DEFAULT_BEING_INITIALIZED |
|
#undef __DEFAULT_INITIALIZED |
|
|
|
} // namespace cl |
|
|
|
#ifdef _WIN32 |
|
#pragma pop_macro("max") |
|
#endif // _WIN32 |
|
|
|
#endif // CL_HPP_
|
|
|