@ -54,7 +54,7 @@ namespace cv { namespace cuda { namespace device
template < typename T >
__device__ __forceinline__ T shfl ( T val , int srcLane , int width = warpSize )
{
# if __CUDA_ARCH__ >= 300
# if defined __CUDA_ARCH__ && __CUDA_ARCH__ >= 300
return __shfl ( val , srcLane , width ) ;
# else
return T ( ) ;
@ -62,7 +62,7 @@ namespace cv { namespace cuda { namespace device
}
__device__ __forceinline__ unsigned int shfl ( unsigned int val , int srcLane , int width = warpSize )
{
# if __CUDA_ARCH__ >= 300
# if defined __CUDA_ARCH__ && __CUDA_ARCH__ >= 300
return ( unsigned int ) __shfl ( ( int ) val , srcLane , width ) ;
# else
return 0 ;
@ -70,7 +70,7 @@ namespace cv { namespace cuda { namespace device
}
__device__ __forceinline__ double shfl ( double val , int srcLane , int width = warpSize )
{
# if __CUDA_ARCH__ >= 300
# if defined __CUDA_ARCH__ && __CUDA_ARCH__ >= 300
int lo = __double2loint ( val ) ;
int hi = __double2hiint ( val ) ;
@ -86,7 +86,7 @@ namespace cv { namespace cuda { namespace device
template < typename T >
__device__ __forceinline__ T shfl_down ( T val , unsigned int delta , int width = warpSize )
{
# if __CUDA_ARCH__ >= 300
# if defined __CUDA_ARCH__ && __CUDA_ARCH__ >= 300
return __shfl_down ( val , delta , width ) ;
# else
return T ( ) ;
@ -94,7 +94,7 @@ namespace cv { namespace cuda { namespace device
}
__device__ __forceinline__ unsigned int shfl_down ( unsigned int val , unsigned int delta , int width = warpSize )
{
# if __CUDA_ARCH__ >= 300
# if defined __CUDA_ARCH__ && __CUDA_ARCH__ >= 300
return ( unsigned int ) __shfl_down ( ( int ) val , delta , width ) ;
# else
return 0 ;
@ -102,7 +102,7 @@ namespace cv { namespace cuda { namespace device
}
__device__ __forceinline__ double shfl_down ( double val , unsigned int delta , int width = warpSize )
{
# if __CUDA_ARCH__ >= 300
# if defined __CUDA_ARCH__ && __CUDA_ARCH__ >= 300
int lo = __double2loint ( val ) ;
int hi = __double2hiint ( val ) ;
@ -118,7 +118,7 @@ namespace cv { namespace cuda { namespace device
template < typename T >
__device__ __forceinline__ T shfl_up ( T val , unsigned int delta , int width = warpSize )
{
# if __CUDA_ARCH__ >= 300
# if defined __CUDA_ARCH__ && __CUDA_ARCH__ >= 300
return __shfl_up ( val , delta , width ) ;
# else
return T ( ) ;
@ -126,7 +126,7 @@ namespace cv { namespace cuda { namespace device
}
__device__ __forceinline__ unsigned int shfl_up ( unsigned int val , unsigned int delta , int width = warpSize )
{
# if __CUDA_ARCH__ >= 300
# if defined __CUDA_ARCH__ && __CUDA_ARCH__ >= 300
return ( unsigned int ) __shfl_up ( ( int ) val , delta , width ) ;
# else
return 0 ;
@ -134,7 +134,7 @@ namespace cv { namespace cuda { namespace device
}
__device__ __forceinline__ double shfl_up ( double val , unsigned int delta , int width = warpSize )
{
# if __CUDA_ARCH__ >= 300
# if defined __CUDA_ARCH__ && __CUDA_ARCH__ >= 300
int lo = __double2loint ( val ) ;
int hi = __double2hiint ( val ) ;