|  | 
| template<typename T > | 
| __device__ __forceinline__ T | cv::gpu::device::shfl (T val, int srcLane, int width=warpSize) | 
|  | 
| __device__ __forceinline__ unsigned int | cv::gpu::device::shfl (unsigned int val, int srcLane, int width=warpSize) | 
|  | 
| __device__ __forceinline__ double | cv::gpu::device::shfl (double val, int srcLane, int width=warpSize) | 
|  | 
| template<typename T > | 
| __device__ __forceinline__ T | cv::gpu::device::shfl_down (T val, unsigned int delta, int width=warpSize) | 
|  | 
| __device__ __forceinline__ unsigned int | cv::gpu::device::shfl_down (unsigned int val, unsigned int delta, int width=warpSize) | 
|  | 
| __device__ __forceinline__ double | cv::gpu::device::shfl_down (double val, unsigned int delta, int width=warpSize) | 
|  | 
| template<typename T > | 
| __device__ __forceinline__ T | cv::gpu::device::shfl_up (T val, unsigned int delta, int width=warpSize) | 
|  | 
| __device__ __forceinline__ unsigned int | cv::gpu::device::shfl_up (unsigned int val, unsigned int delta, int width=warpSize) | 
|  | 
| __device__ __forceinline__ double | cv::gpu::device::shfl_up (double val, unsigned int delta, int width=warpSize) | 
|  |