10 #define GPUGENIE_SCAN_THREADBLOCK_SIZE (256) 11 #define GPUGENIE_SCAN_MIN_SHORT_ARRAY_SIZE (4) 12 #define GPUGENIE_SCAN_MAX_SHORT_ARRAY_SIZE (4*GPUGENIE_SCAN_THREADBLOCK_SIZE) // 1024 13 #define GPUGENIE_SCAN_MIN_LARGE_ARRAY_SIZE (8*GPUGENIE_SCAN_THREADBLOCK_SIZE) // 2048 14 #define GPUGENIE_SCAN_MAX_LARGE_ARRAY_SIZE (4*GPUGENIE_SCAN_THREADBLOCK_SIZE*GPUGENIE_SCAN_THREADBLOCK_SIZE) // 262144 73 unsigned int arrayLength);
78 unsigned int arrayLength);
83 unsigned int arrayLength);
const unsigned int SCAN_THREADBLOCK_SIZE
__device__ void d_scanExclusivePerBlockShared(uint4 *d_Dst, uint4 *d_Src, uint activeThreads, uint pow2size)
This is the top-level namespace of the project.
__device__ void d_scanInclusivePerBlockShared(uint4 *d_Dst, uint4 *d_Src, uint activeThreads, uint pow2size)
const unsigned int SCAN_MIN_LARGE_ARRAY_SIZE
uint h_pow2ceil_32(uint x)
size_t scanExclusiveShort(unsigned int *d_Dst, unsigned int *d_Src, unsigned int arrayLength)
__device__ void d_scanExclusiveShared(uint4 *d_Dst, uint4 *d_Src, uint activeThreads, uint pow2size)
size_t scanExclusiveLarge(unsigned int *d_Dst, unsigned int *d_Src, unsigned int arrayLength)
__global__ void g_scanExclusiveShared(uint4 *d_Dst, uint4 *d_Src, uint activeThreads, uint pow2size)
__device__ uint d_pow2ceil_32(uint x)
__device__ void d_scanInclusiveShared(uint4 *d_Dst, uint4 *d_Src, uint activeThreads, uint pow2size)
__global__ void g_scanInclusiveShared(uint4 *d_Dst, uint4 *d_Src, uint activeThreads, uint pow2size)
const unsigned int SCAN_MAX_SHORT_ARRAY_SIZE
void scanExclusiveHost(unsigned int *dst, unsigned int *src, unsigned int arrayLength)
const unsigned int SCAN_MIN_SHORT_ARRAY_SIZE
const unsigned int SCAN_MAX_LARGE_ARRAY_SIZE