OpenFPM_pdata  4.1.0
Project that contain the implementation of distributed structures
 
Loading...
Searching...
No Matches
cub::BlockLoad< InputT, BLOCK_DIM_X, ITEMS_PER_THREAD, ALGORITHM, BLOCK_DIM_Y, BLOCK_DIM_Z, PTX_ARCH >::LoadInternal< BLOCK_LOAD_VECTORIZE, DUMMY > Struct Template Reference

Detailed Description

template<typename InputT, int BLOCK_DIM_X, int ITEMS_PER_THREAD, BlockLoadAlgorithm ALGORITHM = BLOCK_LOAD_DIRECT, int BLOCK_DIM_Y = 1, int BLOCK_DIM_Z = 1, int PTX_ARCH = CUB_PTX_ARCH>
template<int DUMMY>
struct cub::BlockLoad< InputT, BLOCK_DIM_X, ITEMS_PER_THREAD, ALGORITHM, BLOCK_DIM_Y, BLOCK_DIM_Z, PTX_ARCH >::LoadInternal< BLOCK_LOAD_VECTORIZE, DUMMY >

BLOCK_LOAD_VECTORIZE specialization of load helper

Definition at line 722 of file block_load.cuh.

Public Types

typedef NullType TempStorage
 Shared memory storage layout type.
 

Public Member Functions

__device__ __forceinline__ LoadInternal (TempStorage &, int linear_tid)
 Constructor.
 
template<typename InputIteratorT >
__device__ __forceinline__ void Load (InputT *block_ptr, InputT(&items)[ITEMS_PER_THREAD])
 Load a linear segment of items from memory, specialized for native pointer types (attempts vectorization)
 
template<typename InputIteratorT >
__device__ __forceinline__ void Load (const InputT *block_ptr, InputT(&items)[ITEMS_PER_THREAD])
 Load a linear segment of items from memory, specialized for native pointer types (attempts vectorization)
 
template<CacheLoadModifier MODIFIER, typename ValueType , typename OffsetT >
__device__ __forceinline__ void Load (CacheModifiedInputIterator< MODIFIER, ValueType, OffsetT > block_itr, InputT(&items)[ITEMS_PER_THREAD])
 Load a linear segment of items from memory, specialized for native pointer types (attempts vectorization)
 
template<typename _InputIteratorT >
__device__ __forceinline__ void Load (_InputIteratorT block_itr, InputT(&items)[ITEMS_PER_THREAD])
 Load a linear segment of items from memory, specialized for opaque input iterators (skips vectorization)
 
template<typename InputIteratorT >
__device__ __forceinline__ void Load (InputIteratorT block_itr, InputT(&items)[ITEMS_PER_THREAD], int valid_items)
 Load a linear segment of items from memory, guarded by range (skips vectorization)
 
template<typename InputIteratorT , typename DefaultT >
__device__ __forceinline__ void Load (InputIteratorT block_itr, InputT(&items)[ITEMS_PER_THREAD], int valid_items, DefaultT oob_default)
 Load a linear segment of items from memory, guarded by range, with a fall-back assignment of out-of-bound elements (skips vectorization)
 

Data Fields

int linear_tid
 Linear thread-id.
 

The documentation for this struct was generated from the following file: