< Signed integer type for global offsets More...
< Signed integer type for global offsets
Utility class for dispatching the appropriately-tuned kernels for DeviceRle
Definition at line 121 of file dispatch_rle.cuh.
| Data Structures | |
| struct | KernelConfig | 
| struct | Policy100 | 
| SM10.  More... | |
| struct | Policy130 | 
| SM13.  More... | |
| struct | Policy200 | 
| SM20.  More... | |
| struct | Policy300 | 
| SM30.  More... | |
| struct | Policy350 | 
| SM35.  More... | |
| struct | PtxRleSweepPolicy | 
| Public Types | |
| enum | { INIT_KERNEL_THREADS = 128 } | 
| typedef std::iterator_traits< InputIteratorT >::value_type | T | 
| typedef If<(Equals< typenamestd::iterator_traits< LengthsOutputIteratorT >::value_type, void >::VALUE), OffsetT, typenamestd::iterator_traits< LengthsOutputIteratorT >::value_type >::Type | LengthT | 
| typedef ReduceByKeyScanTileState< LengthT, OffsetT > | ScanTileStateT | 
| typedef Policy100 | PtxPolicy | 
| Static Public Member Functions | |
| template<typename KernelConfig > | |
| CUB_RUNTIME_FUNCTION static __forceinline__ void | InitConfigs (int ptx_version, KernelConfig &device_rle_config) | 
| template<typename DeviceScanInitKernelPtr , typename DeviceRleSweepKernelPtr > | |
| CUB_RUNTIME_FUNCTION static __forceinline__ cudaError_t | Dispatch (void *d_temp_storage, size_t &temp_storage_bytes, InputIteratorT d_in, OffsetsOutputIteratorT d_offsets_out, LengthsOutputIteratorT d_lengths_out, NumRunsOutputIteratorT d_num_runs_out, EqualityOpT equality_op, OffsetT num_items, cudaStream_t stream, bool debug_synchronous, int ptx_version, DeviceScanInitKernelPtr device_scan_init_kernel, DeviceRleSweepKernelPtr device_rle_sweep_kernel, KernelConfig device_rle_config) | 
| < Function type of cub::DeviceRleSweepKernelPtr | |
| CUB_RUNTIME_FUNCTION static __forceinline__ cudaError_t | Dispatch (void *d_temp_storage, size_t &temp_storage_bytes, InputIteratorT d_in, OffsetsOutputIteratorT d_offsets_out, LengthsOutputIteratorT d_lengths_out, NumRunsOutputIteratorT d_num_runs_out, EqualityOpT equality_op, OffsetT num_items, cudaStream_t stream, bool debug_synchronous) | 
| typedef If<(Equals<typenamestd::iterator_traits<LengthsOutputIteratorT>::value_type,void>::VALUE),OffsetT,typenamestd::iterator_traits<LengthsOutputIteratorT>::value_type>::Type cub::DeviceRleDispatch< InputIteratorT, OffsetsOutputIteratorT, LengthsOutputIteratorT, NumRunsOutputIteratorT, EqualityOpT, OffsetT >::LengthT | 
Definition at line 133 of file dispatch_rle.cuh.
| typedef Policy100 cub::DeviceRleDispatch< InputIteratorT, OffsetsOutputIteratorT, LengthsOutputIteratorT, NumRunsOutputIteratorT, EqualityOpT, OffsetT >::PtxPolicy | 
Definition at line 256 of file dispatch_rle.cuh.
| typedef ReduceByKeyScanTileState<LengthT, OffsetT> cub::DeviceRleDispatch< InputIteratorT, OffsetsOutputIteratorT, LengthsOutputIteratorT, NumRunsOutputIteratorT, EqualityOpT, OffsetT >::ScanTileStateT | 
Definition at line 141 of file dispatch_rle.cuh.
| typedef std::iterator_traits<InputIteratorT>::value_type cub::DeviceRleDispatch< InputIteratorT, OffsetsOutputIteratorT, LengthsOutputIteratorT, NumRunsOutputIteratorT, EqualityOpT, OffsetT >::T | 
Definition at line 128 of file dispatch_rle.cuh.
| anonymous enum | 
Definition at line 135 of file dispatch_rle.cuh.
| 
 | inlinestatic | 
Internal dispatch routine
| [in] | d_temp_storage | Device-accessible allocation of temporary storage. When NULL, the required allocation size is written to temp_storage_bytesand no work is done. | 
| [in,out] | temp_storage_bytes | Reference to size in bytes of d_temp_storageallocation | 
| [in] | d_in | Pointer to input sequence of data items | 
| [out] | d_offsets_out | Pointer to output sequence of run-offsets | 
| [out] | d_lengths_out | Pointer to output sequence of run-lengths | 
| [out] | d_num_runs_out | Pointer to total number of runs (i.e., length of d_offsets_out) | 
| [in] | equality_op | Equality operator for input items | 
| [in] | num_items | Total number of input items (i.e., length of d_in) | 
| [in] | stream | [optional] CUDA stream to launch kernels within. Default is stream0. | 
| [in] | debug_synchronous | [optional] Whether or not to synchronize the stream after every kernel launch to check for errors. Also causes launch configurations to be printed to the console. Default is false. | 
Definition at line 484 of file dispatch_rle.cuh.
| 
 | inlinestatic | 
< Function type of cub::DeviceRleSweepKernelPtr
Internal dispatch routine for computing a device-wide run-length-encode using the specified kernel functions.
| [in] | d_temp_storage | Device-accessible allocation of temporary storage. When NULL, the required allocation size is written to temp_storage_bytesand no work is done. | 
| [in,out] | temp_storage_bytes | Reference to size in bytes of d_temp_storageallocation | 
| [in] | d_in | Pointer to the input sequence of data items | 
| [out] | d_offsets_out | Pointer to the output sequence of run-offsets | 
| [out] | d_lengths_out | Pointer to the output sequence of run-lengths | 
| [out] | d_num_runs_out | Pointer to the total number of runs encountered (i.e., length of d_offsets_out) | 
| [in] | equality_op | Equality operator for input items | 
| [in] | num_items | Total number of input items (i.e., length of d_in) | 
| [in] | stream | CUDA stream to launch kernels within. Default is stream0. | 
| [in] | debug_synchronous | Whether or not to synchronize the stream after every kernel launch to check for errors. Also causes launch configurations to be printed to the console. Default is false. | 
| [in] | ptx_version | PTX version of dispatch kernels | 
| [in] | device_scan_init_kernel | Kernel function pointer to parameterization of cub::DeviceScanInitKernel | 
| [in] | device_rle_sweep_kernel | Kernel function pointer to parameterization of cub::DeviceRleSweepKernel | 
| [in] | device_rle_config | Dispatch parameters that match the policy that device_rle_sweep_kernelwas compiled for | 
Definition at line 357 of file dispatch_rle.cuh.
| 
 | inlinestatic | 
Initialize kernel dispatch configurations with the policies corresponding to the PTX assembly we will use
Definition at line 273 of file dispatch_rle.cuh.