template<bool IS_DESCENDING, typename KeyT, typename ValueT, typename OffsetT>
struct cub::DispatchRadixSort< IS_DESCENDING, KeyT, ValueT, OffsetT >
< Signed integer type for global offsets
Utility class for dispatching the appropriately-tuned kernels for device-wide radix sort
Definition at line 807 of file dispatch_radix_sort.cuh.
|
CUB_RUNTIME_FUNCTION __forceinline__ | DispatchRadixSort (void *d_temp_storage, size_t &temp_storage_bytes, DoubleBuffer< KeyT > &d_keys, DoubleBuffer< ValueT > &d_values, OffsetT num_items, int begin_bit, int end_bit, bool is_overwrite_okay, cudaStream_t stream, bool debug_synchronous, int ptx_version) |
| Constructor.
|
|
template<typename ActivePolicyT , typename SingleTileKernelT > |
CUB_RUNTIME_FUNCTION __forceinline__ cudaError_t | InvokeSingleTile (SingleTileKernelT single_tile_kernel) |
| Invoke a single block to sort in-core. More...
|
|
template<typename PassConfigT > |
CUB_RUNTIME_FUNCTION __forceinline__ cudaError_t | InvokePass (const KeyT *d_keys_in, KeyT *d_keys_out, const ValueT *d_values_in, ValueT *d_values_out, OffsetT *d_spine, int spine_length, int ¤t_bit, PassConfigT &pass_config) |
|
template<typename ActivePolicyT , typename UpsweepKernelT , typename ScanKernelT , typename DownsweepKernelT > |
CUB_RUNTIME_FUNCTION __forceinline__ cudaError_t | InvokePasses (UpsweepKernelT upsweep_kernel, UpsweepKernelT alt_upsweep_kernel, ScanKernelT scan_kernel, DownsweepKernelT downsweep_kernel, DownsweepKernelT alt_downsweep_kernel) |
| Invocation (run multiple digit passes) More...
|
|
template<typename ActivePolicyT > |
CUB_RUNTIME_FUNCTION __forceinline__ cudaError_t | Invoke () |
| Invocation.
|
|
|
void * | d_temp_storage |
| [in] Device-accessible allocation of temporary storage. When NULL, the required allocation size is written to temp_storage_bytes and no work is done.
|
|
size_t & | temp_storage_bytes |
| [in,out] Reference to size in bytes of d_temp_storage allocation
|
|
DoubleBuffer< KeyT > & | d_keys |
| [in,out] Double-buffer whose current buffer contains the unsorted input keys and, upon return, is updated to point to the sorted output keys
|
|
DoubleBuffer< ValueT > & | d_values |
| [in,out] Double-buffer whose current buffer contains the unsorted input values and, upon return, is updated to point to the sorted output values
|
|
OffsetT | num_items |
| [in] Number of items to sort
|
|
int | begin_bit |
| [in] The beginning (least-significant) bit index needed for key comparison
|
|
int | end_bit |
| [in] The past-the-end (most-significant) bit index needed for key comparison
|
|
cudaStream_t | stream |
| [in] CUDA stream to launch kernels within. Default is stream0.
|
|
bool | debug_synchronous |
| [in] Whether or not to synchronize the stream after every kernel launch to check for errors. Also causes launch configurations to be printed to the console. Default is false .
|
|
int | ptx_version |
| [in] PTX version
|
|
bool | is_overwrite_okay |
| [in] Whether is okay to overwrite source buffers
|
|
template<bool IS_DESCENDING, typename KeyT , typename ValueT , typename OffsetT >
template<typename PassConfigT >
CUB_RUNTIME_FUNCTION __forceinline__ cudaError_t cub::DispatchRadixSort< IS_DESCENDING, KeyT, ValueT, OffsetT >::InvokePass |
( |
const KeyT * |
d_keys_in, |
|
|
KeyT * |
d_keys_out, |
|
|
const ValueT * |
d_values_in, |
|
|
ValueT * |
d_values_out, |
|
|
OffsetT * |
d_spine, |
|
|
int |
spine_length, |
|
|
int & |
current_bit, |
|
|
PassConfigT & |
pass_config |
|
) |
| |
|
inline |
template<bool IS_DESCENDING, typename KeyT , typename ValueT , typename OffsetT >
template<typename ActivePolicyT , typename UpsweepKernelT , typename ScanKernelT , typename DownsweepKernelT >
CUB_RUNTIME_FUNCTION __forceinline__ cudaError_t cub::DispatchRadixSort< IS_DESCENDING, KeyT, ValueT, OffsetT >::InvokePasses |
( |
UpsweepKernelT |
upsweep_kernel, |
|
|
UpsweepKernelT |
alt_upsweep_kernel, |
|
|
ScanKernelT |
scan_kernel, |
|
|
DownsweepKernelT |
downsweep_kernel, |
|
|
DownsweepKernelT |
alt_downsweep_kernel |
|
) |
| |
|
inline |
Invocation (run multiple digit passes)
< Function type of cub::DeviceRadixSortDownsweepKernel
- Parameters
-
[in] | upsweep_kernel | Kernel function pointer to parameterization of cub::DeviceRadixSortUpsweepKernel |
[in] | alt_upsweep_kernel | Alternate kernel function pointer to parameterization of cub::DeviceRadixSortUpsweepKernel |
[in] | scan_kernel | Kernel function pointer to parameterization of cub::SpineScanKernel |
[in] | downsweep_kernel | Kernel function pointer to parameterization of cub::DeviceRadixSortDownsweepKernel |
[in] | alt_downsweep_kernel | Alternate kernel function pointer to parameterization of cub::DeviceRadixSortDownsweepKernel |
Definition at line 1096 of file dispatch_radix_sort.cuh.
template<bool IS_DESCENDING, typename KeyT , typename ValueT , typename OffsetT >
template<typename ActivePolicyT , typename SingleTileKernelT >
CUB_RUNTIME_FUNCTION __forceinline__ cudaError_t cub::DispatchRadixSort< IS_DESCENDING, KeyT, ValueT, OffsetT >::InvokeSingleTile |
( |
SingleTileKernelT |
single_tile_kernel | ) |
|
|
inline |
Invoke a single block to sort in-core.
< Function type of cub::DeviceRadixSortSingleTileKernel
- Parameters
-
[in] | single_tile_kernel | Kernel function pointer to parameterization of cub::DeviceRadixSortSingleTileKernel |
Definition at line 880 of file dispatch_radix_sort.cuh.