doxygen/openfpm/device__partition_8cuh_source.html

/******************************************************************************

 * Copyright (c) 2011, Duane Merrill.  All rights reserved.

 * Copyright (c) 2011-2018, NVIDIA CORPORATION.  All rights reserved.

 *

 * Redistribution and use in source and binary forms, with or without

 * modification, are permitted provided that the following conditions are met:

 *     * Redistributions of source code must retain the above copyright

 *       notice, this list of conditions and the following disclaimer.

 *     * Redistributions in binary form must reproduce the above copyright

 *       notice, this list of conditions and the following disclaimer in the

 *       documentation and/or other materials provided with the distribution.

 *     * Neither the name of the NVIDIA CORPORATION nor the

 *       names of its contributors may be used to endorse or promote products

 *       derived from this software without specific prior written permission.

 *

 * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" AND

 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED

 * WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE

 * DISCLAIMED. IN NO EVENT SHALL NVIDIA CORPORATION BE LIABLE FOR ANY

 * DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES

 * (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;

 * LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND

 * ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT

 * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS

 * SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.

 *

 ******************************************************************************/


#pragma once


#include <stdio.h>

#include <iterator>


#include "dispatch/dispatch_select_if.cuh"

#include "../util_namespace.cuh"


CUB_NS_PREFIX


namespace cub {


struct DevicePartition

{

    template <

        typename                    InputIteratorT,

        typename                    FlagIterator,

        typename                    OutputIteratorT,

        typename                    NumSelectedIteratorT>

    CUB_RUNTIME_FUNCTION __forceinline__

    static cudaError_t Flagged(

        void*               d_temp_storage,

        size_t                      &temp_storage_bytes,

        InputIteratorT              d_in,

        FlagIterator                d_flags,

        OutputIteratorT             d_out,

        NumSelectedIteratorT        d_num_selected_out,

        int                         num_items,

        cudaStream_t                stream             = 0,

        bool                        debug_synchronous  = false)

    {

        typedef int                     OffsetT;         // Signed integer type for global offsets

        typedef NullType                SelectOp;       // Selection op (not used)

        typedef NullType                EqualityOp;     // Equality operator (not used)


        return DispatchSelectIf<InputIteratorT, FlagIterator, OutputIteratorT, NumSelectedIteratorT, SelectOp, EqualityOp, OffsetT, true>::Dispatch(

            d_temp_storage,

            temp_storage_bytes,

            d_in,

            d_flags,

            d_out,

            d_num_selected_out,

            SelectOp(),

            EqualityOp(),

            num_items,

            stream,

            debug_synchronous);

    }


    template <

        typename                    InputIteratorT,

        typename                    OutputIteratorT,

        typename                    NumSelectedIteratorT,

        typename                    SelectOp>

    CUB_RUNTIME_FUNCTION __forceinline__

    static cudaError_t If(

        void*               d_temp_storage,

        size_t                      &temp_storage_bytes,

        InputIteratorT              d_in,

        OutputIteratorT             d_out,

        NumSelectedIteratorT        d_num_selected_out,

        int                         num_items,

        SelectOp                    select_op,

        cudaStream_t                stream             = 0,

        bool                        debug_synchronous  = false)

    {

        typedef int                     OffsetT;         // Signed integer type for global offsets

        typedef NullType*               FlagIterator;   // FlagT iterator type (not used)

        typedef NullType                EqualityOp;     // Equality operator (not used)


        return DispatchSelectIf<InputIteratorT, FlagIterator, OutputIteratorT, NumSelectedIteratorT, SelectOp, EqualityOp, OffsetT, true>::Dispatch(

            d_temp_storage,

            temp_storage_bytes,

            d_in,

            NULL,

            d_out,

            d_num_selected_out,

            select_op,

            EqualityOp(),

            num_items,

            stream,

            debug_synchronous);

    }


};


}               // CUB namespace

CUB_NS_POSTFIX  // Optional outer namespace(s)


dispatch_select_if.cuh

cub
Optional outer namespace(s)
Definition agent_histogram.cuh:48

cub::select_op
FlagsInputIteratorT SelectedOutputIteratorT NumSelectedIteratorT ScanTileStateT SelectOpT select_op
[in] Selection operator
Definition dispatch_select_if.cuh:82

cub::num_items
KeyT const ValueT ValueT OffsetT OffsetT num_items
[in] Total number of input data items
Definition dispatch_radix_sort.cuh:168

cub::d_num_selected_out
FlagsInputIteratorT SelectedOutputIteratorT NumSelectedIteratorT d_num_selected_out
[out] Pointer to the total number of items selected (i.e., length of d_selected_out)
Definition dispatch_select_if.cuh:80

cub::d_flags
FlagsInputIteratorT d_flags
< [in] Pointer to the input sequence of data items
Definition dispatch_select_if.cuh:78

cub::OffsetT
OffsetT OffsetT
[in] Total number of input data items
Definition dispatch_radix_sort.cuh:75

cub::d_out
OutputIteratorT d_out
< [in] Pointer to the input sequence of data items
Definition dispatch_reduce.cuh:71

cub::DevicePartition
DevicePartition provides device-wide, parallel operations for partitioning sequences of data items re...
Definition device_partition.cuh:74

cub::DevicePartition::Flagged
CUB_RUNTIME_FUNCTION static __forceinline__ cudaError_t Flagged(void *d_temp_storage, size_t &temp_storage_bytes, InputIteratorT d_in, FlagIterator d_flags, OutputIteratorT d_out, NumSelectedIteratorT d_num_selected_out, int num_items, cudaStream_t stream=0, bool debug_synchronous=false)
Uses the d_flags sequence to split the corresponding items from d_in into a partitioned sequence d_ou...
Definition device_partition.cuh:126

cub::DevicePartition::If
CUB_RUNTIME_FUNCTION static __forceinline__ cudaError_t If(void *d_temp_storage, size_t &temp_storage_bytes, InputIteratorT d_in, OutputIteratorT d_out, NumSelectedIteratorT d_num_selected_out, int num_items, SelectOp select_op, cudaStream_t stream=0, bool debug_synchronous=false)
Uses the select_op functor to split the corresponding items from d_in into a partitioned sequence d_o...
Definition device_partition.cuh:234

cub::DispatchSelectIf::Dispatch
CUB_RUNTIME_FUNCTION static __forceinline__ cudaError_t Dispatch(void *d_temp_storage, size_t &temp_storage_bytes, InputIteratorT d_in, FlagsInputIteratorT d_flags, SelectedOutputIteratorT d_selected_out, NumSelectedIteratorT d_num_selected_out, SelectOpT select_op, EqualityOpT equality_op, OffsetT num_items, cudaStream_t stream, bool debug_synchronous, int, ScanInitKernelPtrT scan_init_kernel, SelectIfKernelPtrT select_if_kernel, KernelConfig select_if_config)
< Function type of cub::SelectIfKernelPtrT
Definition dispatch_select_if.cuh:344

cub::NullType
A simple "NULL" marker type.
Definition util_type.cuh:257