doxygen/openfpm/util__type_8cuh_source.html

/******************************************************************************

 * Copyright (c) 2011, Duane Merrill.  All rights reserved.

 * Copyright (c) 2011-2018, NVIDIA CORPORATION.  All rights reserved.

 *

 * Redistribution and use in source and binary forms, with or without

 * modification, are permitted provided that the following conditions are met:

 *     * Redistributions of source code must retain the above copyright

 *       notice, this list of conditions and the following disclaimer.

 *     * Redistributions in binary form must reproduce the above copyright

 *       notice, this list of conditions and the following disclaimer in the

 *       documentation and/or other materials provided with the distribution.

 *     * Neither the name of the NVIDIA CORPORATION nor the

 *       names of its contributors may be used to endorse or promote products

 *       derived from this software without specific prior written permission.

 *

 * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" AND

 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED

 * WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE

 * DISCLAIMED. IN NO EVENT SHALL NVIDIA CORPORATION BE LIABLE FOR ANY

 * DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES

 * (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;

 * LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND

 * ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT

 * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS

 * SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.

 *

 ******************************************************************************/


#pragma once


#include <iostream>

#include <limits>

#include <cfloat>


#if (__CUDACC_VER_MAJOR__ >= 9)

    #include <cuda_fp16.h>

#endif


#include "util_macro.cuh"

#include "util_arch.cuh"

#include "util_namespace.cuh"


CUB_NS_PREFIX


namespace cub {


/******************************************************************************

 * Type equality

 ******************************************************************************/


template <bool IF, typename ThenType, typename ElseType>

struct If

{

    typedef ThenType Type;      // true

};


#ifndef DOXYGEN_SHOULD_SKIP_THIS    // Do not document


template <typename ThenType, typename ElseType>

struct If<false, ThenType, ElseType>

{

    typedef ElseType Type;      // false

};


#endif // DOXYGEN_SHOULD_SKIP_THIS


/******************************************************************************

 * Conditional types

 ******************************************************************************/


template <typename A, typename B>

struct Equals

{

    enum {

        VALUE = 0,

        NEGATE = 1

    };

};


#ifndef DOXYGEN_SHOULD_SKIP_THIS    // Do not document


template <typename A>

struct Equals <A, A>

{

    enum {

        VALUE = 1,

        NEGATE = 0

    };

};


#endif // DOXYGEN_SHOULD_SKIP_THIS


/******************************************************************************

 * Static math

 ******************************************************************************/


template <int N, int CURRENT_VAL = N, int COUNT = 0>

struct Log2

{

    enum { VALUE = Log2<N, (CURRENT_VAL >> 1), COUNT + 1>::VALUE };         // Inductive case

};


#ifndef DOXYGEN_SHOULD_SKIP_THIS    // Do not document


template <int N, int COUNT>

struct Log2<N, 0, COUNT>

{

    enum {VALUE = (1 << (COUNT - 1) < N) ?                                  // Base case

        COUNT :

        COUNT - 1 };

};


#endif // DOXYGEN_SHOULD_SKIP_THIS


template <int N>

struct PowerOfTwo

{

    enum { VALUE = ((N & (N - 1)) == 0) };

};


/******************************************************************************

 * Pointer vs. iterator detection

 ******************************************************************************/


template <typename Tp>

struct IsPointer

{

    enum { VALUE = 0 };

};


#ifndef DOXYGEN_SHOULD_SKIP_THIS    // Do not document


template <typename Tp>

struct IsPointer<Tp*>

{

    enum { VALUE = 1 };

};


#endif // DOXYGEN_SHOULD_SKIP_THIS


/******************************************************************************

 * Qualifier detection

 ******************************************************************************/


template <typename Tp>

struct IsVolatile

{

    enum { VALUE = 0 };

};


#ifndef DOXYGEN_SHOULD_SKIP_THIS    // Do not document


template <typename Tp>

struct IsVolatile<Tp volatile>

{

    enum { VALUE = 1 };

};


#endif // DOXYGEN_SHOULD_SKIP_THIS


/******************************************************************************

 * Qualifier removal

 ******************************************************************************/


template <typename Tp, typename Up = Tp>

struct RemoveQualifiers

{

    typedef Up Type;

};


#ifndef DOXYGEN_SHOULD_SKIP_THIS    // Do not document


template <typename Tp, typename Up>

struct RemoveQualifiers<Tp, volatile Up>

{

    typedef Up Type;

};


template <typename Tp, typename Up>

struct RemoveQualifiers<Tp, const Up>

{

    typedef Up Type;

};


template <typename Tp, typename Up>

struct RemoveQualifiers<Tp, const volatile Up>

{

    typedef Up Type;

};


/******************************************************************************

 * Marker types

 ******************************************************************************/


struct NullType

{

#ifndef DOXYGEN_SHOULD_SKIP_THIS    // Do not document


    template <typename T>

    __host__ __device__ __forceinline__ NullType& operator =(const T&) { return *this; }


    __host__ __device__ __forceinline__ bool operator ==(const NullType&) { return true; }


    __host__ __device__ __forceinline__ bool operator !=(const NullType&) { return false; }


#endif // DOXYGEN_SHOULD_SKIP_THIS

};


template <int A>

struct Int2Type

{

   enum {VALUE = A};

};


#ifndef DOXYGEN_SHOULD_SKIP_THIS    // Do not document


/******************************************************************************

 * Size and alignment

 ******************************************************************************/


template <typename T>

struct AlignBytes

{

    struct Pad

    {

        T       val;

        char    byte;

    };


    enum

    {

        ALIGN_BYTES = sizeof(Pad) - sizeof(T)

    };


    typedef T Type;

};


// Specializations where host C++ compilers (e.g., 32-bit Windows) may disagree

// with device C++ compilers (EDG) on types passed as template parameters through

// kernel functions


#define __CUB_ALIGN_BYTES(t, b)         \

    template <> struct AlignBytes<t>    \

    { enum { ALIGN_BYTES = b }; typedef __align__(b) t Type; };


__CUB_ALIGN_BYTES(short4, 8)

__CUB_ALIGN_BYTES(ushort4, 8)

__CUB_ALIGN_BYTES(int2, 8)

__CUB_ALIGN_BYTES(uint2, 8)

__CUB_ALIGN_BYTES(long long, 8)

__CUB_ALIGN_BYTES(unsigned long long, 8)

__CUB_ALIGN_BYTES(float2, 8)

__CUB_ALIGN_BYTES(double, 8)

#ifdef _WIN32

    __CUB_ALIGN_BYTES(long2, 8)

    __CUB_ALIGN_BYTES(ulong2, 8)

#else

    __CUB_ALIGN_BYTES(long2, 16)

    __CUB_ALIGN_BYTES(ulong2, 16)

#endif

__CUB_ALIGN_BYTES(int4, 16)

__CUB_ALIGN_BYTES(uint4, 16)

__CUB_ALIGN_BYTES(float4, 16)

__CUB_ALIGN_BYTES(long4, 16)

__CUB_ALIGN_BYTES(ulong4, 16)

__CUB_ALIGN_BYTES(longlong2, 16)

__CUB_ALIGN_BYTES(ulonglong2, 16)

__CUB_ALIGN_BYTES(double2, 16)

__CUB_ALIGN_BYTES(longlong4, 16)

__CUB_ALIGN_BYTES(ulonglong4, 16)

__CUB_ALIGN_BYTES(double4, 16)


template <typename T> struct AlignBytes<volatile T> : AlignBytes<T> {};

template <typename T> struct AlignBytes<const T> : AlignBytes<T> {};

template <typename T> struct AlignBytes<const volatile T> : AlignBytes<T> {};


template <typename T>

struct UnitWord

{

    enum {

        ALIGN_BYTES = AlignBytes<T>::ALIGN_BYTES

    };


    template <typename Unit>

    struct IsMultiple

    {

        enum {

            UNIT_ALIGN_BYTES    = AlignBytes<Unit>::ALIGN_BYTES,

            IS_MULTIPLE         = (sizeof(T) % sizeof(Unit) == 0) && (ALIGN_BYTES % UNIT_ALIGN_BYTES == 0)

        };

    };


    typedef typename If<IsMultiple<int>::IS_MULTIPLE,

        unsigned int,

        typename If<IsMultiple<short>::IS_MULTIPLE,

            unsigned short,

            unsigned char>::Type>::Type         ShuffleWord;


    typedef typename If<IsMultiple<long long>::IS_MULTIPLE,

        unsigned long long,

        ShuffleWord>::Type                      VolatileWord;


    typedef typename If<IsMultiple<longlong2>::IS_MULTIPLE,

        ulonglong2,

        VolatileWord>::Type                     DeviceWord;


    typedef typename If<IsMultiple<int4>::IS_MULTIPLE,

        uint4,

        typename If<IsMultiple<int2>::IS_MULTIPLE,

            uint2,

            ShuffleWord>::Type>::Type           TextureWord;

};


// float2 specialization workaround (for SM10-SM13)

template <>

struct UnitWord <float2>

{

    typedef int         ShuffleWord;

#if (CUB_PTX_ARCH > 0) && (CUB_PTX_ARCH <= 130)

    typedef float       VolatileWord;

    typedef uint2       DeviceWord;

#else

    typedef unsigned long long   VolatileWord;

    typedef unsigned long long   DeviceWord;

#endif

    typedef float2      TextureWord;

};


// float4 specialization workaround (for SM10-SM13)

template <>

struct UnitWord <float4>

{

    typedef int         ShuffleWord;

#if (CUB_PTX_ARCH > 0) && (CUB_PTX_ARCH <= 130)

    typedef float               VolatileWord;

    typedef uint4               DeviceWord;

#else

    typedef unsigned long long  VolatileWord;

    typedef ulonglong2          DeviceWord;

#endif

    typedef float4              TextureWord;

};


// char2 specialization workaround (for SM10-SM13)

template <>

struct UnitWord <char2>

{

    typedef unsigned short      ShuffleWord;

#if (CUB_PTX_ARCH > 0) && (CUB_PTX_ARCH <= 130)

    typedef unsigned short      VolatileWord;

    typedef short               DeviceWord;

#else

    typedef unsigned short      VolatileWord;

    typedef unsigned short      DeviceWord;

#endif

    typedef unsigned short      TextureWord;

};


template <typename T> struct UnitWord<volatile T> : UnitWord<T> {};

template <typename T> struct UnitWord<const T> : UnitWord<T> {};

template <typename T> struct UnitWord<const volatile T> : UnitWord<T> {};


#endif // DOXYGEN_SHOULD_SKIP_THIS


/******************************************************************************

 * Vector type inference utilities.

 ******************************************************************************/


template <typename T, int vec_elements> struct CubVector;


#ifndef DOXYGEN_SHOULD_SKIP_THIS    // Do not document


enum

{

    MAX_VEC_ELEMENTS = 4,

};


template <typename T>

struct CubVector<T, 1>

{

    T x;


    typedef T BaseType;

    typedef CubVector<T, 1> Type;

};


template <typename T>

struct CubVector<T, 2>

{

    T x;

    T y;


    typedef T BaseType;

    typedef CubVector<T, 2> Type;

};


template <typename T>

struct CubVector<T, 3>

{

    T x;

    T y;

    T z;


    typedef T BaseType;

    typedef CubVector<T, 3> Type;

};


template <typename T>

struct CubVector<T, 4>

{

    T x;

    T y;

    T z;

    T w;


    typedef T BaseType;

    typedef CubVector<T, 4> Type;

};


#define CUB_DEFINE_VECTOR_TYPE(base_type,short_type)                                                    \

                                                                                                        \

    template<> struct CubVector<base_type, 1> : short_type##1                                           \

    {                                                                                                   \

      typedef base_type       BaseType;                                                                 \

      typedef short_type##1   Type;                                                                     \

      __host__ __device__ __forceinline__ CubVector operator+(const CubVector &other) const {           \

          CubVector retval;                                                                             \

          retval.x = x + other.x;                                                                       \

          return retval;                                                                                \

      }                                                                                                 \

      __host__ __device__ __forceinline__ CubVector operator-(const CubVector &other) const {           \

          CubVector retval;                                                                             \

          retval.x = x - other.x;                                                                       \

          return retval;                                                                                \

      }                                                                                                 \

    };                                                                                                  \

                                                                                                        \

    template<> struct CubVector<base_type, 2> : short_type##2                                           \

    {                                                                                                   \

        typedef base_type       BaseType;                                                               \

        typedef short_type##2   Type;                                                                   \

        __host__ __device__ __forceinline__ CubVector operator+(const CubVector &other) const {         \

            CubVector retval;                                                                           \

            retval.x = x + other.x;                                                                     \

            retval.y = y + other.y;                                                                     \

            return retval;                                                                              \

        }                                                                                               \

        __host__ __device__ __forceinline__ CubVector operator-(const CubVector &other) const {         \

            CubVector retval;                                                                           \

            retval.x = x - other.x;                                                                     \

            retval.y = y - other.y;                                                                     \

            return retval;                                                                              \

        }                                                                                               \

    };                                                                                                  \

                                                                                                        \

    template<> struct CubVector<base_type, 3> : short_type##3                                           \

    {                                                                                                   \

        typedef base_type       BaseType;                                                               \

        typedef short_type##3   Type;                                                                   \

        __host__ __device__ __forceinline__ CubVector operator+(const CubVector &other) const {         \

            CubVector retval;                                                                           \

            retval.x = x + other.x;                                                                     \

            retval.y = y + other.y;                                                                     \

            retval.z = z + other.z;                                                                     \

            return retval;                                                                              \

        }                                                                                               \

        __host__ __device__ __forceinline__ CubVector operator-(const CubVector &other) const {         \

            CubVector retval;                                                                           \

            retval.x = x - other.x;                                                                     \

            retval.y = y - other.y;                                                                     \

            retval.z = z - other.z;                                                                     \

            return retval;                                                                              \

        }                                                                                               \

    };                                                                                                  \

                                                                                                        \

    template<> struct CubVector<base_type, 4> : short_type##4                                           \

    {                                                                                                   \

        typedef base_type       BaseType;                                                               \

        typedef short_type##4   Type;                                                                   \

        __host__ __device__ __forceinline__ CubVector operator+(const CubVector &other) const {         \

            CubVector retval;                                                                           \

            retval.x = x + other.x;                                                                     \

            retval.y = y + other.y;                                                                     \

            retval.z = z + other.z;                                                                     \

            retval.w = w + other.w;                                                                     \

            return retval;                                                                              \

        }                                                                                               \

        __host__ __device__ __forceinline__ CubVector operator-(const CubVector &other) const {         \

            CubVector retval;                                                                           \

            retval.x = x - other.x;                                                                     \

            retval.y = y - other.y;                                                                     \

            retval.z = z - other.z;                                                                     \

            retval.w = w - other.w;                                                                     \

            return retval;                                                                              \

        }                                                                                               \

    };


// Expand CUDA vector types for built-in primitives

CUB_DEFINE_VECTOR_TYPE(char,               char)

CUB_DEFINE_VECTOR_TYPE(signed char,        char)

CUB_DEFINE_VECTOR_TYPE(short,              short)

CUB_DEFINE_VECTOR_TYPE(int,                int)

CUB_DEFINE_VECTOR_TYPE(long,               long)

CUB_DEFINE_VECTOR_TYPE(long long,          longlong)

CUB_DEFINE_VECTOR_TYPE(unsigned char,      uchar)

CUB_DEFINE_VECTOR_TYPE(unsigned short,     ushort)

CUB_DEFINE_VECTOR_TYPE(unsigned int,       uint)

CUB_DEFINE_VECTOR_TYPE(unsigned long,      ulong)

CUB_DEFINE_VECTOR_TYPE(unsigned long long, ulonglong)

CUB_DEFINE_VECTOR_TYPE(float,              float)

CUB_DEFINE_VECTOR_TYPE(double,             double)

CUB_DEFINE_VECTOR_TYPE(bool,               uchar)


// Undefine macros

#undef CUB_DEFINE_VECTOR_TYPE


#endif // DOXYGEN_SHOULD_SKIP_THIS


/******************************************************************************

 * Wrapper types

 ******************************************************************************/


template <typename T>

struct Uninitialized

{

    typedef typename UnitWord<T>::DeviceWord DeviceWord;


    enum

    {

        WORDS = sizeof(T) / sizeof(DeviceWord)

    };


    DeviceWord storage[WORDS];


    __host__ __device__ __forceinline__ T& Alias()

    {

        return reinterpret_cast<T&>(*this);

    }

};


template <

    typename    _Key,

    typename    _Value

#if defined(_WIN32) && !defined(_WIN64)

    , bool KeyIsLT = (AlignBytes<_Key>::ALIGN_BYTES < AlignBytes<_Value>::ALIGN_BYTES)

    , bool ValIsLT = (AlignBytes<_Value>::ALIGN_BYTES < AlignBytes<_Key>::ALIGN_BYTES)

#endif // #if defined(_WIN32) && !defined(_WIN64)

    >

struct KeyValuePair

{

    typedef _Key    Key;

    typedef _Value  Value;


    Key     key;

    Value   value;


    __host__ __device__ __forceinline__

    KeyValuePair() {}


    __host__ __device__ __forceinline__

    KeyValuePair(Key const& key, Value const& value) : key(key), value(value) {}


    __host__ __device__ __forceinline__ bool operator !=(const KeyValuePair &b)

    {

        return (value != b.value) || (key != b.key);

    }

};


#if defined(_WIN32) && !defined(_WIN64)


template <typename K, typename V>

struct KeyValuePair<K, V, true, false>

{

    typedef K Key;

    typedef V Value;


    typedef char Pad[AlignBytes<V>::ALIGN_BYTES - AlignBytes<K>::ALIGN_BYTES];


    Value   value;  // Value has larger would-be alignment and goes first

    Key     key;

    Pad     pad;


    __host__ __device__ __forceinline__

    KeyValuePair() {}


    __host__ __device__ __forceinline__

    KeyValuePair(Key const& key, Value const& value) : key(key), value(value) {}


    __host__ __device__ __forceinline__ bool operator !=(const KeyValuePair &b)

    {

        return (value != b.value) || (key != b.key);

    }

};


template <typename K, typename V>

struct KeyValuePair<K, V, false, true>

{

    typedef K Key;

    typedef V Value;


    typedef char Pad[AlignBytes<K>::ALIGN_BYTES - AlignBytes<V>::ALIGN_BYTES];


    Key     key;    // Key has larger would-be alignment and goes first

    Value   value;

    Pad     pad;


    __host__ __device__ __forceinline__

    KeyValuePair() {}


    __host__ __device__ __forceinline__

    KeyValuePair(Key const& key, Value const& value) : key(key), value(value) {}


    __host__ __device__ __forceinline__ bool operator !=(const KeyValuePair &b)

    {

        return (value != b.value) || (key != b.key);

    }

};


#endif // #if defined(_WIN32) && !defined(_WIN64)


#ifndef DOXYGEN_SHOULD_SKIP_THIS    // Do not document


template <typename T, int COUNT>

struct ArrayWrapper

{


    T array[COUNT];


    __host__ __device__ __forceinline__ ArrayWrapper() {}

};


#endif // DOXYGEN_SHOULD_SKIP_THIS


template <typename T>

struct DoubleBuffer

{

    T *d_buffers[2];


    int selector;


    __host__ __device__ __forceinline__ DoubleBuffer()

    {

        selector = 0;

        d_buffers[0] = NULL;

        d_buffers[1] = NULL;

    }


    __host__ __device__ __forceinline__ DoubleBuffer(

        T *d_current,

        T *d_alternate)

    {

        selector = 0;

        d_buffers[0] = d_current;

        d_buffers[1] = d_alternate;

    }


    __host__ __device__ __forceinline__ T* Current() { return d_buffers[selector]; }


    __host__ __device__ __forceinline__ T* Alternate() { return d_buffers[selector ^ 1]; }


};


/******************************************************************************

 * Typedef-detection

 ******************************************************************************/


#define CUB_DEFINE_DETECT_NESTED_TYPE(detector_name, nested_type_name)  \

    template <typename T>                                               \

    struct detector_name                                                \

    {                                                                   \

        template <typename C>                                           \

        static char& test(typename C::nested_type_name*);               \

        template <typename>                                             \

        static int& test(...);                                          \

        enum                                                            \

        {                                                               \

            VALUE = sizeof(test<T>(0)) < sizeof(int)                    \

        };                                                              \

    };


/******************************************************************************

 * Simple enable-if (similar to Boost)

 ******************************************************************************/


template <bool Condition, class T = void>

struct EnableIf

{

    typedef T Type;

};


template <class T>

struct EnableIf<false, T> {};


/******************************************************************************

 * Typedef-detection

 ******************************************************************************/


template <typename T, typename BinaryOp>

struct BinaryOpHasIdxParam

{

private:

/*

    template <typename BinaryOpT, bool (BinaryOpT::*)(const T &a, const T &b, unsigned int idx) const>  struct SFINAE1 {};

    template <typename BinaryOpT, bool (BinaryOpT::*)(const T &a, const T &b, unsigned int idx)>        struct SFINAE2 {};

    template <typename BinaryOpT, bool (BinaryOpT::*)(T a, T b, unsigned int idx) const>                struct SFINAE3 {};

    template <typename BinaryOpT, bool (BinaryOpT::*)(T a, T b, unsigned int idx)>                      struct SFINAE4 {};

*/

    template <typename BinaryOpT, bool (BinaryOpT::*)(const T &a, const T &b, int idx) const>           struct SFINAE5 {};

    template <typename BinaryOpT, bool (BinaryOpT::*)(const T &a, const T &b, int idx)>                 struct SFINAE6 {};

    template <typename BinaryOpT, bool (BinaryOpT::*)(T a, T b, int idx) const>                         struct SFINAE7 {};

    template <typename BinaryOpT, bool (BinaryOpT::*)(T a, T b, int idx)>                               struct SFINAE8 {};

/*

    template <typename BinaryOpT> static char Test(SFINAE1<BinaryOpT, &BinaryOpT::operator()> *);

    template <typename BinaryOpT> static char Test(SFINAE2<BinaryOpT, &BinaryOpT::operator()> *);

    template <typename BinaryOpT> static char Test(SFINAE3<BinaryOpT, &BinaryOpT::operator()> *);

    template <typename BinaryOpT> static char Test(SFINAE4<BinaryOpT, &BinaryOpT::operator()> *);

*/

    template <typename BinaryOpT> __host__ __device__ static char Test(SFINAE5<BinaryOpT, &BinaryOpT::operator()> *);

    template <typename BinaryOpT> __host__ __device__ static char Test(SFINAE6<BinaryOpT, &BinaryOpT::operator()> *);

    template <typename BinaryOpT> __host__ __device__ static char Test(SFINAE7<BinaryOpT, &BinaryOpT::operator()> *);

    template <typename BinaryOpT> __host__ __device__ static char Test(SFINAE8<BinaryOpT, &BinaryOpT::operator()> *);


    template <typename BinaryOpT> static int Test(...);


public:


    static const bool HAS_PARAM = sizeof(Test<BinaryOp>(NULL)) == sizeof(char);

};


/******************************************************************************

 * Simple type traits utilities.

 *

 * For example:

 *     Traits<int>::CATEGORY             // SIGNED_INTEGER

 *     Traits<NullType>::NULL_TYPE       // true

 *     Traits<uint4>::CATEGORY           // NOT_A_NUMBER

 *     Traits<uint4>::PRIMITIVE;         // false

 *

 ******************************************************************************/


enum Category

{

    NOT_A_NUMBER,

    SIGNED_INTEGER,

    UNSIGNED_INTEGER,

    FLOATING_POINT

};


template <Category _CATEGORY, bool _PRIMITIVE, bool _NULL_TYPE, typename _UnsignedBits, typename T>

struct BaseTraits

{

    static const Category CATEGORY      = _CATEGORY;

    enum

    {

        PRIMITIVE       = _PRIMITIVE,

        NULL_TYPE       = _NULL_TYPE,

    };

};


template <typename _UnsignedBits, typename T>

struct BaseTraits<UNSIGNED_INTEGER, true, false, _UnsignedBits, T>

{

    typedef _UnsignedBits       UnsignedBits;


    static const Category       CATEGORY    = UNSIGNED_INTEGER;

    static const UnsignedBits   LOWEST_KEY  = UnsignedBits(0);

    static const UnsignedBits   MAX_KEY     = UnsignedBits(-1);


    enum

    {

        PRIMITIVE       = true,

        NULL_TYPE       = false,

    };


    static __device__ __forceinline__ UnsignedBits TwiddleIn(UnsignedBits key)

    {

        return key;

    }


    static __device__ __forceinline__ UnsignedBits TwiddleOut(UnsignedBits key)

    {

        return key;

    }


    static __host__ __device__ __forceinline__ T Max()

    {

        UnsignedBits retval = MAX_KEY;

        return reinterpret_cast<T&>(retval);

    }


    static __host__ __device__ __forceinline__ T Lowest()

    {

        UnsignedBits retval = LOWEST_KEY;

        return reinterpret_cast<T&>(retval);

    }

};


template <typename _UnsignedBits, typename T>

struct BaseTraits<SIGNED_INTEGER, true, false, _UnsignedBits, T>

{

    typedef _UnsignedBits       UnsignedBits;


    static const Category       CATEGORY    = SIGNED_INTEGER;

    static const UnsignedBits   HIGH_BIT    = UnsignedBits(1) << ((sizeof(UnsignedBits) * 8) - 1);

    static const UnsignedBits   LOWEST_KEY  = HIGH_BIT;

    static const UnsignedBits   MAX_KEY     = UnsignedBits(-1) ^ HIGH_BIT;


    enum

    {

        PRIMITIVE       = true,

        NULL_TYPE       = false,

    };


    static __device__ __forceinline__ UnsignedBits TwiddleIn(UnsignedBits key)

    {

        return key ^ HIGH_BIT;

    };


    static __device__ __forceinline__ UnsignedBits TwiddleOut(UnsignedBits key)

    {

        return key ^ HIGH_BIT;

    };


    static __host__ __device__ __forceinline__ T Max()

    {

        UnsignedBits retval = MAX_KEY;

        return reinterpret_cast<T&>(retval);

    }


    static __host__ __device__ __forceinline__ T Lowest()

    {

        UnsignedBits retval = LOWEST_KEY;

        return reinterpret_cast<T&>(retval);

    }

};


template <typename _T>

struct FpLimits;


template <>

struct FpLimits<float>

{

    static __host__ __device__ __forceinline__ float Max() {

        return FLT_MAX;

    }


    static __host__ __device__ __forceinline__ float Lowest() {

        return FLT_MAX * float(-1);

    }

};


template <>

struct FpLimits<double>

{

    static __host__ __device__ __forceinline__ double Max() {

        return DBL_MAX;

    }


    static __host__ __device__ __forceinline__ double Lowest() {

        return DBL_MAX  * double(-1);

    }

};


#if (__CUDACC_VER_MAJOR__ >= 9)

template <>

struct FpLimits<__half>

{

    static __host__ __device__ __forceinline__ __half Max() {

        unsigned short max_word = 0x7BFF;

        return reinterpret_cast<__half&>(max_word);

    }


    static __host__ __device__ __forceinline__ __half Lowest() {

        unsigned short lowest_word = 0xFBFF;

        return reinterpret_cast<__half&>(lowest_word);

    }

};

#endif


template <typename _UnsignedBits, typename T>

struct BaseTraits<FLOATING_POINT, true, false, _UnsignedBits, T>

{

    typedef _UnsignedBits       UnsignedBits;


    static const Category       CATEGORY    = FLOATING_POINT;

    static const UnsignedBits   HIGH_BIT    = UnsignedBits(1) << ((sizeof(UnsignedBits) * 8) - 1);

    static const UnsignedBits   LOWEST_KEY  = UnsignedBits(-1);

    static const UnsignedBits   MAX_KEY     = UnsignedBits(-1) ^ HIGH_BIT;


    enum

    {

        PRIMITIVE       = true,

        NULL_TYPE       = false,

    };


    static __device__ __forceinline__ UnsignedBits TwiddleIn(UnsignedBits key)

    {

        UnsignedBits mask = (key & HIGH_BIT) ? UnsignedBits(-1) : HIGH_BIT;

        return key ^ mask;

    };


    static __device__ __forceinline__ UnsignedBits TwiddleOut(UnsignedBits key)

    {

        UnsignedBits mask = (key & HIGH_BIT) ? HIGH_BIT : UnsignedBits(-1);

        return key ^ mask;

    };


    static __host__ __device__ __forceinline__ T Max() {

        return FpLimits<T>::Max();

    }


    static __host__ __device__ __forceinline__ T Lowest() {

        return FpLimits<T>::Lowest();

    }

};


template <typename T> struct NumericTraits :            BaseTraits<NOT_A_NUMBER, false, false, T, T> {};


template <> struct NumericTraits<NullType> :            BaseTraits<NOT_A_NUMBER, false, true, NullType, NullType> {};


template <> struct NumericTraits<char> :                BaseTraits<(std::numeric_limits<char>::is_signed) ? SIGNED_INTEGER : UNSIGNED_INTEGER, true, false, unsigned char, char> {};

template <> struct NumericTraits<signed char> :         BaseTraits<SIGNED_INTEGER, true, false, unsigned char, signed char> {};

template <> struct NumericTraits<short> :               BaseTraits<SIGNED_INTEGER, true, false, unsigned short, short> {};

template <> struct NumericTraits<int> :                 BaseTraits<SIGNED_INTEGER, true, false, unsigned int, int> {};

template <> struct NumericTraits<long> :                BaseTraits<SIGNED_INTEGER, true, false, unsigned long, long> {};

template <> struct NumericTraits<long long> :           BaseTraits<SIGNED_INTEGER, true, false, unsigned long long, long long> {};


template <> struct NumericTraits<unsigned char> :       BaseTraits<UNSIGNED_INTEGER, true, false, unsigned char, unsigned char> {};

template <> struct NumericTraits<unsigned short> :      BaseTraits<UNSIGNED_INTEGER, true, false, unsigned short, unsigned short> {};

template <> struct NumericTraits<unsigned int> :        BaseTraits<UNSIGNED_INTEGER, true, false, unsigned int, unsigned int> {};

template <> struct NumericTraits<unsigned long> :       BaseTraits<UNSIGNED_INTEGER, true, false, unsigned long, unsigned long> {};

template <> struct NumericTraits<unsigned long long> :  BaseTraits<UNSIGNED_INTEGER, true, false, unsigned long long, unsigned long long> {};


template <> struct NumericTraits<float> :               BaseTraits<FLOATING_POINT, true, false, unsigned int, float> {};

template <> struct NumericTraits<double> :              BaseTraits<FLOATING_POINT, true, false, unsigned long long, double> {};

#if (__CUDACC_VER_MAJOR__ >= 9)

    template <> struct NumericTraits<__half> :          BaseTraits<FLOATING_POINT, true, false, unsigned short, __half> {};

#endif


template <> struct NumericTraits<bool> :                BaseTraits<UNSIGNED_INTEGER, true, false, typename UnitWord<bool>::VolatileWord, bool> {};


template <typename T>

struct Traits : NumericTraits<typename RemoveQualifiers<T>::Type> {};


#endif // DOXYGEN_SHOULD_SKIP_THIS


       // end group UtilModule


}               // CUB namespace

CUB_NS_POSTFIX  // Optional outer namespace(s)

cub::BlockRadixRank
BlockRadixRank provides operations for ranking unsigned integer types within a CUDA thread block.
Definition block_radix_rank.cuh:98

CUB_DEFINE_VECTOR_TYPE
#define CUB_DEFINE_VECTOR_TYPE(base_type, short_type)
Definition util_type.cuh:523

cub::Category
Category
Basic type traits categories.
Definition util_type.cuh:929

cub::MAX_VEC_ELEMENTS
@ MAX_VEC_ELEMENTS
The maximum number of elements in CUDA vector types.
Definition util_type.cuh:461

cub
Optional outer namespace(s)
Definition agent_histogram.cuh:48

cub::int
KeyT const ValueT ValueT OffsetIteratorT OffsetIteratorT int
[in] The number of segments that comprise the sorting data
Definition dispatch_radix_sort.cuh:336

cub::AlignBytes::Pad
Definition util_type.cuh:293

cub::AlignBytes
Structure alignment.
Definition util_type.cuh:291

cub::AlignBytes::Type
T Type
The "truly aligned" type.
Definition util_type.cuh:305

cub::AlignBytes::ALIGN_BYTES
@ ALIGN_BYTES
The "true CUDA" alignment of T in bytes.
Definition util_type.cuh:301

cub::ArrayWrapper
A wrapper for passing simple static arrays as kernel parameters.
Definition util_type.cuh:771

cub::ArrayWrapper::ArrayWrapper
__host__ __device__ __forceinline__ ArrayWrapper()
Constructor.
Definition util_type.cuh:777

cub::BaseTraits
Basic type traits.
Definition util_type.cuh:942

cub::BinaryOpHasIdxParam::SFINAE5
Definition util_type.cuh:888

cub::BinaryOpHasIdxParam::SFINAE6
Definition util_type.cuh:889

cub::BinaryOpHasIdxParam::SFINAE7
Definition util_type.cuh:890

cub::BinaryOpHasIdxParam::SFINAE8
Definition util_type.cuh:891

cub::BinaryOpHasIdxParam
Determine whether or not BinaryOp's functor is of the form bool operator()(const T& a,...
Definition util_type.cuh:880

cub::CubVector< T, 1 >
Definition util_type.cuh:470

cub::CubVector< T, 2 >
Definition util_type.cuh:482

cub::CubVector< T, 3 >
Definition util_type.cuh:495

cub::CubVector< T, 4 >
Definition util_type.cuh:509

cub::CubVector
Exposes a member typedef Type that names the corresponding CUDA vector type if one exists....
Definition util_type.cuh:454

cub::DoubleBuffer
Double-buffer storage wrapper for multi-pass stream transformations that require more than one storag...
Definition util_type.cuh:792

cub::DoubleBuffer::Current
__host__ __device__ __forceinline__ T * Current()
Return pointer to the currently valid buffer.
Definition util_type.cuh:818

cub::DoubleBuffer::DoubleBuffer
__host__ __device__ __forceinline__ DoubleBuffer(T *d_current, T *d_alternate)
Constructor.
Definition util_type.cuh:808

cub::DoubleBuffer::DoubleBuffer
__host__ __device__ __forceinline__ DoubleBuffer()
Constructor.
Definition util_type.cuh:800

cub::DoubleBuffer::selector
int selector
Selector into d_buffers (i.e., the active/valid buffer)
Definition util_type.cuh:797

cub::DoubleBuffer::Alternate
__host__ __device__ __forceinline__ T * Alternate()
Return pointer to the currently invalid buffer.
Definition util_type.cuh:821

cub::EnableIf
Simple enable-if (similar to Boost)
Definition util_type.cuh:860

cub::EnableIf::Type
T Type
Enable-if type for SFINAE dummy variables.
Definition util_type.cuh:862

cub::Equals
Type equality test.
Definition util_type.cuh:99

cub::FpLimits
Definition util_type.cuh:1039

cub::If
Type selection (IF ? ThenType : ElseType)
Definition util_type.cuh:73

cub::If::Type
ThenType Type
Conditional type result.
Definition util_type.cuh:75

cub::Int2Type
Allows for the treatment of an integral constant as a type at compile-time (e.g., to achieve static c...
Definition util_type.cuh:276

cub::IsPointer
Pointer vs. iterator.
Definition util_type.cuh:171

cub::IsVolatile
Volatile modifier test.
Definition util_type.cuh:196

cub::KeyValuePair
A key identifier paired with a corresponding value.
Definition util_type.cuh:667

cub::KeyValuePair::KeyValuePair
__host__ __device__ __forceinline__ KeyValuePair()
Constructor.
Definition util_type.cuh:676

cub::KeyValuePair::Key
_Key Key
Key data type.
Definition util_type.cuh:668

cub::KeyValuePair::value
Value value
Item value.
Definition util_type.cuh:672

cub::KeyValuePair::key
Key key
Item key.
Definition util_type.cuh:671

cub::KeyValuePair::KeyValuePair
__host__ __device__ __forceinline__ KeyValuePair(Key const &key, Value const &value)
Constructor.
Definition util_type.cuh:680

cub::KeyValuePair::Value
_Value Value
Value data type.
Definition util_type.cuh:669

cub::Log2
Statically determine log2(N), rounded up.
Definition util_type.cuh:133

cub::Max
Default max functor.
Definition thread_operators.cuh:124

cub::NullType
A simple "NULL" marker type.
Definition util_type.cuh:257

cub::NumericTraits
Numeric type traits.
Definition util_type.cuh:1127

cub::PowerOfTwo
Statically determine if N is a power-of-two.
Definition util_type.cuh:156

cub::RemoveQualifiers
Removes const and volatile qualifiers from type Tp.
Definition util_type.cuh:223

cub::RemoveQualifiers::Type
Up Type
Type without const and volatile qualifiers.
Definition util_type.cuh:225

cub::Traits
Type traits.
Definition util_type.cuh:1158

cub::Uninitialized
A storage-backing wrapper that allows types with non-trivial constructors to be aliased in unions.
Definition util_type.cuh:635

cub::Uninitialized::storage
DeviceWord storage[WORDS]
Backing storage.
Definition util_type.cuh:645

cub::Uninitialized::Alias
__host__ __device__ __forceinline__ T & Alias()
Alias.
Definition util_type.cuh:648

cub::Uninitialized::DeviceWord
UnitWord< T >::DeviceWord DeviceWord
Biggest memory-access word that T is a whole multiple of and is not larger than the alignment of T.
Definition util_type.cuh:637

cub::UnitWord::IsMultiple
Definition util_type.cuh:358

cub::UnitWord
Unit-words of data movement.
Definition util_type.cuh:351

cub::UnitWord::DeviceWord
If< IsMultiple< longlong2 >::IS_MULTIPLE, ulonglong2, VolatileWord >::Type DeviceWord
Biggest memory-access word that T is a whole multiple of and is not larger than the alignment of T.
Definition util_type.cuh:380

cub::UnitWord::VolatileWord
If< IsMultiple< longlong >::IS_MULTIPLE, unsignedlonglong, ShuffleWord >::Type VolatileWord
Biggest volatile word that T is a whole multiple of and is not larger than the alignment of T.
Definition util_type.cuh:375

cub::UnitWord::TextureWord
If< IsMultiple< int4 >::IS_MULTIPLE, uint4, typenameIf< IsMultiple< int2 >::IS_MULTIPLE, uint2, ShuffleWord >::Type >::Type TextureWord
Biggest texture reference word that T is a whole multiple of and is not larger than the alignment of ...
Definition util_type.cuh:387

cub::UnitWord::ShuffleWord
If< IsMultiple< int >::IS_MULTIPLE, unsignedint, typenameIf< IsMultiple< short >::IS_MULTIPLE, unsignedshort, unsignedchar >::Type >::Type ShuffleWord
Biggest shuffle word that T is a whole multiple of and is not larger than the alignment of T.
Definition util_type.cuh:370

util_arch.cuh

util_namespace.cuh