doxygen/openfpm/tex__obj__input__iterator_8cuh_source.html

/******************************************************************************

 * Copyright (c) 2011, Duane Merrill.  All rights reserved.

 * Copyright (c) 2011-2018, NVIDIA CORPORATION.  All rights reserved.

 *

 * Redistribution and use in source and binary forms, with or without

 * modification, are permitted provided that the following conditions are met:

 *     * Redistributions of source code must retain the above copyright

 *       notice, this list of conditions and the following disclaimer.

 *     * Redistributions in binary form must reproduce the above copyright

 *       notice, this list of conditions and the following disclaimer in the

 *       documentation and/or other materials provided with the distribution.

 *     * Neither the name of the NVIDIA CORPORATION nor the

 *       names of its contributors may be used to endorse or promote products

 *       derived from this software without specific prior written permission.

 *

 * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" AND

 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED

 * WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE

 * DISCLAIMED. IN NO EVENT SHALL NVIDIA CORPORATION BE LIABLE FOR ANY

 * DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES

 * (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;

 * LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND

 * ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT

 * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS

 * SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.

 *

 ******************************************************************************/


#pragma once


#include <iterator>

#include <iostream>


#include "../thread/thread_load.cuh"

#include "../thread/thread_store.cuh"

#include "../util_device.cuh"

#include "../util_debug.cuh"

#include "../util_namespace.cuh"


#if (THRUST_VERSION >= 100700)

    // This iterator is compatible with Thrust API 1.7 and newer

    #include <thrust/iterator/iterator_facade.h>

    #include <thrust/iterator/iterator_traits.h>

#endif // THRUST_VERSION


CUB_NS_PREFIX


namespace cub {


template <

    typename    T,

    typename    OffsetT = ptrdiff_t>

class TexObjInputIterator

{

public:


    // Required iterator traits

    typedef TexObjInputIterator                 self_type;

    typedef OffsetT                             difference_type;

    typedef T                                   value_type;

    typedef T*                                  pointer;

    typedef T                                   reference;


#if (THRUST_VERSION >= 100700)

    // Use Thrust's iterator categories so we can use these iterators in Thrust 1.7 (or newer) methods

    typedef typename thrust::detail::iterator_facade_category<

        thrust::device_system_tag,

        thrust::random_access_traversal_tag,

        value_type,

        reference

      >::type iterator_category;

#else

    typedef std::random_access_iterator_tag     iterator_category;

#endif  // THRUST_VERSION


private:


    // Largest texture word we can use in device

    typedef typename UnitWord<T>::TextureWord TextureWord;


    // Number of texture words per T

    enum {

        TEXTURE_MULTIPLE = sizeof(T) / sizeof(TextureWord)

    };


private:


    T*                  ptr;

    difference_type     tex_offset;

    cudaTextureObject_t tex_obj;


public:


    __host__ __device__ __forceinline__ TexObjInputIterator()

    :

        ptr(NULL),

        tex_offset(0),

        tex_obj(0)

    {}


    template <typename QualifiedT>

    cudaError_t BindTexture(

        QualifiedT      *ptr,

        size_t          bytes = size_t(-1),

        size_t          tex_offset = 0)

    {

        this->ptr = const_cast<typename RemoveQualifiers<QualifiedT>::Type *>(ptr);

        this->tex_offset = tex_offset;


        cudaChannelFormatDesc   channel_desc = cudaCreateChannelDesc<TextureWord>();

        cudaResourceDesc        res_desc;

        cudaTextureDesc         tex_desc;

        memset(&res_desc, 0, sizeof(cudaResourceDesc));

        memset(&tex_desc, 0, sizeof(cudaTextureDesc));

        res_desc.resType                = cudaResourceTypeLinear;

        res_desc.res.linear.devPtr      = this->ptr;

        res_desc.res.linear.desc        = channel_desc;

        res_desc.res.linear.sizeInBytes = bytes;

        tex_desc.readMode               = cudaReadModeElementType;

        return cudaCreateTextureObject(&tex_obj, &res_desc, &tex_desc, NULL);

    }


    cudaError_t UnbindTexture()

    {

        return cudaDestroyTextureObject(tex_obj);

    }


    __host__ __device__ __forceinline__ self_type operator++(int)

    {

        self_type retval = *this;

        tex_offset++;

        return retval;

    }


    __host__ __device__ __forceinline__ self_type operator++()

    {

        tex_offset++;

        return *this;

    }


    __host__ __device__ __forceinline__ reference operator*() const

    {

#if (CUB_PTX_ARCH == 0)

        // Simply dereference the pointer on the host

        return ptr[tex_offset];

#else

        // Move array of uninitialized words, then alias and assign to return value

        TextureWord words[TEXTURE_MULTIPLE];


        #pragma unroll

        for (int i = 0; i < TEXTURE_MULTIPLE; ++i)

        {

            words[i] = tex1Dfetch<TextureWord>(

                tex_obj,

                (tex_offset * TEXTURE_MULTIPLE) + i);

        }


        // Load from words

        return *reinterpret_cast<T*>(words);

#endif

    }


    template <typename Distance>

    __host__ __device__ __forceinline__ self_type operator+(Distance n) const

    {

        self_type retval;

        retval.ptr          = ptr;

        retval.tex_obj      = tex_obj;

        retval.tex_offset   = tex_offset + n;

        return retval;

    }


    template <typename Distance>

    __host__ __device__ __forceinline__ self_type& operator+=(Distance n)

    {

        tex_offset += n;

        return *this;

    }


    template <typename Distance>

    __host__ __device__ __forceinline__ self_type operator-(Distance n) const

    {

        self_type retval;

        retval.ptr          = ptr;

        retval.tex_obj      = tex_obj;

        retval.tex_offset   = tex_offset - n;

        return retval;

    }


    template <typename Distance>

    __host__ __device__ __forceinline__ self_type& operator-=(Distance n)

    {

        tex_offset -= n;

        return *this;

    }


    __host__ __device__ __forceinline__ difference_type operator-(self_type other) const

    {

        return tex_offset - other.tex_offset;

    }


    template <typename Distance>

    __host__ __device__ __forceinline__ reference operator[](Distance n) const

    {

        self_type offset = (*this) + n;

        return *offset;

    }


    __host__ __device__ __forceinline__ pointer operator->()

    {

        return &(*(*this));

    }


    __host__ __device__ __forceinline__ bool operator==(const self_type& rhs)

    {

        return ((ptr == rhs.ptr) && (tex_offset == rhs.tex_offset) && (tex_obj == rhs.tex_obj));

    }


    __host__ __device__ __forceinline__ bool operator!=(const self_type& rhs)

    {

        return ((ptr != rhs.ptr) || (tex_offset != rhs.tex_offset) || (tex_obj != rhs.tex_obj));

    }


    friend std::ostream& operator<<(std::ostream& os, const self_type& itr)

    {

        return os;

    }


};


       // end group UtilIterator


}               // CUB namespace

CUB_NS_POSTFIX  // Optional outer namespace(s)

cub::BlockRadixRank
BlockRadixRank provides operations for ranking unsigned integer types within a CUDA thread block.
Definition block_radix_rank.cuh:98

cub::TexObjInputIterator
A random-access input wrapper for dereferencing array values through texture cache....
Definition tex_obj_input_iterator.cuh:112

cub::TexObjInputIterator::operator-
__host__ __device__ __forceinline__ self_type operator-(Distance n) const
Subtraction.
Definition tex_obj_input_iterator.cuh:248

cub::TexObjInputIterator::BindTexture
cudaError_t BindTexture(QualifiedT *ptr, size_t bytes=size_t(-1), size_t tex_offset=0)
Use this iterator to bind ptr with a texture reference.
Definition tex_obj_input_iterator.cuh:162

cub::TexObjInputIterator::TexObjInputIterator
__host__ __device__ __forceinline__ TexObjInputIterator()
Constructor.
Definition tex_obj_input_iterator.cuh:153

cub::TexObjInputIterator::UnbindTexture
cudaError_t UnbindTexture()
Unbind this iterator from its texture reference.
Definition tex_obj_input_iterator.cuh:184

cub::TexObjInputIterator::operator==
__host__ __device__ __forceinline__ bool operator==(const self_type &rhs)
Equal to.
Definition tex_obj_input_iterator.cuh:286

cub::TexObjInputIterator::value_type
T value_type
The type of the element the iterator can point to.
Definition tex_obj_input_iterator.cuh:118

cub::TexObjInputIterator::operator+
__host__ __device__ __forceinline__ self_type operator+(Distance n) const
Addition.
Definition tex_obj_input_iterator.cuh:229

cub::TexObjInputIterator::iterator_category
std::random_access_iterator_tag iterator_category
The iterator category.
Definition tex_obj_input_iterator.cuh:131

cub::TexObjInputIterator::reference
T reference
The type of a reference to an element the iterator can point to.
Definition tex_obj_input_iterator.cuh:120

cub::TexObjInputIterator::operator+=
__host__ __device__ __forceinline__ self_type & operator+=(Distance n)
Addition assignment.
Definition tex_obj_input_iterator.cuh:240

cub::TexObjInputIterator::operator[]
__host__ __device__ __forceinline__ reference operator[](Distance n) const
Array subscript.
Definition tex_obj_input_iterator.cuh:273

cub::TexObjInputIterator::difference_type
OffsetT difference_type
Type to express the result of subtracting one iterator from another.
Definition tex_obj_input_iterator.cuh:117

cub::TexObjInputIterator::operator++
__host__ __device__ __forceinline__ self_type operator++(int)
Postfix increment.
Definition tex_obj_input_iterator.cuh:190

cub::TexObjInputIterator::operator<<
friend std::ostream & operator<<(std::ostream &os, const self_type &itr)
ostream operator
Definition tex_obj_input_iterator.cuh:298

cub::TexObjInputIterator::operator->
__host__ __device__ __forceinline__ pointer operator->()
Structure dereference.
Definition tex_obj_input_iterator.cuh:280

cub::TexObjInputIterator::pointer
T * pointer
The type of a pointer to an element the iterator can point to.
Definition tex_obj_input_iterator.cuh:119

cub::TexObjInputIterator::self_type
TexObjInputIterator self_type
My own type.
Definition tex_obj_input_iterator.cuh:116

cub::TexObjInputIterator::operator-
__host__ __device__ __forceinline__ difference_type operator-(self_type other) const
Distance.
Definition tex_obj_input_iterator.cuh:266

cub::TexObjInputIterator::operator++
__host__ __device__ __forceinline__ self_type operator++()
Prefix increment.
Definition tex_obj_input_iterator.cuh:198

cub::TexObjInputIterator::operator-=
__host__ __device__ __forceinline__ self_type & operator-=(Distance n)
Subtraction assignment.
Definition tex_obj_input_iterator.cuh:259

cub::TexObjInputIterator::operator*
__host__ __device__ __forceinline__ reference operator*() const
Indirection.
Definition tex_obj_input_iterator.cuh:205

cub::TexObjInputIterator::operator!=
__host__ __device__ __forceinline__ bool operator!=(const self_type &rhs)
Not equal to.
Definition tex_obj_input_iterator.cuh:292

cub
Optional outer namespace(s)
Definition agent_histogram.cuh:48

cub::OffsetT
OffsetT OffsetT
[in] Total number of input data items
Definition dispatch_radix_sort.cuh:75

cub::RemoveQualifiers::Type
Up Type
Type without const and volatile qualifiers.
Definition util_type.cuh:225