doxygen/openfpm/cuda__grid__gpu__funcs_8cuh_source.html

/*

 * cuda_grid_gpu_funcs.cuh

 *

 *  Created on: Aug 20, 2018

 *      Author: i-bird

 */


#ifndef CUDA_GRID_GPU_FUNCS_CUH_

#define CUDA_GRID_GPU_FUNCS_CUH_


#include "config.h"

#include "util/cuda_launch.hpp"

#include "map_grid_cuda_ker.cuh"


#if defined(CUDA_GPU) && defined(__NVCC__)


template<unsigned int dim, typename grid_type>

__global__ void copy_ndim_grid_block_device(grid_type src, grid_type dst)

{

    unsigned int i = blockIdx.x;


    if (i >= src.getGrid().size() || i >= dst.getGrid().size())

    {return;}


    auto key_src = src.getGrid().InvLinId(i);


    dst.get_o(key_src) = src.get_o(key_src);

};


template<unsigned int dim, typename grid_type>

struct copy_ndim_grid_impl

{

    static __device__ void copy(grid_type & src, grid_type & dst)

    {

        unsigned int i = threadIdx.x + blockIdx.x * blockDim.x;


        if (i >= src.getGrid().size() || i >= dst.getGrid().size())

        {return;}


        auto key_src = src.getGrid().InvLinId(i);


        dst.get_o(key_src) = src.get_o(key_src);

    }

};


template<typename grid_type>

struct copy_ndim_grid_impl<2,grid_type>

{

    static __device__ void copy(grid_type & src, grid_type & dst)

    {

        grid_key_dx<2> key_src;

        key_src.set_d(0,threadIdx.x + blockIdx.x * blockDim.x);

        key_src.set_d(1,threadIdx.y + blockIdx.y * blockDim.y);


        if (key_src.get(0) >= src.getGrid().size(0))    {return;}

        if (key_src.get(1) >= src.getGrid().size(1))    {return;}


        if (key_src.get(0) >= dst.getGrid().size(0))    {return;}

        if (key_src.get(1) >= dst.getGrid().size(1))    {return;}


        dst.get_o(key_src) = src.get_o(key_src);

    }

};


template<typename grid_type>

struct copy_ndim_grid_impl<3,grid_type>

{

    static __device__ void copy(grid_type & src, grid_type & dst)

    {

        grid_key_dx<3> key_src;

        key_src.set_d(0,threadIdx.x + blockIdx.x * blockDim.x);

        key_src.set_d(1,threadIdx.y + blockIdx.y * blockDim.y);

        key_src.set_d(2,threadIdx.y + blockIdx.y * blockDim.y);


        if (key_src.get(0) >= src.getGrid().size(0))    {return;}

        if (key_src.get(1) >= src.getGrid().size(1))    {return;}

        if (key_src.get(2) >= src.getGrid().size(2))    {return;}


        if (key_src.get(0) >= dst.getGrid().size(0))    {return;}

        if (key_src.get(1) >= dst.getGrid().size(1))    {return;}

        if (key_src.get(2) >= dst.getGrid().size(2))    {return;}


        dst.get_o(key_src) = src.get_o(key_src);

    }

};


template<unsigned int dim, typename grid_type>

__global__ void copy_ndim_grid_device(grid_type src, grid_type dst)

{

    copy_ndim_grid_impl<dim,grid_type>::copy(src,dst);

}


#endif


template<bool inte_or_lin, typename base_grid, unsigned int dim, typename T>

struct grid_toKernelImpl

{

    template<typename grid_type> static base_grid toKernel(grid_type & gc)

    {

        /*grid_gpu_ker<dim,T,memory_traits_lin,typename grid_type::linearizer_type>*/base_grid g(gc.getGrid());


        g.get_data_().disable_manage_memory();

        g.get_data_().mem = gc.get_internal_data_().mem;

        // Increment the reference of mem

        //g.get_data_().mem->incRef();

        g.get_data_().mem_r.bind_ref(gc.get_internal_data_().mem_r);

        g.get_data_().switchToDevicePtr();


        return g;

    }

};


template<typename base_grid, unsigned int dim, typename T>

struct grid_toKernelImpl<true,base_grid,dim,T>

{

    template<typename grid_type> static base_grid toKernel(grid_type & gc)

    {

        /*grid_gpu_ker<dim,T,memory_traits_inte, typename grid_type::linearizer_type>*/ base_grid g(gc.getGrid());

        copy_switch_memory_c_no_cpy<typename std::remove_reference<decltype(gc.get_internal_data_())>::type,

                                    typename std::remove_reference<decltype(g.get_data_())>::type> cp_mc(gc.get_internal_data_(),g.get_data_());


        boost::mpl::for_each_ref< boost::mpl::range_c<int,0,T::max_prop> >(cp_mc);


        return g;

    }

};


#endif /* CUDA_GRID_GPU_FUNCS_CUH_ */

grid_dist_id
This is a distributed grid.
Definition grid_dist_id.hpp:278

grid_dist_id::size
size_t size() const
Return the total number of points in the grid.
Definition grid_dist_id.hpp:1339

grid_key_dx
grid_key_dx is the key to access any element in the grid
Definition grid_key.hpp:19

grid_key_dx::set_d
__device__ __host__ void set_d(index_type i, index_type id)
Set the i index.
Definition grid_key.hpp:516

grid_key_dx::get
__device__ __host__ index_type get(index_type i) const
Get the i index.
Definition grid_key.hpp:503

copy_switch_memory_c_no_cpy
this class is a functor for "for_each" algorithm
Definition map_grid_cuda_ker.cuh:34

grid_toKernelImpl
Definition cuda_grid_gpu_funcs.cuh:99