doxygen/openfpm/Domain__icells__cart_8hpp_source.html

/*

 * Domain_icells_cart.hpp

 *

 *  Created on: Apr 27, 2019

 *      Author: i-bird

 */


#ifndef DOMAIN_ICELLS_CART_HPP_

#define DOMAIN_ICELLS_CART_HPP_


#include "Vector/map_vector.hpp"

#include "Space/Ghost.hpp"

#include "NN/CellList/CellList.hpp"

#include "NN/CellList/cuda/CellDecomposer_gpu_ker.cuh"

#include "Vector/map_vector_sparse.hpp"

#include <iomanip>


#ifdef __NVCC__


template<unsigned int dim, typename vector_sparse_type, typename CellDecomposer_type>

__global__ void insert_icell(vector_sparse_type vs, CellDecomposer_type cld, grid_key_dx<dim,int> start,grid_key_dx<dim,int> stop)

{

    vs.init();


    auto gk = grid_p<dim>::get_grid_point(cld.get_div_c());


    unsigned int b = blockIdx.x + blockIdx.y * gridDim.x + blockIdx.z * gridDim.x * gridDim.y;


    bool out = false;

    for (unsigned int i = 0 ; i < dim ; i++)

    {

        gk.set_d(i,gk.get(i) + start.get(i));

        if (gk.get(i) > stop.get(i))

        {out = true;}

    }


    if (out == false)

    {

        auto id = cld.LinId(gk);


        vs.insert_b(id,b);

    }


    vs.flush_block_insert(b, threadIdx.x == 0 & threadIdx.y == 0 & threadIdx.z == 0 );

}


template<unsigned int dim, typename vector_sparse_type, typename CellDecomposer_type>

__global__ void insert_remove_icell(vector_sparse_type vs, vector_sparse_type vsi, CellDecomposer_type cld, grid_key_dx<dim,int> start,grid_key_dx<dim,int> stop)

{

    vs.init();

    vsi.init();


    auto gk = grid_p<dim>::get_grid_point(cld.get_div_c());


    unsigned int b = blockIdx.x + blockIdx.y * gridDim.x + blockIdx.z * gridDim.x * gridDim.y;


    bool out = false;

    for (unsigned int i = 0 ; i < dim ; i++)

    {

        gk.set_d(i,gk.get(i) + start.get(i));

        if (gk.get(i) > stop.get(i))

        {out = true;}

    }


    if (out == false)

    {

        auto id = cld.LinId(gk);


        vs.insert_b(id,b);

        vsi.remove_b(id,b);

    }


    vs.flush_block_insert(b, threadIdx.x == 0 & threadIdx.y == 0 & threadIdx.z == 0 );

    vsi.flush_block_remove(b, threadIdx.x == 0 & threadIdx.y == 0 & threadIdx.z == 0);

}


template<unsigned int dim, typename T, template<typename> class layout_base , typename Memory, typename cnt_type, typename ids_type, bool is_gpu>

struct CalculateInternalCells_impl

{

    template<typename VCluster_type>

    static void CalculateInternalCells(VCluster_type & v_cl,

            openfpm::vector<Box<dim,T>,Memory,layout_base> & ig_box,

            openfpm::vector<SpaceBox<dim,T>,Memory,layout_base> & domain,

            Box<dim,T> & pbox,

            T r_cut,

            const Ghost<dim,T> & enlarge,

            CellDecomposer_sm<dim,T,shift<dim,T>> & cd,

            openfpm::vector<aggregate<ids_type>,Memory,layout_base> & icells,

            openfpm::vector<aggregate<ids_type>,Memory,layout_base> & dcells)

    {


    }

};


template<unsigned int dim, typename T, template<typename> class layout_base , typename Memory, typename cnt_type, typename ids_type>

struct CalculateInternalCells_impl<dim,T,layout_base,Memory,cnt_type,ids_type,true>

{

    template<typename VCluster_type>

    static void CalculateInternalCells(VCluster_type & v_cl,

            openfpm::vector<Box<dim,T>,Memory,layout_base> & ig_box,

            openfpm::vector<SpaceBox<dim,T>,Memory,layout_base> & domain,

            Box<dim,T> & pbox,

            T r_cut,

            const Ghost<dim,T> & enlarge,

            CellDecomposer_sm<dim,T,shift<dim,T>> & cd,

            openfpm::vector<aggregate<ids_type>,Memory,layout_base> & icells,

            openfpm::vector<aggregate<ids_type>,Memory,layout_base> & dcells)

    {

#if 0


        // Division array

        size_t div[dim];


        // Calculate the parameters of the cell-list


        cl_param_calculate(pbox, div, r_cut, enlarge);


        openfpm::array<T,dim,cnt_type> spacing_c;

        openfpm::array<ids_type,dim,cnt_type> div_c;

        openfpm::array<ids_type,dim,cnt_type> off;


        for (size_t i = 0 ; i < dim ; i++)

        {

            spacing_c[i] = (pbox.getHigh(i) - pbox.getLow(i)) / div[i];

            off[i] = 1;

            // div_c must include offset

            div_c[i] = div[i] + 2*off[i];


        }


        shift_only<dim,T> t(Matrix<dim,T>::identity(),pbox.getP1());


        CellDecomposer_gpu_ker<dim,T,cnt_type,ids_type,shift_only<dim,T>> cld(spacing_c,div_c,off,t);

        grid_sm<dim,void> g = cld.getGrid();

        cd.setDimensions(pbox,div,off[0]);


        openfpm::vector_sparse_gpu<aggregate<unsigned int>> vs;

        openfpm::vector_sparse_gpu<aggregate<unsigned int>> vsi;


        vs.template setBackground<0>(0);


        // insert Domain cells


        for (size_t i = 0 ; i < domain.size() ; i++)

        {

            Box<dim,T> bx = SpaceBox<dim,T>(domain.get(i));


            auto pp2 = bx.getP2();


            for (size_t j = 0 ; j < dim ; j++)

            {pp2.get(j) = std::nextafter(pp2.get(j),pp2.get(j) - static_cast<T>(1.0));}


            auto p1 = cld.getCell(bx.getP1());

            auto p2 = cld.getCell(pp2);


            auto ite = g.getGPUIterator(p1,p2,256);


            if (ite.wthr.x == 0)

            {continue;}


            vsi.setGPUInsertBuffer(ite.nblocks(),256);


            CUDA_LAUNCH((insert_icell<dim>),ite,vsi.toKernel(),cld,ite.start,p2);


            vsi.template flush<>(v_cl.getgpuContext(),flush_type::FLUSH_ON_DEVICE);

        }


        // calculate the number of kernel launch


        for (size_t i = 0 ; i < ig_box.size() ; i++)

        {

            Box<dim,T> bx = ig_box.get(i);


            auto pp2 = bx.getP2();


            for (size_t j = 0 ; j < dim ; j++)

            {pp2.get(j) = std::nextafter(pp2.get(j),pp2.get(j) - static_cast<T>(1.0));}


            auto p1 = cld.getCell(bx.getP1());

            auto p2 = cld.getCell(pp2);


            auto ite = g.getGPUIterator(p1,p2,256);


            if (ite.wthr.x == 0)

            {continue;}


            vs.setGPUInsertBuffer(ite.nblocks(),256);

            vsi.setGPURemoveBuffer(ite.nblocks(),256);


            CUDA_LAUNCH(insert_remove_icell<dim>,ite,vs.toKernel(),vsi.toKernel(),cld,ite.start,p2);


            vs.template flush<>(v_cl.getgpuContext(),flush_type::FLUSH_ON_DEVICE);

            vsi.flush_remove(v_cl.getgpuContext(),flush_type::FLUSH_ON_DEVICE);

        }


        vs.swapIndexVector(icells);

        vsi.swapIndexVector(dcells);


#endif

    }

};


#endif


template<unsigned int dim, typename T, template<typename> class layout_base , typename Memory>

class domain_icell_calculator

{

    typedef unsigned int cnt_type;


    typedef int ids_type;


    openfpm::vector<aggregate<ids_type>,Memory,layout_base> icells;

    openfpm::vector<aggregate<ids_type>,Memory,layout_base> dcells;


    CellDecomposer_sm<dim,T,shift<dim,T>> cd;


    public:


    template<typename VCluster_type>

    void CalculateInternalCells(VCluster_type & v_cl,

                                openfpm::vector<Box<dim,T>,Memory,layout_base> & ig_box,

                                openfpm::vector<SpaceBox<dim,T>,Memory,layout_base> & domain,

                                Box<dim,T> & pbox,

                                T r_cut,

                                const Ghost<dim,T> & enlarge)

    {

#ifdef __NVCC__

        CalculateInternalCells_impl<dim,T,layout_base,Memory,cnt_type,ids_type,std::is_same<Memory,CudaMemory>::value>::CalculateInternalCells(v_cl,ig_box,domain,pbox,r_cut,enlarge,cd,icells,dcells);

#endif

    }


    openfpm::vector<aggregate<ids_type>,Memory,layout_base> & getIcells()

    {

        return icells;

    }


    openfpm::vector<aggregate<ids_type>,Memory,layout_base> & getDcells()

    {

        return dcells;

    }


    Box<dim,T> getBoxCell(unsigned int ci)

    {

        Box<dim,T> b;


        for (size_t i = 0 ; i < dim ; i++)

        {

            auto key = cd.getGrid().InvLinId(ci);

            Point<dim,T> p1 = cd.getOrig().get(i) - cd.getPadding(i)*cd.getCellBox().getHigh(i) ;


            b.setLow(i,p1.get(i) + key.get(i)*cd.getCellBox().getHigh(i));

            b.setHigh(i,p1.get(i) + ((key.get(i) + 1)*cd.getCellBox().getHigh(i)));

        }


        return b;

    }


    const grid_sm<dim,void> & getGrid()

    {

        return cd.getGrid();

    }

};


#endif /* DOMAIN_ICELLS_CART_HPP_ */

Box
This class represent an N-dimensional box.
Definition Box.hpp:61

Box::getP2
Point< dim, T > getP2() const
Get the point p2.
Definition Box.hpp:722

Box::getLow
__device__ __host__ T getLow(int i) const
get the i-coordinate of the low bound interval of the box
Definition Box.hpp:556

Box::getHigh
__device__ __host__ T getHigh(int i) const
get the high interval of the box
Definition Box.hpp:567

Box::getP1
Point< dim, T > getP1() const
Get the point p1.
Definition Box.hpp:708

CellDecomposer_gpu_ker
Definition CellDecomposer_gpu_ker.cuh:19

Ghost
Definition Ghost.hpp:40

Matrix
This class implement an NxN (dense) matrix.
Definition Matrix.hpp:33

Point
This class implement the point shape in an N-dimensional space.
Definition Point.hpp:28

Point::get
__device__ __host__ const T & get(unsigned int i) const
Get coordinate.
Definition Point.hpp:172

SpaceBox
This class represent an N-dimensional box.
Definition SpaceBox.hpp:27

domain_icell_calculator
Definition Domain_icells_cart.hpp:209

domain_icell_calculator::getIcells
openfpm::vector< aggregate< ids_type >, Memory, layout_base > & getIcells()
Return the list of the internal cells.
Definition Domain_icells_cart.hpp:274

domain_icell_calculator::CalculateInternalCells
void CalculateInternalCells(VCluster_type &v_cl, openfpm::vector< Box< dim, T >, Memory, layout_base > &ig_box, openfpm::vector< SpaceBox< dim, T >, Memory, layout_base > &domain, Box< dim, T > &pbox, T r_cut, const Ghost< dim, T > &enlarge)
Calculate the subdomain that are in the skin part of the domain.
Definition Domain_icells_cart.hpp:257

domain_icell_calculator::getBoxCell
Box< dim, T > getBoxCell(unsigned int ci)
Given a cell index return the cell box.
Definition Domain_icells_cart.hpp:295

domain_icell_calculator::getDcells
openfpm::vector< aggregate< ids_type >, Memory, layout_base > & getDcells()
Return the list of the internal cells.
Definition Domain_icells_cart.hpp:284

domain_icell_calculator::getGrid
const grid_sm< dim, void > & getGrid()
Get the grid base information about this cell decomposition.
Definition Domain_icells_cart.hpp:317

grid_key_dx
grid_key_dx is the key to access any element in the grid
Definition grid_key.hpp:19

grid_key_dx::get
__device__ __host__ index_type get(index_type i) const
Get the i index.
Definition grid_key.hpp:503

grid_sm
Declaration grid_sm.
Definition grid_sm.hpp:167

grid_sm::setDimensions
void setDimensions(const size_t(&dims)[N])
Reset the dimension of the grid.
Definition grid_sm.hpp:326

openfpm::array
Definition array_openfpm.hpp:38

openfpm::vector_sparse
Definition map_vector_sparse.hpp:789

openfpm::vector_sparse::flush_remove
void flush_remove(gpu::ofp_context_t &context, flush_type opt=FLUSH_ON_HOST)
merge the added element to the main data array
Definition map_vector_sparse.hpp:1811

openfpm::vector_sparse::setGPURemoveBuffer
void setGPURemoveBuffer(int nblock, int nslot)
set the gpu remove buffer for every block
Definition map_vector_sparse.hpp:1935

openfpm::vector_sparse::toKernel
vector_sparse_gpu_ker< T, Ti, layout_base > toKernel()
toKernel function transform this structure into one that can be used on GPU
Definition map_vector_sparse.hpp:1873

openfpm::vector_sparse::setGPUInsertBuffer
void setGPUInsertBuffer(int nblock, int nslot)
set the gpu insert buffer for every block
Definition map_vector_sparse.hpp:1892

openfpm::vector_sparse::swapIndexVector
void swapIndexVector(vector< aggregate< Ti >, Memory, layout_base, grow_p > &iv)
Definition map_vector_sparse.hpp:1613

openfpm::vector
Implementation of 1-D std::vector like structure.
Definition map_vector.hpp:203

shift_only
Definition CellDecomposer.hpp:150

shift
Definition CellDecomposer.hpp:27

aggregate
aggregate of properties, from a list of object if create a struct that follow the OPENFPM native stru...
Definition aggregate.hpp:215