doxygen/openfpm/SparseGrid_26__gray__scott__3d__sparse__gpu__opt__weak__scal_2main_8cu_source.html

#include "Decomposition/Distribution/BoxDistribution.hpp"

#include "Grid/grid_dist_id.hpp"

#include "data_type/aggregate.hpp"

#include "timer.hpp"


#ifdef __NVCC__


constexpr int U = 0;

constexpr int V = 1;


constexpr int U_next = 2;

constexpr int V_next = 3;


constexpr int x = 0;

constexpr int y = 1;

constexpr int z = 2;


typedef CartDecomposition<3,float, CudaMemory, memory_traits_inte, BoxDistribution<3,float> > Dec;


typedef sgrid_dist_id_gpu<3,float,aggregate<float,float,float,float>,CudaMemory, Dec> SparseGridType;


void init(SparseGridType & grid, Box<3,float> & domain, size_t (& div)[3])

{


    double spacing_x = grid.spacing(0);

    double spacing_y = grid.spacing(1);

    double spacing_z = grid.spacing(2);


    typedef typename GetAddBlockType<SparseGridType>::type InsertBlockT;


    // Get the processor domain in continuos


    for (int i = 0 ; i < div[0] ; i++)

    {

        for (int j = 0 ; j < div[1] ; j++)

        {

            for (int k = 0 ; k < div[2] ; k++)

            {

                Point<3,double> p({0.5+i*1.0,0.5+j*1.0,0.5+k*1.0});

                Sphere<3,double> sph(p,0.3);


                Box<3,size_t> bx;


                for (int s = 0 ; s < 3 ; s++)

                {

                    bx.setLow(s,(size_t)((sph.center(s) - 0.31)/grid.spacing(s)));

                    bx.setHigh(s,(size_t)((sph.center(s) + 0.31)/grid.spacing(s)));

                }


                grid.addPoints([spacing_x,spacing_y,spacing_z,sph] __device__ (int i, int j, int k)

                        {

                            Point<3,double> pc({i*spacing_x,j*spacing_y,k*spacing_z});


                            // Check if the point is in the domain

                                            if (sph.isInside(pc) )

                                            {return true;}

                                            return false;

                        },

                        [] __device__ (InsertBlockT & data, int i, int j, int k)

                        {

                            data.template get<U>() = 1.0;

                            data.template get<V>() = 0.0;

                        }

                    );


                grid.template flush<smax_<U>,smax_<V>>(flush_type::FLUSH_ON_DEVICE);

                grid.removeUnusedBuffers();

            }

        }

    }


    for (int i = 0 ; i < div[0] ; i++)

    {

            for (int j = 0 ; j < div[1] ; j++)

            {

                Point<3,double> u({0.0,0.0,1.0});

                Point<3,double> c({0.5+i,0.5+j,0.0});


                Box<3,size_t> bx;


                bx.setLow(0,(0.4+i)/spacing_x);

                bx.setHigh(0,(0.6+i)/spacing_x);


                bx.setLow(1,(0.4+j)/spacing_y);

                bx.setHigh(1,(0.6+j)/spacing_y);


                bx.setLow(2,0);

                bx.setHigh(2,(size_t)grid.size(2));


                grid.addPoints(bx.getKP1(),bx.getKP2(),[spacing_x,spacing_y,spacing_z,u,c] __device__ (int i, int j, int k)

                                    {

                        Point<3,double> pc({i*spacing_x,j*spacing_y,k*spacing_z});

                                                Point<3,double> pcs({i*spacing_x,j*spacing_y,k*spacing_z});

                                                Point<3,double> vp;


                        // shift

                        pc -= c;


                                        // calculate the distance from the diagonal

                                        vp.get(0) = pc.get(1)*u.get(2) - pc.get(2)*u.get(1);

                                        vp.get(1) = pc.get(2)*u.get(0) - pc.get(0)*u.get(2);

                                        vp.get(2) = pc.get(0)*u.get(1) - pc.get(1)*u.get(0);


                        double distance = vp.norm();


                                                // Check if the point is in the domain

                                                if (distance < 0.1 )

                                                {return true;}


                                                return false;

                                    },

                                    [] __device__ (InsertBlockT & data, int i, int j, int k)

                                    {

                                            data.template get<U>() = 1.0;

                                            data.template get<V>() = 0.0;

                                    }

                                );


                grid.template flush<smax_<U>,smax_<V>>(flush_type::FLUSH_ON_DEVICE);

                grid.removeUnusedBuffers();

            }

    }


    for (int i = 0 ; i < div[0] ; i++)

    {

            for (int k = 0 ; k < div[2] ; k++)

            {

                Point<3,double> u({0.0,1.0,0.0});

                Point<3,double> c({0.5+i,0.0,0.5+k});


                Box<3,size_t> bx;


                bx.setLow(0,(0.4+i)/spacing_x);

                bx.setHigh(0,(0.6+i)/spacing_x);


                bx.setLow(2,(0.4+k)/spacing_z);

                bx.setHigh(2,(0.6+k)/spacing_z);


                bx.setLow(1,0);

                bx.setHigh(1,(size_t)grid.size(1));


                grid.addPoints(bx.getKP1(),bx.getKP2(),[spacing_x,spacing_y,spacing_z,u,c] __device__ (int i, int j, int k)

                                    {

                        Point<3,double> pc({i*spacing_x,j*spacing_y,k*spacing_z});

                                                Point<3,double> pcs({i*spacing_x,j*spacing_y,k*spacing_z});

                                                Point<3,double> vp;


                        // shift

                        pc -= c;


                                        // calculate the distance from the diagonal

                                        vp.get(0) = pc.get(1)*u.get(2) - pc.get(2)*u.get(1);

                                        vp.get(1) = pc.get(2)*u.get(0) - pc.get(0)*u.get(2);

                                        vp.get(2) = pc.get(0)*u.get(1) - pc.get(1)*u.get(0);


                        double distance = vp.norm();


                                                // Check if the point is in the domain

                                                if (distance < 0.1 )

                                                {return true;}


                                                return false;

                                    },

                                    [] __device__ (InsertBlockT & data, int i, int j, int k)

                                    {

                                            data.template get<U>() = 1.0;

                                            data.template get<V>() = 0.0;

                                    }

                                );


                grid.template flush<smax_<U>,smax_<V>>(flush_type::FLUSH_ON_DEVICE);

                grid.removeUnusedBuffers();

            }

    }


    for (int j = 0 ; j < div[1] ; j++)

    {

            for (int k = 0 ; k < div[2] ; k++)

            {

                Point<3,double> u({1.0,0.0,0.0});

                Point<3,double> c({0.0,0.5+j,0.5+k});


                Box<3,size_t> bx;


                bx.setLow(1,(0.4+j)/spacing_y);

                bx.setHigh(1,(0.6+j)/spacing_y);


                bx.setLow(2,(0.4+k)/spacing_z);

                bx.setHigh(2,(0.6+k)/spacing_z);


                bx.setLow(0,0);

                bx.setHigh(0,(size_t)grid.size(0));


                grid.addPoints(bx.getKP1(),bx.getKP2(),[spacing_x,spacing_y,spacing_z,u,c] __device__ (int i, int j, int k)

                                    {

                        Point<3,double> pc({i*spacing_x,j*spacing_y,k*spacing_z});

                                                Point<3,double> pcs({i*spacing_x,j*spacing_y,k*spacing_z});

                                                Point<3,double> vp;


                        // shift

                        pc -= c;


                                        // calculate the distance from the diagonal

                                        vp.get(0) = pc.get(1)*u.get(2) - pc.get(2)*u.get(1);

                                        vp.get(1) = pc.get(2)*u.get(0) - pc.get(0)*u.get(2);

                                        vp.get(2) = pc.get(0)*u.get(1) - pc.get(1)*u.get(0);


                        double distance = vp.norm();


                                                // Check if the point is in the domain

                                                if (distance < 0.1 )

                                                {return true;}


                                                return false;

                                    },

                                    [] __device__ (InsertBlockT & data, int i, int j, int k)

                                    {

                                            data.template get<U>() = 1.0;

                                            data.template get<V>() = 0.0;

                                    }

                                );


                grid.template flush<smax_<U>,smax_<V>>(flush_type::FLUSH_ON_DEVICE);

                grid.removeUnusedBuffers();

            }

    }


    long int x_start = grid.size(0)*0.4f/domain.getHigh(0);

    long int y_start = grid.size(1)*0.4f/domain.getHigh(1);

    long int z_start = grid.size(1)*0.4f/domain.getHigh(2);


    long int x_stop = grid.size(0)*0.6f/domain.getHigh(0);

    long int y_stop = grid.size(1)*0.6f/domain.getHigh(1);

    long int z_stop = grid.size(1)*0.6f/domain.getHigh(2);


    grid_key_dx<3> start({x_start,y_start,z_start});

    grid_key_dx<3> stop ({x_stop,y_stop,z_stop});


        grid.addPoints(start,stop,[] __device__ (int i, int j, int k)

                                {

                                                return true;

                                },

                                [] __device__ (InsertBlockT & data, int i, int j, int k)

                                {

                                        data.template get<U>() = 0.5;

                                        data.template get<V>() = 0.24;

                                }

                                );


    grid.template flush<smin_<U>,smax_<V>>(flush_type::FLUSH_ON_DEVICE);


}


int main(int argc, char* argv[])

{

    openfpm_init(&argc,&argv);


    // First we check which type of decomposition BoxDistritubion prodice

    auto & v_cl = create_vcluster();


    openfpm::vector<int> facts;

    getPrimeFactors(v_cl.size(),facts);


    size_t div[3];


    for (int i = 0 ; i < 3 ; i++)

    {div[i] = 1;}


    for (int i = 0 ; i < facts.size() ; i++)

    {div[i % 3] *= facts.get(i);}


    grid_sm<3,void> gdist(div);


    // domain

    Box<3,float> domain({0.0,0.0,0.0},{div[0]*1.0f,div[1]*1.0f,div[2]*1.0f});


    // grid size

    size_t sz[3] = {64*div[0],64*div[1],64*div[2]};


    // Define periodicity of the grid

    periodicity<3> bc = {PERIODIC,PERIODIC,PERIODIC};


    // Ghost in grid unit

    Ghost<3,long int> g(1);


    // deltaT

    float deltaT = 0.25;


    // Diffusion constant for specie U

    float du = 2*1e-5;


    // Diffusion constant for specie V

    float dv = 1*1e-5;


    // Number of timesteps

#ifdef TEST_RUN

    size_t timeSteps = 300;

#else

        size_t timeSteps = 15000;

#endif


    // K and F (Physical constant in the equation)

    float K = 0.053;

    float F = 0.014;


    SparseGridType grid(sz,domain,g,bc,0,gdist);


    // spacing of the grid on x and y

    float spacing[3] = {grid.spacing(0),grid.spacing(1),grid.spacing(2)};


    init(grid,domain,div);


        grid.deviceToHost<U,V,U_next,V_next>();

        grid.write("final");


    openfpm_finalize();

    return 0;


    // sync the ghost

    grid.template ghost_get<U,V>(RUN_ON_DEVICE);


    // because we assume that spacing[x] == spacing[y] we use formula 2

    // and we calculate the prefactor of Eq 2

    float uFactor = deltaT * du/(spacing[x]*spacing[x]);

    float vFactor = deltaT * dv/(spacing[x]*spacing[x]);


    timer tot_sim;

    tot_sim.start();


    for (size_t i = 0; i < timeSteps ; ++i)

    {

        if (v_cl.rank() == 0)

        {std::cout << "STEP: " << i << std::endl;}

/*      if (i % 300 == 0)

        {

            std::cout << "STEP: " << i << std::endl;

            grid.write_frame("out",i,VTK_WRITER);

        }*/


        typedef typename GetCpBlockType<decltype(grid),0,1>::type CpBlockType;


        auto func = [uFactor,vFactor,deltaT,F,K] __device__ (float & u_out, float & v_out,

                                                   CpBlockType & u, CpBlockType & v,

                                                   int i, int j, int k){


                float uc = u(i,j,k);

                float vc = v(i,j,k);


                u_out = uc + uFactor *(u(i-1,j,k) + u(i+1,j,k) +

                                                       u(i,j-1,k) + u(i,j+1,k) +

                                                       u(i,j,k-1) + u(i,j,k+1) - 6.0f*uc) - deltaT * uc*vc*vc

                                                       - deltaT * F * (uc - 1.0f);


                v_out = vc + vFactor *(v(i-1,j,k) + v(i+1,j,k) +

                                                       v(i,j+1,k) + v(i,j-1,k) +

                                                       v(i,j,k-1) + v(i,j,k+1) - 6.0f*vc) + deltaT * uc*vc*vc

                                   - deltaT * (F+K) * vc;

                };


        if (i % 2 == 0)

        {

            grid.conv2<U,V,U_next,V_next,1>({0,0,0},{(long int)sz[0]-1,(long int)sz[1]-1,(long int)sz[2]-1},func);


            // After copy we synchronize again the ghost part U and V


            grid.ghost_get<U_next,V_next>(RUN_ON_DEVICE | SKIP_LABELLING);

        }

        else

        {

            grid.conv2<U_next,V_next,U,V,1>({0,0,0},{(long int)sz[0]-1,(long int)sz[1]-1,(long int)sz[2]-1},func);


            // After copy we synchronize again the ghost part U and V

            grid.ghost_get<U,V>(RUN_ON_DEVICE | SKIP_LABELLING);

        }


        // Every 500 time step we output the configuration for

        // visualization

//      if (i % 500 == 0)

//      {

//          grid.save("output_" + std::to_string(count));

//          count++;

//      }

    }


    tot_sim.stop();

    std::cout << "Total simulation: " << tot_sim.getwct() << std::endl;


    grid.deviceToHost<U,V,U_next,V_next>();

    grid.write("final");


    openfpm_finalize();


}


#else


int main(int argc, char* argv[])

{

        return 0;

}


#endif


Box
This class represent an N-dimensional box.
Definition Box.hpp:61

Box::setHigh
__device__ __host__ void setHigh(int i, T val)
set the high interval of the box
Definition Box.hpp:544

Box::setLow
__device__ __host__ void setLow(int i, T val)
set the low interval of the box
Definition Box.hpp:533

CartDecomposition
This class decompose a space into sub-sub-domains and distribute them across processors.
Definition CartDecomposition.hpp:145

CudaMemory
Definition CudaMemory.cuh:59

Ghost
Definition Ghost.hpp:40

Point
This class implement the point shape in an N-dimensional space.
Definition Point.hpp:28

Point::get
__device__ __host__ const T & get(unsigned int i) const
Get coordinate.
Definition Point.hpp:172

Point::norm
__device__ __host__ T norm() const
norm of the vector
Definition Point.hpp:231

Sphere
This class implement the Sphere concept in an N-dimensional space.
Definition Sphere.hpp:24

grid_key_dx
grid_key_dx is the key to access any element in the grid
Definition grid_key.hpp:19

grid_sm
Declaration grid_sm.
Definition grid_sm.hpp:167

grid
Definition grid_test.hpp:219

openfpm::vector
Implementation of 1-D std::vector like structure.
Definition map_vector.hpp:203

openfpm::vector::size
size_t size()
Stub size.
Definition map_vector.hpp:211

timer
Class for cpu time benchmarking.
Definition timer.hpp:28

timer::stop
void stop()
Stop the timer.
Definition timer.hpp:119

timer::start
void start()
Start the timer.
Definition timer.hpp:90

timer::getwct
double getwct()
Return the elapsed real time.
Definition timer.hpp:130

cub::int
KeyT const ValueT ValueT OffsetIteratorT OffsetIteratorT int
[in] The number of segments that comprise the sorting data
Definition dispatch_radix_sort.cuh:336

cub::init
OutputIteratorT OffsetT ReductionOpT OuputT init
< [in] The initial value of the reduction
Definition dispatch_reduce.cuh:119

F
[v_transform metafunction]
Definition variadic_to_vmpl_unit_test.hpp:18

GetCpBlockType
get the type of the block
Definition SparseGridGpu.hpp:162

enc_num
Definition encap_num.hpp:13

periodicity
Boundary conditions.
Definition common.hpp:22

smax_
Definition map_vector_sparse_cuda_kernels.cuh:192