doxygen/openfpm_pdata/main__float128_8cpp_source.html

 /*

  * ### WIKI 1 ###

  *

  * ## Simple example

  *

  * In this example we show 1D PSE derivative function approximation

  * in the case of floating points 128bit 2 time better than float128 precision

  *

  * ### WIKI END ###

  *

  */


 #include "config/config.h"

 #include "Vector/vector_dist.hpp"

 #include "Decomposition/CartDecomposition.hpp"

 #include "PSE/Kernels.hpp"

 #include "data_type/aggregate.hpp"

 #include <cmath>


 // This example only work if there is HAVE_LIBQUADMATH

 #ifdef HAVE_LIBQUADMATH


 #include <boost/multiprecision/float128.hpp>


 typedef boost::multiprecision::float128 float128;


 /*

  * ### WIKI 2 ###

  *

  * Here we define the function x*e^(-x*x) and its

  * second derivative in analytic form

  *

  * 2x*(2*x-3)*e^(-x^2)

  *

  */


 float128 f_xex2(float128 x)

 {

     return x*exp(-x*x);

 }


 float128 f_xex2(Point<1,float128> & x)

 {

     return x.get(0)*exp(-x.get(0)*x.get(0));

 }


 float128 Lapf_xex2(Point<1,float128> & x)

 {

     return 2.0*x.get(0)*(2.0*x.get(0)*x.get(0) - 3.0)*exp(-x.get(0)*x.get(0));

 }


 /*

  *

  * ### WIKI END ###

  *

  */


 int main(int argc, char* argv[])

 {

     //

     // ### WIKI 3 ###

     //

     // Some useful parameters. Like

     //

     // * Number of particles

     // * Minimum number of padding particles

     // * The computational domain

     // * The spacing

     // * The mollification length

     // * Second order Laplacian kernel in 1D

     //


     // Number of particles

     const size_t Npart = 125;


     // Number of padding particles (At least)

     const size_t Npad = 40;


     // The domain

     Box<1,float128> box({0.0},{4.0});


     // Calculated spacing

     float128 spacing = box.getHigh(0) / Npart;


     // Epsilon of the particle kernel

     const float128 eps = 2*spacing;


     // Laplacian PSE kernel 1 dimension, on float128, second order

     Lap_PSE<1,float128,2> lker(eps);


     //

     // ### WIKI 2 ###

     //

     // Here we Initialize the library and we define Ghost size

     // and non-periodic boundary conditions

     //

     openfpm_init(&argc,&argv);

     Vcluster & v_cl = create_vcluster();


     size_t bc[1]={NON_PERIODIC};

     Ghost<1,float128> g(12*eps);


     //

     // ### WIKI 3 ###

     //

     // Here we are creating a distributed vector defined by the following parameters

     //

     // we create a set of N+1 particles to have a fully covered domain of particles between 0.0 and 4.0

     // Suppose we have a spacing given by 1.0 you need 4 +1 particles to cover your domain

     //

     vector_dist<1,float128, aggregate<float128>, CartDecomposition<1,float128> > vd(Npart+1,box,bc,g);


     //

     // ### WIKI 4 ###

     //

     // We assign the position to the particles, the scalar property is set to

     // the function x*e^(-x*x) value.

     // Each processor has parts of the particles and fill part of the space, the

     // position is assigned independently from the decomposition.

     //

     // In this case, if there are 1001 particles and 3 processors the in the

     // domain from 0.0 to 4.0

     //

     // * processor 0 place particles from 0.0 to 1.332 (334 particles)

     // * processor 1 place particles from 1.336 to 2.668 (334 particles)

     // * processor 2 place particles from 2.672 to 4.0 (333 particles)

     //


     // It return how many particles the processors with id < rank has in total

     size_t base = vd.init_size_accum(Npart+1);

     auto it2 = vd.getIterator();


     while (it2.isNext())

     {

         auto key = it2.get();


         // set the position of the particles

         vd.getPos(key)[0] = (key.getKey() + base) * spacing;

         //set the property of the particles

         vd.template getProp<0>(key) = f_xex2((key.getKey() + base) * spacing);


         ++it2;

     }


     //

     // ### WIKI 5 ###

     //

     // Once defined the position, we distribute them across the processors

     // following the decomposition, finally we get the ghost part

     //

     vd.map();

     vd.ghost_get<0>();


     //

     // ### WIKI 6 ###

     //

     // near the boundary we have two options, or we use one sided kernels,

     // or we add additional particles, it is required that such particles

     // produces a 2 time differentiable function. In order to obtain such

     // result we extend for x < 0.0 and x > 4.0 with the test function xe^(-x*x).

     //

     // Note that for x < 0.0 such extension is equivalent to mirror the

     // particles changing the sign of the strength

     //

     // \verbatim

     //

     // 0.6  -0.5      0.5  0.6   Strength

     //  +----+----*----*----*-

     //          0.0              Position

     //

     //  with * = real particle

     //       + = mirror particle

     //

     // \endverbatim

     //

     //

     Box<1,float128> m_pad({0.0},{0.1});

     Box<1,float128> m_pad2({3.9},{4.0});

     float128 enlarge = 0.1;


     // Create a box

     if (Npad * spacing > 0.1)

     {

         m_pad.setHigh(0,Npad * spacing);

         m_pad2.setLow(0,4.0 - Npad*spacing);

         enlarge = Npad * spacing;

     }


     auto it = vd.getDomainIterator();


     while (it.isNext())

     {

         auto key = it.get();


         // set the position of the particles

         if (m_pad.isInsideNB(vd.getPos(key)) == true)

         {

             vd.add();

             vd.getLastPos()[0] = - vd.getPos(key)[0];

             vd.template getLastProp<0>() = - vd.template getProp<0>(key);

         }


         // set the position of the particles

         if (m_pad2.isInsideNB(vd.getPos(key)) == true)

         {

             vd.add();

             vd.getLastPos()[0] = 2.0 * box.getHigh(0) - vd.getPos(key)[0];

             vd.template getLastProp<0>() = f_xex2(vd.getLastPos()[0]);

         }


         ++it;

     }


     //

     // ### WIKI 7 ###

     //

     // We create a CellList with cell spacing 12 sigma

     //


     // get and construct the Cell list


     Ghost<1,float128> gp(enlarge);

     auto cl = vd.getCellList(12*eps,gp);


     // Maximum infinity norm

     double linf = 0.0;


     //

     // ### WIKI 8 ###

     //

     // For each particle get the neighborhood of each particle

     //

     // This cycle is literally the formula from PSE operator approximation

     //

     // \$ \frac{1}{\epsilon^{2}} h (u_{q} - u_{p}) \eta_{\epsilon}(x_q - x_p) \$

     //

     //


     auto it_p = vd.getDomainIterator();

     while (it_p.isNext())

     {

         // float128 PSE integration accumulator

         float128 pse = 0;


         // key

         vect_dist_key_dx key = it_p.get();


         // Get the position of the particles

         Point<1,float128> p = vd.getPos(key);


         // We are not interested in calculating out the domain

         // note added padding particle are considered domain particles

         if (p.get(0) < 0.0 || p.get(0) >= 4.0)

         {

             ++it_p;

             continue;

         }


         // Get f(x) at the position of the particle

         float128 prp_x = vd.template getProp<0>(key);


         // Get the neighborhood of the particles

         auto NN = cl.template getNNIterator<NO_CHECK>(cl.getCell(p));

         while(NN.isNext())

         {

             auto nnp = NN.get();


             // Calculate contribution given by the kernel value at position p,

             // given by the Near particle

             if (nnp != key.getKey())

             {

                 // W(x-y)

                 float128 ker = lker.value(p,vd.getPos(nnp));


                 // f(y)

                 float128 prp_y = vd.template getProp<0>(nnp);


                 // 1.0/(eps)^2 [f(y)-f(x)]*W(x,y)*V_q

                 float128 prp = 1.0/eps/eps * (prp_y - prp_x) * spacing;

                 pse += prp * ker;

             }


             // Next particle

             ++NN;

         }


         // Here we calculate the L_infinity norm or the maximum difference

         // of the analytic solution from the PSE calculated


         float128 sol = Lapf_xex2(p);


         if (fabs(pse - sol) > linf)

             linf = static_cast<double>(fabs(pse - sol));


         ++it_p;

     }


     //

     // ### WIKI 9 ###

     //

     // Calculate the maximum infinity norm across processors and

     // print it

     //


     v_cl.max(linf);

     v_cl.execute();


     if (v_cl.getProcessUnitID() == 0)

         std::cout << "Norm infinity: " << linf << "\n";


     //

     // ### WIKI 10 ###

     //

     // Deinitialize the library

     //

     openfpm_finalize();

 }


 #else


 int main(int argc, char* argv[])

 {

 }


 #endif

Vcluster_base::getProcessUnitID
size_t getProcessUnitID()
Get the process unit id.
Definition: VCluster_base.hpp:356

Vcluster_base::execute
void execute()
Execute all the requests.
Definition: VCluster_base.hpp:1054

Box::getHigh
T getHigh(int i) const
get the high interval of the box
Definition: Box.hpp:490

Box::setHigh
void setHigh(int i, T val)
set the high interval of the box
Definition: Box.hpp:467

Point
This class implement the point shape in an N-dimensional space.
Definition: Point.hpp:22

vect_dist_key_dx
Grid key for a distributed grid.
Definition: vector_dist_key.hpp:19

Vcluster_base::max
void max(T &num)
Get the maximum number across all processors (or reduction with infinity norm)
Definition: VCluster_base.hpp:402

Ghost
Definition: Ghost.hpp:39

Lap_PSE
Implementation of the Laplacian kernels for PSE.
Definition: Kernels.hpp:25

Vcluster
Implementation of VCluster class.
Definition: VCluster.hpp:36

CartDecomposition
This class decompose a space into sub-sub-domains and distribute them across processors.
Definition: CartDecomposition.hpp:132

Point::get
const T & get(size_t i) const
Get coordinate.
Definition: Point.hpp:142

vect_dist_key_dx::getKey
size_t getKey() const
Get the key.
Definition: vector_dist_key.hpp:42

Box
This class represent an N-dimensional box.
Definition: Box.hpp:56

key
This class is a trick to indicate the compiler a specific specialization pattern. ...
Definition: memory_c.hpp:201

vector_dist
Distributed vector.
Definition: vector_dist.hpp:202