html/dox/dp3m_8cpp_source.html

/*

 * Copyright (C) 2010-2022 The ESPResSo project

 * Copyright (C) 2002,2003,2004,2005,2006,2007,2008,2009,2010

 *   Max-Planck-Institute for Polymer Research, Theory Group

 *

 * This file is part of ESPResSo.

 *

 * ESPResSo is free software: you can redistribute it and/or modify

 * it under the terms of the GNU General Public License as published by

 * the Free Software Foundation, either version 3 of the License, or

 * (at your option) any later version.

 *

 * ESPResSo is distributed in the hope that it will be useful,

 * but WITHOUT ANY WARRANTY; without even the implied warranty of

 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the

 * GNU General Public License for more details.

 *

 * You should have received a copy of the GNU General Public License

 * along with this program.  If not, see <http://www.gnu.org/licenses/>.

 */


/** @file

 *  P3M algorithm for long-range magnetic dipole-dipole interaction.

 *

 *  By default the magnetic epsilon is metallic = 0.

 */


#include "config/config.hpp"


#ifdef DP3M


#include "magnetostatics/dp3m.hpp"


#include "p3m/TuningAlgorithm.hpp"

#include "p3m/TuningLogger.hpp"

#include "p3m/common.hpp"

#include "p3m/fft.hpp"

#include "p3m/influence_function_dipolar.hpp"

#include "p3m/interpolation.hpp"

#include "p3m/send_mesh.hpp"


#include "BoxGeometry.hpp"

#include "LocalBox.hpp"

#include "Particle.hpp"

#include "ParticleRange.hpp"

#include "PropagationMode.hpp"

#include "cell_system/CellStructure.hpp"

#include "cell_system/CellStructureType.hpp"

#include "communication.hpp"

#include "errorhandling.hpp"

#include "integrators/Propagation.hpp"

#include "npt.hpp"

#include "system/System.hpp"

#include "tuning.hpp"


#include <utils/Vector.hpp>

#include <utils/constants.hpp>

#include <utils/integral_parameter.hpp>

#include <utils/math/int_pow.hpp>

#include <utils/math/sinc.hpp>

#include <utils/math/sqr.hpp>


#include <boost/mpi/collectives/all_reduce.hpp>

#include <boost/mpi/collectives/reduce.hpp>


#include <algorithm>

#include <array>

#include <cstddef>

#include <cstdio>

#include <functional>

#include <optional>

#include <sstream>

#include <stdexcept>

#include <vector>


void DipolarP3M::count_magnetic_particles() {

  int local_n = 0;

  double local_mu2 = 0.;


  for (auto const &p : get_system().cell_structure->local_particles()) {

    if (p.dipm() != 0.) {

      local_mu2 += p.calc_dip().norm2();

      local_n++;

    }

  }


  boost::mpi::all_reduce(comm_cart, local_mu2, dp3m.sum_mu2, std::plus<>());

  boost::mpi::all_reduce(comm_cart, local_n, dp3m.sum_dip_part, std::plus<>());

}


static double dp3m_k_space_error(double box_size, int mesh, int cao,

                                 int n_c_part, double sum_q2, double alpha_L);


static double dp3m_real_space_error(double box_size, double r_cut_iL,

                                    int n_c_part, double sum_q2,

                                    double alpha_L);


/** Compute the value of alpha through a bisection method.

 *  Based on eq. (33) @cite wang01a.

 */

double dp3m_rtbisection(double box_size, double r_cut_iL, int n_c_part,

                        double sum_q2, double x1, double x2, double xacc,

                        double tuned_accuracy);


double DipolarP3M::calc_average_self_energy_k_space() const {

  auto const start = Utils::Vector3i{dp3m.fft.plan[3].start};

  auto const size = Utils::Vector3i{dp3m.fft.plan[3].new_mesh};


  auto const &box_geo = *get_system().box_geo;

  auto const node_phi = grid_influence_function_self_energy(

      dp3m.params, start, start + size, dp3m.g_energy);


  double phi = 0.;

  boost::mpi::reduce(comm_cart, node_phi, phi, std::plus<>(), 0);

  phi /= 3. * box_geo.length()[0] * Utils::int_pow<3>(dp3m.params.mesh[0]);

  return phi * Utils::pi();

}


void DipolarP3M::init() {

  assert(dp3m.params.mesh >= Utils::Vector3i::broadcast(1));

  assert(dp3m.params.cao >= 1 and dp3m.params.cao <= 7);

  assert(dp3m.params.alpha > 0.);


  auto const &system = get_system();

  auto const &box_geo = *system.box_geo;

  auto const &local_geo = *system.local_geo;

  auto const verlet_skin = system.cell_structure->get_verlet_skin();


  dp3m.params.cao3 = Utils::int_pow<3>(dp3m.params.cao);

  dp3m.params.recalc_a_ai_cao_cut(box_geo.length());

  dp3m.local_mesh.calc_local_ca_mesh(dp3m.params, local_geo, verlet_skin, 0.);


  dp3m.sm.resize(comm_cart, dp3m.local_mesh);


  int ca_mesh_size =

      fft_init(dp3m.local_mesh.dim, dp3m.local_mesh.margin, dp3m.params.mesh,

               dp3m.params.mesh_off, dp3m.ks_pnum, dp3m.fft,

               ::communicator.node_grid, comm_cart);

  dp3m.rs_mesh.resize(ca_mesh_size);

  dp3m.ks_mesh.resize(ca_mesh_size);


  for (auto &val : dp3m.rs_mesh_dip) {

    val.resize(ca_mesh_size);

  }


  dp3m.calc_differential_operator();


  /* fix box length dependent constants */

  scaleby_box_l();


  count_magnetic_particles();

}


DipolarP3M::DipolarP3M(P3MParameters &&parameters, double prefactor,

                       int tune_timings, bool tune_verbose)

    : dp3m{std::move(parameters)}, tune_timings{tune_timings},

      tune_verbose{tune_verbose} {


  set_prefactor(prefactor);

  m_is_tuned = !dp3m.params.tuning;

  dp3m.params.tuning = false;


  if (tune_timings <= 0) {

    throw std::domain_error("Parameter 'timings' must be > 0");

  }


  if (dp3m.params.mesh != Utils::Vector3i::broadcast(dp3m.params.mesh[0])) {

    throw std::domain_error("DipolarP3M requires a cubic mesh");

  }

}


namespace {


template <int cao> struct AssignDipole {


  void operator()(dp3m_data_struct &dp3m, Utils::Vector3d const &real_pos,

                  Utils::Vector3d const &dip) const {

    auto const weights = p3m_calculate_interpolation_weights<cao>(

        real_pos, dp3m.params.ai, dp3m.local_mesh);

    p3m_interpolate<cao>(dp3m.local_mesh, weights,

                         [&dip, &dp3m](int ind, double w) {

                           dp3m.rs_mesh_dip[0][ind] += w * dip[0];

                           dp3m.rs_mesh_dip[1][ind] += w * dip[1];

                           dp3m.rs_mesh_dip[2][ind] += w * dip[2];

                         });


    dp3m.inter_weights.store<cao>(weights);

  }


};


} // namespace


void DipolarP3M::dipole_assign(ParticleRange const &particles) {

  dp3m.inter_weights.reset(dp3m.params.cao);


  /* prepare local FFT mesh */

  for (auto &i : dp3m.rs_mesh_dip)

    for (int j = 0; j < dp3m.local_mesh.size; j++)

      i[j] = 0.;


  for (auto const &p : particles) {

    if (p.dipm() != 0.) {

      Utils::integral_parameter<int, AssignDipole, 1, 7>(dp3m.params.cao, dp3m,

                                                         p.pos(), p.calc_dip());

    }

  }

}


namespace {


template <int cao> struct AssignTorques {


  void operator()(dp3m_data_struct const &dp3m, double prefac, int d_rs,

                  ParticleRange const &particles) const {


    /* magnetic particle index */

    auto p_index = std::size_t{0ul};


    for (auto &p : particles) {

      if (p.dipm() != 0.) {

        auto const w = dp3m.inter_weights.load<cao>(p_index);


        Utils::Vector3d E{};

        p3m_interpolate(dp3m.local_mesh, w,

                        [&E, &dp3m, d_rs](int ind, double w) {

                          E[d_rs] += w * dp3m.rs_mesh[ind];

                        });


        p.torque() -= vector_product(p.calc_dip(), prefac * E);

        ++p_index;

      }

    }

  }


};


template <int cao> struct AssignForces {


  void operator()(dp3m_data_struct const &dp3m, double prefac, int d_rs,

                  ParticleRange const &particles) const {


    /* magnetic particle index */

    auto p_index = std::size_t{0ul};


    for (auto &p : particles) {

      if (p.dipm() != 0.) {

        auto const w = dp3m.inter_weights.load<cao>(p_index);


        Utils::Vector3d E{};

        p3m_interpolate(dp3m.local_mesh, w, [&E, &dp3m](int ind, double w) {

          E[0] += w * dp3m.rs_mesh_dip[0][ind];

          E[1] += w * dp3m.rs_mesh_dip[1][ind];

          E[2] += w * dp3m.rs_mesh_dip[2][ind];

        });


        p.force()[d_rs] += p.calc_dip() * prefac * E;

        ++p_index;

      }

    }

  }


};


} // namespace


double DipolarP3M::long_range_kernel(bool force_flag, bool energy_flag,

                                     ParticleRange const &particles) {

  /* k-space energy */

  double energy = 0.;

  auto const &system = get_system();

  auto const &box_geo = *system.box_geo;

  auto const dipole_prefac = prefactor / Utils::int_pow<3>(dp3m.params.mesh[0]);

#ifdef NPT

  auto const npt_flag =

      force_flag and (system.propagation->integ_switch == INTEG_METHOD_NPT_ISO);

#else

  auto constexpr npt_flag = false;

#endif


  if (dp3m.sum_mu2 > 0.) {

    dipole_assign(particles);

    /* Gather information for FFT grid inside the nodes domain (inner local

     * mesh) and perform forward 3D FFT (Charge Assignment Mesh). */

    std::array<double *, 3> meshes = {{dp3m.rs_mesh_dip[0].data(),

                                       dp3m.rs_mesh_dip[1].data(),

                                       dp3m.rs_mesh_dip[2].data()}};


    dp3m.sm.gather_grid(Utils::make_span(meshes), comm_cart,

                        dp3m.local_mesh.dim);


    fft_perform_forw(dp3m.rs_mesh_dip[0].data(), dp3m.fft, comm_cart);

    fft_perform_forw(dp3m.rs_mesh_dip[1].data(), dp3m.fft, comm_cart);

    fft_perform_forw(dp3m.rs_mesh_dip[2].data(), dp3m.fft, comm_cart);

    // Note: after these calls, the grids are in the order yzx and not xyz

    // anymore!!!

  }


  /* === k-space energy calculation  === */

  if (energy_flag or npt_flag) {

    /*********************

       Dipolar energy

    **********************/

    if (dp3m.sum_mu2 > 0.) {

      /* i*k differentiation for dipolar gradients:

       * |(\Fourier{\vect{mu}}(k)\cdot \vect{k})|^2 */

      int ind = 0;

      int i = 0;

      int j[3];

      double node_energy = 0.0;

      for (j[0] = 0; j[0] < dp3m.fft.plan[3].new_mesh[0]; j[0]++) {

        for (j[1] = 0; j[1] < dp3m.fft.plan[3].new_mesh[1]; j[1]++) {

          for (j[2] = 0; j[2] < dp3m.fft.plan[3].new_mesh[2]; j[2]++) {

            node_energy +=

                dp3m.g_energy[i] *

                (Utils::sqr(

                     dp3m.rs_mesh_dip[0][ind] *

                         dp3m.d_op[0][j[2] + dp3m.fft.plan[3].start[2]] +

                     dp3m.rs_mesh_dip[1][ind] *

                         dp3m.d_op[0][j[0] + dp3m.fft.plan[3].start[0]] +

                     dp3m.rs_mesh_dip[2][ind] *

                         dp3m.d_op[0][j[1] + dp3m.fft.plan[3].start[1]]) +

                 Utils::sqr(

                     dp3m.rs_mesh_dip[0][ind + 1] *

                         dp3m.d_op[0][j[2] + dp3m.fft.plan[3].start[2]] +

                     dp3m.rs_mesh_dip[1][ind + 1] *

                         dp3m.d_op[0][j[0] + dp3m.fft.plan[3].start[0]] +

                     dp3m.rs_mesh_dip[2][ind + 1] *

                         dp3m.d_op[0][j[1] + dp3m.fft.plan[3].start[1]]));

            ind += 2;

            i++;

          }

        }

      }

      node_energy *= dipole_prefac * Utils::pi() * box_geo.length_inv()[0];

      boost::mpi::reduce(comm_cart, node_energy, energy, std::plus<>(), 0);


      if (dp3m.energy_correction == 0.)

        calc_energy_correction();


      if (this_node == 0) {

        /* self energy correction */

        energy -= prefactor * dp3m.sum_mu2 * Utils::sqrt_pi_i() * (2. / 3.) *

                  Utils::int_pow<3>(dp3m.params.alpha);


        /* dipolar energy correction due to systematic Madelung-self effects */

        energy += prefactor * dp3m.energy_correction / box_geo.volume();

      }

    }

  } // if (energy_flag)


  /* === k-space force calculation  === */

  if (force_flag) {

    /****************************

     * DIPOLAR TORQUES (k-space)

     ****************************/

    if (dp3m.sum_mu2 > 0.) {

      auto const two_pi_L_i = 2. * Utils::pi() * box_geo.length_inv()[0];

      /* fill in ks_mesh array for torque calculation */

      int ind = 0;

      int i = 0;

      int j[3];

      double tmp0, tmp1;


      for (j[0] = 0; j[0] < dp3m.fft.plan[3].new_mesh[0]; j[0]++) { // j[0]=n_y

        for (j[1] = 0; j[1] < dp3m.fft.plan[3].new_mesh[1];

             j[1]++) { // j[1]=n_z

          for (j[2] = 0; j[2] < dp3m.fft.plan[3].new_mesh[2];

               j[2]++) { // j[2]=n_x

            // tmp0 = Re(mu)*k,   tmp1 = Im(mu)*k


            tmp0 = dp3m.rs_mesh_dip[0][ind] *

                       dp3m.d_op[0][j[2] + dp3m.fft.plan[3].start[2]] +

                   dp3m.rs_mesh_dip[1][ind] *

                       dp3m.d_op[0][j[0] + dp3m.fft.plan[3].start[0]] +

                   dp3m.rs_mesh_dip[2][ind] *

                       dp3m.d_op[0][j[1] + dp3m.fft.plan[3].start[1]];


            tmp1 = dp3m.rs_mesh_dip[0][ind + 1] *

                       dp3m.d_op[0][j[2] + dp3m.fft.plan[3].start[2]] +

                   dp3m.rs_mesh_dip[1][ind + 1] *

                       dp3m.d_op[0][j[0] + dp3m.fft.plan[3].start[0]] +

                   dp3m.rs_mesh_dip[2][ind + 1] *

                       dp3m.d_op[0][j[1] + dp3m.fft.plan[3].start[1]];


            /* the optimal influence function is the same for torques

               and energy */

            dp3m.ks_mesh[ind] = tmp0 * dp3m.g_energy[i];

            dp3m.ks_mesh[ind + 1] = tmp1 * dp3m.g_energy[i];

            ind += 2;

            i++;

          }

        }

      }


      /* Force component loop */

      for (int d = 0; d < 3; d++) {

        auto const d_rs = (d + dp3m.ks_pnum) % 3;

        ind = 0;

        for (j[0] = 0; j[0] < dp3m.fft.plan[3].new_mesh[0]; j[0]++) {

          for (j[1] = 0; j[1] < dp3m.fft.plan[3].new_mesh[1]; j[1]++) {

            for (j[2] = 0; j[2] < dp3m.fft.plan[3].new_mesh[2]; j[2]++) {

              dp3m.rs_mesh[ind] =

                  dp3m.d_op[0][j[d] + dp3m.fft.plan[3].start[d]] *

                  dp3m.ks_mesh[ind];

              ind++;

              dp3m.rs_mesh[ind] =

                  dp3m.d_op[0][j[d] + dp3m.fft.plan[3].start[d]] *

                  dp3m.ks_mesh[ind];

              ind++;

            }

          }

        }


        /* Back FFT force component mesh */

        fft_perform_back(dp3m.rs_mesh.data(), false, dp3m.fft, comm_cart);

        /* redistribute force component mesh */

        dp3m.sm.spread_grid(dp3m.rs_mesh.data(), comm_cart,

                            dp3m.local_mesh.dim);

        /* Assign force component from mesh to particle */

        Utils::integral_parameter<int, AssignTorques, 1, 7>(

            dp3m.params.cao, dp3m, dipole_prefac * two_pi_L_i, d_rs, particles);

      }


      /***************************

         DIPOLAR FORCES (k-space)

      ****************************/


      // Compute forces after torques because the algorithm below overwrites the

      // grids dp3m.rs_mesh_dip !

      // Note: I'll do here 9 inverse FFTs. By symmetry, we can reduce this

      // number to 6 !

      /* fill in ks_mesh array for force calculation */

      ind = 0;

      i = 0;

      for (j[0] = 0; j[0] < dp3m.fft.plan[3].new_mesh[0]; j[0]++) { // j[0]=n_y

        for (j[1] = 0; j[1] < dp3m.fft.plan[3].new_mesh[1];

             j[1]++) { // j[1]=n_z

          for (j[2] = 0; j[2] < dp3m.fft.plan[3].new_mesh[2];

               j[2]++) { // j[2]=n_x

            // tmp0 = Im(mu)*k,   tmp1 = -Re(mu)*k

            tmp0 = dp3m.rs_mesh_dip[0][ind + 1] *

                       dp3m.d_op[0][j[2] + dp3m.fft.plan[3].start[2]] +

                   dp3m.rs_mesh_dip[1][ind + 1] *

                       dp3m.d_op[0][j[0] + dp3m.fft.plan[3].start[0]] +

                   dp3m.rs_mesh_dip[2][ind + 1] *

                       dp3m.d_op[0][j[1] + dp3m.fft.plan[3].start[1]];

            tmp1 = dp3m.rs_mesh_dip[0][ind] *

                       dp3m.d_op[0][j[2] + dp3m.fft.plan[3].start[2]] +

                   dp3m.rs_mesh_dip[1][ind] *

                       dp3m.d_op[0][j[0] + dp3m.fft.plan[3].start[0]] +

                   dp3m.rs_mesh_dip[2][ind] *

                       dp3m.d_op[0][j[1] + dp3m.fft.plan[3].start[1]];

            dp3m.ks_mesh[ind] = tmp0 * dp3m.g_force[i];

            dp3m.ks_mesh[ind + 1] = -tmp1 * dp3m.g_force[i];

            ind += 2;

            i++;

          }

        }

      }


      /* Force component loop */

      for (int d = 0; d < 3; d++) { /* direction in k-space: */

        auto const d_rs = (d + dp3m.ks_pnum) % 3;

        ind = 0;

        for (j[0] = 0; j[0] < dp3m.fft.plan[3].new_mesh[0];

             j[0]++) { // j[0]=n_y

          for (j[1] = 0; j[1] < dp3m.fft.plan[3].new_mesh[1];

               j[1]++) { // j[1]=n_z

            for (j[2] = 0; j[2] < dp3m.fft.plan[3].new_mesh[2];

                 j[2]++) { // j[2]=n_x

              tmp0 = dp3m.d_op[0][j[d] + dp3m.fft.plan[3].start[d]] *

                     dp3m.ks_mesh[ind];

              dp3m.rs_mesh_dip[0][ind] =

                  dp3m.d_op[0][j[2] + dp3m.fft.plan[3].start[2]] * tmp0;

              dp3m.rs_mesh_dip[1][ind] =

                  dp3m.d_op[0][j[0] + dp3m.fft.plan[3].start[0]] * tmp0;

              dp3m.rs_mesh_dip[2][ind] =

                  dp3m.d_op[0][j[1] + dp3m.fft.plan[3].start[1]] * tmp0;

              ind++;

              tmp0 = dp3m.d_op[0][j[d] + dp3m.fft.plan[3].start[d]] *

                     dp3m.ks_mesh[ind];

              dp3m.rs_mesh_dip[0][ind] =

                  dp3m.d_op[0][j[2] + dp3m.fft.plan[3].start[2]] * tmp0;

              dp3m.rs_mesh_dip[1][ind] =

                  dp3m.d_op[0][j[0] + dp3m.fft.plan[3].start[0]] * tmp0;

              dp3m.rs_mesh_dip[2][ind] =

                  dp3m.d_op[0][j[1] + dp3m.fft.plan[3].start[1]] * tmp0;

              ind++;

            }

          }

        }

        /* Back FFT force component mesh */

        fft_perform_back(dp3m.rs_mesh_dip[0].data(), false, dp3m.fft,

                         comm_cart);

        fft_perform_back(dp3m.rs_mesh_dip[1].data(), false, dp3m.fft,

                         comm_cart);

        fft_perform_back(dp3m.rs_mesh_dip[2].data(), false, dp3m.fft,

                         comm_cart);

        /* redistribute force component mesh */

        std::array<double *, 3> meshes = {{dp3m.rs_mesh_dip[0].data(),

                                           dp3m.rs_mesh_dip[1].data(),

                                           dp3m.rs_mesh_dip[2].data()}};


        dp3m.sm.spread_grid(Utils::make_span(meshes), comm_cart,

                            dp3m.local_mesh.dim);

        /* Assign force component from mesh to particle */

        Utils::integral_parameter<int, AssignForces, 1, 7>(

            dp3m.params.cao, dp3m, dipole_prefac * Utils::sqr(two_pi_L_i), d_rs,

            particles);

      }

    } /* if (dp3m.sum_mu2 > 0) */

  } /* if (force_flag) */


  if (dp3m.params.epsilon != P3M_EPSILON_METALLIC) {

    auto const surface_term =

        calc_surface_term(force_flag, energy_flag or npt_flag, particles);

    if (this_node == 0) {

      energy += surface_term;

    }

  }

  if (npt_flag) {

    npt_add_virial_contribution(energy);

    fprintf(stderr, "dipolar_P3M at this moment is added to p_vir[0]\n");

  }

  if (not energy_flag) {

    energy = 0.;

  }


  return energy;

}


double DipolarP3M::calc_surface_term(bool force_flag, bool energy_flag,

                                     ParticleRange const &particles) {

  auto const &box_geo = *get_system().box_geo;

  auto const pref = prefactor * 4. * Utils::pi() / box_geo.volume() /

                    (2. * dp3m.params.epsilon + 1.);

  auto const n_local_part = particles.size();


  // We put all the dipolar momenta in a the arrays mx,my,mz according to the

  // id-number of the particles

  std::vector<double> mx(n_local_part);

  std::vector<double> my(n_local_part);

  std::vector<double> mz(n_local_part);


  std::size_t ip = 0u;

  for (auto const &p : particles) {

    auto const dip = p.calc_dip();

    mx[ip] = dip[0];

    my[ip] = dip[1];

    mz[ip] = dip[2];

    ip++;

  }


  // we will need the sum of all dipolar momenta vectors

  auto local_dip = Utils::Vector3d{};

  for (std::size_t i = 0u; i < n_local_part; i++) {

    local_dip[0] += mx[i];

    local_dip[1] += my[i];

    local_dip[2] += mz[i];

  }

  auto const box_dip =

      boost::mpi::all_reduce(comm_cart, local_dip, std::plus<>());


  double energy = 0.;

  if (energy_flag) {

    double sum_e = 0.;

    for (std::size_t i = 0u; i < n_local_part; i++) {

      sum_e += mx[i] * box_dip[0] + my[i] * box_dip[1] + mz[i] * box_dip[2];

    }

    energy =

        0.5 * pref * boost::mpi::all_reduce(comm_cart, sum_e, std::plus<>());

  }


  if (force_flag) {


    std::vector<double> sumix(n_local_part);

    std::vector<double> sumiy(n_local_part);

    std::vector<double> sumiz(n_local_part);


    for (std::size_t i = 0u; i < n_local_part; i++) {

      sumix[i] = my[i] * box_dip[2] - mz[i] * box_dip[1];

      sumiy[i] = mz[i] * box_dip[0] - mx[i] * box_dip[2];

      sumiz[i] = mx[i] * box_dip[1] - my[i] * box_dip[0];

    }


    ip = 0u;

    for (auto &p : particles) {

      auto &torque = p.torque();

      torque[0] -= pref * sumix[ip];

      torque[1] -= pref * sumiy[ip];

      torque[2] -= pref * sumiz[ip];

      ip++;

    }

  }


  return energy;

}


void DipolarP3M::calc_influence_function_force() {

  auto const start = Utils::Vector3i{dp3m.fft.plan[3].start};

  auto const size = Utils::Vector3i{dp3m.fft.plan[3].new_mesh};


  dp3m.g_force = grid_influence_function<3>(dp3m.params, start, start + size,

                                            get_system().box_geo->length());

}


void DipolarP3M::calc_influence_function_energy() {

  auto const start = Utils::Vector3i{dp3m.fft.plan[3].start};

  auto const size = Utils::Vector3i{dp3m.fft.plan[3].new_mesh};


  dp3m.g_energy = grid_influence_function<2>(dp3m.params, start, start + size,

                                             get_system().box_geo->length());

}


class DipolarTuningAlgorithm : public TuningAlgorithm {

  dp3m_data_struct &dp3m;

  int m_mesh_max = -1, m_mesh_min = -1;


public:


  DipolarTuningAlgorithm(System::System &system, dp3m_data_struct &input_dp3m,

                         double prefactor, int timings)

      : TuningAlgorithm(system, prefactor, timings), dp3m{input_dp3m} {}


  P3MParameters &get_params() override { return dp3m.params; }


  void on_solver_change() const override { m_system.on_dipoles_change(); }


  std::optional<std::string>


  layer_correction_veto_r_cut(double) const override {

    return {};

  }


  void setup_logger(bool verbose) override {

    auto const &box_geo = *m_system.box_geo;

    m_logger = std::make_unique<TuningLogger>(

        verbose and this_node == 0, "DipolarP3M", TuningLogger::Mode::Dipolar);

    m_logger->tuning_goals(dp3m.params.accuracy, m_prefactor,

                           box_geo.length()[0], dp3m.sum_dip_part,

                           dp3m.sum_mu2);

    m_logger->log_tuning_start();

  }


  std::tuple<double, double, double, double>


  calculate_accuracy(Utils::Vector3i const &mesh, int cao,

                     double r_cut_iL) const override {


    double alpha_L, rs_err, ks_err;

    auto const &box_geo = *m_system.box_geo;


    /* calc maximal real space error for setting */

    rs_err = dp3m_real_space_error(box_geo.length()[0], r_cut_iL,

                                   dp3m.sum_dip_part, dp3m.sum_mu2, 0.001);

    // alpha cannot be zero for dipoles because real-space formula breaks down


    if (Utils::sqrt_2() * rs_err > dp3m.params.accuracy) {

      /* assume rs_err = ks_err -> rs_err = accuracy/sqrt(2.0) -> alpha_L */

      alpha_L = dp3m_rtbisection(

          box_geo.length()[0], r_cut_iL, dp3m.sum_dip_part, dp3m.sum_mu2,

          0.0001 * box_geo.length()[0], 5. * box_geo.length()[0], 0.0001,

          dp3m.params.accuracy);

    } else {

      /* even alpha=0 is ok, however, we cannot choose it since it kills the

         k-space error formula.

         Anyways, this very likely NOT the optimal solution */

      alpha_L = 0.1;

    }


    /* calculate real-space and k-space error for this alpha_L */

    rs_err = dp3m_real_space_error(box_geo.length()[0], r_cut_iL,

                                   dp3m.sum_dip_part, dp3m.sum_mu2, alpha_L);

    ks_err = dp3m_k_space_error(box_geo.length()[0], mesh[0], cao,

                                dp3m.sum_dip_part, dp3m.sum_mu2, alpha_L);


    return {Utils::Vector2d{rs_err, ks_err}.norm(), rs_err, ks_err, alpha_L};

  }


  void determine_mesh_limits() override {

    if (dp3m.params.mesh[0] == -1) {

      /* simple heuristic to limit the tried meshes if the accuracy cannot

         be obtained with smaller meshes, but normally not all these

         meshes have to be tested */

      auto const expo = std::log(std::cbrt(dp3m.sum_dip_part)) / std::log(2.);

      /* Medium-educated guess for the minimal mesh */

      m_mesh_min = static_cast<int>(std::round(std::pow(2., std::floor(expo))));

      /* avoid using more than 1 GB of FFT arrays */

      m_mesh_max = 128;

    } else {

      m_mesh_min = m_mesh_max = dp3m.params.mesh[0];

      m_logger->report_fixed_mesh(dp3m.params.mesh);

    }

  }


  TuningAlgorithm::Parameters get_time() override {

    auto tuned_params = TuningAlgorithm::Parameters{};

    auto time_best = time_sentinel;

    for (auto tmp_mesh = m_mesh_min; tmp_mesh <= m_mesh_max; tmp_mesh += 2) {

      auto trial_params = TuningAlgorithm::Parameters{};

      trial_params.mesh = Utils::Vector3i::broadcast(tmp_mesh);

      trial_params.cao = cao_best;


      auto const trial_time =

          get_m_time(trial_params.mesh, trial_params.cao, trial_params.r_cut_iL,

                     trial_params.alpha_L, trial_params.accuracy);


      /* this mesh does not work at all */

      if (trial_time < 0.)

        continue;


      /* the optimum r_cut for this mesh is the upper limit for higher meshes,

         everything else is slower */

      m_r_cut_iL_max = trial_params.r_cut_iL;


      if (trial_time < time_best) {

        /* new optimum */

        reset_n_trials();

        tuned_params = trial_params;

        time_best = tuned_params.time = trial_time;

      } else if (trial_time > time_best + time_granularity or

                 get_n_trials() > max_n_consecutive_trials) {

        /* no hope of further optimisation */

        break;

      }

    }

    return tuned_params;

  }


};


void DipolarP3M::tune() {

  auto &system = get_system();

  auto const &box_geo = *system.box_geo;

  if (dp3m.params.alpha_L == 0. and dp3m.params.alpha != 0.) {

    dp3m.params.alpha_L = dp3m.params.alpha * box_geo.length()[0];

  }

  if (dp3m.params.r_cut_iL == 0. and dp3m.params.r_cut != 0.) {

    dp3m.params.r_cut_iL = dp3m.params.r_cut * box_geo.length_inv()[0];

  }

  if (not is_tuned()) {

    count_magnetic_particles();

    if (dp3m.sum_dip_part == 0) {

      throw std::runtime_error(

          "DipolarP3M: no dipolar particles in the system");

    }

    try {

      DipolarTuningAlgorithm parameters(system, dp3m, prefactor, tune_timings);

      parameters.setup_logger(tune_verbose);

      // parameter ranges

      parameters.determine_mesh_limits();

      parameters.determine_r_cut_limits();

      parameters.determine_cao_limits(3);

      // run tuning algorithm

      parameters.tune();

      m_is_tuned = true;

      system.on_dipoles_change();

    } catch (...) {

      dp3m.params.tuning = false;

      throw;

    }

  }

  init();

}


/** Tuning dipolar-P3M */


static auto dp3m_tune_aliasing_sums(int nx, int ny, int nz, int mesh,

                                    double mesh_i, int cao, double alpha_L_i) {

  using Utils::sinc;


  auto const factor1 = Utils::sqr(Utils::pi() * alpha_L_i);


  auto alias1 = 0.;

  auto alias2 = 0.;

  for (int mx = -P3M_BRILLOUIN; mx <= P3M_BRILLOUIN; mx++) {

    auto const nmx = nx + mx * mesh;

    auto const fnmx = mesh_i * nmx;

    for (int my = -P3M_BRILLOUIN; my <= P3M_BRILLOUIN; my++) {

      auto const nmy = ny + my * mesh;

      auto const fnmy = mesh_i * nmy;

      for (int mz = -P3M_BRILLOUIN; mz <= P3M_BRILLOUIN; mz++) {

        auto const nmz = nz + mz * mesh;

        auto const fnmz = mesh_i * nmz;


        auto const nm2 = Utils::sqr(nmx) + Utils::sqr(nmy) + Utils::sqr(nmz);

        auto const ex = std::exp(-factor1 * nm2);


        auto const U2 = pow(sinc(fnmx) * sinc(fnmy) * sinc(fnmz), 2. * cao);


        alias1 += Utils::sqr(ex) * nm2;

        alias2 += U2 * ex * pow((nx * nmx + ny * nmy + nz * nmz), 3.) / nm2;

      }

    }

  }

  return std::make_pair(alias1, alias2);

}


/** Calculate the k-space error of dipolar-P3M */


static double dp3m_k_space_error(double box_size, int mesh, int cao,

                                 int n_c_part, double sum_q2, double alpha_L) {

  double he_q = 0.;

  auto const mesh_i = 1. / mesh;

  auto const alpha_L_i = 1. / alpha_L;


  for (int nx = -mesh / 2; nx < mesh / 2; nx++)

    for (int ny = -mesh / 2; ny < mesh / 2; ny++)

      for (int nz = -mesh / 2; nz < mesh / 2; nz++)

        if ((nx != 0) || (ny != 0) || (nz != 0)) {

          auto const n2 = Utils::sqr(nx) + Utils::sqr(ny) + Utils::sqr(nz);

          auto const cs = p3m_analytic_cotangent_sum(nx, mesh_i, cao) *

                          p3m_analytic_cotangent_sum(ny, mesh_i, cao) *

                          p3m_analytic_cotangent_sum(nz, mesh_i, cao);

          auto const [alias1, alias2] =

              dp3m_tune_aliasing_sums(nx, ny, nz, mesh, mesh_i, cao, alpha_L_i);

          auto const d =

              alias1 - Utils::sqr(alias2 / cs) /

                           Utils::int_pow<3>(static_cast<double>(n2));

          /* at high precision, d can become negative due to extinction;

             also, don't take values that have no significant digits left*/

          if (d > 0 && (fabs(d / alias1) > ROUND_ERROR_PREC))

            he_q += d;

        }


  return 8. * Utils::sqr(Utils::pi()) / 3. * sum_q2 * sqrt(he_q / n_c_part) /

         Utils::int_pow<4>(box_size);

}


/** Calculate the value of the errors for the REAL part of the force in terms

 *  of the splitting parameter alpha of Ewald. Based on eq. (33) @cite wang01a.

 *

 *  Please note that in this more refined approach we don't use

 *  eq. (37), but eq. (33) which maintains all the powers in alpha.

 */


static double dp3m_real_space_error(double box_size, double r_cut_iL,

                                    int n_c_part, double sum_q2,

                                    double alpha_L) {

  double d_error_f, d_cc, d_dc, d_con;


  auto const d_rcut = r_cut_iL * box_size;

  auto const d_rcut2 = Utils::sqr(d_rcut);

  auto const d_rcut4 = Utils::sqr(d_rcut2);


  auto const d_a2 = Utils::sqr(alpha_L) / Utils::sqr(box_size);


  auto const d_c = sum_q2 * exp(-d_a2 * d_rcut2);


  d_cc = 4. * Utils::sqr(d_a2) * Utils::sqr(d_rcut2) + 6. * d_a2 * d_rcut2 + 3.;


  d_dc = 8. * Utils::int_pow<3>(d_a2) * Utils::int_pow<3>(d_rcut2) +

         20. * Utils::sqr(d_a2) * d_rcut4 + 30. * d_a2 * d_rcut2 + 15.;


  d_con = 1. / sqrt(Utils::int_pow<3>(box_size) * Utils::sqr(d_a2) * d_rcut *

                    Utils::sqr(d_rcut4) * static_cast<double>(n_c_part));


  d_error_f = d_c * d_con *

              sqrt((13. / 6.) * Utils::sqr(d_cc) +

                   (2. / 15.) * Utils::sqr(d_dc) - (13. / 15.) * d_cc * d_dc);


  return d_error_f;

}


/** Using bisection, find the root of a function "func-tuned_accuracy/sqrt(2.)"

 *  known to lie between x1 and x2. The root, returned as rtbis, will be

 *  refined until its accuracy is \f$\pm\f$ @p xacc.

 */


double dp3m_rtbisection(double box_size, double r_cut_iL, int n_c_part,

                        double sum_q2, double x1, double x2, double xacc,

                        double tuned_accuracy) {

  constexpr int JJ_RTBIS_MAX = 40;


  auto const constant = tuned_accuracy / Utils::sqrt_2();


  auto const f1 =

      dp3m_real_space_error(box_size, r_cut_iL, n_c_part, sum_q2, x1) -

      constant;

  auto const f2 =

      dp3m_real_space_error(box_size, r_cut_iL, n_c_part, sum_q2, x2) -

      constant;

  if (f1 * f2 >= 0.0) {

    throw std::runtime_error(

        "Root must be bracketed for bisection in dp3m_rtbisection");

  }

  // Orient the search dx, and set rtb to x1 or x2 ...

  double dx;

  double rtb = f1 < 0.0 ? (dx = x2 - x1, x1) : (dx = x1 - x2, x2);

  for (int j = 1; j <= JJ_RTBIS_MAX; j++) {

    auto const xmid = rtb + (dx *= 0.5);

    auto const fmid =

        dp3m_real_space_error(box_size, r_cut_iL, n_c_part, sum_q2, xmid) -

        constant;

    if (fmid <= 0.0)

      rtb = xmid;

    if (fabs(dx) < xacc || fmid == 0.0)

      return rtb;

  }

  throw std::runtime_error("Too many bisections in dp3m_rtbisection");

}


void DipolarP3M::sanity_checks_boxl() const {

  auto const &system = get_system();

  auto const &box_geo = *system.box_geo;

  auto const &local_geo = *system.local_geo;

  for (unsigned int i = 0u; i < 3u; i++) {

    /* check k-space cutoff */

    if (dp3m.params.cao_cut[i] >= box_geo.length_half()[i]) {

      std::stringstream msg;

      msg << "dipolar P3M_init: k-space cutoff " << dp3m.params.cao_cut[i]

          << " is larger than half of box dimension " << box_geo.length()[i];

      throw std::runtime_error(msg.str());

    }

    if (dp3m.params.cao_cut[i] >= local_geo.length()[i]) {

      std::stringstream msg;

      msg << "dipolar P3M_init: k-space cutoff " << dp3m.params.cao_cut[i]

          << " is larger than local box dimension " << local_geo.length()[i];

      throw std::runtime_error(msg.str());

    }

  }


  if ((box_geo.length()[0] != box_geo.length()[1]) or

      (box_geo.length()[1] != box_geo.length()[2])) {

    throw std::runtime_error("DipolarP3M: requires a cubic box");

  }

}


void DipolarP3M::sanity_checks_periodicity() const {

  auto const &box_geo = *get_system().box_geo;

  if (!box_geo.periodic(0) or !box_geo.periodic(1) or !box_geo.periodic(2)) {

    throw std::runtime_error(

        "DipolarP3M: requires periodicity (True, True, True)");

  }

}


void DipolarP3M::sanity_checks_cell_structure() const {

  auto const &local_geo = *get_system().local_geo;

  if (local_geo.cell_structure_type() != CellStructureType::REGULAR and

      local_geo.cell_structure_type() != CellStructureType::HYBRID) {

    throw std::runtime_error(

        "DipolarP3M: requires the regular or hybrid decomposition cell system");

  }

  if (::communicator.size > 1 and

      local_geo.cell_structure_type() == CellStructureType::HYBRID) {

    throw std::runtime_error(

        "DipolarP3M: does not work with the hybrid decomposition cell system, "

        "if using more than one MPI node");

  }

}


void DipolarP3M::sanity_checks_node_grid() const {

  auto const &node_grid = ::communicator.node_grid;

  if (node_grid[0] < node_grid[1] or node_grid[1] < node_grid[2]) {

    throw std::runtime_error(

        "DipolarP3M: node grid must be sorted, largest first");

  }

}


void DipolarP3M::scaleby_box_l() {

  auto const &box_geo = *get_system().box_geo;

  dp3m.params.r_cut = dp3m.params.r_cut_iL * box_geo.length()[0];

  dp3m.params.alpha = dp3m.params.alpha_L * box_geo.length_inv()[0];

  dp3m.params.recalc_a_ai_cao_cut(box_geo.length());

  dp3m.local_mesh.recalc_ld_pos(dp3m.params);

  sanity_checks_boxl();

  calc_influence_function_force();

  calc_influence_function_energy();

  dp3m.energy_correction = 0.0;

}


void DipolarP3M::calc_energy_correction() {

  auto const &box_geo = *get_system().box_geo;

  auto const Ukp3m = calc_average_self_energy_k_space() * box_geo.volume();

  auto const Ewald_volume = Utils::int_pow<3>(dp3m.params.alpha_L);

  auto const Eself = -2. * Ewald_volume * Utils::sqrt_pi_i() / 3.;

  dp3m.energy_correction =

      -dp3m.sum_mu2 * (Ukp3m + Eself + 2. * Utils::pi() / 3.);

}


#ifdef NPT


void npt_add_virial_magnetic_contribution(double energy) {

  npt_add_virial_contribution(energy);

}


#endif // NPT

#endif // DP3M

BoxGeometry.hpp

CellStructureType.hpp

CellStructureType::HYBRID
@ HYBRID
Hybrid decomposition.

CellStructureType::REGULAR
@ REGULAR
Regular decomposition.

CellStructure.hpp

LocalBox.hpp

ParticleRange.hpp

Particle.hpp

PropagationMode.hpp

INTEG_METHOD_NPT_ISO
@ INTEG_METHOD_NPT_ISO
Definition PropagationMode.hpp:45

Propagation.hpp

TuningAlgorithm.hpp

TuningLogger.hpp

Vector.hpp
Vector implementation and trait types for boost qvm interoperability.

torque
__global__ float float * torque
Definition barnes_hut_gpu_cuda.cu:685

u
float u[3]
Definition barnes_hut_gpu_cuda.cu:690

DipolarTuningAlgorithm
Definition dp3m.cpp:606

DipolarTuningAlgorithm::layer_correction_veto_r_cut
std::optional< std::string > layer_correction_veto_r_cut(double) const override
Definition dp3m.cpp:620

DipolarTuningAlgorithm::get_time
TuningAlgorithm::Parameters get_time() override
Definition dp3m.cpp:684

DipolarTuningAlgorithm::setup_logger
void setup_logger(bool verbose) override
Definition dp3m.cpp:624

DipolarTuningAlgorithm::calculate_accuracy
std::tuple< double, double, double, double > calculate_accuracy(Utils::Vector3i const &mesh, int cao, double r_cut_iL) const override
Definition dp3m.cpp:635

DipolarTuningAlgorithm::get_params
P3MParameters & get_params() override
Definition dp3m.cpp:615

DipolarTuningAlgorithm::DipolarTuningAlgorithm
DipolarTuningAlgorithm(System::System &system, dp3m_data_struct &input_dp3m, double prefactor, int timings)
Definition dp3m.cpp:611

DipolarTuningAlgorithm::determine_mesh_limits
void determine_mesh_limits() override
Definition dp3m.cpp:668

DipolarTuningAlgorithm::on_solver_change
void on_solver_change() const override
Definition dp3m.cpp:617

Dipoles::Actor< DipolarP3M >::set_prefactor
void set_prefactor(double new_prefactor)
Definition magnetostatics/actor.hpp:39

Dipoles::Actor< DipolarP3M >::prefactor
double prefactor
Magnetostatics prefactor.
Definition magnetostatics/actor.hpp:37

ParticleRange
A range of particles.
Definition ParticleRange.hpp:38

ParticleRange::size
base_type::size_type size() const
Definition ParticleRange.hpp:44

System::Leaf::get_system
auto & get_system()
Definition core/system/Leaf.hpp:38

System::System
Main system class.
Definition core/system/System.hpp:65

System::System::on_dipoles_change
void on_dipoles_change()
Definition core/system/System.cpp:277

System::System::box_geo
std::shared_ptr< BoxGeometry > box_geo
Definition core/system/System.hpp:265

TuningAlgorithm
Tuning algorithm for P3M.
Definition TuningAlgorithm.hpp:64

TuningAlgorithm::get_m_time
double get_m_time(Utils::Vector3i const &mesh, int &tuned_cao, double &tuned_r_cut_iL, double &tuned_alpha_L, double &tuned_accuracy)
Get the optimal alpha and the corresponding computation time for a fixed mesh.
Definition TuningAlgorithm.cpp:215

TuningAlgorithm::time_sentinel
static auto constexpr time_sentinel
Value for invalid time measurements.
Definition TuningAlgorithm.hpp:91

TuningAlgorithm::cao_best
int cao_best
Definition TuningAlgorithm.hpp:75

TuningAlgorithm::max_n_consecutive_trials
static auto constexpr max_n_consecutive_trials
Maximal number of consecutive trials that don't improve runtime.
Definition TuningAlgorithm.hpp:88

TuningAlgorithm::reset_n_trials
void reset_n_trials()
Definition TuningAlgorithm.hpp:180

TuningAlgorithm::m_system
System::System & m_system
Definition TuningAlgorithm.hpp:66

TuningAlgorithm::m_prefactor
double m_prefactor
Definition TuningAlgorithm.hpp:73

TuningAlgorithm::m_r_cut_iL_max
double m_r_cut_iL_max
Definition TuningAlgorithm.hpp:76

TuningAlgorithm::tune
void tune()
Definition TuningAlgorithm.hpp:154

TuningAlgorithm::determine_cao_limits
void determine_cao_limits(int initial_cao)
Determine a sensible range for the charge assignment order.
Definition TuningAlgorithm.cpp:77

TuningAlgorithm::determine_r_cut_limits
void determine_r_cut_limits()
Determine a sensible range for the real-space cutoff.
Definition TuningAlgorithm.cpp:59

TuningAlgorithm::m_logger
std::unique_ptr< TuningLogger > m_logger
Definition TuningAlgorithm.hpp:74

TuningAlgorithm::time_granularity
static auto constexpr time_granularity
Granularity of the time measurement (milliseconds).
Definition TuningAlgorithm.hpp:82

TuningAlgorithm::get_n_trials
auto get_n_trials()
Definition TuningAlgorithm.hpp:178

TuningLogger::Mode::Dipolar
@ Dipolar

Utils::Vector
Definition Vector.hpp:47

Utils::Vector::broadcast
static Vector< T, N > broadcast(T const &s)
Create a vector that has all entries set to one value.
Definition Vector.hpp:110

Utils::Vector::norm
T norm() const
Definition Vector.hpp:131

p3m_interpolation_cache::store
void store(const InterpolationWeights< cao > &w)
Push back weights for one point.
Definition interpolation.hpp:82

p3m_interpolation_cache::load
InterpolationWeights< cao > load(std::size_t i) const
Load entry from the cache.
Definition interpolation.hpp:103

p3m_interpolation_cache::reset
void reset(int cao)
Reset the cache.
Definition interpolation.hpp:125

p3m_send_mesh::spread_grid
void spread_grid(Utils::Span< double * > meshes, const boost::mpi::communicator &comm, const Utils::Vector3i &dim)
Definition send_mesh.cpp:186

p3m_send_mesh::resize
void resize(const boost::mpi::communicator &comm, const P3MLocalMesh &local_mesh)
Definition send_mesh.cpp:73

p3m_send_mesh::gather_grid
void gather_grid(Utils::Span< double * > meshes, const boost::mpi::communicator &comm, const Utils::Vector3i &dim)
Definition send_mesh.cpp:148

common.hpp
Common functions for dipolar and charge P3M.

P3M_EPSILON_METALLIC
auto constexpr P3M_EPSILON_METALLIC
This value indicates metallic boundary conditions.
Definition common.hpp:45

communicator
Communicator communicator
Definition communication.cpp:48

comm_cart
boost::mpi::communicator comm_cart
The communicator.
Definition communication.cpp:47

this_node
int this_node
The number of this node.
Definition communication.cpp:69

config.hpp
This file contains the defaults for ESPResSo.

ROUND_ERROR_PREC
#define ROUND_ERROR_PREC
Precision for capture of round off errors.
Definition config.hpp:66

P3M_BRILLOUIN
#define P3M_BRILLOUIN
P3M: Number of Brillouin zones taken into account in the calculation of the optimal influence functio...
Definition config.hpp:53

constants.hpp

vector_product
__device__ void vector_product(float const *a, float const *b, float *out)
Definition dipolar_direct_sum_gpu_cuda.cu:41

dp3m_k_space_error
static double dp3m_k_space_error(double box_size, int mesh, int cao, int n_c_part, double sum_q2, double alpha_L)
Calculate the k-space error of dipolar-P3M.
Definition dp3m.cpp:786

npt_add_virial_magnetic_contribution
void npt_add_virial_magnetic_contribution(double energy)
Update the NpT virial.
Definition dp3m.cpp:965

dp3m_rtbisection
double dp3m_rtbisection(double box_size, double r_cut_iL, int n_c_part, double sum_q2, double x1, double x2, double xacc, double tuned_accuracy)
Compute the value of alpha through a bisection method.
Definition dp3m.cpp:853

dp3m_tune_aliasing_sums
static auto dp3m_tune_aliasing_sums(int nx, int ny, int nz, int mesh, double mesh_i, int cao, double alpha_L_i)
Tuning dipolar-P3M.
Definition dp3m.cpp:754

dp3m_real_space_error
static double dp3m_real_space_error(double box_size, double r_cut_iL, int n_c_part, double sum_q2, double alpha_L)
Calculate the value of the errors for the REAL part of the force in terms of the splitting parameter ...
Definition dp3m.cpp:821

dp3m.hpp
P3M algorithm for long-range magnetic dipole-dipole interaction.

errorhandling.hpp
This file contains the errorhandling code for severe errors, like a broken bond or illegal parameter ...

fft_perform_forw
void fft_perform_forw(double *data, fft_data_struct &fft, const boost::mpi::communicator &comm)
Perform an in-place forward 3D FFT.
Definition fft.cpp:683

fft_perform_back
void fft_perform_back(double *data, bool check_complex, fft_data_struct &fft, const boost::mpi::communicator &comm)
Perform an in-place backward 3D FFT.
Definition fft.cpp:714

fft_init
int fft_init(Utils::Vector3i const &ca_mesh_dim, int const *ca_mesh_margin, Utils::Vector3i const &global_mesh_dim, Utils::Vector3d const &global_mesh_off, int &ks_pnum, fft_data_struct &fft, Utils::Vector3i const &grid, boost::mpi::communicator const &comm)
Initialize everything connected to the 3D-FFT.
Definition fft.cpp:484

fft.hpp
Routines, row decomposition, data structures and communication for the 3D-FFT.

influence_function_dipolar.hpp

grid_influence_function_self_energy
double grid_influence_function_self_energy(P3MParameters const &params, Utils::Vector3i const &n_start, Utils::Vector3i const &n_end, std::vector< double > const &g)
Calculate self-energy of the influence function.
Definition influence_function_dipolar.hpp:193

int_pow.hpp

integral_parameter.hpp

interpolation.hpp

p3m_interpolate
void p3m_interpolate(P3MLocalMesh const &local_mesh, InterpolationWeights< cao > const &weights, Kernel kernel)
P3M grid interpolation.
Definition interpolation.hpp:192

Cells::particles
ParticleRange particles(Utils::Span< Cell *const > cells)
Definition CellStructure.hpp:87

Utils::pi
DEVICE_QUALIFIER constexpr T pi()
Ratio of diameter and circumference of a circle.
Definition constants.hpp:36

Utils::sinc
DEVICE_QUALIFIER T sinc(T d)
Calculates the sinc-function as sin(PI*x)/(PI*x).
Definition sinc.hpp:45

Utils::sqr
DEVICE_QUALIFIER constexpr T sqr(T x)
Calculates the SQuaRe of x.
Definition sqr.hpp:26

Utils::make_span
DEVICE_QUALIFIER constexpr Span< T > make_span(T *p, std::size_t N)
Definition Span.hpp:112

Utils::sqrt_2
DEVICE_QUALIFIER constexpr T sqrt_2()
Square root of 2.
Definition constants.hpp:64

Utils::sqrt_pi_i
DEVICE_QUALIFIER constexpr T sqrt_pi_i()
One over square root of pi.
Definition constants.hpp:43

npt_add_virial_contribution
void npt_add_virial_contribution(double energy)
Definition npt.cpp:141

npt.hpp
Exports for the NpT code.

p3m_analytic_cotangent_sum
static __device__ double p3m_analytic_cotangent_sum(int n, double mesh_i)
Definition p3m_gpu_error_cuda.cu:54

send_mesh.hpp

sinc.hpp

sqr.hpp

Communicator::node_grid
Utils::Vector3i node_grid
Definition core/communication.hpp:64

DipolarP3M::init
void init()
Recalculate all derived parameters.
Definition dp3m.cpp:119

DipolarP3M::tune_timings
int tune_timings
Magnetostatics prefactor.
Definition dp3m.hpp:100

DipolarP3M::dipole_assign
void dipole_assign(ParticleRange const &particles)
Assign the physical dipoles using the tabulated assignment function.
Definition dp3m.cpp:190

DipolarP3M::dp3m
dp3m_data_struct dp3m
Dipolar P3M parameters.
Definition dp3m.hpp:97

DipolarP3M::DipolarP3M
DipolarP3M(P3MParameters &&parameters, double prefactor, int tune_timings, bool tune_verbose)
Definition dp3m.cpp:154

DipolarP3M::long_range_kernel
double long_range_kernel(bool force_flag, bool energy_flag, ParticleRange const &particles)
Compute the k-space part of forces and energies.
Definition dp3m.cpp:257

DipolarP3M::count_magnetic_particles
void count_magnetic_particles()
Count the number of magnetic particles and calculate the sum of the squared dipole moments.
Definition dp3m.cpp:76

DipolarP3M::tune
void tune()
Tune dipolar P3M parameters to desired accuracy.
Definition dp3m.cpp:719

DipolarP3M::is_tuned
bool is_tuned() const
Definition dp3m.hpp:170

DipolarP3M::tune_verbose
bool tune_verbose
Definition dp3m.hpp:101

P3MLocalMesh::dim
Utils::Vector3i dim
dimension (size) of local mesh.
Definition common.hpp:186

P3MLocalMesh::size
int size
number of local mesh points.
Definition common.hpp:188

P3MLocalMesh::recalc_ld_pos
void recalc_ld_pos(P3MParameters const &params)
Recalculate quantities derived from the mesh and box length: ld_pos (position of the left down mesh).
Definition common.hpp:213

P3MLocalMesh::calc_local_ca_mesh
void calc_local_ca_mesh(P3MParameters const &params, LocalBox const &local_geo, double skin, double space_layer)
Calculate properties of the local FFT mesh for the charge assignment process.
Definition common.cpp:78

P3MLocalMesh::margin
int margin[6]
number of margin mesh points.
Definition common.hpp:201

P3MParameters
Structure to hold P3M parameters and some dependent variables.
Definition common.hpp:67

P3MParameters::cao_cut
Utils::Vector3d cao_cut
cutoff for charge assignment.
Definition common.hpp:89

P3MParameters::alpha
double alpha
unscaled alpha_L for use with fast inline functions only
Definition common.hpp:96

P3MParameters::r_cut_iL
double r_cut_iL
cutoff radius for real space electrostatics (>0), rescaled to r_cut_iL = r_cut * box_l_i.
Definition common.hpp:75

P3MParameters::cao
int cao
charge assignment order ([0,7]).
Definition common.hpp:82

P3MParameters::accuracy
double accuracy
accuracy of the actual parameter set.
Definition common.hpp:84

P3MParameters::alpha_L
double alpha_L
Ewald splitting parameter (0.
Definition common.hpp:72

P3MParameters::cao3
int cao3
number of points unto which a single charge is interpolated, i.e.
Definition common.hpp:102

P3MParameters::mesh_off
Utils::Vector3d mesh_off
offset of the first mesh point (lower left corner) from the coordinate origin ([0,...
Definition common.hpp:80

P3MParameters::ai
Utils::Vector3d ai
inverse mesh constant.
Definition common.hpp:93

P3MParameters::r_cut
double r_cut
unscaled r_cut_iL for use with fast inline functions only
Definition common.hpp:99

P3MParameters::recalc_a_ai_cao_cut
void recalc_a_ai_cao_cut(Utils::Vector3d const &box_l)
Recalculate quantities derived from the mesh and box length: a, ai and cao_cut.
Definition common.hpp:167

P3MParameters::tuning
bool tuning
tuning or production?
Definition common.hpp:69

P3MParameters::mesh
Utils::Vector3i mesh
number of mesh points per coordinate direction (>0).
Definition common.hpp:77

P3MParameters::epsilon
double epsilon
epsilon of the "surrounding dielectric".
Definition common.hpp:87

TuningAlgorithm::Parameters
Definition TuningAlgorithm.hpp:100

TuningAlgorithm::Parameters::mesh
Utils::Vector3i mesh
Definition TuningAlgorithm.hpp:101

anonymous_namespace{dp3m.cpp}::AssignDipole
Definition dp3m.cpp:173

anonymous_namespace{dp3m.cpp}::AssignDipole::operator()
void operator()(dp3m_data_struct &dp3m, Utils::Vector3d const &real_pos, Utils::Vector3d const &dip) const
Definition dp3m.cpp:174

anonymous_namespace{dp3m.cpp}::AssignForces
Definition dp3m.cpp:231

anonymous_namespace{dp3m.cpp}::AssignForces::operator()
void operator()(dp3m_data_struct const &dp3m, double prefac, int d_rs, ParticleRange const &particles) const
Definition dp3m.cpp:232

anonymous_namespace{dp3m.cpp}::AssignTorques
Definition dp3m.cpp:207

anonymous_namespace{dp3m.cpp}::AssignTorques::operator()
void operator()(dp3m_data_struct const &dp3m, double prefac, int d_rs, ParticleRange const &particles) const
Definition dp3m.cpp:208

dp3m_data_struct
Definition dp3m.hpp:62

dp3m_data_struct::sm
p3m_send_mesh sm
send/recv mesh sizes
Definition dp3m.hpp:86

dp3m_data_struct::local_mesh
P3MLocalMesh local_mesh
local mesh.
Definition dp3m.hpp:67

dp3m_data_struct::fft
fft_data_struct fft
Definition dp3m.hpp:91

dp3m_data_struct::rs_mesh
fft_vector< double > rs_mesh
real space mesh (local) for CA/FFT.
Definition dp3m.hpp:69

dp3m_data_struct::sum_mu2
double sum_mu2
Sum of square of magnetic dipoles (only on head node).
Definition dp3m.hpp:78

dp3m_data_struct::rs_mesh_dip
std::array< fft_vector< double >, 3 > rs_mesh_dip
real space mesh (local) for CA/FFT of the dipolar field.
Definition dp3m.hpp:71

dp3m_data_struct::sum_dip_part
int sum_dip_part
number of dipolar particles (only on head node).
Definition dp3m.hpp:76

dp3m_data_struct::inter_weights
p3m_interpolation_cache inter_weights
Definition dp3m.hpp:83

dp3m_data_struct::ks_mesh
std::vector< double > ks_mesh
k-space mesh (local) for k-space calculation and FFT.
Definition dp3m.hpp:73

dp3m_data_struct::energy_correction
double energy_correction
cached k-space self-energy correction
Definition dp3m.hpp:89

fft_data_struct::plan
fft_forw_plan plan[4]
Information for forward FFTs.
Definition fft.hpp:154

fft_forw_plan::start
int start[3]
lower left point of local FFT mesh in global FFT mesh coordinates.
Definition fft.hpp:111

fft_forw_plan::new_mesh
int new_mesh[3]
size of local mesh after communication, also used for actual FFT.
Definition fft.hpp:109

p3m_data_struct_base::g_energy
std::vector< double > g_energy
Energy optimised influence function (k-space)
Definition data_struct.hpp:45

p3m_data_struct_base::params
P3MParameters params
Definition data_struct.hpp:37

p3m_data_struct_base::calc_differential_operator
void calc_differential_operator()
Calculate the Fourier transformed differential operator.
Definition data_struct.hpp:54

p3m_data_struct_base::d_op
std::array< std::vector< int >, 3 > d_op
Spatial differential operator in k-space.
Definition data_struct.hpp:41

p3m_data_struct_base::g_force
std::vector< double > g_force
Force optimised influence function (k-space)
Definition data_struct.hpp:43

p3m_data_struct_base::ks_pnum
int ks_pnum
number of permutations in k_space
Definition data_struct.hpp:48

tuning.hpp