dox/GpuParticleData_8cpp_source.html

/*

 * Copyright (C) 2014-2022 The ESPResSo project

 *

 * This file is part of ESPResSo.

 *

 * ESPResSo is free software: you can redistribute it and/or modify

 * it under the terms of the GNU General Public License as published by

 * the Free Software Foundation, either version 3 of the License, or

 * (at your option) any later version.

 *

 * ESPResSo is distributed in the hope that it will be useful,

 * but WITHOUT ANY WARRANTY; without even the implied warranty of

 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the

 * GNU General Public License for more details.

 *

 * You should have received a copy of the GNU General Public License

 * along with this program.  If not, see <http://www.gnu.org/licenses/>.

 */


#include "config/config.hpp"


#ifdef CUDA


#include "GpuParticleData.hpp"


#include "cell_system/CellStructure.hpp"

#include "communication.hpp"

#include "cuda/CudaHostAllocator.hpp"

#include "system/System.hpp"


#include <utils/Vector.hpp>

#include <utils/mpi/gather_buffer.hpp>

#include <utils/mpi/scatter_buffer.hpp>


#include <boost/serialization/array.hpp>

#include <boost/serialization/is_bitwise_serializable.hpp>

#include <boost/serialization/split_free.hpp>


#include <cstddef>

#include <span>

#include <vector>


void GpuParticleData::enable_particle_transfer() {

  if (m_need_particles_update and not m_communication_enabled) {

    if (::this_node == 0) {

      gpu_init_particle_comm();

    }

    m_communication_enabled = true;

  }

}


void GpuParticleData::copy_particles_to_device() {

  auto const &cell_structure = *System::get_system().cell_structure;

  copy_particles_to_device(cell_structure.local_particles(), ::this_node);

}


bool GpuParticleData::has_compatible_device() const {

  auto result = false;

  if (::this_node == 0) {

    result = has_compatible_device_impl();

  }

  boost::mpi::broadcast(::comm_cart, result, 0);

  return result;

}

bool GpuParticleData::has_compatible_device() const  {…}


BOOST_IS_BITWISE_SERIALIZABLE(GpuParticleData::GpuParticle)


namespace boost {

namespace serialization {

template <typename Archive>


void load(Archive &ar, GpuParticleData::GpuParticle &p, unsigned const) {

  ar >> make_array(reinterpret_cast<char *>(&p),

                   sizeof(GpuParticleData::GpuParticle));

}

void load(Archive &ar, GpuParticleData::GpuParticle &p, unsigned const) {…}

template <typename Archive>


void save(Archive &ar, GpuParticleData::GpuParticle const &p, unsigned const) {

  ar << make_array(reinterpret_cast<char const *>(&p),

                   sizeof(GpuParticleData::GpuParticle));

}

void save(Archive &ar, GpuParticleData::GpuParticle const &p, unsigned const) {…}

} // namespace serialization

} // namespace boost


BOOST_SERIALIZATION_SPLIT_FREE(GpuParticleData::GpuParticle)


static void pack_particles(ParticleRange const &particles,

                           GpuParticleData::GpuParticle *buffer) {

  auto const &box = *System::get_system().box_geo;

  std::size_t i = 0u;

  for (auto const &p : particles) {

    buffer[i].p = static_cast<Utils::Vector3f>(box.folded_position(p.pos()));

#ifdef DIPOLES

    buffer[i].dip = static_cast<Utils::Vector3f>(p.calc_dip());

#endif

#ifdef ELECTROSTATICS

    buffer[i].q = static_cast<float>(p.q());

#endif

    buffer[i].identity = p.id();

    i++;

  }

}

static void pack_particles(ParticleRange const &particles, {…}


void GpuParticleData::gather_particle_data(

    ParticleRange const &particles,

    pinned_vector<GpuParticle> &particle_data_host, int this_node) {

  auto const n_part = particles.size();


  if (this_node > 0) {

    static std::vector<GpuParticle> buffer;

    buffer.resize(n_part);

    /* pack local parts into buffer */

    pack_particles(particles, buffer.data());


    Utils::Mpi::gather_buffer(buffer, comm_cart);

  } else {

    particle_data_host.resize(n_part);


    /* Pack own particles */

    pack_particles(particles, particle_data_host.data());


    Utils::Mpi::gather_buffer(particle_data_host, comm_cart);

  }

}


/**

 * @brief Add a flat force (and torque) array to a range of particles.

 *

 * @param particles The particles the forces (and torques) should be added to

 * @param forces The forces as flat array of size 3 * particles.size()

 * @param torques The torques as flat array of size 3 * particles.size(),

 *                this is only touched if ROTATION is active.

 */


static void add_forces_and_torques(ParticleRange const &particles,

                                   std::span<const float> forces,

                                   std::span<const float> torques) {

  std::size_t i = 0ul;

  for (auto &p : particles) {

    for (std::size_t j = 0ul; j < 3ul; j++) {

      p.force()[j] += static_cast<double>(forces[3ul * i + j]);

#ifdef ROTATION

      p.torque()[j] += static_cast<double>(torques[3ul * i + j]);

#endif

    }

    i++;

  }

}

static void add_forces_and_torques(ParticleRange const &particles, {…}


/**

 * @brief Distribute forces to the worker nodes, and add them to the particles.

 *

 * @param particles    The particles for which the forces (and torques) should

 *                     be added to.

 * @param host_forces  The forces as flat array of size 3 * particles.size(),

 *                     only relevant on the head node.

 * @param host_torques The torques as flat array of size 3 * particles.size(),

 *                     this is only touched if ROTATION is active. Only

 *                     relevant on the head node.

 */

void GpuParticleData::particles_scatter_forces(

    ParticleRange const &particles, std::span<float> host_forces,

    std::span<float> host_torques) const {


  auto const size = 3ul * particles.size();

  auto const n_elements = static_cast<int>(size);


  if (::this_node > 0) {

    static std::vector<float> buffer_forces;

    static std::vector<float> buffer_torques;


    buffer_forces.resize(size);

    Utils::Mpi::scatter_buffer(buffer_forces.data(), n_elements, ::comm_cart);

#ifdef ROTATION

    buffer_torques.resize(size);

    Utils::Mpi::scatter_buffer(buffer_torques.data(), n_elements, ::comm_cart);

#endif

    add_forces_and_torques(particles, buffer_forces, buffer_torques);

  } else {

    Utils::Mpi::scatter_buffer(host_forces.data(), n_elements, ::comm_cart);

#ifdef ROTATION

    Utils::Mpi::scatter_buffer(host_torques.data(), n_elements, ::comm_cart);

#endif

    add_forces_and_torques(particles, host_forces, host_torques);

  }

}


#endif

CellStructure.hpp

CudaHostAllocator.hpp

pinned_vector
std::vector< T, CudaHostAllocator< T > > pinned_vector
Definition CudaHostAllocator.hpp:64

add_forces_and_torques
static void add_forces_and_torques(ParticleRange const &particles, std::span< const float > forces, std::span< const float > torques)
Add a flat force (and torque) array to a range of particles.
Definition GpuParticleData.cpp:132

pack_particles
static void pack_particles(ParticleRange const &particles, GpuParticleData::GpuParticle *buffer)
Definition GpuParticleData.cpp:85

GpuParticleData.hpp

Vector.hpp
Vector implementation and trait types for boost qvm interoperability.

GpuParticleData
Particle data communication manager for the GPU.
Definition GpuParticleData.hpp:51

GpuParticleData::has_compatible_device
bool has_compatible_device() const
Definition GpuParticleData.cpp:57

ParticleRange
A range of particles.
Definition ParticleRange.hpp:38

ParticleRange::size
base_type::size_type size() const
Definition ParticleRange.hpp:44

System::System::cell_structure
std::shared_ptr< CellStructure > cell_structure
Definition core/system/System.hpp:314

System::System::box_geo
std::shared_ptr< BoxGeometry > box_geo
Definition core/system/System.hpp:312

Utils::Vector
Definition Vector.hpp:49

comm_cart
boost::mpi::communicator comm_cart
The communicator.
Definition communication.cpp:52

this_node
int this_node
The number of this node.
Definition communication.cpp:74

config.hpp
This file contains the defaults for ESPResSo.

gather_buffer.hpp

Cells::particles
ParticleRange particles(std::span< Cell *const > cells)
Definition CellStructure.hpp:95

System::get_system
System & get_system()
Definition core/system/System.cpp:126

Utils::Mpi::gather_buffer
void gather_buffer(std::vector< T, Allocator > &buffer, boost::mpi::communicator const &comm, int root=0)
Gather buffer with different size on each node.
Definition gather_buffer.hpp:54

Utils::Mpi::scatter_buffer
void scatter_buffer(T *buffer, int n_elem, boost::mpi::communicator comm, int root=0)
Scatter buffer with different size on each node.
Definition scatter_buffer.hpp:44

boost::serialization::load
void load(Archive &ar, GpuParticleData::GpuParticle &p, unsigned const)
Definition GpuParticleData.cpp:71

boost::serialization::save
void save(Archive &ar, GpuParticleData::GpuParticle const &p, unsigned const)
Definition GpuParticleData.cpp:76

boost
Definition core/accumulators/AccumulatorBase.hpp:28

scatter_buffer.hpp

GpuParticleData::GpuParticle
Subset of Particle which is copied to the GPU.
Definition GpuParticleData.hpp:69