26#include "communication.hpp"
29#include "system/System.hpp"
36#include <boost/container/flat_set.hpp>
37#include <boost/mpi/collectives/all_reduce.hpp>
38#include <boost/mpi/communicator.hpp>
39#include <boost/mpi/request.hpp>
40#include <boost/range/algorithm/reverse.hpp>
41#include <boost/range/numeric.hpp>
48#include <initializer_list>
53int RegularDecomposition::position_to_cell_index(
57 for (
auto i = 0u; i < 3u; i++) {
58 cpos[i] =
static_cast<int>(std::floor(pos[i] *
inv_cell_size[i])) + 1 -
84void RegularDecomposition::move_if_local(
86 std::vector<ParticleChange> &modified_cells) {
87 for (
auto &part : src) {
88 auto target_cell = position_to_cell(part.pos());
91 target_cell->particles().insert(std::move(part));
92 modified_cells.emplace_back(
ModifiedList{target_cell->particles()});
94 rest.
insert(std::move(part));
101void RegularDecomposition::move_left_or_right(
ParticleList &src,
107 auto const can_move_left =
m_box.
periodic(dir) or not is_open_boundary_left;
108 auto const can_move_right =
m_box.
periodic(dir) or not is_open_boundary_right;
111 for (
auto it = src.
begin(); it != src.
end();) {
112 auto const pos = it->pos()[dir];
114 right.
insert(std::move(*it));
117 left.
insert(std::move(*it));
125void RegularDecomposition::exchange_neighbors(
126 ParticleList &pl, std::vector<ParticleChange> &modified_cells) {
127 auto const node_neighbors = Utils::Mpi::cart_neighbors<3>(
m_comm);
128 static ParticleList send_buf_l, send_buf_r, recv_buf_l, recv_buf_r;
130 for (
int dir = 0; dir < 3; dir++) {
132 if (Utils::Mpi::cart_get<3>(
m_comm).dims[dir] == 1) {
137 if (Utils::Mpi::cart_get<3>(
m_comm).dims[dir] == 2) {
138 move_left_or_right(pl, send_buf_l, send_buf_l, dir);
141 node_neighbors[2 * dir], 0, recv_buf_l);
145 using boost::mpi::request;
148 move_left_or_right(pl, send_buf_l, send_buf_r, dir);
151 node_neighbors[2 * dir], 0, recv_buf_l);
152 auto req_r =
isendrecv(
m_comm, node_neighbors[2 * dir + 1], 0, send_buf_r,
153 node_neighbors[2 * dir + 1], 0, recv_buf_r);
155 std::array<request, 4> reqs{{req_l[0], req_l[1], req_r[0], req_r[1]}};
156 boost::mpi::wait_all(reqs.begin(), reqs.end());
162 move_if_local(recv_buf_l, pl, modified_cells);
163 move_if_local(recv_buf_r, pl, modified_cells);
177 std::vector<ParticleChange> &diff) {
181 for (
auto it = c->particles().begin(); it != c->particles().end();) {
187 if (target_cell == c) {
192 auto p = std::move(*it);
193 it = c->particles().erase(it);
197 if (target_cell ==
nullptr) {
199 displaced_parts.
insert(std::move(p));
202 else if (target_cell != c) {
203 target_cell->particles().insert(std::move(p));
204 diff.emplace_back(
ModifiedList{target_cell->particles()});
210 auto const grid = Utils::Mpi::cart_get<3>(
m_comm).dims;
214 int rounds_left = grid[0] + grid[1] + grid[2] - 3;
215 for (; rounds_left > 0; rounds_left--) {
216 exchange_neighbors(displaced_parts, diff);
218 auto left_over = boost::mpi::all_reduce(
m_comm, displaced_parts.
size(),
219 std::plus<std::size_t>());
221 if (left_over == 0) {
226 exchange_neighbors(displaced_parts, diff);
229 if (not displaced_parts.
empty()) {
232 for (
auto &part : displaced_parts) {
234 <<
"than one local box length in one timestep";
235 sort_cell->particles().insert(std::move(part));
237 diff.emplace_back(
ModifiedList{sort_cell->particles()});
242void RegularDecomposition::mark_cells() {
258void RegularDecomposition::fill_comm_cell_lists(
ParticleList **part_lists,
261 for (
int o = lc[0]; o <= hc[0]; o++)
262 for (
int n = lc[1]; n <= hc[1]; n++)
263 for (
int m = lc[2]; m <= hc[2]; m++) {
266 *part_lists++ = &(
cells.at(i).particles());
271 auto dir_max_range = [
this](
unsigned int i) {
275 return {dir_max_range(0u), dir_max_range(1u), dir_max_range(2u)};
279int RegularDecomposition::calc_processor_min_num_cells()
const {
285 return boost::accumulate(Utils::Mpi::cart_get<3>(
m_comm).dims, 1,
286 [](
int n_cells,
int grid) {
287 return (grid == 1) ? 2 * n_cells : n_cells;
291void RegularDecomposition::create_cell_grid(
double range) {
292 auto const cart_info = Utils::Mpi::cart_get<3>(
m_comm);
296 auto const min_num_cells = calc_processor_min_num_cells();
300 auto const cells_per_dir =
301 static_cast<int>(std::ceil(std::cbrt(min_num_cells)));
309 auto const scale = std::cbrt(RegularDecomposition::max_num_cells / volume);
311 for (
auto i = 0u; i < 3u; i++) {
313 cell_grid[i] =
static_cast<int>(std::ceil(local_box_l[i] * scale));
314 cell_range[i] = local_box_l[i] /
static_cast<double>(
cell_grid[i]);
316 if (cell_range[i] < range) {
318 cell_grid[i] =
static_cast<int>(std::floor(local_box_l[i] / range));
321 <<
"interaction range " << range <<
" in direction " << i
322 <<
" is larger than the local box size " << local_box_l[i];
325 cell_range[i] = local_box_l[i] /
static_cast<double>(
cell_grid[i]);
337 if (n_local_cells <= RegularDecomposition::max_num_cells)
342 auto min_size = cell_range[0];
344 for (
auto i = 1u; i < 3u; ++i) {
345 if (
cell_grid[i] > 1 and cell_range[i] < min_size) {
347 min_size = cell_range[i];
356 if (n_local_cells < min_num_cells) {
358 <<
" is smaller than minimum " << min_num_cells
359 <<
": either interaction range is too large for "
360 <<
"the current skin (range=" << range <<
", "
361 <<
"half_local_box_l=[" << local_box_l / 2. <<
"]) "
362 <<
"or min_num_cells too large";
366 if (n_local_cells > RegularDecomposition::max_num_cells) {
370 auto const node_pos = cart_info.coords;
374 for (
auto i = 0u; i < 3u; i++) {
384 cells.resize(
static_cast<unsigned int>(new_cells));
390 return boost::container::flat_set<K, std::remove_reference_t<Comparator>>(
391 std::forward<Comparator>(comp));
394void RegularDecomposition::init_cell_interactions() {
399 auto const cart_info = Utils::Mpi::cart_get<3>(
m_comm);
401 auto const &node_pos = cart_info.coords;
410 return (cell_idx[
coord] == 0 or cell_idx[
coord] == global_size[
coord] - 1);
416 auto const fcb_is_inner_connection = [&global_size,
this](
Utils::Vector3i a,
420 auto const involves_ghost_cell =
421 (a[fc_normal] == -1 or a[fc_normal] == global_size[fc_normal] or
422 b[fc_normal] == -1 or b[fc_normal] == global_size[fc_normal]);
423 if (not involves_ghost_cell) {
425 return std::abs((a - b)[fc_dir]) > 1;
435 return (global_halo_offset + local_index);
440 auto const folded_index = (global_index + global_size) % global_size;
448 return (global_index - global_halo_offset);
454 if (fc_normal == fc_dir) {
455 throw std::domain_error(
"fully_connected_boundary normal and connection "
456 "coordinates need to differ.");
458 if (node_grid[fc_dir] != 1) {
459 throw std::runtime_error(
460 "The MPI nodegrid must be 1 in the fully connected direction.");
463 throw std::runtime_error(
464 "The fully connected boundary requires periodicity in the "
465 "boundary normal direction.");
477 for (
int o = start[2]; o < end[2]; o++)
478 for (
int n = start[1]; n < end[1]; n++)
479 for (
int m = start[0]; m < end[0]; m++) {
491 if (at_boundary(fc_boundary, {m, n, o})) {
492 lower_index[fc_direction] = -1;
493 upper_index[fc_direction] = global_size[fc_direction];
499 for (
auto i = 0u; i < 3u; i++) {
501 lower_index[i] = std::max(0, lower_index[i]);
502 upper_index[i] = std::min(global_size[i] - 1, upper_index[i]);
508 auto neighbors = make_flat_set<Utils::Vector3i>(
510 return folded_linear_index(a) < folded_linear_index(b);
514 for (
int p = lower_index[2]; p <= upper_index[2]; p++)
515 for (
int q = lower_index[1]; q <= upper_index[1]; q++)
516 for (
int r = lower_index[0]; r <= upper_index[0]; r++) {
520 if (fcb_is_inner_connection({m, n, o}, {r, q, p}))
527 auto const ind1 = folded_linear_index({m, n, o});
529 std::vector<Cell *> red_neighbors;
530 std::vector<Cell *> black_neighbors;
536 for (
auto &neighbor : neighbors) {
538 for (
auto coord : {0u, 1u, 2u}) {
539 if (neighbor[
coord] == -1) {
546 auto const ind2 = folded_linear_index(neighbor);
551 auto cell = &
cells.at(
556 red_neighbors.push_back(cell);
558 black_neighbors.push_back(cell);
584 boost::reverse(c.part_lists);
595 auto next = std::next(it);
613 int dir, lr, i, cnt, n_comm_cells[3];
616 auto const comm_info = Utils::Mpi::cart_get<3>(
m_comm);
617 auto const node_neighbors = Utils::Mpi::cart_neighbors<3>(
m_comm);
621 for (dir = 0; dir < 3; dir++) {
622 for (lr = 0; lr < 2; lr++) {
624 if (comm_info.dims[dir] == 1)
641 for (dir = 0; dir < 3; dir++) {
642 lc[(dir + 1) % 3] = 1 - done[(dir + 1) % 3];
643 lc[(dir + 2) % 3] = 1 - done[(dir + 2) % 3];
644 hc[(dir + 1) % 3] =
cell_grid[(dir + 1) % 3] + done[(dir + 1) % 3];
645 hc[(dir + 2) % 3] =
cell_grid[(dir + 2) % 3] + done[(dir + 2) % 3];
650 for (lr = 0; lr < 2; lr++) {
651 if (comm_info.dims[dir] == 1) {
653 ghost_comm.communications[cnt].type =
GHOST_LOCL;
654 ghost_comm.communications[cnt].node =
m_comm.rank();
657 ghost_comm.communications[cnt].part_lists.resize(2 * n_comm_cells[dir]);
660 lc[dir] = hc[dir] = 1 + lr * (
cell_grid[dir] - 1);
662 fill_comm_cell_lists(ghost_comm.communications[cnt].part_lists.data(),
666 lc[dir] = hc[dir] = 0 + (1 - lr) * (
cell_grid[dir] + 1);
669 fill_comm_cell_lists(
670 &ghost_comm.communications[cnt].part_lists[n_comm_cells[dir]], lc,
676 for (i = 0; i < 2; i++) {
677 if ((comm_info.coords[dir] + i) % 2 == 0) {
678 ghost_comm.communications[cnt].type =
GHOST_SEND;
679 ghost_comm.communications[cnt].node = node_neighbors[2 * dir + lr];
680 ghost_comm.communications[cnt].part_lists.resize(n_comm_cells[dir]);
683 lc[dir] = hc[dir] = 1 + lr * (
cell_grid[dir] - 1);
685 fill_comm_cell_lists(
686 ghost_comm.communications[cnt].part_lists.data(), lc, hc);
689 if ((comm_info.coords[dir] + (1 - i)) % 2 == 0) {
690 ghost_comm.communications[cnt].type =
GHOST_RECV;
691 ghost_comm.communications[cnt].node =
692 node_neighbors[2 * dir + (1 - lr)];
693 ghost_comm.communications[cnt].part_lists.resize(n_comm_cells[dir]);
695 lc[dir] = hc[dir] = (1 - lr) * (
cell_grid[dir] + 1);
697 fill_comm_cell_lists(
698 ghost_comm.communications[cnt].part_lists.data(), lc, hc);
711 boost::mpi::communicator comm,
double range,
BoxGeometry const &box_geo,
713 std::optional<std::pair<int, int>> fully_connected)
714 : m_comm(
std::move(comm)), m_box(box_geo), m_local_box(local_geo),
715 m_fully_connected_boundary(
std::move(fully_connected)) {
718 create_cell_grid(range);
721 init_cell_interactions();
static int coord(std::string const &s)
auto make_flat_set(Comparator &&comp)
static void fold_and_reset(Particle &p, BoxGeometry const &box_geo)
Fold coordinates to box and reset the old position.
Vector implementation and trait types for boost qvm interoperability.
T get_mi_coord(T a, T b, unsigned coord) const
Get the minimum-image distance between two coordinates.
Utils::Vector3d const & length() const
Box length.
constexpr bool periodic(unsigned coord) const
Check periodicity in direction.
void fold_position(Utils::Vector3d &pos, Utils::Vector3i &image_box) const
Fold coordinates to primary simulation box in-place.
auto const & my_right() const
Right (top, back) corner of this nodes local box.
auto const & boundary() const
Boundary information for the local box.
auto const & my_left() const
Left (bottom, front) corner of this nodes local box.
auto const & length() const
Dimensions of the box a single node is responsible for.
void clear()
Remove all elements form container.
bool empty() const
Is the container empty?
T & insert(T const &v)
Insert an element into the container.
iterator erase(iterator it)
Remove element from the list.
std::size_t size() const
Number of elements in the container.
DEVICE_QUALIFIER constexpr size_type size() const noexcept
static DEVICE_QUALIFIER constexpr Vector< T, N > broadcast(typename Base::value_type const &value) noexcept
Create a vector that has all entries set to the same value.
Communicator communicator
This file contains the errorhandling code for severe errors, like a broken bond or illegal parameter ...
#define runtimeErrorMsg()
#define GHOST_RECV
recv from a single node
#define GHOST_PSTSTORE
additional flag for poststoring
#define GHOST_LOCL
transfer data from cell to cell on this node
#define GHOST_SEND
send to a single node
#define GHOST_PREFETCH
additional flag for prefetching
std::array< mpi::request, 2 > isendrecv(mpi::communicator const &comm, int dest, int stag, const T &sval, int src, int rtag, T &rval)
mpi::status sendrecv(mpi::communicator const &comm, int dest, int stag, const T &sval, int src, int rtag, T &rval)
T product(Vector< T, N > const &v)
int get_linear_index(int a, int b, int c, const Vector3i &adim)
auto hadamard_product(Vector< T, N > const &a, Vector< U, N > const &b)
void assign_prefetches(GhostCommunicator &comm)
Of every two communication rounds, set the first receivers to prefetch and poststore.
void revert_comm_order(GhostCommunicator &comm)
Revert the order of a communicator: After calling this the communicator is working in reverted order ...
Utils::Vector3i node_grid
Properties for a ghost communication.
std::vector< GhostCommunication > communications
List of ghost communications.
Struct holding all information for one particle.
auto & pos_at_last_verlet_update()
auto const & image_box() const
GhostCommunicator m_exchange_ghosts_comm
Utils::Vector3i ghost_cell_grid
linked cell grid with ghost frame.
Utils::Vector3d max_cutoff() const override
Utils::Vector3d inv_cell_size
inverse cell_size.
std::vector< Cell * > m_ghost_cells
BoxGeometry const & m_box
Cell * particle_to_cell(Particle const &p) override
auto fully_connected_boundary() const
void resort(bool global, std::vector< ParticleChange > &diff) override
std::vector< Cell > cells
RegularDecomposition(boost::mpi::communicator comm, double range, BoxGeometry const &box_geo, LocalBox const &local_geo, std::optional< std::pair< int, int > > fully_connected)
Utils::Vector3d cell_size
Cell size.
std::span< Cell *const > local_cells() const override
std::vector< Cell * > m_local_cells
Utils::Vector3d max_range() const override
GhostCommunicator m_collect_ghost_force_comm
Utils::Vector3i cell_grid
Grid dimensions per node.
Utils::Vector3i cell_offset
Offset in global grid.
boost::mpi::communicator m_comm