ESPResSo
Extensible Simulation Package for Research on Soft Matter Systems
Loading...
Searching...
No Matches
LBWalberlaImpl.hpp
Go to the documentation of this file.
1/*
2 * Copyright (C) 2019-2026 The ESPResSo project
3 *
4 * This file is part of ESPResSo.
5 *
6 * ESPResSo is free software: you can redistribute it and/or modify
7 * it under the terms of the GNU General Public License as published by
8 * the Free Software Foundation, either version 3 of the License, or
9 * (at your option) any later version.
10 *
11 * ESPResSo is distributed in the hope that it will be useful,
12 * but WITHOUT ANY WARRANTY; without even the implied warranty of
13 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
14 * GNU General Public License for more details.
15 *
16 * You should have received a copy of the GNU General Public License
17 * along with this program. If not, see <http://www.gnu.org/licenses/>.
18 */
19
20#pragma once
21
22/**
23 * @file
24 * @ref walberla::LBWalberlaImpl implements the interface of the LB
25 * waLBerla bridge using sweeps generated by lbmpy
26 * (see <tt>maintainer/walberla_kernels</tt>).
27 */
28
29#include <blockforest/Initialization.h>
30#include <blockforest/StructuredBlockForest.h>
31#include <domain_decomposition/BlockDataID.h>
32#include <domain_decomposition/IBlock.h>
33#include <field/AddToStorage.h>
34#include <field/vtk/FlagFieldCellFilter.h>
35#include <field/vtk/VTKWriter.h>
36#include <stencil/D3Q19.h>
37#include <stencil/D3Q27.h>
38#include <waLBerlaDefinitions.h>
39#if defined(__CUDACC__) and defined(WALBERLA_BUILD_WITH_CUDA)
40#include <gpu/AddGPUFieldToStorage.h>
41#endif
42
43#include "../BoundaryHandling.hpp"
44#include "../BoundaryPackInfo.hpp"
45#include "../utils/boundary.hpp"
46#include "../utils/types_conversion.hpp"
48#include "ResetForce.hpp"
49#include "lb_fields.hpp"
50#include "lb_kernels.hpp"
51#if defined(__CUDACC__) and defined(WALBERLA_BUILD_WITH_CUDA)
52#include "lb_fields.cuh"
53#include "lb_kernels.cuh"
54#endif
55
63
64#include <utils/Vector.hpp>
65
66#include <array>
67#include <bitset>
68#include <cstddef>
69#include <functional>
70#include <initializer_list>
71#include <limits>
72#include <memory>
73#include <optional>
74#include <stdexcept>
75#include <string>
76#include <type_traits>
77#include <utility>
78#include <variant>
79#include <vector>
80
81namespace walberla {
82
83/** @brief Class that runs and controls the LB on waLBerla. */
84template <typename FloatType, lbmpy::Arch Architecture>
86#if not defined(WALBERLA_BUILD_WITH_CUDA)
87 static_assert(Architecture != lbmpy::Arch::GPU,
88 "waLBerla was compiled without CUDA support");
89#endif
90protected:
91 // ---- Types & Constants ----
92
93 using Kernels = detail::KernelTrait<FloatType, Architecture>;
95 typename Kernels::DynamicUBB>;
97 std::variant<typename Kernels::StreamCollisionModelThermalized,
99
100public:
101 /** @brief Stencil for collision and streaming operations. */
102 using Stencil = stencil::D3Q19;
103 /** @brief Stencil for ghost communication (includes domain corners). */
104 using StencilFull = stencil::D3Q27;
105 /** @brief Lattice model (e.g. blockforest). */
107
108protected:
109 // "underlying" field types (`GPUField` has no f-size info at compile time)
112
113public:
117#if defined(__CUDACC__) and defined(WALBERLA_BUILD_WITH_CUDA)
118 using GPUField = gpu::GPUField<FloatType>;
119#endif
120
121 struct GhostComm {
122 /** @brief Ghost communication operations. */
123 enum GhostCommFlags : unsigned {
124 PDF, ///< PDFs communication
125 VEL, ///< velocities communication
126 LAF, ///< last applied forces communication
127 UBB, ///< boundaries communication
128 SIZE
129 };
130 };
131
132protected:
133 /**
134 * @brief Full communicator.
135 * We use the D3Q27 directions to update cells along the diagonals during
136 * a full ghost communication. This is needed to properly update the corners
137 * of the ghost layer when setting cell velocities or populations.
138 */
140 FieldTrait<FloatType, Stencil,
141 Architecture>::template RegularCommScheme<stencil::D3Q27>;
143 FieldTrait<FloatType, Stencil,
144 Architecture>::template BoundaryCommScheme<stencil::D3Q27>;
145 /**
146 * @brief Regular communicator.
147 * We use the same directions as the stencil during integration.
148 */
150 FieldTrait<FloatType, Stencil,
151 Architecture>::template RegularCommScheme<Stencil>;
152 template <class Field>
153 using PackInfo =
155
156protected:
157 // ---- Member Variables ----
158
159 // Physical parameters
160 FloatType m_viscosity; /// kinematic viscosity
161 FloatType m_density;
162 FloatType m_kT;
163 unsigned int m_seed;
164 double m_zc_to_md; // zero-centered conversion factor to MD units
165 double m_zc_to_lb; // zero-centered conversion factor to LB units
166
167 // lattice
168 std::shared_ptr<LatticeWalberla> m_lattice;
169
170 // Block data access handles
171 BlockDataID m_pdf_field_id;
173 BlockDataID m_flag_field_id;
174
177
180
181 /** Flag for boundary cells. */
182 FlagUID const Boundary_flag{"boundary"};
183 bool m_has_boundaries{false};
184
185 // boundaries
186 std::shared_ptr<BoundaryModel> m_boundary;
187
188 // communicators
189 std::shared_ptr<BoundaryFullCommunicator> m_boundary_communicator;
190 std::shared_ptr<RegularFullCommunicator> m_full_communicator;
191 std::shared_ptr<RegularFullCommunicator> m_pdf_communicator;
192 std::shared_ptr<RegularFullCommunicator> m_vel_communicator;
193 std::shared_ptr<RegularFullCommunicator> m_laf_communicator;
194 std::shared_ptr<PDFStreamingCommunicator> m_pdf_streaming_communicator;
195 std::bitset<GhostComm::SIZE> m_pending_ghost_comm;
197
198 // collision sweep
199 std::shared_ptr<CollisionModel> m_collision_model;
200
201 // force reset sweep + external force handling
202 std::shared_ptr<ResetForce<PdfField, VectorField>> m_reset_force;
203
204 // velocity update sweep
205 std::shared_ptr<typename Kernels::UpdateVelFromPDF>
207
208 // Lees-Edwards boundary interpolation
209 std::shared_ptr<LeesEdwardsPack> m_lees_edwards_callbacks;
210 std::shared_ptr<InterpolateAndShiftAtBoundary<_PdfField, FloatType>>
212 std::shared_ptr<InterpolateAndShiftAtBoundary<_VectorField, FloatType>>
214 std::shared_ptr<InterpolateAndShiftAtBoundary<_VectorField, FloatType>>
216
217public:
218 template <typename T> FloatType FloatType_c(T t) const {
219 return numeric_cast<FloatType>(t);
220 }
221
222 [[nodiscard]] std::size_t stencil_size() const noexcept override {
223 return static_cast<std::size_t>(Stencil::Size);
224 }
225
226 [[nodiscard]] bool is_double_precision() const noexcept override {
227 return std::is_same_v<FloatType, double>;
228 }
229
230 [[nodiscard]] bool is_gpu() const noexcept override {
231 return Architecture == lbmpy::Arch::GPU;
232 }
233
234public:
235 LBWalberlaImpl(std::shared_ptr<LatticeWalberla> lattice, double viscosity,
236 double density)
238 m_kT(FloatType{0}), m_seed(0u), m_zc_to_md(density),
239 m_zc_to_lb(1. / density), m_lattice(std::move(lattice)),
241
242 auto const &blocks = m_lattice->get_blocks();
243 auto const n_ghost_layers = m_lattice->get_ghost_layers();
244 if (n_ghost_layers == 0u)
245 throw std::runtime_error("At least one ghost layer must be used");
246
247 // Initialize and register fields (must use the "underlying" types)
248 m_pdf_field_id = add_to_storage<_PdfField>("pdfs");
249 m_pdf_tmp_field_id = add_to_storage<_PdfField>("pdfs_tmp");
250 m_last_applied_force_field_id = add_to_storage<_VectorField>("force last");
251 m_force_to_be_applied_id = add_to_storage<_VectorField>("force next");
252 m_velocity_field_id = add_to_storage<_VectorField>("velocity");
253 m_vel_tmp_field_id = add_to_storage<_VectorField>("velocity_tmp");
254
255 // Initialize and register pdf field with zero centered density
256 auto pdf_setter = typename Kernels::InitialPDFsSetter(
258 for (auto &block : *blocks) {
259 pdf_setter(&block);
260 }
261
262 // Initialize and register flag field (fluid/boundary)
263 m_flag_field_id = field::addFlagFieldToStorage<FlagField>(
264 blocks, "flag field", n_ghost_layers);
265 // Initialize boundary sweep
266 reset_boundary_handling(m_lattice->get_blocks());
267
268 // Set up the communication and register fields
271
273
274 // Instantiate the sweep responsible for force double buffering and
275 // external forces
276 m_reset_force = std::make_shared<ResetForce<PdfField, VectorField>>(
278
279 // Instantiate velocity update sweep
281 std::make_shared<typename Kernels::UpdateVelFromPDF>(
283 }
284
285 ~LBWalberlaImpl() override = default;
286
287 // ---- Integration (Core LB Algorithm) ----
288
289 void integrate() override {
290 integrate_pull_scheme();
292 }
293
294protected:
295 void integrate_vtk_writers() override {
296 for (auto const &it : m_vtk_auto) {
297 auto &vtk_handle = it.second;
298 if (vtk_handle->enabled) {
299 vtk::writeFiles(vtk_handle->ptr)();
300 vtk_handle->execution_count++;
301 }
302 }
303 }
304
305private:
306 /**
307 * @brief One LB time step using the pull scheme.
308 * Sequence: reset forces, stream-collide, communicate PDFs,
309 * apply Lees-Edwards interpolation (if active), handle boundaries,
310 * update velocity field from PDFs.
311 */
312 void integrate_pull_scheme() {
314 auto const &blocks = get_lattice().get_blocks();
315 // Reset force fields
316 integrate_reset_force(blocks);
317 // LB stream collide
318 integrate_stream_collide(blocks);
319 // Mark pending ghost layer updates
320 // As pdf and laf are communicated directly afterwards, they are not set
323 m_pdf_streaming_communicator->communicate();
324 if (has_lees_edwards_bc()) {
325 apply_lees_edwards_pdf_interpolation(blocks);
326 apply_lees_edwards_last_applied_force_interpolation(blocks);
327 }
328 // Handle boundaries
329 if (m_has_boundaries) {
330 integrate_boundaries(blocks);
331 }
332 // Update velocities from pdfs
333 integrate_update_velocities_from_pdf(blocks);
334
335 if (has_lees_edwards_bc()) {
336 apply_lees_edwards_vel_interpolation_and_shift(blocks);
337 }
338 }
339
340 void integrate_stream_collide(std::shared_ptr<BlockStorage> const &blocks) {
341 auto &cm_variant = *m_collision_model;
342 for (auto &block : *blocks) {
343 auto const block_variant = std::variant<IBlock *>(&block);
344 std::visit(m_run_stream_collide_sweep, cm_variant, block_variant);
345 }
346 if (auto *cm =
347 std::get_if<typename Kernels::StreamCollisionModelThermalized>(
348 &cm_variant)) {
349 cm->setTime_step(cm->getTime_step() + 1u);
350 }
351 }
352
353 void integrate_reset_force(std::shared_ptr<BlockStorage> const &blocks) {
354 for (auto &block : *blocks)
355 (*m_reset_force)(&block);
356 }
357
358 void integrate_boundaries(std::shared_ptr<BlockStorage> const &blocks) {
359 for (auto &block : *blocks)
360 (*m_boundary)(&block);
361 }
362
363 void integrate_update_velocities_from_pdf(
364 std::shared_ptr<BlockStorage> const &blocks) {
365 for (auto &block : *blocks)
367 }
368
369private:
370 // ---- Collision Model ----
371
372 /**
373 * @brief Visitor for dispatching stream-collide sweeps.
374 * Handles both thermalized and Lees-Edwards collision models
375 * via @c std::visit on the @ref CollisionModel variant.
376 */
377 class StreamCollideSweepVisitor {
378 public:
379 using StructuredBlockStorage = LatticeWalberla::Lattice_T;
380
381 void operator()(typename Kernels::StreamCollisionModelThermalized &cm,
382 IBlock *b) {
383 cm.configure(m_storage, b);
384 cm(b);
385 }
386
387 void operator()(typename Kernels::StreamCollisionModelLeesEdwards &cm,
388 IBlock *b) {
389 cm.setV_s(static_cast<decltype(cm.getV_s())>(
390 m_lees_edwards_callbacks->get_shear_velocity()));
391 cm(b);
392 }
393
394 StreamCollideSweepVisitor() = default;
395 StreamCollideSweepVisitor(std::shared_ptr<StructuredBlockStorage> storage) {
396 m_storage = std::move(storage);
397 }
398 StreamCollideSweepVisitor(std::shared_ptr<StructuredBlockStorage> storage,
399 std::shared_ptr<LeesEdwardsPack> callbacks) {
400 m_storage = std::move(storage);
401 m_lees_edwards_callbacks = std::move(callbacks);
402 }
403
404 private:
405 std::shared_ptr<StructuredBlockStorage> m_storage{};
406 std::shared_ptr<LeesEdwardsPack> m_lees_edwards_callbacks{};
407 };
408 StreamCollideSweepVisitor m_run_stream_collide_sweep{};
409
410 /** @brief Relaxation rate omega from kinematic viscosity: 2/(6*nu+1). */
411 FloatType shear_mode_relaxation_rate() const;
412 /**
413 * @brief Odd-mode relaxation rate for the magic parameter relation.
414 * Ensures optimal bounce-back wall location for the two-relaxation-time
415 * model. Default magic number is 3/16.
416 */
417 FloatType odd_mode_relaxation_rate(
418 FloatType shear_relaxation,
419 FloatType magic_number = FloatType{3} / FloatType{16}) const;
420
421public:
422 void set_collision_model(double kT, unsigned int seed) override;
424 std::unique_ptr<LeesEdwardsPack> &&lees_edwards_pack) override;
425 void check_lebc(unsigned int shear_direction,
426 unsigned int shear_plane_normal) const override;
427
428public:
429 // ---- Ghost Communication ----
430
431 /**
432 * @brief Perform all pending ghost layer updates.
433 * Uses a lazy scheme: ghost communications are only executed when
434 * they have been marked as pending by a preceding write operation.
435 */
445
446 void ghost_communication_pdf() override {
449 m_pdf_communicator->communicate();
450 if (has_lees_edwards_bc()) {
451 auto const &blocks = get_lattice().get_blocks();
452 apply_lees_edwards_pdf_interpolation(blocks);
453 }
455 }
456 }
457
458 void ghost_communication_vel() override {
461 m_vel_communicator->communicate();
462 if (has_lees_edwards_bc()) {
463 auto const &blocks = get_lattice().get_blocks();
464 apply_lees_edwards_vel_interpolation_and_shift(blocks);
465 }
467 }
468 }
469
470 void ghost_communication_laf() override {
473 m_laf_communicator->communicate();
474 if (has_lees_edwards_bc()) {
475 auto const &blocks = get_lattice().get_blocks();
476 apply_lees_edwards_last_applied_force_interpolation(blocks);
477 }
479 }
480 }
481
489
490 /** @brief Communicate all fields at once using the D3Q27 stencil. */
493 m_full_communicator->communicate();
494 if (has_lees_edwards_bc()) {
496 }
500 }
501
502private:
503 // ---- Lees-Edwards Boundary Conditions ----
504
505 auto has_lees_edwards_bc() const {
506 return std::holds_alternative<
507 typename Kernels::StreamCollisionModelLeesEdwards>(*m_collision_model);
508 }
509
510 void apply_lees_edwards_pdf_interpolation(
511 std::shared_ptr<BlockStorage> const &blocks) {
512 for (auto &block : *blocks)
514 }
515
516 void apply_lees_edwards_vel_interpolation_and_shift(
517 std::shared_ptr<BlockStorage> const &blocks) {
518 for (auto &block : *blocks)
520 }
521
522 void apply_lees_edwards_last_applied_force_interpolation(
523 std::shared_ptr<BlockStorage> const &blocks) {
524 for (auto &block : *blocks)
526 }
527
528public:
530 auto const &blocks = get_lattice().get_blocks();
531 apply_lees_edwards_pdf_interpolation(blocks);
532 apply_lees_edwards_vel_interpolation_and_shift(blocks);
533 apply_lees_edwards_last_applied_force_interpolation(blocks);
534 }
535
536public:
537 // ---- Node & Slice Accessors (by quantity) ----
538
539 // Velocity
540 std::optional<Utils::Vector3d>
542 bool consider_ghosts = false) const override;
543 bool set_node_velocity(Utils::Vector3i const &node,
544 Utils::Vector3d const &v) override;
545 std::vector<double>
546 get_slice_velocity(Utils::Vector3i const &lower_corner,
547 Utils::Vector3i const &upper_corner) const override;
548 void set_slice_velocity(Utils::Vector3i const &lower_corner,
549 Utils::Vector3i const &upper_corner,
550 std::vector<double> const &velocity) override;
551
552 // Density
553 std::optional<double>
555 bool consider_ghosts = false) const override;
556 bool set_node_density(Utils::Vector3i const &node, double density) override;
557 std::vector<double>
558 get_slice_density(Utils::Vector3i const &lower_corner,
559 Utils::Vector3i const &upper_corner) const override;
560 void set_slice_density(Utils::Vector3i const &lower_corner,
561 Utils::Vector3i const &upper_corner,
562 std::vector<double> const &density) override;
563
564 // Population
565 std::optional<std::vector<double>>
567 bool consider_ghosts = false) const override;
568 bool set_node_population(Utils::Vector3i const &node,
569 std::vector<double> const &population) override;
570 std::vector<double>
571 get_slice_population(Utils::Vector3i const &lower_corner,
572 Utils::Vector3i const &upper_corner) const override;
573 void set_slice_population(Utils::Vector3i const &lower_corner,
574 Utils::Vector3i const &upper_corner,
575 std::vector<double> const &population) override;
576
577 // Force
578 std::optional<Utils::Vector3d>
579 get_node_force_to_be_applied(Utils::Vector3i const &node) const override;
580 std::optional<Utils::Vector3d>
582 bool consider_ghosts = false) const override;
584 Utils::Vector3d const &force) override;
585 std::vector<double> get_slice_last_applied_force(
586 Utils::Vector3i const &lower_corner,
587 Utils::Vector3i const &upper_corner) const override;
588 void set_slice_last_applied_force(Utils::Vector3i const &lower_corner,
589 Utils::Vector3i const &upper_corner,
590 std::vector<double> const &force) override;
591
592 // Pressure tensor
593 std::optional<Utils::VectorXd<9>>
594 get_node_pressure_tensor(Utils::Vector3i const &node) const override;
595 std::vector<double>
596 get_slice_pressure_tensor(Utils::Vector3i const &lower_corner,
597 Utils::Vector3i const &upper_corner) const override;
598
599private:
600 // ---- Interpolation (position-based access) ----
601
602 /** @brief Return a B-spline interpolation kernel for force distribution. */
603 auto make_force_interpolation_kernel() const;
604 /** @brief Return a B-spline interpolation kernel for velocity readout. */
605 auto make_velocity_interpolation_kernel() const;
606 /** @brief Return a B-spline interpolation kernel for density readout. */
607 auto make_density_interpolation_kernel() const;
608
609public:
610 std::function<bool(Utils::Vector3d const &)>
611 make_lattice_position_checker(bool consider_points_in_halo) const override;
612 bool add_force_at_pos(Utils::Vector3d const &pos,
613 Utils::Vector3d const &force) override;
614 void add_forces_at_pos(std::vector<Utils::Vector3d> const &pos,
615 std::vector<Utils::Vector3d> const &forces) override;
616 std::optional<Utils::Vector3d>
618 bool consider_points_in_halo = false) const override;
619 std::vector<Utils::Vector3d>
620 get_velocities_at_pos(std::vector<Utils::Vector3d> const &pos) override;
621 std::optional<double>
623 bool consider_points_in_halo = false) const override;
624 std::vector<double>
625 get_densities_at_pos(std::vector<Utils::Vector3d> const &pos) override;
626
627public:
628 // ---- Boundary Handling ----
629
630 void reset_boundary_handling(std::shared_ptr<BlockStorage> const &blocks) {
631 auto const [lc, uc] = m_lattice->get_local_grid_range(true);
632 m_boundary =
633 std::make_shared<BoundaryModel>(blocks, m_pdf_field_id, m_flag_field_id,
634 CellInterval{to_cell(lc), to_cell(uc)});
635 }
636
637 void on_boundary_add();
638 void clear_boundaries() override;
639 void reallocate_ubb_field() override;
640 void
641 update_boundary_from_shape(std::vector<int> const &raster_flat,
642 std::vector<double> const &data_flat) override;
643 std::optional<Utils::Vector3d>
645 bool consider_ghosts = false) const override;
647 Utils::Vector3d const &velocity) override;
648 std::vector<std::optional<Utils::Vector3d>> get_slice_velocity_at_boundary(
649 Utils::Vector3i const &lower_corner,
650 Utils::Vector3i const &upper_corner) const override;
652 Utils::Vector3i const &lower_corner, Utils::Vector3i const &upper_corner,
653 std::vector<std::optional<Utils::Vector3d>> const &velocity) override;
654 std::optional<Utils::Vector3d>
655 get_node_boundary_force(Utils::Vector3i const &node) const override;
656 bool remove_node_from_boundary(Utils::Vector3i const &node) override;
657 std::optional<bool>
659 bool consider_ghosts = false) const override;
660 std::vector<bool>
661 get_slice_is_boundary(Utils::Vector3i const &lower_corner,
662 Utils::Vector3i const &upper_corner) const override;
664 std::vector<int> const &raster_flat) const override;
665 [[nodiscard]] Utils::Vector3d get_boundary_force() const override;
666
667private:
668 [[nodiscard]] Utils::Vector3i flat_index_to_node(int index) const;
669 [[nodiscard]] Utils::Vector3i get_neighbor_node(Utils::Vector3i const &node,
670 int dir) const;
671
672public:
673 // ---- Global Reductions & Physical Parameters ----
674
675 // Global pressure tensor
676 [[nodiscard]] Utils::VectorXd<9> get_pressure_tensor() const override {
677 Matrix3<FloatType> tensor(FloatType{0});
678 for (auto const &block : *get_lattice().get_blocks()) {
679 auto pdf_field = block.template getData<PdfField>(m_pdf_field_id);
681 }
682 auto const &grid_size = get_lattice().get_grid_dimensions();
683 auto const number_of_nodes = Utils::product(grid_size);
685 return to_vector9d(tensor) * (1. / static_cast<double>(number_of_nodes));
686 }
687
688 // Global momentum
689 [[nodiscard]] Utils::Vector3d get_momentum() const override {
690 Vector3<FloatType> mom(FloatType{0});
691 for (auto const &block : *get_lattice().get_blocks()) {
692 auto pdf_field = block.template getData<PdfField>(m_pdf_field_id);
693 auto force_field =
694 block.template getData<VectorField>(m_last_applied_force_field_id);
695 mom += lbm::accessor::MomentumDensity::reduce(pdf_field, force_field,
696 m_density);
697 }
698 return to_vector3d(mom);
699 }
700
701 // Global external force
702 void set_external_force(Utils::Vector3d const &ext_force) override {
703 m_reset_force->set_ext_force(zero_centered_to_lb(ext_force));
704 }
705
706 [[nodiscard]] Utils::Vector3d get_external_force() const noexcept override {
707 return zero_centered_to_md(m_reset_force->get_ext_force());
708 }
709
710 void set_viscosity(double viscosity) override {
711 m_viscosity = FloatType_c(viscosity);
712 }
713
714 [[nodiscard]] double get_viscosity() const noexcept override {
715 return static_cast<double>(m_viscosity);
716 }
717
718 [[nodiscard]] double get_density() const noexcept override {
719 return static_cast<double>(m_density);
720 }
721
722 [[nodiscard]] double get_kT() const noexcept override {
723 return static_cast<double>(m_kT);
724 }
725
726 [[nodiscard]] unsigned int get_seed() const noexcept override {
727 return m_seed;
728 }
729
730 [[nodiscard]] std::optional<uint64_t> get_rng_state() const override {
731 auto const cm =
732 std::get_if<typename Kernels::StreamCollisionModelThermalized>(
734 if (!cm or m_kT == 0.) {
735 return std::nullopt;
736 }
737 return {static_cast<uint64_t>(cm->getTime_step())};
738 }
739
740 void set_rng_state(uint64_t counter) override {
741 auto const cm =
742 std::get_if<typename Kernels::StreamCollisionModelThermalized>(
744 if (!cm or m_kT == 0.) {
745 throw std::runtime_error("This LB instance is unthermalized");
746 }
747 assert(counter <=
748 static_cast<uint32_t>(std::numeric_limits<uint_t>::max()));
749 cm->setTime_step(static_cast<uint32_t>(counter));
750 }
751
752 [[nodiscard]] LatticeWalberla const &get_lattice() const noexcept override {
753 return *m_lattice;
754 }
755
756 [[nodiscard]] std::size_t get_velocity_field_id() const noexcept override {
757 return m_velocity_field_id;
758 }
759
760 [[nodiscard]] std::size_t get_force_field_id() const noexcept override {
762 }
763
764 /**
765 * @brief Correction factor for off-diagonal pressure tensor elements.
766 * Compensates for the viscosity-dependent error in the non-equilibrium
767 * stress: factor = nu / (nu + 1/6).
768 */
770 return m_viscosity / (m_viscosity + FloatType{1} / FloatType{6});
771 }
772
773 void pressure_tensor_correction(Matrix3<FloatType> &tensor) const {
774 auto const revert_factor = pressure_tensor_correction_factor();
775 for (auto const i : {1u, 2u, 3u, 5u, 6u, 7u}) {
776 tensor[i] *= revert_factor;
777 }
778 }
779
780 void pressure_tensor_correction(std::span<FloatType, 9ul> tensor) const {
781 auto const revert_factor = pressure_tensor_correction_factor();
782 for (auto const i : {1u, 2u, 3u, 5u, 6u, 7u}) {
783 tensor[i] *= revert_factor;
784 }
785 }
786
787protected:
788 /**
789 * @brief Scale data by a conversion factor (in-place).
790 * Used for zero-centered density representation: LB internally stores
791 * density fluctuations around zero, while the user interface uses
792 * absolute densities. The conversion factors @ref m_zc_to_md and
793 * @ref m_zc_to_lb translate between these representations.
794 */
795 template <typename T>
796 void zero_centered_transform_impl(T &data, auto const factor) const {
797 if constexpr (std::is_arithmetic_v<T>) {
798 static_assert(std::is_floating_point_v<T>);
799 data *= static_cast<T>(factor);
800 } else {
801 auto const coef = static_cast<typename T::value_type>(factor);
802 std::transform(std::begin(data), std::end(data), std::begin(data),
803 [coef](auto value) { return value * coef; });
804 }
805 }
806
807 void zero_centered_to_lb_in_place(auto &data) const {
809 }
810
811 void zero_centered_to_md_in_place(auto &data) const {
813 }
814
815 auto zero_centered_to_lb(auto const &data) const {
816 auto transformed_data = data;
817 zero_centered_to_lb_in_place(transformed_data);
818 return transformed_data;
819 }
820
821 auto zero_centered_to_md(auto const &data) const {
822 auto transformed_data = data;
823 zero_centered_to_md_in_place(transformed_data);
824 return transformed_data;
825 }
826
827public:
828 // ---- File I/O ----
829
830 void register_vtk_field_filters(walberla::vtk::VTKOutput &vtk_obj) override {
831 field::FlagFieldCellFilter<FlagField> fluid_filter(m_flag_field_id);
832 fluid_filter.addFlag(Boundary_flag);
833 vtk_obj.addCellExclusionFilter(fluid_filter);
834 }
835
836 void register_vtk_field_writers(walberla::vtk::VTKOutput &vtk_obj,
837 LatticeModel::units_map const &units,
838 int flag_observables) override;
839
840protected:
841 // ---- Private Infrastructure Helpers ----
842
843 /**
844 * @brief Convenience function to add a field with a custom allocator.
845 *
846 * When vectorization is off, let waLBerla decide which memory allocator
847 * to use. When vectorization is on, the aligned memory allocator is
848 * required, otherwise <tt>cpu_vectorize_info["assume_aligned"]</tt> will
849 * trigger assertions. That is because for single-precision kernels the
850 * waLBerla heuristic in <tt>src/field/allocation/FieldAllocator.h</tt>
851 * will fall back to @c StdFieldAlloc, yet @c AllocateAligned is needed
852 * for intrinsics to work.
853 */
854 template <typename Field> auto add_to_storage(std::string const tag) {
855 auto const &blocks = m_lattice->get_blocks();
856 auto const n_ghost_layers = m_lattice->get_ghost_layers();
857#if defined(__CUDACC__) and defined(WALBERLA_BUILD_WITH_CUDA)
858 if constexpr (Architecture == lbmpy::Arch::GPU) {
859 auto field_id = gpu::addGPUFieldToStorage<GPUField>(
860 blocks, tag, Field::F_SIZE, field::fzyx, n_ghost_layers);
861 if constexpr (std::is_same_v<Field, _VectorField>) {
862 for (auto &block : *blocks) {
863 auto field = block.template getData<GPUField>(field_id);
864 lbm::accessor::Vector::initialize(field, Vector3<FloatType>{0});
865 }
866 } else if constexpr (std::is_same_v<Field, _PdfField>) {
867 for (auto &block : *blocks) {
868 auto field = block.template getData<GPUField>(field_id);
870 field, std::array<FloatType, Stencil::Size>{});
871 }
872 }
873 return field_id;
874 }
875#endif
876 {
877#ifdef ESPRESSO_BUILD_WITH_AVX_KERNELS
878 constexpr auto alignment = field::SIMDAlignment();
879 using value_type = Field::value_type;
880 using Allocator = field::AllocateAligned<value_type, alignment>;
881 auto const allocator = std::make_shared<Allocator>();
882 auto const empty_set = Set<SUID>::emptySet();
883 return field::addToStorage<Field>(
884 blocks, tag, field::internal::defaultSize, FloatType{0}, field::fzyx,
885 n_ghost_layers, false, {}, empty_set, empty_set, allocator);
886#else // ESPRESSO_BUILD_WITH_AVX_KERNELS
887 return field::addToStorage<Field>(blocks, tag, FloatType{0}, field::fzyx,
888 n_ghost_layers);
889#endif // ESPRESSO_BUILD_WITH_AVX_KERNELS
890 }
891 }
892
893 /**
894 * @brief Set up D3Q27 communicators for full ghost layer updates.
895 * Creates per-field communicators (PDF, velocity, last-applied force)
896 * as well as a combined communicator and the boundary communicator.
897 */
899 auto const &blocks = m_lattice->get_blocks();
900
901 m_full_communicator = std::make_shared<RegularFullCommunicator>(blocks);
902 m_full_communicator->addPackInfo(
903 std::make_shared<PackInfo<PdfField>>(m_pdf_field_id));
904 m_full_communicator->addPackInfo(
906 m_full_communicator->addPackInfo(
907 std::make_shared<PackInfo<VectorField>>(m_velocity_field_id));
908
909 m_pdf_communicator = std::make_shared<RegularFullCommunicator>(blocks);
910 m_vel_communicator = std::make_shared<RegularFullCommunicator>(blocks);
911 m_laf_communicator = std::make_shared<RegularFullCommunicator>(blocks);
912 m_pdf_communicator->addPackInfo(
913 std::make_shared<PackInfo<PdfField>>(m_pdf_field_id));
914 m_vel_communicator->addPackInfo(
915 std::make_shared<PackInfo<VectorField>>(m_velocity_field_id));
916 m_laf_communicator->addPackInfo(
918
920 std::make_shared<BoundaryFullCommunicator>(blocks);
921 m_boundary_communicator->addPackInfo(
924 auto boundary_packinfo = std::make_shared<
927 boundary_packinfo->setup_boundary_handle(m_lattice, m_boundary);
928 m_boundary_communicator->addPackInfo(boundary_packinfo);
929 }
930
931 /**
932 * @brief Set up the communicator used during integration.
933 * Uses optimized streaming pack info when neither boundaries nor
934 * Lees-Edwards boundary conditions are active; falls back to the
935 * generic pack info otherwise.
936 */
938 auto const setup = [this]<typename PackInfoPdf, typename PackInfoVec>() {
939 auto const &blocks = m_lattice->get_blocks();
941 std::make_shared<PDFStreamingCommunicator>(blocks);
942 m_pdf_streaming_communicator->addPackInfo(
943 std::make_shared<PackInfoPdf>(m_pdf_field_id));
944 m_pdf_streaming_communicator->addPackInfo(
945 std::make_shared<PackInfoVec>(m_last_applied_force_field_id));
946 };
948 using PackInfoPdf = FieldTrait::PackInfoStreamingPdf;
949 using PackInfoVec = FieldTrait::PackInfoStreamingVec;
950 if (m_has_boundaries or (m_collision_model and has_lees_edwards_bc())) {
951 setup.template operator()<PackInfo<PdfField>, PackInfoVec>();
952 } else {
953 setup.template operator()<PackInfoPdf, PackInfoVec>();
954 }
955 }
956};
957
958} // namespace walberla
959
960// Out-of-class template method definitions
964#include "LBNodeAccess.impl.hpp"
965#include "LBSliceAccess.impl.hpp"
966#include "LBVTK.impl.hpp"
Out-of-class boundary access definitions for walberla::LBWalberlaImpl.
Out-of-class collision model setup definitions for walberla::LBWalberlaImpl.
Out-of-class position-based interpolation definitions for walberla::LBWalberlaImpl.
Out-of-class node access definitions for walberla::LBWalberlaImpl.
Out-of-class slice access definitions for walberla::LBWalberlaImpl.
Out-of-class VTK writer registration definition for walberla::LBWalberlaImpl.
LBWalberlaBase provides the public interface of the LB waLBerla bridge.
Vector implementation and trait types for boost qvm interoperability.
Interface of a lattice-based fluid model.
std::map< std::string, std::shared_ptr< VTKHandle > > m_vtk_auto
VTK writers that are executed automatically.
std::unordered_map< std::string, double > units_map
Class that runs and controls the BlockForest in waLBerla.
walberla::blockforest::StructuredBlockForest Lattice_T
Boundary class optimized for sparse data.
field::FlagField< uint8_t > FlagField
Class that runs and controls the LB on waLBerla.
void add_forces_at_pos(std::vector< Utils::Vector3d > const &pos, std::vector< Utils::Vector3d > const &forces) override
Distribute forces to the lattice at given positions.
std::shared_ptr< typename Kernels::UpdateVelFromPDF > m_update_velocities_from_pdf
std::vector< double > get_slice_last_applied_force(Utils::Vector3i const &lower_corner, Utils::Vector3i const &upper_corner) const override
std::variant< typename Kernels::StreamCollisionModelThermalized, typename Kernels::StreamCollisionModelLeesEdwards > CollisionModel
void zero_centered_transform_impl(T &data, auto const factor) const
Scale data by a conversion factor (in-place).
void reset_boundary_handling(std::shared_ptr< BlockStorage > const &blocks)
std::shared_ptr< RegularFullCommunicator > m_pdf_communicator
std::vector< std::optional< Utils::Vector3d > > get_slice_velocity_at_boundary(Utils::Vector3i const &lower_corner, Utils::Vector3i const &upper_corner) const override
std::optional< Utils::Vector3d > get_node_last_applied_force(Utils::Vector3i const &node, bool consider_ghosts=false) const override
stencil::D3Q19 Stencil
Stencil for collision and streaming operations.
std::optional< Utils::Vector3d > get_node_velocity_at_boundary(Utils::Vector3i const &node, bool consider_ghosts=false) const override
void ghost_communication() override
Perform all pending ghost layer updates.
void pressure_tensor_correction(Matrix3< FloatType > &tensor) const
std::optional< Utils::Vector3d > get_node_velocity(Utils::Vector3i const &node, bool consider_ghosts=false) const override
FieldTrait< FloatType, Stencil, Architecture >::template RegularCommScheme< Stencil > PDFStreamingCommunicator
Regular communicator.
Utils::Vector3d get_boundary_force_from_shape(std::vector< int > const &raster_flat) const override
Total force exerted by the fluid on a subset of boundary nodes.
std::shared_ptr< RegularFullCommunicator > m_full_communicator
std::size_t get_force_field_id() const noexcept override
std::shared_ptr< CollisionModel > m_collision_model
void set_slice_velocity(Utils::Vector3i const &lower_corner, Utils::Vector3i const &upper_corner, std::vector< double > const &velocity) override
unsigned int get_seed() const noexcept override
void integrate_vtk_writers() override
void pressure_tensor_correction(std::span< FloatType, 9ul > tensor) const
BoundaryModel::FlagField FlagField
bool remove_node_from_boundary(Utils::Vector3i const &node) override
std::optional< Utils::Vector3d > get_node_boundary_force(Utils::Vector3i const &node) const override
std::optional< double > get_density_at_pos(Utils::Vector3d const &pos, bool consider_points_in_halo=false) const override
void zero_centered_to_md_in_place(auto &data) const
FieldTrait< FloatType, Stencil >::VectorField _VectorField
void set_slice_velocity_at_boundary(Utils::Vector3i const &lower_corner, Utils::Vector3i const &upper_corner, std::vector< std::optional< Utils::Vector3d > > const &velocity) override
std::vector< double > get_slice_population(Utils::Vector3i const &lower_corner, Utils::Vector3i const &upper_corner) const override
void set_rng_state(uint64_t counter) override
std::vector< double > get_slice_velocity(Utils::Vector3i const &lower_corner, Utils::Vector3i const &upper_corner) const override
Utils::Vector3d get_boundary_force() const override
std::shared_ptr< LatticeWalberla > m_lattice
std::shared_ptr< LeesEdwardsPack > m_lees_edwards_callbacks
LBWalberlaImpl(std::shared_ptr< LatticeWalberla > lattice, double viscosity, double density)
bool set_node_last_applied_force(Utils::Vector3i const &node, Utils::Vector3d const &force) override
std::function< bool(Utils::Vector3d const &)> make_lattice_position_checker(bool consider_points_in_halo) const override
FieldTrait< FloatType, Stencil >::PdfField _PdfField
std::shared_ptr< InterpolateAndShiftAtBoundary< _VectorField, FloatType > > m_lees_edwards_vel_interpol_sweep
std::vector< bool > get_slice_is_boundary(Utils::Vector3i const &lower_corner, Utils::Vector3i const &upper_corner) const override
std::vector< double > get_slice_density(Utils::Vector3i const &lower_corner, Utils::Vector3i const &upper_corner) const override
bool is_double_precision() const noexcept override
void update_boundary_from_shape(std::vector< int > const &raster_flat, std::vector< double > const &data_flat) override
Set boundary conditions from a rasterized shape.
std::shared_ptr< BoundaryModel > m_boundary
FieldTrait< FloatType, Stencil, Architecture >::PdfField PdfField
std::vector< double > get_slice_pressure_tensor(Utils::Vector3i const &lower_corner, Utils::Vector3i const &upper_corner) const override
FieldTrait< FloatType, Stencil, Architecture >::template PackInfo< Field > PackInfo
bool set_node_density(Utils::Vector3i const &node, double density) override
void set_collision_model(double kT, unsigned int seed) override
Set up the thermalized collision model.
std::vector< Utils::Vector3d > get_velocities_at_pos(std::vector< Utils::Vector3d > const &pos) override
Interpolate velocities at given positions (batch version).
void ghost_communication_laf() override
std::optional< bool > get_node_is_boundary(Utils::Vector3i const &node, bool consider_ghosts=false) const override
std::shared_ptr< ResetForce< PdfField, VectorField > > m_reset_force
void setup_streaming_communicator()
Set up the communicator used during integration.
FlagUID const Boundary_flag
Flag for boundary cells.
~LBWalberlaImpl() override=default
std::optional< uint64_t > get_rng_state() const override
std::optional< std::vector< double > > get_node_population(Utils::Vector3i const &node, bool consider_ghosts=false) const override
FloatType m_density
kinematic viscosity
double get_viscosity() const noexcept override
double get_kT() const noexcept override
Utils::Vector3d get_momentum() const override
void set_viscosity(double viscosity) override
void on_boundary_add()
Lazily enable boundary mode on first boundary addition.
std::shared_ptr< BoundaryFullCommunicator > m_boundary_communicator
std::size_t stencil_size() const noexcept override
auto add_to_storage(std::string const tag)
Convenience function to add a field with a custom allocator.
void ghost_communication_full()
Communicate all fields at once using the D3Q27 stencil.
auto zero_centered_to_lb(auto const &data) const
FieldTrait< FloatType, Stencil, Architecture >::template BoundaryCommScheme< stencil::D3Q27 > BoundaryFullCommunicator
bool set_node_velocity_at_boundary(Utils::Vector3i const &node, Utils::Vector3d const &velocity) override
stencil::D3Q27 StencilFull
Stencil for ghost communication (includes domain corners).
void register_vtk_field_writers(walberla::vtk::VTKOutput &vtk_obj, LatticeModel::units_map const &units, int flag_observables) override
std::optional< double > get_node_density(Utils::Vector3i const &node, bool consider_ghosts=false) const override
void check_lebc(unsigned int shear_direction, unsigned int shear_plane_normal) const override
Verify that MD and LB Lees-Edwards parameters are consistent.
void set_slice_density(Utils::Vector3i const &lower_corner, Utils::Vector3i const &upper_corner, std::vector< double > const &density) override
void ghost_communication_vel() override
Utils::Vector3d get_external_force() const noexcept override
FloatType FloatType_c(T t) const
std::shared_ptr< RegularFullCommunicator > m_laf_communicator
std::size_t get_velocity_field_id() const noexcept override
Utils::VectorXd< 9 > get_pressure_tensor() const override
ResourceObserver m_mpi_cart_comm_observer
FieldTrait< FloatType, Stencil, Architecture >::template RegularCommScheme< stencil::D3Q27 > RegularFullCommunicator
Full communicator.
std::shared_ptr< InterpolateAndShiftAtBoundary< _PdfField, FloatType > > m_lees_edwards_pdf_interpol_sweep
void set_external_force(Utils::Vector3d const &ext_force) override
void setup_full_communicator()
Set up D3Q27 communicators for full ghost layer updates.
std::optional< Utils::Vector3d > get_velocity_at_pos(Utils::Vector3d const &pos, bool consider_points_in_halo=false) const override
FieldTrait< FloatType, Stencil, Architecture >::VectorField VectorField
void set_slice_last_applied_force(Utils::Vector3i const &lower_corner, Utils::Vector3i const &upper_corner, std::vector< double > const &force) override
LatticeWalberla::Lattice_T BlockStorage
Lattice model (e.g.
std::shared_ptr< RegularFullCommunicator > m_vel_communicator
std::bitset< GhostComm::SIZE > m_pending_ghost_comm
LatticeWalberla const & get_lattice() const noexcept override
auto zero_centered_to_md(auto const &data) const
void set_slice_population(Utils::Vector3i const &lower_corner, Utils::Vector3i const &upper_corner, std::vector< double > const &population) override
double get_density() const noexcept override
void ghost_communication_pdf() override
void register_vtk_field_filters(walberla::vtk::VTKOutput &vtk_obj) override
std::optional< Utils::Vector3d > get_node_force_to_be_applied(Utils::Vector3i const &node) const override
std::vector< double > get_densities_at_pos(std::vector< Utils::Vector3d > const &pos) override
void zero_centered_to_lb_in_place(auto &data) const
bool set_node_velocity(Utils::Vector3i const &node, Utils::Vector3d const &v) override
bool set_node_population(Utils::Vector3i const &node, std::vector< double > const &population) override
bool is_gpu() const noexcept override
FloatType pressure_tensor_correction_factor() const
Correction factor for off-diagonal pressure tensor elements.
std::shared_ptr< PDFStreamingCommunicator > m_pdf_streaming_communicator
detail::KernelTrait< FloatType, Architecture > Kernels
BlockDataID m_last_applied_force_field_id
std::optional< Utils::VectorXd< 9 > > get_node_pressure_tensor(Utils::Vector3i const &node) const override
std::shared_ptr< InterpolateAndShiftAtBoundary< _VectorField, FloatType > > m_lees_edwards_last_applied_force_interpol_sweep
bool add_force_at_pos(Utils::Vector3d const &pos, Utils::Vector3d const &force) override
void setup_boundary_handle(std::shared_ptr< LatticeWalberla > lattice, std::shared_ptr< Boundary_T > boundary)
static double * block(double *p, std::size_t index, std::size_t size)
Definition elc.cpp:175
T product(Vector< T, N > const &v)
Definition Vector.hpp:372
STL namespace.
auto reduce(GhostLayerField< double, uint_t{19u}> const *pdf_field, GhostLayerField< double, uint_t{3u}> const *force_field, double const density)
void initialize(GhostLayerField< double, uint_t{19u}> *pdf_field, std::array< double, 19u > const &pop)
auto reduce(GhostLayerField< double, uint_t{19u}> const *pdf_field, double const density)
void initialize(GhostLayerField< double, uint_t{3u}> *vec_field, Vector3< double > const &vec)
\file PackInfoPdfDoublePrecision.cpp \author pystencils
auto to_vector3d(Vector3< T > const &v) noexcept
Cell to_cell(signed_integral_vector auto const &xyz)
ResourceObserver get_mpi_cart_comm_observer()
Get an observer on waLBerla's MPI Cartesian communicator status.
auto to_vector9d(Matrix3< T > const &m) noexcept
static Utils::Vector3d velocity(Particle const &p_ref, Particle const &p_vs)
Velocity of the virtual site.
Definition relative.cpp:65
Observer to monitor the lifetime of a shared resource.
detail::KernelTrait< FT, AT >::PackInfoVec PackInfoStreamingVec
Definition lb_fields.hpp:37
field::GhostLayerField< FT, PdfStencil::Size > PdfField
Definition lb_fields.hpp:33
field::GhostLayerField< FT, uint_t{3u}> VectorField
Definition lb_fields.hpp:34
detail::KernelTrait< FT, AT >::PackInfoPdf PackInfoStreamingPdf
Definition lb_fields.hpp:36
GhostCommFlags
Ghost communication operations.
@ LAF
last applied forces communication