dox/LBInterpolation_8impl_8hpp_source.html

/*

 * Copyright (C) 2019-2026 The ESPResSo project

 *

 * This file is part of ESPResSo.

 *

 * ESPResSo is free software: you can redistribute it and/or modify

 * it under the terms of the GNU General Public License as published by

 * the Free Software Foundation, either version 3 of the License, or

 * (at your option) any later version.

 *

 * ESPResSo is distributed in the hope that it will be useful,

 * but WITHOUT ANY WARRANTY; without even the implied warranty of

 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the

 * GNU General Public License for more details.

 *

 * You should have received a copy of the GNU General Public License

 * along with this program.  If not, see <http://www.gnu.org/licenses/>.

 */


#pragma once


/**

 * @file

 * Out-of-class position-based interpolation definitions for

 * @ref walberla::LBWalberlaImpl.

 */


#include <utils/Vector.hpp>

#include <utils/interpolation/bspline_3d.hpp>


#include <algorithm>

#include <array>

#include <cstddef>

#include <iostream>

#include <iterator>

#include <memory>

#include <optional>

#include <stdexcept>

#include <string>

#include <type_traits>

#include <utility>

#include <vector>


namespace walberla {


/**

 * @brief Exception for accessing a lattice node outside the local domain

 *  and ghost layers during B-spline interpolation.

 */


class interpolation_illegal_access : public std::runtime_error {

public:


  interpolation_illegal_access(std::string const &field,

                               Utils::Vector3d const &pos,

                               std::array<int, 3> const &node, double weight)

      : std::runtime_error("Access to LB " + field + " field failed") {

    std::cerr << "pos [" << pos << "], node [" << Utils::Vector3i(node)

              << "], weight " << weight << "\n";

  }


};


void interpolate_bspline_at_pos(Utils::Vector3d const &pos, auto const &&f) {

  Utils::Interpolation::bspline_3d<2>(

      pos, f, Utils::Vector3d::broadcast(1.), // grid spacing

      Utils::Vector3d::broadcast(.5));        // offset

}


template <typename FloatType, lbmpy::Arch Architecture>

std::function<bool(Utils::Vector3d const &)>


LBWalberlaImpl<FloatType, Architecture>::make_lattice_position_checker(

    bool consider_points_in_halo) const {

  auto const &lat = *m_lattice;

  if (consider_points_in_halo) {

    return [&](Utils::Vector3d const &p) { return lat.pos_in_local_halo(p); };

  }

  return [&](Utils::Vector3d const &p) { return lat.pos_in_local_domain(p); };

}


/**

 * @brief Distribute forces to the lattice at given positions.

 * Uses B-spline interpolation to spread each force over the surrounding

 * lattice nodes. On GPU, positions are transformed to block-local

 * coordinates and the operation is performed in a single kernel launch.

 */

template <typename FloatType, lbmpy::Arch Architecture>


void LBWalberlaImpl<FloatType, Architecture>::add_forces_at_pos(

    std::vector<Utils::Vector3d> const &pos,

    std::vector<Utils::Vector3d> const &forces) {

  assert(pos.size() == forces.size());

  if (pos.empty()) {

    return;

  }

  if constexpr (Architecture == lbmpy::Arch::CPU) {

    auto const kernel = make_force_interpolation_kernel();

    for (std::size_t i = 0ul; i < pos.size(); ++i) {

      kernel(pos[i], forces[i]);

    }

  }

#if defined(__CUDACC__) and defined(WALBERLA_BUILD_WITH_CUDA)

  if constexpr (Architecture == lbmpy::Arch::GPU) {

    auto const &lattice = get_lattice();

    auto const &block = *(lattice.get_blocks()->begin());

    auto const origin = block.getAABB().min();

    std::vector<FloatType> host_pos;

    std::vector<FloatType> host_force;

    host_pos.reserve(3ul * pos.size());

    host_force.reserve(3ul * forces.size());

    assert(lattice.get_blocks()->getNumberOfBlocks() == 1u);

    for (auto const &vec : pos) {

#pragma unroll

      for (std::size_t i : {0ul, 1ul, 2ul}) {

        host_pos.emplace_back(static_cast<FloatType>(vec[i] - origin[i]));

      }

    }

    for (auto const &vec : forces) {

#pragma unroll

      for (std::size_t i : {0ul, 1ul, 2ul}) {

        host_force.emplace_back(static_cast<FloatType>(vec[i]));

      }

    }

    zero_centered_to_lb_in_place(host_force);

    auto const gl = lattice.get_ghost_layers();

    auto field = block.template uncheckedFastGetData<VectorField>(

        m_force_to_be_applied_id);

    lbm::accessor::Interpolation::add_force(field, host_pos, host_force, gl);

  }

#endif

}


template <typename FloatType, lbmpy::Arch Architecture>

auto LBWalberlaImpl<FloatType, Architecture>::make_force_interpolation_kernel()

    const {

  auto const &lattice = *m_lattice;

  auto const &blocks = *lattice.get_blocks();

  assert(lattice.get_ghost_layers() == 1u);

  return [&](Utils::Vector3d const &pos, Utils::Vector3d const &force) {

    if (not get_block_extended(lattice, pos, 1u)) {

      return;

    }

    interpolate_bspline_at_pos(

        pos, [&, conv = m_zc_to_lb, field_id = m_force_to_be_applied_id](

                 std::array<int, 3> const node, double weight) {

          auto block = get_block_extended(lattice, node, 0u);

          if (!block)

            block = get_block_extended(lattice, node, 1u);

          if (block) {

            auto cell = to_cell(node);

            blocks.transformGlobalToBlockLocalCell(cell, *block);

            weight *= conv;

            auto const weighted_force = to_vector3<FloatType>(weight * force);

            auto field =

                block->template uncheckedFastGetData<VectorField>(field_id);

            lbm::accessor::Vector::add(field, weighted_force, cell);

          }

        });

  };

}


template <typename FloatType, lbmpy::Arch Architecture>

auto LBWalberlaImpl<FloatType,

                    Architecture>::make_velocity_interpolation_kernel() const {

  auto const &lattice = *m_lattice;

  auto const &blocks = *lattice.get_blocks();

  assert(lattice.get_ghost_layers() == 1u);

  return [&](Utils::Vector3d const &pos) {

    Utils::Vector3d acc{0., 0., 0.};

    interpolate_bspline_at_pos(

        pos, [&, field_id = m_velocity_field_id](std::array<int, 3> const node,

                                                 double weight) {

          // Nodes with zero weight might not be accessible, because they can be

          // outside ghost layers

          if (weight != 0.) {

            auto block = get_block_extended(lattice, node, 1u);

            if (!block)

              throw interpolation_illegal_access("velocity", pos, node, weight);

            Vector3<FloatType> vel;

            if (m_has_boundaries and m_boundary->node_is_boundary(node)) {

              vel = m_boundary->get_node_value_at_boundary(node);

            } else {

              auto cell = to_cell(node);

              blocks.transformGlobalToBlockLocalCell(cell, *block);

              auto field =

                  block->template uncheckedFastGetData<VectorField>(field_id);

              vel = lbm::accessor::Vector::get(field, cell);

            }

            acc += to_vector3d(vel) * weight;

          }

        });

    return acc;

  };

}


template <typename FloatType, lbmpy::Arch Architecture>

auto LBWalberlaImpl<FloatType,

                    Architecture>::make_density_interpolation_kernel() const {

  auto const &lattice = *m_lattice;

  auto const &blocks = *lattice.get_blocks();

  assert(lattice.get_ghost_layers() == 1u);

  return [&](Utils::Vector3d const &pos) {

    double acc = 0.;

    interpolate_bspline_at_pos(

        pos, [&, density = m_density, field_id = m_pdf_field_id](

                 std::array<int, 3> const node, double weight) {

          // Nodes with zero weight might not be accessible, because they can be

          // outside ghost layers

          if (weight != 0.) {

            auto block = get_block_extended(lattice, node, 1u);

            if (!block)

              throw interpolation_illegal_access("density", pos, node, weight);

            auto cell = to_cell(node);

            blocks.transformGlobalToBlockLocalCell(cell, *block);

            auto field =

                block->template uncheckedFastGetData<PdfField>(field_id);

            auto const rho = lbm::accessor::Density::get(field, density, cell);

            acc += rho * weight;

          }

        });

    return acc;

  };

}


/**

 * @brief Interpolate velocities at given positions (batch version).

 * On GPU, boundary slip velocities are written into the velocity field

 * before interpolation, since the field has indeterminate values inside

 * boundary regions.

 */

template <typename FloatType, lbmpy::Arch Architecture>

std::vector<Utils::Vector3d>


LBWalberlaImpl<FloatType, Architecture>::get_velocities_at_pos(

    std::vector<Utils::Vector3d> const &pos) {

  if (pos.empty()) {

    return {};

  }

  std::vector<Utils::Vector3d> vel{};

  vel.reserve(pos.size());

  if constexpr (Architecture == lbmpy::Arch::CPU) {

    auto const kernel = make_velocity_interpolation_kernel();

    std::ranges::transform(pos, std::back_inserter(vel), kernel);

  }

#if defined(__CUDACC__) and defined(WALBERLA_BUILD_WITH_CUDA)

  if constexpr (Architecture == lbmpy::Arch::GPU) {

    auto const &lattice = get_lattice();

    auto const &block = *(lattice.get_blocks()->begin());

    auto const origin = block.getAABB().min();

    std::vector<FloatType> host_pos;

    host_pos.reserve(3ul * pos.size());

    assert(lattice.get_blocks()->getNumberOfBlocks() == 1u);

    for (auto const &vec : pos) {

#pragma unroll

      for (std::size_t i : {0ul, 1ul, 2ul}) {

        host_pos.emplace_back(static_cast<FloatType>(vec[i] - origin[i]));

      }

    }

    auto const gl = lattice.get_ghost_layers();

    auto field =

        block.template uncheckedFastGetData<VectorField>(m_velocity_field_id);

    // the velocity field has indeterminate values inside boundary regions;

    // we overwrite them with boundary slip velocities before interpolation

    auto const [dev_idx, dev_vel] = m_boundary->get_flattened_map_device();

    if (not dev_idx->empty()) {

      lbm::accessor::Vector::set_from_list(field, *dev_idx, *dev_vel, gl);

    }

    auto const res = lbm::accessor::Interpolation::get_vel(field, host_pos, gl);

    for (auto it = res.begin(); it != res.end(); it += 3) {

      vel.emplace_back(Utils::Vector3d{static_cast<double>(*(it + 0)),

                                       static_cast<double>(*(it + 1)),

                                       static_cast<double>(*(it + 2))});

    }

  }

#endif

  return vel;

}


template <typename FloatType, lbmpy::Arch Architecture>

std::vector<double>


LBWalberlaImpl<FloatType, Architecture>::get_densities_at_pos(

    std::vector<Utils::Vector3d> const &pos) {

  if (pos.empty()) {

    return {};

  }

  std::vector<double> rho{};

  rho.reserve(pos.size());

  if constexpr (Architecture == lbmpy::Arch::CPU) {

    auto const kernel = make_density_interpolation_kernel();

    std::ranges::transform(pos, std::back_inserter(rho), kernel);

  }

#if defined(__CUDACC__) and defined(WALBERLA_BUILD_WITH_CUDA)

  if constexpr (Architecture == lbmpy::Arch::GPU) {

    auto const &lattice = get_lattice();

    auto const &block = *(lattice.get_blocks()->begin());

    auto const origin = block.getAABB().min();

    std::vector<FloatType> host_pos;

    host_pos.reserve(3ul * pos.size());

    assert(lattice.get_blocks()->getNumberOfBlocks() == 1u);

    for (auto const &vec : pos) {

#pragma unroll

      for (std::size_t i : {0ul, 1ul, 2ul}) {

        host_pos.emplace_back(static_cast<FloatType>(vec[i] - origin[i]));

      }

    }

    auto const gl = lattice.get_ghost_layers();

    auto field = block.template uncheckedFastGetData<PdfField>(m_pdf_field_id);

    auto res =

        lbm::accessor::Interpolation::get_rho(field, host_pos, m_density, gl);

    if constexpr (std::is_same_v<FloatType, double>) {

      std::swap(rho, res);

    } else {

      for (auto const &v : res) {

        rho.emplace_back(static_cast<double>(v));

      }

    }

  }

#endif

  return rho;

}


template <typename FloatType, lbmpy::Arch Architecture>

std::optional<Utils::Vector3d>


LBWalberlaImpl<FloatType, Architecture>::get_velocity_at_pos(

    Utils::Vector3d const &pos, bool consider_points_in_halo) const {

  assert(not m_pending_ghost_comm.test(GhostComm::VEL));

  assert(not m_pending_ghost_comm.test(GhostComm::UBB));

  if (!consider_points_in_halo and !m_lattice->pos_in_local_domain(pos))

    return std::nullopt;

  if (consider_points_in_halo and !m_lattice->pos_in_local_halo(pos))

    return std::nullopt;

  auto const kernel = make_velocity_interpolation_kernel();

  return {kernel(pos)};

}


template <typename FloatType, lbmpy::Arch Architecture>

std::optional<double>


LBWalberlaImpl<FloatType, Architecture>::get_density_at_pos(

    Utils::Vector3d const &pos, bool consider_points_in_halo) const {

  assert(not m_pending_ghost_comm.test(GhostComm::PDF));

  if (!consider_points_in_halo and !m_lattice->pos_in_local_domain(pos))

    return std::nullopt;

  if (consider_points_in_halo and !m_lattice->pos_in_local_halo(pos))

    return std::nullopt;

  auto const kernel = make_density_interpolation_kernel();

  return {kernel(pos)};

}


template <typename FloatType, lbmpy::Arch Architecture>


bool LBWalberlaImpl<FloatType, Architecture>::add_force_at_pos(

    Utils::Vector3d const &pos, Utils::Vector3d const &force) {

  if (!m_lattice->pos_in_local_halo(pos))

    return false;

  auto const kernel = make_force_interpolation_kernel();

  kernel(pos, force);

  return true;

}


} // namespace walberla

Vector.hpp
Vector implementation and trait types for boost qvm interoperability.

bspline_3d.hpp

Utils::Vector
Definition Vector.hpp:50

Utils::Vector::broadcast
static DEVICE_QUALIFIER constexpr Vector< T, N > broadcast(typename Base::value_type const &value) noexcept
Create a vector that has all entries set to the same value.
Definition Vector.hpp:131

walberla::LBWalberlaImpl
Class that runs and controls the LB on waLBerla.
Definition LBWalberlaImpl.hpp:86

walberla::LBWalberlaImpl::add_forces_at_pos
void add_forces_at_pos(std::vector< Utils::Vector3d > const &pos, std::vector< Utils::Vector3d > const &forces) override
Distribute forces to the lattice at given positions.
Definition LBInterpolation.impl.hpp:85

walberla::LBWalberlaImpl::get_density_at_pos
std::optional< double > get_density_at_pos(Utils::Vector3d const &pos, bool consider_points_in_halo=false) const override
Definition LBInterpolation.impl.hpp:333

walberla::LBWalberlaImpl::make_lattice_position_checker
std::function< bool(Utils::Vector3d const &)> make_lattice_position_checker(bool consider_points_in_halo) const override
Definition LBInterpolation.impl.hpp:69

walberla::LBWalberlaImpl::get_velocities_at_pos
std::vector< Utils::Vector3d > get_velocities_at_pos(std::vector< Utils::Vector3d > const &pos) override
Interpolate velocities at given positions (batch version).
Definition LBInterpolation.impl.hpp:229

walberla::LBWalberlaImpl::get_velocity_at_pos
std::optional< Utils::Vector3d > get_velocity_at_pos(Utils::Vector3d const &pos, bool consider_points_in_halo=false) const override
Definition LBInterpolation.impl.hpp:319

walberla::LBWalberlaImpl::get_densities_at_pos
std::vector< double > get_densities_at_pos(std::vector< Utils::Vector3d > const &pos) override
Definition LBInterpolation.impl.hpp:276

walberla::LBWalberlaImpl::add_force_at_pos
bool add_force_at_pos(Utils::Vector3d const &pos, Utils::Vector3d const &force) override
Definition LBInterpolation.impl.hpp:345

walberla::interpolation_illegal_access
Exception for accessing a lattice node outside the local domain and ghost layers during B-spline inte...
Definition LBInterpolation.impl.hpp:50

walberla::interpolation_illegal_access::interpolation_illegal_access
interpolation_illegal_access(std::string const &field, Utils::Vector3d const &pos, std::array< int, 3 > const &node, double weight)
Definition LBInterpolation.impl.hpp:52

stream
cudaStream_t stream[1]
CUDA streams for parallel computing on CPU and GPU.
Definition common_cuda.cu:34

block
static double * block(double *p, std::size_t index, std::size_t size)
Definition elc.cpp:175

Utils::Vector3i
VectorXi< 3 > Vector3i
Definition Vector.hpp:193

lbmpy::Arch::CPU
@ CPU

lbmpy::Arch::GPU
@ GPU

std
STL namespace.

walberla::lbm::accessor::Density::get
double get(GhostLayerField< double, uint_t{19u}> const *pdf_field, double const density, Cell const &cell)
Definition FieldAccessorsDoublePrecision.h:609

walberla::lbm::accessor::Interpolation::add_force
void add_force(gpu::GPUField< double > const *field, std::vector< double > const &pos, std::vector< double > const &forces, uint gl)
Definition FieldAccessorsDoublePrecisionCUDA.cu:746

walberla::lbm::accessor::Interpolation::get_rho
std::vector< double > get_rho(gpu::GPUField< double > const *field, std::vector< double > const &pos, double const density, uint gl)
Definition FieldAccessorsDoublePrecisionCUDA.cu:702

walberla::lbm::accessor::Interpolation::get_vel
std::vector< double > get_vel(gpu::GPUField< double > const *field, std::vector< double > const &pos, uint gl)
Definition FieldAccessorsDoublePrecisionCUDA.cu:725

walberla::lbm::accessor::Vector::set_from_list
void set_from_list(gpu::GPUField< double > const *field, thrust::device_vector< int > const &indices, thrust::device_vector< double > const &values, uint gl)
Definition FieldAccessorsDoublePrecisionCUDA.cu:527

walberla::lbm::accessor::Vector::add
void add(GhostLayerField< double, uint_t{3u}> *vec_field, Vector3< double > const &vec, Cell const &cell)
Definition FieldAccessorsDoublePrecision.h:320

walberla::lbm::accessor::Vector::get
auto get(GhostLayerField< double, uint_t{3u}> const *vec_field, Cell const &cell)
Definition FieldAccessorsDoublePrecision.h:302

walberla
\file PackInfoPdfDoublePrecision.cpp \author pystencils
Definition EKWalberla.hpp:38

walberla::get_block_extended
IBlock * get_block_extended(LatticeWalberla const &lattice, auto const &pos, unsigned int n_ghost_layers)
Definition BlockAndCell.hpp:87

walberla::to_vector3d
auto to_vector3d(Vector3< T > const &v) noexcept
Definition types_conversion.hpp:47

walberla::interpolate_bspline_at_pos
void interpolate_bspline_at_pos(Utils::Vector3d const &pos, auto const &&f)
Definition LBInterpolation.impl.hpp:61

walberla::to_cell
Cell to_cell(signed_integral_vector auto const &xyz)
Definition BlockAndCell.hpp:78

OutputVTK::density
@ density