dox/ReactionKernelIndexed__5__double__precision_8cpp_source.html

//======================================================================================================================

//

//  This file is part of waLBerla. waLBerla is free software: you can

//  redistribute it and/or modify it under the terms of the GNU General Public

//  License as published by the Free Software Foundation, either version 3 of

//  the License, or (at your option) any later version.

//

//  waLBerla is distributed in the hope that it will be useful, but WITHOUT

//  ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or

//  FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License

//  for more details.

//

//  You should have received a copy of the GNU General Public License along

//  with waLBerla (see COPYING.txt). If not, see <http://www.gnu.org/licenses/>.

//

//! \\file ReactionKernelIndexed_5_double_precision.cpp

//! \\author pystencils

//======================================================================================================================


// kernel generated with pystencils v1.4+1.ge851f4e, lbmpy v1.4+1.ge9efe34, sympy v1.12.1, lbmpy_walberla/pystencils_walberla from waLBerla commit 3247aa7395049ca5bfb69d34d55e45db19fa439c


#include "ReactionKernelIndexed_5_double_precision.h"

#include "core/DataTypes.h"

#include "core/Macros.h"


#define FUNC_PREFIX


using namespace std;


namespace walberla {

namespace pystencils {


#ifdef __GNUC__

#pragma GCC diagnostic push

#pragma GCC diagnostic ignored "-Wstrict-aliasing"

#pragma GCC diagnostic ignored "-Wunused-variable"

#pragma GCC diagnostic ignored "-Wconversion"

#endif


#if defined(__CUDACC__) and !defined(__clang__)

#pragma push

#ifdef __NVCC_DIAG_PRAGMA_SUPPORT__

#pragma nv_diag_suppress 177

#else

#pragma diag_suppress 177

#endif

#endif

// NOLINTBEGIN(readability-non-const-parameter*)


namespace internal_714956d26e6eb81c5dec60e7ab7da8ab {


static FUNC_PREFIX void reactionkernelindexed_5_double_precision_boundary_ReactionKernelIndexed_5_double_precision(uint8_t *RESTRICT const _data_indexVector, double *RESTRICT _data_rho_0, double *RESTRICT _data_rho_1, double *RESTRICT _data_rho_2, double *RESTRICT _data_rho_3, double *RESTRICT _data_rho_4, int64_t const _stride_rho_0_0, int64_t const _stride_rho_0_1, int64_t const _stride_rho_0_2, int64_t const _stride_rho_1_0, int64_t const _stride_rho_1_1, int64_t const _stride_rho_1_2, int64_t const _stride_rho_2_0, int64_t const _stride_rho_2_1, int64_t const _stride_rho_2_2, int64_t const _stride_rho_3_0, int64_t const _stride_rho_3_1, int64_t const _stride_rho_3_2, int64_t const _stride_rho_4_0, int64_t const _stride_rho_4_1, int64_t const _stride_rho_4_2, int32_t indexVectorSize, double order_0, double order_1, double order_2, double order_3, double order_4, double rate_coefficient, double stoech_0, double stoech_1, double stoech_2, double stoech_3, double stoech_4) {

#pragma omp parallel

  {

#pragma omp for schedule(static)

    for (int64_t ctr_0 = 0; ctr_0 < indexVectorSize; ctr_0 += 1) {

      const int32_t x = *((int32_t *)(&_data_indexVector[12 * ctr_0]));

      const int32_t y = *((int32_t *)(&_data_indexVector[12 * ctr_0 + 4]));

      const int32_t z = *((int32_t *)(&_data_indexVector[12 * ctr_0 + 8]));


      const double local_rho_0 = _data_rho_0[_stride_rho_0_0 * x + _stride_rho_0_1 * y + _stride_rho_0_2 * z];

      const double local_rho_1 = _data_rho_1[_stride_rho_1_0 * x + _stride_rho_1_1 * y + _stride_rho_1_2 * z];

      const double local_rho_2 = _data_rho_2[_stride_rho_2_0 * x + _stride_rho_2_1 * y + _stride_rho_2_2 * z];

      const double local_rho_3 = _data_rho_3[_stride_rho_3_0 * x + _stride_rho_3_1 * y + _stride_rho_3_2 * z];

      const double local_rho_4 = _data_rho_4[_stride_rho_4_0 * x + _stride_rho_4_1 * y + _stride_rho_4_2 * z];

      const double rate_factor = pow(local_rho_0, order_0) * pow(local_rho_1, order_1) * pow(local_rho_2, order_2) * pow(local_rho_3, order_3) * pow(local_rho_4, order_4) * rate_coefficient;

      _data_rho_0[_stride_rho_0_0 * x + _stride_rho_0_1 * y + _stride_rho_0_2 * z] = local_rho_0 + rate_factor * stoech_0;

      _data_rho_1[_stride_rho_1_0 * x + _stride_rho_1_1 * y + _stride_rho_1_2 * z] = local_rho_1 + rate_factor * stoech_1;

      _data_rho_2[_stride_rho_2_0 * x + _stride_rho_2_1 * y + _stride_rho_2_2 * z] = local_rho_2 + rate_factor * stoech_2;

      _data_rho_3[_stride_rho_3_0 * x + _stride_rho_3_1 * y + _stride_rho_3_2 * z] = local_rho_3 + rate_factor * stoech_3;

      _data_rho_4[_stride_rho_4_0 * x + _stride_rho_4_1 * y + _stride_rho_4_2 * z] = local_rho_4 + rate_factor * stoech_4;

    }

  }

}


} // namespace internal_714956d26e6eb81c5dec60e7ab7da8ab


// NOLINTEND(readability-non-const-parameter*)

#ifdef __GNUC__

#pragma GCC diagnostic pop

#endif


#if defined(__CUDACC__) and !defined(__clang__)

#pragma pop

#endif


void ReactionKernelIndexed_5_double_precision::run_impl(IBlock *block, IndexVectors::Type type) {

  auto *indexVectors = block->uncheckedFastGetData<IndexVectors>(indexVectorID);

  int32_t indexVectorSize = int32_c(indexVectors->indexVector(type).size());

  if (indexVectorSize == 0)

    return;


  auto pointer = indexVectors->pointerCpu(type);


  uint8_t *_data_indexVector = reinterpret_cast<uint8_t *>(pointer);


  auto rho_3 = block->getData<field::GhostLayerField<double, 1>>(rho_3ID);

  auto rho_1 = block->getData<field::GhostLayerField<double, 1>>(rho_1ID);

  auto rho_2 = block->getData<field::GhostLayerField<double, 1>>(rho_2ID);

  auto rho_4 = block->getData<field::GhostLayerField<double, 1>>(rho_4ID);

  auto rho_0 = block->getData<field::GhostLayerField<double, 1>>(rho_0ID);


  auto &rate_coefficient = rate_coefficient_;

  auto &stoech_1 = stoech_1_;

  auto &stoech_3 = stoech_3_;

  auto &order_3 = order_3_;

  auto &order_1 = order_1_;

  auto &order_4 = order_4_;

  auto &stoech_2 = stoech_2_;

  auto &stoech_4 = stoech_4_;

  auto &order_0 = order_0_;

  auto &stoech_0 = stoech_0_;

  auto &order_2 = order_2_;

  WALBERLA_ASSERT_GREATER_EQUAL(0, -int_c(rho_0->nrOfGhostLayers()))

  double *RESTRICT _data_rho_0 = rho_0->dataAt(0, 0, 0, 0);

  WALBERLA_ASSERT_GREATER_EQUAL(0, -int_c(rho_1->nrOfGhostLayers()))

  double *RESTRICT _data_rho_1 = rho_1->dataAt(0, 0, 0, 0);

  WALBERLA_ASSERT_GREATER_EQUAL(0, -int_c(rho_2->nrOfGhostLayers()))

  double *RESTRICT _data_rho_2 = rho_2->dataAt(0, 0, 0, 0);

  WALBERLA_ASSERT_GREATER_EQUAL(0, -int_c(rho_3->nrOfGhostLayers()))

  double *RESTRICT _data_rho_3 = rho_3->dataAt(0, 0, 0, 0);

  WALBERLA_ASSERT_GREATER_EQUAL(0, -int_c(rho_4->nrOfGhostLayers()))

  double *RESTRICT _data_rho_4 = rho_4->dataAt(0, 0, 0, 0);

  const int64_t _stride_rho_0_0 = int64_t(rho_0->xStride());

  const int64_t _stride_rho_0_1 = int64_t(rho_0->yStride());

  const int64_t _stride_rho_0_2 = int64_t(rho_0->zStride());

  const int64_t _stride_rho_1_0 = int64_t(rho_1->xStride());

  const int64_t _stride_rho_1_1 = int64_t(rho_1->yStride());

  const int64_t _stride_rho_1_2 = int64_t(rho_1->zStride());

  const int64_t _stride_rho_2_0 = int64_t(rho_2->xStride());

  const int64_t _stride_rho_2_1 = int64_t(rho_2->yStride());

  const int64_t _stride_rho_2_2 = int64_t(rho_2->zStride());

  const int64_t _stride_rho_3_0 = int64_t(rho_3->xStride());

  const int64_t _stride_rho_3_1 = int64_t(rho_3->yStride());

  const int64_t _stride_rho_3_2 = int64_t(rho_3->zStride());

  const int64_t _stride_rho_4_0 = int64_t(rho_4->xStride());

  const int64_t _stride_rho_4_1 = int64_t(rho_4->yStride());

  const int64_t _stride_rho_4_2 = int64_t(rho_4->zStride());

  internal_714956d26e6eb81c5dec60e7ab7da8ab::reactionkernelindexed_5_double_precision_boundary_ReactionKernelIndexed_5_double_precision(_data_indexVector, _data_rho_0, _data_rho_1, _data_rho_2, _data_rho_3, _data_rho_4, _stride_rho_0_0, _stride_rho_0_1, _stride_rho_0_2, _stride_rho_1_0, _stride_rho_1_1, _stride_rho_1_2, _stride_rho_2_0, _stride_rho_2_1, _stride_rho_2_2, _stride_rho_3_0, _stride_rho_3_1, _stride_rho_3_2, _stride_rho_4_0, _stride_rho_4_1, _stride_rho_4_2, indexVectorSize, order_0, order_1, order_2, order_3, order_4, rate_coefficient, stoech_0, stoech_1, stoech_2, stoech_3, stoech_4);

}


void ReactionKernelIndexed_5_double_precision::run(IBlock *block) {

  run_impl(block, IndexVectors::ALL);

}


void ReactionKernelIndexed_5_double_precision::inner(IBlock *block) {

  run_impl(block, IndexVectors::INNER);

}


void ReactionKernelIndexed_5_double_precision::outer(IBlock *block) {

  run_impl(block, IndexVectors::OUTER);

}


} // namespace pystencils

} // namespace walberla

FUNC_PREFIX
#define FUNC_PREFIX
\file AdvectiveFluxKernel_double_precision.cpp \author pystencils
Definition AdvectiveFluxKernel_double_precision.cpp:28

RESTRICT
#define RESTRICT
\file AdvectiveFluxKernel_double_precision.h \author pystencils
Definition AdvectiveFluxKernel_double_precision.h:40

ReactionKernelIndexed_5_double_precision.h

walberla::pystencils::ReactionKernelIndexed_5_double_precision::IndexVectors::OUTER
@ OUTER
Definition ReactionKernelIndexed_5_double_precision.h:89

walberla::pystencils::ReactionKernelIndexed_5_double_precision::IndexVectors::ALL
@ ALL
Definition ReactionKernelIndexed_5_double_precision.h:89

walberla::pystencils::ReactionKernelIndexed_5_double_precision::IndexVectors::INNER
@ INNER
Definition ReactionKernelIndexed_5_double_precision.h:89

walberla::pystencils::ReactionKernelIndexed_5_double_precision
Definition ReactionKernelIndexed_5_double_precision.h:73

walberla::pystencils::ReactionKernelIndexed_5_double_precision::stoech_2_
double stoech_2_
Definition ReactionKernelIndexed_5_double_precision.h:245

walberla::pystencils::ReactionKernelIndexed_5_double_precision::stoech_4_
double stoech_4_
Definition ReactionKernelIndexed_5_double_precision.h:247

walberla::pystencils::ReactionKernelIndexed_5_double_precision::rate_coefficient_
double rate_coefficient_
Definition ReactionKernelIndexed_5_double_precision.h:242

walberla::pystencils::ReactionKernelIndexed_5_double_precision::run
void run(IBlock *block)
Definition ReactionKernelIndexed_5_double_precision.cpp:139

walberla::pystencils::ReactionKernelIndexed_5_double_precision::order_0_
double order_0_
Definition ReactionKernelIndexed_5_double_precision.h:237

walberla::pystencils::ReactionKernelIndexed_5_double_precision::order_1_
double order_1_
Definition ReactionKernelIndexed_5_double_precision.h:238

walberla::pystencils::ReactionKernelIndexed_5_double_precision::rho_0ID
BlockDataID rho_0ID
Definition ReactionKernelIndexed_5_double_precision.h:232

walberla::pystencils::ReactionKernelIndexed_5_double_precision::order_3_
double order_3_
Definition ReactionKernelIndexed_5_double_precision.h:240

walberla::pystencils::ReactionKernelIndexed_5_double_precision::stoech_1_
double stoech_1_
Definition ReactionKernelIndexed_5_double_precision.h:244

walberla::pystencils::ReactionKernelIndexed_5_double_precision::stoech_3_
double stoech_3_
Definition ReactionKernelIndexed_5_double_precision.h:246

walberla::pystencils::ReactionKernelIndexed_5_double_precision::stoech_0_
double stoech_0_
Definition ReactionKernelIndexed_5_double_precision.h:243

walberla::pystencils::ReactionKernelIndexed_5_double_precision::inner
void inner(IBlock *block)
Definition ReactionKernelIndexed_5_double_precision.cpp:143

walberla::pystencils::ReactionKernelIndexed_5_double_precision::rho_1ID
BlockDataID rho_1ID
Definition ReactionKernelIndexed_5_double_precision.h:233

walberla::pystencils::ReactionKernelIndexed_5_double_precision::outer
void outer(IBlock *block)
Definition ReactionKernelIndexed_5_double_precision.cpp:147

walberla::pystencils::ReactionKernelIndexed_5_double_precision::rho_3ID
BlockDataID rho_3ID
Definition ReactionKernelIndexed_5_double_precision.h:235

walberla::pystencils::ReactionKernelIndexed_5_double_precision::order_2_
double order_2_
Definition ReactionKernelIndexed_5_double_precision.h:239

walberla::pystencils::ReactionKernelIndexed_5_double_precision::rho_4ID
BlockDataID rho_4ID
Definition ReactionKernelIndexed_5_double_precision.h:236

walberla::pystencils::ReactionKernelIndexed_5_double_precision::order_4_
double order_4_
Definition ReactionKernelIndexed_5_double_precision.h:241

walberla::pystencils::ReactionKernelIndexed_5_double_precision::rho_2ID
BlockDataID rho_2ID
Definition ReactionKernelIndexed_5_double_precision.h:234

stream
cudaStream_t stream[1]
CUDA streams for parallel computing on CPU and GPU.
Definition common_cuda.cu:34

block
static double * block(double *p, std::size_t index, std::size_t size)
Definition elc.cpp:175

std
STL namespace.

walberla::pystencils::internal_714956d26e6eb81c5dec60e7ab7da8ab::reactionkernelindexed_5_double_precision_boundary_ReactionKernelIndexed_5_double_precision
static FUNC_PREFIX void reactionkernelindexed_5_double_precision_boundary_ReactionKernelIndexed_5_double_precision(uint8_t *RESTRICT const _data_indexVector, double *RESTRICT _data_rho_0, double *RESTRICT _data_rho_1, double *RESTRICT _data_rho_2, double *RESTRICT _data_rho_3, double *RESTRICT _data_rho_4, int64_t const _stride_rho_0_0, int64_t const _stride_rho_0_1, int64_t const _stride_rho_0_2, int64_t const _stride_rho_1_0, int64_t const _stride_rho_1_1, int64_t const _stride_rho_1_2, int64_t const _stride_rho_2_0, int64_t const _stride_rho_2_1, int64_t const _stride_rho_2_2, int64_t const _stride_rho_3_0, int64_t const _stride_rho_3_1, int64_t const _stride_rho_3_2, int64_t const _stride_rho_4_0, int64_t const _stride_rho_4_1, int64_t const _stride_rho_4_2, int32_t indexVectorSize, double order_0, double order_1, double order_2, double order_3, double order_4, double rate_coefficient, double stoech_0, double stoech_1, double stoech_2, double stoech_3, double stoech_4)
Definition ReactionKernelIndexed_5_double_precision.cpp:50

walberla
\file PackInfoPdfDoublePrecision.cpp \author pystencils
Definition EKWalberla.hpp:38