dox/ReactionKernelBulk__3__single__precision__CUDA_8h_source.html

//======================================================================================================================

//

//  This file is part of waLBerla. waLBerla is free software: you can

//  redistribute it and/or modify it under the terms of the GNU General Public

//  License as published by the Free Software Foundation, either version 3 of

//  the License, or (at your option) any later version.

//

//  waLBerla is distributed in the hope that it will be useful, but WITHOUT

//  ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or

//  FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License

//  for more details.

//

//  You should have received a copy of the GNU General Public License along

//  with waLBerla (see COPYING.txt). If not, see <http://www.gnu.org/licenses/>.

//

//! \\file ReactionKernelBulk_3_single_precision_CUDA.h

//! \\author pystencils

//======================================================================================================================


// kernel generated with pystencils v1.4+1.ge851f4e, lbmpy v1.4+1.ge9efe34,

// sympy v1.12.1, lbmpy_walberla/pystencils_walberla from waLBerla commit

// 007e77e077ad9d22b5eed6f3d3118240993e553c


#pragma once

#include "core/DataTypes.h"

#include "core/logging/Logging.h"


#include "gpu/GPUField.h"

#include "gpu/GPUWrapper.h"


#include "domain_decomposition/BlockDataID.h"

#include "domain_decomposition/IBlock.h"

#include "domain_decomposition/StructuredBlockStorage.h"

#include "field/SwapableCompare.h"


#include <functional>

#include <unordered_map>


#ifdef __GNUC__

#define RESTRICT __restrict__

#else

#define RESTRICT

#endif


#if (defined WALBERLA_CXX_COMPILER_IS_GNU) ||                                  \

    (defined WALBERLA_CXX_COMPILER_IS_CLANG)

#pragma GCC diagnostic push

#pragma GCC diagnostic ignored "-Wunused-parameter"

#pragma GCC diagnostic ignored "-Wreorder"

#endif


namespace walberla {

namespace pystencils {


class ReactionKernelBulk_3_single_precision_CUDA {

public:


  ReactionKernelBulk_3_single_precision_CUDA(

      BlockDataID rho_0ID_, BlockDataID rho_1ID_, BlockDataID rho_2ID_,

      float order_0, float order_1, float order_2, float rate_coefficient,

      float stoech_0, float stoech_1, float stoech_2)

      : rho_0ID(rho_0ID_), rho_1ID(rho_1ID_), rho_2ID(rho_2ID_),

        order_0_(order_0), order_1_(order_1), order_2_(order_2),

        rate_coefficient_(rate_coefficient), stoech_0_(stoech_0),

        stoech_1_(stoech_1), stoech_2_(stoech_2) {}


  void run(IBlock *block, gpuStream_t stream = nullptr);


  void runOnCellInterval(const shared_ptr<StructuredBlockStorage> &blocks,

                         const CellInterval &globalCellInterval,

                         cell_idx_t ghostLayers, IBlock *block,

                         gpuStream_t stream = nullptr);


  void operator()(IBlock *block, gpuStream_t stream = nullptr) {

    run(block, stream);

  }


  static std::function<void(IBlock *)> getSweep(

      const shared_ptr<ReactionKernelBulk_3_single_precision_CUDA> &kernel) {

    return [kernel](IBlock *b) { kernel->run(b); };

  }


  static std::function<void(IBlock *, gpuStream_t)> getSweepOnCellInterval(

      const shared_ptr<ReactionKernelBulk_3_single_precision_CUDA> &kernel,

      const shared_ptr<StructuredBlockStorage> &blocks,

      const CellInterval &globalCellInterval, cell_idx_t ghostLayers = 1) {

    return [kernel, blocks, globalCellInterval,

            ghostLayers](IBlock *b, gpuStream_t stream = nullptr) {

      kernel->runOnCellInterval(blocks, globalCellInterval, ghostLayers, b,

                                stream);

    };

  }


  std::function<void(IBlock *)> getSweep(gpuStream_t stream = nullptr) {

    return [this, stream](IBlock *b) { this->run(b, stream); };

  }


  std::function<void(IBlock *)>


  getSweepOnCellInterval(const shared_ptr<StructuredBlockStorage> &blocks,

                         const CellInterval &globalCellInterval,

                         cell_idx_t ghostLayers = 1,

                         gpuStream_t stream = nullptr) {

    return [this, blocks, globalCellInterval, ghostLayers, stream](IBlock *b) {

      this->runOnCellInterval(blocks, globalCellInterval, ghostLayers, b,

                              stream);

    };

  }


  void configure(const shared_ptr<StructuredBlockStorage> & /*blocks*/,

                 IBlock * /*block*/) {}


  inline float getOrder_0() const { return order_0_; }

  inline float getOrder_1() const { return order_1_; }

  inline float getOrder_2() const { return order_2_; }

  inline float getRate_coefficient() const { return rate_coefficient_; }

  inline float getStoech_0() const { return stoech_0_; }

  inline float getStoech_1() const { return stoech_1_; }

  inline float getStoech_2() const { return stoech_2_; }

  inline void setOrder_0(const float value) { order_0_ = value; }

  inline void setOrder_1(const float value) { order_1_ = value; }

  inline void setOrder_2(const float value) { order_2_ = value; }


  inline void setRate_coefficient(const float value) {

    rate_coefficient_ = value;

  }


  inline void setStoech_0(const float value) { stoech_0_ = value; }

  inline void setStoech_1(const float value) { stoech_1_ = value; }

  inline void setStoech_2(const float value) { stoech_2_ = value; }


private:

  BlockDataID rho_0ID;

  BlockDataID rho_1ID;

  BlockDataID rho_2ID;

  float order_0_;

  float order_1_;

  float order_2_;

  float rate_coefficient_;

  float stoech_0_;

  float stoech_1_;

  float stoech_2_;

};


} // namespace pystencils

} // namespace walberla


#if (defined WALBERLA_CXX_COMPILER_IS_GNU) ||                                  \

    (defined WALBERLA_CXX_COMPILER_IS_CLANG)

#pragma GCC diagnostic pop

#endif

walberla::pystencils::ReactionKernelBulk_3_single_precision_CUDA
Definition ReactionKernelBulk_3_single_precision_CUDA.h:55

walberla::pystencils::ReactionKernelBulk_3_single_precision_CUDA::setStoech_1
void setStoech_1(const float value)
Definition ReactionKernelBulk_3_single_precision_CUDA.h:125

walberla::pystencils::ReactionKernelBulk_3_single_precision_CUDA::configure
void configure(const shared_ptr< StructuredBlockStorage > &, IBlock *)
Definition ReactionKernelBulk_3_single_precision_CUDA.h:108

walberla::pystencils::ReactionKernelBulk_3_single_precision_CUDA::setOrder_2
void setOrder_2(const float value)
Definition ReactionKernelBulk_3_single_precision_CUDA.h:120

walberla::pystencils::ReactionKernelBulk_3_single_precision_CUDA::getSweep
static std::function< void(IBlock *)> getSweep(const shared_ptr< ReactionKernelBulk_3_single_precision_CUDA > &kernel)
Definition ReactionKernelBulk_3_single_precision_CUDA.h:77

walberla::pystencils::ReactionKernelBulk_3_single_precision_CUDA::getStoech_0
float getStoech_0() const
Definition ReactionKernelBulk_3_single_precision_CUDA.h:115

walberla::pystencils::ReactionKernelBulk_3_single_precision_CUDA::getRate_coefficient
float getRate_coefficient() const
Definition ReactionKernelBulk_3_single_precision_CUDA.h:114

walberla::pystencils::ReactionKernelBulk_3_single_precision_CUDA::getStoech_1
float getStoech_1() const
Definition ReactionKernelBulk_3_single_precision_CUDA.h:116

walberla::pystencils::ReactionKernelBulk_3_single_precision_CUDA::operator()
void operator()(IBlock *block, gpuStream_t stream=nullptr)
Definition ReactionKernelBulk_3_single_precision_CUDA.h:73

walberla::pystencils::ReactionKernelBulk_3_single_precision_CUDA::getOrder_1
float getOrder_1() const
Definition ReactionKernelBulk_3_single_precision_CUDA.h:112

walberla::pystencils::ReactionKernelBulk_3_single_precision_CUDA::setOrder_0
void setOrder_0(const float value)
Definition ReactionKernelBulk_3_single_precision_CUDA.h:118

walberla::pystencils::ReactionKernelBulk_3_single_precision_CUDA::getSweepOnCellInterval
std::function< void(IBlock *)> getSweepOnCellInterval(const shared_ptr< StructuredBlockStorage > &blocks, const CellInterval &globalCellInterval, cell_idx_t ghostLayers=1, gpuStream_t stream=nullptr)
Definition ReactionKernelBulk_3_single_precision_CUDA.h:98

walberla::pystencils::ReactionKernelBulk_3_single_precision_CUDA::setRate_coefficient
void setRate_coefficient(const float value)
Definition ReactionKernelBulk_3_single_precision_CUDA.h:121

walberla::pystencils::ReactionKernelBulk_3_single_precision_CUDA::setStoech_0
void setStoech_0(const float value)
Definition ReactionKernelBulk_3_single_precision_CUDA.h:124

walberla::pystencils::ReactionKernelBulk_3_single_precision_CUDA::setOrder_1
void setOrder_1(const float value)
Definition ReactionKernelBulk_3_single_precision_CUDA.h:119

walberla::pystencils::ReactionKernelBulk_3_single_precision_CUDA::setStoech_2
void setStoech_2(const float value)
Definition ReactionKernelBulk_3_single_precision_CUDA.h:126

walberla::pystencils::ReactionKernelBulk_3_single_precision_CUDA::getStoech_2
float getStoech_2() const
Definition ReactionKernelBulk_3_single_precision_CUDA.h:117

walberla::pystencils::ReactionKernelBulk_3_single_precision_CUDA::getSweep
std::function< void(IBlock *)> getSweep(gpuStream_t stream=nullptr)
Definition ReactionKernelBulk_3_single_precision_CUDA.h:93

walberla::pystencils::ReactionKernelBulk_3_single_precision_CUDA::ReactionKernelBulk_3_single_precision_CUDA
ReactionKernelBulk_3_single_precision_CUDA(BlockDataID rho_0ID_, BlockDataID rho_1ID_, BlockDataID rho_2ID_, float order_0, float order_1, float order_2, float rate_coefficient, float stoech_0, float stoech_1, float stoech_2)
Definition ReactionKernelBulk_3_single_precision_CUDA.h:57

walberla::pystencils::ReactionKernelBulk_3_single_precision_CUDA::run
void run(IBlock *block, gpuStream_t stream=nullptr)
Definition ReactionKernelBulk_3_single_precision_CUDA.cu:65

walberla::pystencils::ReactionKernelBulk_3_single_precision_CUDA::getOrder_2
float getOrder_2() const
Definition ReactionKernelBulk_3_single_precision_CUDA.h:113

walberla::pystencils::ReactionKernelBulk_3_single_precision_CUDA::runOnCellInterval
void runOnCellInterval(const shared_ptr< StructuredBlockStorage > &blocks, const CellInterval &globalCellInterval, cell_idx_t ghostLayers, IBlock *block, gpuStream_t stream=nullptr)
Definition ReactionKernelBulk_3_single_precision_CUDA.cu:104

walberla::pystencils::ReactionKernelBulk_3_single_precision_CUDA::getOrder_0
float getOrder_0() const
Definition ReactionKernelBulk_3_single_precision_CUDA.h:111

walberla::pystencils::ReactionKernelBulk_3_single_precision_CUDA::getSweepOnCellInterval
static std::function< void(IBlock *, gpuStream_t)> getSweepOnCellInterval(const shared_ptr< ReactionKernelBulk_3_single_precision_CUDA > &kernel, const shared_ptr< StructuredBlockStorage > &blocks, const CellInterval &globalCellInterval, cell_idx_t ghostLayers=1)
Definition ReactionKernelBulk_3_single_precision_CUDA.h:82

stream
cudaStream_t stream[1]
CUDA streams for parallel computing on CPU and GPU.
Definition common_cuda.cu:34

block
static double * block(double *p, std::size_t index, std::size_t size)
Definition elc.cpp:175

walberla
\file PackInfoPdfDoublePrecision.cpp \author pystencils
Definition EKWalberla.hpp:38