61 auto rho =
block->getData<gpu::GPUField<float>>(rhoID);
62 auto j =
block->getData<gpu::GPUField<float>>(jID);
64 WALBERLA_ASSERT_GREATER_EQUAL(-1, -int_c(j->nrOfGhostLayers()))
65 float *
RESTRICT const _data_j = j->dataAt(-1, -1, -1, 0);
66 WALBERLA_ASSERT_EQUAL(j->layout(), field::fzyx)
67 WALBERLA_ASSERT_GREATER_EQUAL(-1, -int_c(rho->nrOfGhostLayers()))
68 float *
RESTRICT _data_rho = rho->dataAt(-1, -1, -1, 0);
69 WALBERLA_ASSERT_GREATER_EQUAL(j->xSizeWithGhostLayer(), int64_t(int64_c(j->xSize()) + 2))
70 const int64_t _size_j_0 = int64_t(int64_c(j->xSize()) + 2);
71 WALBERLA_ASSERT_EQUAL(j->layout(), field::fzyx)
72 WALBERLA_ASSERT_GREATER_EQUAL(j->ySizeWithGhostLayer(), int64_t(int64_c(j->ySize()) + 2))
73 const int64_t _size_j_1 = int64_t(int64_c(j->ySize()) + 2);
74 WALBERLA_ASSERT_EQUAL(j->layout(), field::fzyx)
75 WALBERLA_ASSERT_GREATER_EQUAL(j->zSizeWithGhostLayer(), int64_t(int64_c(j->zSize()) + 2))
76 const int64_t _size_j_2 = int64_t(int64_c(j->zSize()) + 2);
77 WALBERLA_ASSERT_EQUAL(j->layout(), field::fzyx)
78 const int64_t _stride_j_0 = int64_t(j->xStride());
79 const int64_t _stride_j_1 = int64_t(j->yStride());
80 const int64_t _stride_j_2 = int64_t(j->zStride());
81 const int64_t _stride_j_3 = int64_t(1 * int64_t(j->fStride()));
82 const int64_t _stride_rho_0 = int64_t(rho->xStride());
83 const int64_t _stride_rho_1 = int64_t(rho->yStride());
84 const int64_t _stride_rho_2 = int64_t(rho->zStride());
85 dim3 _block(uint32_c(((128 < _size_j_0 - 2) ? 128 : _size_j_0 - 2)), uint32_c(((1024 < ((_size_j_1 - 2 < 2 * ((int64_t)(128) / (int64_t)(((128 < _size_j_0 - 2) ? 128 : _size_j_0 - 2)))) ? _size_j_1 - 2 : 2 * ((int64_t)(128) / (int64_t)(((128 < _size_j_0 - 2) ? 128 : _size_j_0 - 2))))) ? 1024 : ((_size_j_1 - 2 < 2 * ((int64_t)(128) / (int64_t)(((128 < _size_j_0 - 2) ? 128 : _size_j_0 - 2)))) ? _size_j_1 - 2 : 2 * ((int64_t)(128) / (int64_t)(((128 < _size_j_0 - 2) ? 128 : _size_j_0 - 2)))))), uint32_c(((64 < ((_size_j_2 - 2 < ((int64_t)(256) / (int64_t)(((128 < _size_j_0 - 2) ? 128 : _size_j_0 - 2) * ((_size_j_1 - 2 < 2 * ((int64_t)(128) / (int64_t)(((128 < _size_j_0 - 2) ? 128 : _size_j_0 - 2)))) ? _size_j_1 - 2 : 2 * ((int64_t)(128) / (int64_t)(((128 < _size_j_0 - 2) ? 128 : _size_j_0 - 2))))))) ? _size_j_2 - 2 : ((int64_t)(256) / (int64_t)(((128 < _size_j_0 - 2) ? 128 : _size_j_0 - 2) * ((_size_j_1 - 2 < 2 * ((int64_t)(128) / (int64_t)(((128 < _size_j_0 - 2) ? 128 : _size_j_0 - 2)))) ? _size_j_1 - 2 : 2 * ((int64_t)(128) / (int64_t)(((128 < _size_j_0 - 2) ? 128 : _size_j_0 - 2)))))))) ? 64 : ((_size_j_2 - 2 < ((int64_t)(256) / (int64_t)(((128 < _size_j_0 - 2) ? 128 : _size_j_0 - 2) * ((_size_j_1 - 2 < 2 * ((int64_t)(128) / (int64_t)(((128 < _size_j_0 - 2) ? 128 : _size_j_0 - 2)))) ? _size_j_1 - 2 : 2 * ((int64_t)(128) / (int64_t)(((128 < _size_j_0 - 2) ? 128 : _size_j_0 - 2))))))) ? _size_j_2 - 2 : ((int64_t)(256) / (int64_t)(((128 < _size_j_0 - 2) ? 128 : _size_j_0 - 2) * ((_size_j_1 - 2 < 2 * ((int64_t)(128) / (int64_t)(((128 < _size_j_0 - 2) ? 128 : _size_j_0 - 2)))) ? _size_j_1 - 2 : 2 * ((int64_t)(128) / (int64_t)(((128 < _size_j_0 - 2) ? 128 : _size_j_0 - 2))))))))));
86 dim3 _grid(uint32_c(((_size_j_0 - 2) % (((128 < _size_j_0 - 2) ? 128 : _size_j_0 - 2)) == 0 ? (int64_t)(_size_j_0 - 2) / (int64_t)(((128 < _size_j_0 - 2) ? 128 : _size_j_0 - 2)) : ((int64_t)(_size_j_0 - 2) / (int64_t)(((128 < _size_j_0 - 2) ? 128 : _size_j_0 - 2))) + 1)), uint32_c(((_size_j_1 - 2) % (((1024 < ((_size_j_1 - 2 < 2 * ((int64_t)(128) / (int64_t)(((128 < _size_j_0 - 2) ? 128 : _size_j_0 - 2)))) ? _size_j_1 - 2 : 2 * ((int64_t)(128) / (int64_t)(((128 < _size_j_0 - 2) ? 128 : _size_j_0 - 2))))) ? 1024 : ((_size_j_1 - 2 < 2 * ((int64_t)(128) / (int64_t)(((128 < _size_j_0 - 2) ? 128 : _size_j_0 - 2)))) ? _size_j_1 - 2 : 2 * ((int64_t)(128) / (int64_t)(((128 < _size_j_0 - 2) ? 128 : _size_j_0 - 2)))))) == 0 ? (int64_t)(_size_j_1 - 2) / (int64_t)(((1024 < ((_size_j_1 - 2 < 2 * ((int64_t)(128) / (int64_t)(((128 < _size_j_0 - 2) ? 128 : _size_j_0 - 2)))) ? _size_j_1 - 2 : 2 * ((int64_t)(128) / (int64_t)(((128 < _size_j_0 - 2) ? 128 : _size_j_0 - 2))))) ? 1024 : ((_size_j_1 - 2 < 2 * ((int64_t)(128) / (int64_t)(((128 < _size_j_0 - 2) ? 128 : _size_j_0 - 2)))) ? _size_j_1 - 2 : 2 * ((int64_t)(128) / (int64_t)(((128 < _size_j_0 - 2) ? 128 : _size_j_0 - 2)))))) : ((int64_t)(_size_j_1 - 2) / (int64_t)(((1024 < ((_size_j_1 - 2 < 2 * ((int64_t)(128) / (int64_t)(((128 < _size_j_0 - 2) ? 128 : _size_j_0 - 2)))) ? _size_j_1 - 2 : 2 * ((int64_t)(128) / (int64_t)(((128 < _size_j_0 - 2) ? 128 : _size_j_0 - 2))))) ? 1024 : ((_size_j_1 - 2 < 2 * ((int64_t)(128) / (int64_t)(((128 < _size_j_0 - 2) ? 128 : _size_j_0 - 2)))) ? _size_j_1 - 2 : 2 * ((int64_t)(128) / (int64_t)(((128 < _size_j_0 - 2) ? 128 : _size_j_0 - 2))))))) + 1)), uint32_c(((_size_j_2 - 2) % (((64 < ((_size_j_2 - 2 < ((int64_t)(256) / (int64_t)(((128 < _size_j_0 - 2) ? 128 : _size_j_0 - 2) * ((_size_j_1 - 2 < 2 * ((int64_t)(128) / (int64_t)(((128 < _size_j_0 - 2) ? 128 : _size_j_0 - 2)))) ? _size_j_1 - 2 : 2 * ((int64_t)(128) / (int64_t)(((128 < _size_j_0 - 2) ? 128 : _size_j_0 - 2))))))) ? _size_j_2 - 2 : ((int64_t)(256) / (int64_t)(((128 < _size_j_0 - 2) ? 128 : _size_j_0 - 2) * ((_size_j_1 - 2 < 2 * ((int64_t)(128) / (int64_t)(((128 < _size_j_0 - 2) ? 128 : _size_j_0 - 2)))) ? _size_j_1 - 2 : 2 * ((int64_t)(128) / (int64_t)(((128 < _size_j_0 - 2) ? 128 : _size_j_0 - 2)))))))) ? 64 : ((_size_j_2 - 2 < ((int64_t)(256) / (int64_t)(((128 < _size_j_0 - 2) ? 128 : _size_j_0 - 2) * ((_size_j_1 - 2 < 2 * ((int64_t)(128) / (int64_t)(((128 < _size_j_0 - 2) ? 128 : _size_j_0 - 2)))) ? _size_j_1 - 2 : 2 * ((int64_t)(128) / (int64_t)(((128 < _size_j_0 - 2) ? 128 : _size_j_0 - 2))))))) ? _size_j_2 - 2 : ((int64_t)(256) / (int64_t)(((128 < _size_j_0 - 2) ? 128 : _size_j_0 - 2) * ((_size_j_1 - 2 < 2 * ((int64_t)(128) / (int64_t)(((128 < _size_j_0 - 2) ? 128 : _size_j_0 - 2)))) ? _size_j_1 - 2 : 2 * ((int64_t)(128) / (int64_t)(((128 < _size_j_0 - 2) ? 128 : _size_j_0 - 2))))))))) == 0 ? (int64_t)(_size_j_2 - 2) / (int64_t)(((64 < ((_size_j_2 - 2 < ((int64_t)(256) / (int64_t)(((128 < _size_j_0 - 2) ? 128 : _size_j_0 - 2) * ((_size_j_1 - 2 < 2 * ((int64_t)(128) / (int64_t)(((128 < _size_j_0 - 2) ? 128 : _size_j_0 - 2)))) ? _size_j_1 - 2 : 2 * ((int64_t)(128) / (int64_t)(((128 < _size_j_0 - 2) ? 128 : _size_j_0 - 2))))))) ? _size_j_2 - 2 : ((int64_t)(256) / (int64_t)(((128 < _size_j_0 - 2) ? 128 : _size_j_0 - 2) * ((_size_j_1 - 2 < 2 * ((int64_t)(128) / (int64_t)(((128 < _size_j_0 - 2) ? 128 : _size_j_0 - 2)))) ? _size_j_1 - 2 : 2 * ((int64_t)(128) / (int64_t)(((128 < _size_j_0 - 2) ? 128 : _size_j_0 - 2)))))))) ? 64 : ((_size_j_2 - 2 < ((int64_t)(256) / (int64_t)(((128 < _size_j_0 - 2) ? 128 : _size_j_0 - 2) * ((_size_j_1 - 2 < 2 * ((int64_t)(128) / (int64_t)(((128 < _size_j_0 - 2) ? 128 : _size_j_0 - 2)))) ? _size_j_1 - 2 : 2 * ((int64_t)(128) / (int64_t)(((128 < _size_j_0 - 2) ? 128 : _size_j_0 - 2))))))) ? _size_j_2 - 2 : ((int64_t)(256) / (int64_t)(((128 < _size_j_0 - 2) ? 128 : _size_j_0 - 2) * ((_size_j_1 - 2 < 2 * ((int64_t)(128) / (int64_t)(((128 < _size_j_0 - 2) ? 128 : _size_j_0 - 2)))) ? _size_j_1 - 2 : 2 * ((int64_t)(128) / (int64_t)(((128 < _size_j_0 - 2) ? 128 : _size_j_0 - 2))))))))) : ((int64_t)(_size_j_2 - 2) / (int64_t)(((64 < ((_size_j_2 - 2 < ((int64_t)(256) / (int64_t)(((128 < _size_j_0 - 2) ? 128 : _size_j_0 - 2) * ((_size_j_1 - 2 < 2 * ((int64_t)(128) / (int64_t)(((128 < _size_j_0 - 2) ? 128 : _size_j_0 - 2)))) ? _size_j_1 - 2 : 2 * ((int64_t)(128) / (int64_t)(((128 < _size_j_0 - 2) ? 128 : _size_j_0 - 2))))))) ? _size_j_2 - 2 : ((int64_t)(256) / (int64_t)(((128 < _size_j_0 - 2) ? 128 : _size_j_0 - 2) * ((_size_j_1 - 2 < 2 * ((int64_t)(128) / (int64_t)(((128 < _size_j_0 - 2) ? 128 : _size_j_0 - 2)))) ? _size_j_1 - 2 : 2 * ((int64_t)(128) / (int64_t)(((128 < _size_j_0 - 2) ? 128 : _size_j_0 - 2)))))))) ? 64 : ((_size_j_2 - 2 < ((int64_t)(256) / (int64_t)(((128 < _size_j_0 - 2) ? 128 : _size_j_0 - 2) * ((_size_j_1 - 2 < 2 * ((int64_t)(128) / (int64_t)(((128 < _size_j_0 - 2) ? 128 : _size_j_0 - 2)))) ? _size_j_1 - 2 : 2 * ((int64_t)(128) / (int64_t)(((128 < _size_j_0 - 2) ? 128 : _size_j_0 - 2))))))) ? _size_j_2 - 2 : ((int64_t)(256) / (int64_t)(((128 < _size_j_0 - 2) ? 128 : _size_j_0 - 2) * ((_size_j_1 - 2 < 2 * ((int64_t)(128) / (int64_t)(((128 < _size_j_0 - 2) ? 128 : _size_j_0 - 2)))) ? _size_j_1 - 2 : 2 * ((int64_t)(128) / (int64_t)(((128 < _size_j_0 - 2) ? 128 : _size_j_0 - 2)))))))))) + 1)));
87 internal_continuitykernel_single_precision_cuda_continuitykernel_single_precision_cuda::continuitykernel_single_precision_cuda_continuitykernel_single_precision_cuda<<<_grid, _block, 0, stream>>>(_data_j, _data_rho, _size_j_0, _size_j_1, _size_j_2, _stride_j_0, _stride_j_1, _stride_j_2, _stride_j_3, _stride_rho_0, _stride_rho_1, _stride_rho_2);
92 CellInterval ci = globalCellInterval;
93 CellInterval blockBB = blocks->getBlockCellBB(*
block);
94 blockBB.expand(ghostLayers);
95 ci.intersect(blockBB);
96 blocks->transformGlobalToBlockLocalCellInterval(ci, *
block);
100 auto rho =
block->getData<gpu::GPUField<float>>(rhoID);
101 auto j =
block->getData<gpu::GPUField<float>>(jID);
103 WALBERLA_ASSERT_GREATER_EQUAL(ci.xMin() - 1, -int_c(j->nrOfGhostLayers()))
104 WALBERLA_ASSERT_GREATER_EQUAL(ci.yMin() - 1, -int_c(j->nrOfGhostLayers()))
105 WALBERLA_ASSERT_GREATER_EQUAL(ci.zMin() - 1, -int_c(j->nrOfGhostLayers()))
106 float *
RESTRICT const _data_j = j->dataAt(ci.xMin() - 1, ci.yMin() - 1, ci.zMin() - 1, 0);
107 WALBERLA_ASSERT_EQUAL(j->layout(), field::fzyx)
108 WALBERLA_ASSERT_GREATER_EQUAL(ci.xMin() - 1, -int_c(rho->nrOfGhostLayers()))
109 WALBERLA_ASSERT_GREATER_EQUAL(ci.yMin() - 1, -int_c(rho->nrOfGhostLayers()))
110 WALBERLA_ASSERT_GREATER_EQUAL(ci.zMin() - 1, -int_c(rho->nrOfGhostLayers()))
111 float *
RESTRICT _data_rho = rho->dataAt(ci.xMin() - 1, ci.yMin() - 1, ci.zMin() - 1, 0);
112 WALBERLA_ASSERT_GREATER_EQUAL(j->xSizeWithGhostLayer(), int64_t(int64_c(ci.xSize()) + 2))
113 const int64_t _size_j_0 = int64_t(int64_c(ci.xSize()) + 2);
114 WALBERLA_ASSERT_EQUAL(j->layout(), field::fzyx)
115 WALBERLA_ASSERT_GREATER_EQUAL(j->ySizeWithGhostLayer(), int64_t(int64_c(ci.ySize()) + 2))
116 const int64_t _size_j_1 = int64_t(int64_c(ci.ySize()) + 2);
117 WALBERLA_ASSERT_EQUAL(j->layout(), field::fzyx)
118 WALBERLA_ASSERT_GREATER_EQUAL(j->zSizeWithGhostLayer(), int64_t(int64_c(ci.zSize()) + 2))
119 const int64_t _size_j_2 = int64_t(int64_c(ci.zSize()) + 2);
120 WALBERLA_ASSERT_EQUAL(j->layout(), field::fzyx)
121 const int64_t _stride_j_0 = int64_t(j->xStride());
122 const int64_t _stride_j_1 = int64_t(j->yStride());
123 const int64_t _stride_j_2 = int64_t(j->zStride());
124 const int64_t _stride_j_3 = int64_t(1 * int64_t(j->fStride()));
125 const int64_t _stride_rho_0 = int64_t(rho->xStride());
126 const int64_t _stride_rho_1 = int64_t(rho->yStride());
127 const int64_t _stride_rho_2 = int64_t(rho->zStride());
128 dim3 _block(uint32_c(((128 < _size_j_0 - 2) ? 128 : _size_j_0 - 2)), uint32_c(((1024 < ((_size_j_1 - 2 < 2 * ((int64_t)(128) / (int64_t)(((128 < _size_j_0 - 2) ? 128 : _size_j_0 - 2)))) ? _size_j_1 - 2 : 2 * ((int64_t)(128) / (int64_t)(((128 < _size_j_0 - 2) ? 128 : _size_j_0 - 2))))) ? 1024 : ((_size_j_1 - 2 < 2 * ((int64_t)(128) / (int64_t)(((128 < _size_j_0 - 2) ? 128 : _size_j_0 - 2)))) ? _size_j_1 - 2 : 2 * ((int64_t)(128) / (int64_t)(((128 < _size_j_0 - 2) ? 128 : _size_j_0 - 2)))))), uint32_c(((64 < ((_size_j_2 - 2 < ((int64_t)(256) / (int64_t)(((128 < _size_j_0 - 2) ? 128 : _size_j_0 - 2) * ((_size_j_1 - 2 < 2 * ((int64_t)(128) / (int64_t)(((128 < _size_j_0 - 2) ? 128 : _size_j_0 - 2)))) ? _size_j_1 - 2 : 2 * ((int64_t)(128) / (int64_t)(((128 < _size_j_0 - 2) ? 128 : _size_j_0 - 2))))))) ? _size_j_2 - 2 : ((int64_t)(256) / (int64_t)(((128 < _size_j_0 - 2) ? 128 : _size_j_0 - 2) * ((_size_j_1 - 2 < 2 * ((int64_t)(128) / (int64_t)(((128 < _size_j_0 - 2) ? 128 : _size_j_0 - 2)))) ? _size_j_1 - 2 : 2 * ((int64_t)(128) / (int64_t)(((128 < _size_j_0 - 2) ? 128 : _size_j_0 - 2)))))))) ? 64 : ((_size_j_2 - 2 < ((int64_t)(256) / (int64_t)(((128 < _size_j_0 - 2) ? 128 : _size_j_0 - 2) * ((_size_j_1 - 2 < 2 * ((int64_t)(128) / (int64_t)(((128 < _size_j_0 - 2) ? 128 : _size_j_0 - 2)))) ? _size_j_1 - 2 : 2 * ((int64_t)(128) / (int64_t)(((128 < _size_j_0 - 2) ? 128 : _size_j_0 - 2))))))) ? _size_j_2 - 2 : ((int64_t)(256) / (int64_t)(((128 < _size_j_0 - 2) ? 128 : _size_j_0 - 2) * ((_size_j_1 - 2 < 2 * ((int64_t)(128) / (int64_t)(((128 < _size_j_0 - 2) ? 128 : _size_j_0 - 2)))) ? _size_j_1 - 2 : 2 * ((int64_t)(128) / (int64_t)(((128 < _size_j_0 - 2) ? 128 : _size_j_0 - 2))))))))));
129 dim3 _grid(uint32_c(((_size_j_0 - 2) % (((128 < _size_j_0 - 2) ? 128 : _size_j_0 - 2)) == 0 ? (int64_t)(_size_j_0 - 2) / (int64_t)(((128 < _size_j_0 - 2) ? 128 : _size_j_0 - 2)) : ((int64_t)(_size_j_0 - 2) / (int64_t)(((128 < _size_j_0 - 2) ? 128 : _size_j_0 - 2))) + 1)), uint32_c(((_size_j_1 - 2) % (((1024 < ((_size_j_1 - 2 < 2 * ((int64_t)(128) / (int64_t)(((128 < _size_j_0 - 2) ? 128 : _size_j_0 - 2)))) ? _size_j_1 - 2 : 2 * ((int64_t)(128) / (int64_t)(((128 < _size_j_0 - 2) ? 128 : _size_j_0 - 2))))) ? 1024 : ((_size_j_1 - 2 < 2 * ((int64_t)(128) / (int64_t)(((128 < _size_j_0 - 2) ? 128 : _size_j_0 - 2)))) ? _size_j_1 - 2 : 2 * ((int64_t)(128) / (int64_t)(((128 < _size_j_0 - 2) ? 128 : _size_j_0 - 2)))))) == 0 ? (int64_t)(_size_j_1 - 2) / (int64_t)(((1024 < ((_size_j_1 - 2 < 2 * ((int64_t)(128) / (int64_t)(((128 < _size_j_0 - 2) ? 128 : _size_j_0 - 2)))) ? _size_j_1 - 2 : 2 * ((int64_t)(128) / (int64_t)(((128 < _size_j_0 - 2) ? 128 : _size_j_0 - 2))))) ? 1024 : ((_size_j_1 - 2 < 2 * ((int64_t)(128) / (int64_t)(((128 < _size_j_0 - 2) ? 128 : _size_j_0 - 2)))) ? _size_j_1 - 2 : 2 * ((int64_t)(128) / (int64_t)(((128 < _size_j_0 - 2) ? 128 : _size_j_0 - 2)))))) : ((int64_t)(_size_j_1 - 2) / (int64_t)(((1024 < ((_size_j_1 - 2 < 2 * ((int64_t)(128) / (int64_t)(((128 < _size_j_0 - 2) ? 128 : _size_j_0 - 2)))) ? _size_j_1 - 2 : 2 * ((int64_t)(128) / (int64_t)(((128 < _size_j_0 - 2) ? 128 : _size_j_0 - 2))))) ? 1024 : ((_size_j_1 - 2 < 2 * ((int64_t)(128) / (int64_t)(((128 < _size_j_0 - 2) ? 128 : _size_j_0 - 2)))) ? _size_j_1 - 2 : 2 * ((int64_t)(128) / (int64_t)(((128 < _size_j_0 - 2) ? 128 : _size_j_0 - 2))))))) + 1)), uint32_c(((_size_j_2 - 2) % (((64 < ((_size_j_2 - 2 < ((int64_t)(256) / (int64_t)(((128 < _size_j_0 - 2) ? 128 : _size_j_0 - 2) * ((_size_j_1 - 2 < 2 * ((int64_t)(128) / (int64_t)(((128 < _size_j_0 - 2) ? 128 : _size_j_0 - 2)))) ? _size_j_1 - 2 : 2 * ((int64_t)(128) / (int64_t)(((128 < _size_j_0 - 2) ? 128 : _size_j_0 - 2))))))) ? _size_j_2 - 2 : ((int64_t)(256) / (int64_t)(((128 < _size_j_0 - 2) ? 128 : _size_j_0 - 2) * ((_size_j_1 - 2 < 2 * ((int64_t)(128) / (int64_t)(((128 < _size_j_0 - 2) ? 128 : _size_j_0 - 2)))) ? _size_j_1 - 2 : 2 * ((int64_t)(128) / (int64_t)(((128 < _size_j_0 - 2) ? 128 : _size_j_0 - 2)))))))) ? 64 : ((_size_j_2 - 2 < ((int64_t)(256) / (int64_t)(((128 < _size_j_0 - 2) ? 128 : _size_j_0 - 2) * ((_size_j_1 - 2 < 2 * ((int64_t)(128) / (int64_t)(((128 < _size_j_0 - 2) ? 128 : _size_j_0 - 2)))) ? _size_j_1 - 2 : 2 * ((int64_t)(128) / (int64_t)(((128 < _size_j_0 - 2) ? 128 : _size_j_0 - 2))))))) ? _size_j_2 - 2 : ((int64_t)(256) / (int64_t)(((128 < _size_j_0 - 2) ? 128 : _size_j_0 - 2) * ((_size_j_1 - 2 < 2 * ((int64_t)(128) / (int64_t)(((128 < _size_j_0 - 2) ? 128 : _size_j_0 - 2)))) ? _size_j_1 - 2 : 2 * ((int64_t)(128) / (int64_t)(((128 < _size_j_0 - 2) ? 128 : _size_j_0 - 2))))))))) == 0 ? (int64_t)(_size_j_2 - 2) / (int64_t)(((64 < ((_size_j_2 - 2 < ((int64_t)(256) / (int64_t)(((128 < _size_j_0 - 2) ? 128 : _size_j_0 - 2) * ((_size_j_1 - 2 < 2 * ((int64_t)(128) / (int64_t)(((128 < _size_j_0 - 2) ? 128 : _size_j_0 - 2)))) ? _size_j_1 - 2 : 2 * ((int64_t)(128) / (int64_t)(((128 < _size_j_0 - 2) ? 128 : _size_j_0 - 2))))))) ? _size_j_2 - 2 : ((int64_t)(256) / (int64_t)(((128 < _size_j_0 - 2) ? 128 : _size_j_0 - 2) * ((_size_j_1 - 2 < 2 * ((int64_t)(128) / (int64_t)(((128 < _size_j_0 - 2) ? 128 : _size_j_0 - 2)))) ? _size_j_1 - 2 : 2 * ((int64_t)(128) / (int64_t)(((128 < _size_j_0 - 2) ? 128 : _size_j_0 - 2)))))))) ? 64 : ((_size_j_2 - 2 < ((int64_t)(256) / (int64_t)(((128 < _size_j_0 - 2) ? 128 : _size_j_0 - 2) * ((_size_j_1 - 2 < 2 * ((int64_t)(128) / (int64_t)(((128 < _size_j_0 - 2) ? 128 : _size_j_0 - 2)))) ? _size_j_1 - 2 : 2 * ((int64_t)(128) / (int64_t)(((128 < _size_j_0 - 2) ? 128 : _size_j_0 - 2))))))) ? _size_j_2 - 2 : ((int64_t)(256) / (int64_t)(((128 < _size_j_0 - 2) ? 128 : _size_j_0 - 2) * ((_size_j_1 - 2 < 2 * ((int64_t)(128) / (int64_t)(((128 < _size_j_0 - 2) ? 128 : _size_j_0 - 2)))) ? _size_j_1 - 2 : 2 * ((int64_t)(128) / (int64_t)(((128 < _size_j_0 - 2) ? 128 : _size_j_0 - 2))))))))) : ((int64_t)(_size_j_2 - 2) / (int64_t)(((64 < ((_size_j_2 - 2 < ((int64_t)(256) / (int64_t)(((128 < _size_j_0 - 2) ? 128 : _size_j_0 - 2) * ((_size_j_1 - 2 < 2 * ((int64_t)(128) / (int64_t)(((128 < _size_j_0 - 2) ? 128 : _size_j_0 - 2)))) ? _size_j_1 - 2 : 2 * ((int64_t)(128) / (int64_t)(((128 < _size_j_0 - 2) ? 128 : _size_j_0 - 2))))))) ? _size_j_2 - 2 : ((int64_t)(256) / (int64_t)(((128 < _size_j_0 - 2) ? 128 : _size_j_0 - 2) * ((_size_j_1 - 2 < 2 * ((int64_t)(128) / (int64_t)(((128 < _size_j_0 - 2) ? 128 : _size_j_0 - 2)))) ? _size_j_1 - 2 : 2 * ((int64_t)(128) / (int64_t)(((128 < _size_j_0 - 2) ? 128 : _size_j_0 - 2)))))))) ? 64 : ((_size_j_2 - 2 < ((int64_t)(256) / (int64_t)(((128 < _size_j_0 - 2) ? 128 : _size_j_0 - 2) * ((_size_j_1 - 2 < 2 * ((int64_t)(128) / (int64_t)(((128 < _size_j_0 - 2) ? 128 : _size_j_0 - 2)))) ? _size_j_1 - 2 : 2 * ((int64_t)(128) / (int64_t)(((128 < _size_j_0 - 2) ? 128 : _size_j_0 - 2))))))) ? _size_j_2 - 2 : ((int64_t)(256) / (int64_t)(((128 < _size_j_0 - 2) ? 128 : _size_j_0 - 2) * ((_size_j_1 - 2 < 2 * ((int64_t)(128) / (int64_t)(((128 < _size_j_0 - 2) ? 128 : _size_j_0 - 2)))) ? _size_j_1 - 2 : 2 * ((int64_t)(128) / (int64_t)(((128 < _size_j_0 - 2) ? 128 : _size_j_0 - 2)))))))))) + 1)));
130 internal_continuitykernel_single_precision_cuda_continuitykernel_single_precision_cuda::continuitykernel_single_precision_cuda_continuitykernel_single_precision_cuda<<<_grid, _block, 0, stream>>>(_data_j, _data_rho, _size_j_0, _size_j_1, _size_j_2, _stride_j_0, _stride_j_1, _stride_j_2, _stride_j_3, _stride_rho_0, _stride_rho_1, _stride_rho_2);