KernelStatistics(kd, ld, cd, 0);
#endif
+ X_KERNEL_START(kernelData);
+
// TODO: outer openmp parallel
for(int iter = 0; iter < maxIterations; iter += 2) {
} // for (int iter = 0; ...
+ X_KERNEL_END(kernelData);
+
#ifdef VTK_OUTPUT
if (cd->VtkOutput) {
kd->PdfsActive = kd->Pdfs[0];
#define I(index, dir) P_INDEX_3((nCells), (index), (dir))
- for (int index = indexStartVec; index < indexStopVec; index += VSIZE) {
+ for (int index = indexStartVec; index < indexStopVec; index += VSIZE) { // LOOP list-aa-pv-even-vec
#define X(name, idx, idxinv, _x, _y, _z) JOIN(vpdf_,name) = VLDU(&src[I(index, idx)]);
} // loop over fluid nodes
- for (int index = indexStopVec; index < indexStop; ++index) {
+ for (int index = indexStopVec; index < indexStop; ++index) { // LOOP list-aa-pv-even-scalar
#define X(name, idx, idxinv, _x, _y, _z) JOIN(pdf_,name) = src[I(index, idx)];
D3Q19_LIST