KernelStatistics(kd, ld, cd, 0);
#endif
+ X_KERNEL_START(kernelData);
+
// TODO: outer openmp parallel
for(int iter = 0; iter < maxIterations; iter += 2) {
#pragma vector always
#pragma simd
#endif
- for (int index = 0; index < nFluid; ++index) {
+ for (int index = 0; index < nFluid; ++index) { // LOOP list-aa-ria-even
#define I(index, dir) P_INDEX_3((nCells), (index), (dir))
int indexStop = threadIndices[threadId] + nFluidThread;
// Because of runlength coding iterations are not independent.
- for (int index = indexStart; index < indexStop; ++index) {
+ for (int index = indexStart; index < indexStop; ++index) { // LOOP list-aa-ria-odd
#define I(index, dir) P_INDEX_3((nCells), (index), (dir))
} // for (int iter = 0; ...
+ X_KERNEL_END(kernelData);
+
#ifdef VTK_OUTPUT
if (cd->VtkOutput) {
kd->PdfsActive = src;