X-Git-Url: http://git.rrze.uni-erlangen.de/gitweb/?p=LbmBenchmarkKernelsPublic.git;a=blobdiff_plain;f=src%2FBenchKernelD3Q19ListAa.c;fp=src%2FBenchKernelD3Q19ListAa.c;h=20213110c6b7bc31ba3eca4311f25fe9f33f976d;hp=045a396f5ef786343f5134b4aeb6386a2bbc446c;hb=8cafd9ea08a6b1103eab29811227a7ae536dffa6;hpb=0fde6e45e9be83893afae896cf49a799777f6d7c diff --git a/src/BenchKernelD3Q19ListAa.c b/src/BenchKernelD3Q19ListAa.c index 045a396..2021311 100644 --- a/src/BenchKernelD3Q19ListAa.c +++ b/src/BenchKernelD3Q19ListAa.c @@ -98,6 +98,8 @@ void FNAME(D3Q19ListAaKernel)(LatticeDesc * ld, KernelData * kernelData, CaseDat KernelStatistics(kd, ld, cd, 0); #endif + X_KERNEL_START(kernelData); + // TODO: outer openmp parallel for(int iter = 0; iter < maxIterations; iter += 2) { @@ -122,7 +124,7 @@ void FNAME(D3Q19ListAaKernel)(LatticeDesc * ld, KernelData * kernelData, CaseDat #pragma vector always #pragma simd #endif - for (int index = 0; index < nFluid; ++index) { + for (int index = 0; index < nFluid; ++index) { // LOOP list-aa-even #define I(index, dir) P_INDEX_3((nCells), (index), (dir)) @@ -259,7 +261,7 @@ void FNAME(D3Q19ListAaKernel)(LatticeDesc * ld, KernelData * kernelData, CaseDat #ifdef INTEL_OPT_DIRECTIVES #pragma ivdep #endif - for (int index = 0; index < nFluid; ++index) { + for (int index = 0; index < nFluid; ++index) { // LOOP list-aa-odd adjListIndex = index * N_D3Q19_IDX; @@ -397,6 +399,8 @@ void FNAME(D3Q19ListAaKernel)(LatticeDesc * ld, KernelData * kernelData, CaseDat } // for (int iter = 0; ... + X_KERNEL_END(kernelData); + #ifdef VTK_OUTPUT if (cd->VtkOutput) {