projects
/
LbmBenchmarkKernelsPublic.git
/ blobdiff
commit
grep
author
committer
pickaxe
?
search:
re
summary
|
shortlog
|
log
|
commit
|
commitdiff
|
tree
raw
|
inline
| side by side
merge with kernels from MH's master thesis
[LbmBenchmarkKernelsPublic.git]
/
src
/
BenchKernelD3Q19ListAaRia.c
diff --git
a/src/BenchKernelD3Q19ListAaRia.c
b/src/BenchKernelD3Q19ListAaRia.c
index 245c2a539eda2c9fedd439b55d0db619dd64babd..0cb46367ff0962cfc202886b7d53e8860a2ee1c5 100644
(file)
--- a/
src/BenchKernelD3Q19ListAaRia.c
+++ b/
src/BenchKernelD3Q19ListAaRia.c
@@
-116,6
+116,8
@@
void FNAME(D3Q19ListAaRiaKernel)(LatticeDesc * ld, KernelData * kernelData, Case
KernelStatistics(kd, ld, cd, 0);
#endif
KernelStatistics(kd, ld, cd, 0);
#endif
+ X_KERNEL_START(kernelData);
+
// TODO: outer openmp parallel
for(int iter = 0; iter < maxIterations; iter += 2) {
// TODO: outer openmp parallel
for(int iter = 0; iter < maxIterations; iter += 2) {
@@
-139,7
+141,7
@@
void FNAME(D3Q19ListAaRiaKernel)(LatticeDesc * ld, KernelData * kernelData, Case
#pragma vector always
#pragma simd
#endif
#pragma vector always
#pragma simd
#endif
- for (int index = 0; index < nFluid; ++index) {
+ for (int index = 0; index < nFluid; ++index) {
// LOOP list-aa-ria-even
#define I(index, dir) P_INDEX_3((nCells), (index), (dir))
#define I(index, dir) P_INDEX_3((nCells), (index), (dir))
@@
-296,7
+298,7
@@
void FNAME(D3Q19ListAaRiaKernel)(LatticeDesc * ld, KernelData * kernelData, Case
int indexStop = threadIndices[threadId] + nFluidThread;
// Because of runlength coding iterations are not independent.
int indexStop = threadIndices[threadId] + nFluidThread;
// Because of runlength coding iterations are not independent.
- for (int index = indexStart; index < indexStop; ++index) {
+ for (int index = indexStart; index < indexStop; ++index) {
// LOOP list-aa-ria-odd
#define I(index, dir) P_INDEX_3((nCells), (index), (dir))
#define I(index, dir) P_INDEX_3((nCells), (index), (dir))
@@
-469,6
+471,8
@@
void FNAME(D3Q19ListAaRiaKernel)(LatticeDesc * ld, KernelData * kernelData, Case
} // for (int iter = 0; ...
} // for (int iter = 0; ...
+ X_KERNEL_END(kernelData);
+
#ifdef VTK_OUTPUT
if (cd->VtkOutput) {
kd->PdfsActive = src;
#ifdef VTK_OUTPUT
if (cd->VtkOutput) {
kd->PdfsActive = src;
This page took
0.046909 seconds
and
5
git commands to generate.