projects
/
LbmBenchmarkKernelsPublic.git
/ blobdiff
commit
grep
author
committer
pickaxe
?
search:
re
summary
|
shortlog
|
log
|
commit
|
commitdiff
|
tree
raw
|
inline
| side by side
bulk commit
[LbmBenchmarkKernelsPublic.git]
/
src
/
BenchKernelD3Q19ListPullSplitNt.c
diff --git
a/src/BenchKernelD3Q19ListPullSplitNt.c
b/src/BenchKernelD3Q19ListPullSplitNt.c
index dfab54afbdc574c3936d146e28e9925e479a1088..0132dc9058f26d7f18f153e8a0c11f37d38efa74 100644
(file)
--- a/
src/BenchKernelD3Q19ListPullSplitNt.c
+++ b/
src/BenchKernelD3Q19ListPullSplitNt.c
@@
-29,6
+29,7
@@
#include "Memory.h"
#include "Vtk.h"
#include "Vector.h"
#include "Memory.h"
#include "Vtk.h"
#include "Vector.h"
+#include "LikwidIf.h"
#include <inttypes.h>
#include <math.h>
#include <inttypes.h>
#include <math.h>
@@
-118,6
+119,8
@@
void FNAME(KernelPullSplitNt1S)(LatticeDesc * ld, KernelData * kernelData, CaseD
KernelStatistics(kd, ld, cd, 0);
#endif
KernelStatistics(kd, ld, cd, 0);
#endif
+
+ X_LIKWID_START("list-pull-split-nt-1s");
#ifdef _OPENMP
#pragma omp parallel default(none) \
shared(nFluid, nCells, kd, kdl, adjList, src, dst, \
#ifdef _OPENMP
#pragma omp parallel default(none) \
shared(nFluid, nCells, kd, kdl, adjList, src, dst, \
@@
-184,6
+187,7
@@
void FNAME(KernelPullSplitNt1S)(LatticeDesc * ld, KernelData * kernelData, CaseD
for(int iter = 0; iter < maxIterations; ++iter) {
for(int iter = 0; iter < maxIterations; ++iter) {
+
#if 1
#define INDEX_START blIndexStart
#define INDEX_STOP blIndexVec
#if 1
#define INDEX_START blIndexStart
#define INDEX_STOP blIndexVec
@@
-201,6
+205,8
@@
void FNAME(KernelPullSplitNt1S)(LatticeDesc * ld, KernelData * kernelData, CaseD
#define INDEX_STOP blIndexStop
#include "BenchKernelD3Q19ListPullSplitNt1SScalar.h"
#endif
#define INDEX_STOP blIndexStop
#include "BenchKernelD3Q19ListPullSplitNt1SScalar.h"
#endif
+
+
#pragma omp barrier
#pragma omp single
#pragma omp barrier
#pragma omp single
@@
-235,6
+241,9
@@
void FNAME(KernelPullSplitNt1S)(LatticeDesc * ld, KernelData * kernelData, CaseD
MemFree((void **)&tmpArray);
}
MemFree((void **)&tmpArray);
}
+
+ X_LIKWID_STOP("list-pull-split-nt-1s");
+
#ifdef VTK_OUTPUT
if (cd->VtkOutput) {
kd->PdfsActive = src;
#ifdef VTK_OUTPUT
if (cd->VtkOutput) {
kd->PdfsActive = src;
@@
-321,6
+330,10
@@
void FNAME(KernelPullSplitNt2S)(LatticeDesc * ld, KernelData * kernelData, CaseD
KernelStatistics(kd, ld, cd, 0);
#endif
KernelStatistics(kd, ld, cd, 0);
#endif
+
+ X_LIKWID_START("list-pull-split-nt-2s");
+
+
#ifdef _OPENMP
#pragma omp parallel default(none) \
shared(nFluid, nCells, kd, kdl, adjList, src, dst, \
#ifdef _OPENMP
#pragma omp parallel default(none) \
shared(nFluid, nCells, kd, kdl, adjList, src, dst, \
@@
-406,6
+419,7
@@
void FNAME(KernelPullSplitNt2S)(LatticeDesc * ld, KernelData * kernelData, CaseD
#endif
#pragma omp barrier
#endif
#pragma omp barrier
+
#pragma omp single
{
#ifdef VERIFICATION
#pragma omp single
{
#ifdef VERIFICATION
@@
-438,6
+452,8
@@
void FNAME(KernelPullSplitNt2S)(LatticeDesc * ld, KernelData * kernelData, CaseD
MemFree((void **)&tmpArray);
}
MemFree((void **)&tmpArray);
}
+ X_LIKWID_STOP("list-pull-split-nt-2s");
+
#ifdef VTK_OUTPUT
if (cd->VtkOutput) {
kd->PdfsActive = src;
#ifdef VTK_OUTPUT
if (cd->VtkOutput) {
kd->PdfsActive = src;
This page took
0.052923 seconds
and
5
git commands to generate.