X-Git-Url: http://git.rrze.uni-erlangen.de/gitweb/?p=LbmBenchmarkKernelsPublic.git;a=blobdiff_plain;f=src%2FBenchKernelD3Q19ListPullSplitNt1SIntrinsics.h;h=bb075fa95fbd3483792561f3ffeba8837e29d6ef;hp=a3e586b7ab7187fbc3b5bb506af679e29e98fa03;hb=0fde6e45e9be83893afae896cf49a799777f6d7c;hpb=712d0b8fc4a382e1cfe4edef8b0ade11b0a2ce25 diff --git a/src/BenchKernelD3Q19ListPullSplitNt1SIntrinsics.h b/src/BenchKernelD3Q19ListPullSplitNt1SIntrinsics.h index a3e586b..bb075fa 100644 --- a/src/BenchKernelD3Q19ListPullSplitNt1SIntrinsics.h +++ b/src/BenchKernelD3Q19ListPullSplitNt1SIntrinsics.h @@ -41,6 +41,9 @@ #ifdef DEBUG memset(tmpArray, -1, sizeof(PdfT) * nTmpArray * N_TMP); #endif + #ifdef INTEL_OPT_DIRECTIVES + #pragma ivdep + #endif for (int index = 0; index < indexMax; ++index) { @@ -69,7 +72,7 @@ pdf_T + pdf_TN + pdf_TE + pdf_TS + pdf_TW + pdf_B + pdf_BN + pdf_BE + pdf_BS + pdf_BW; - dir_indep_trm = dens - (ux * ux + uy * uy + uz * uz) * 3.0 / 2.0; + dir_indep_trm = dens - (ux * ux + uy * uy + uz * uz) * F(3.0) / F(2.0); w_1_indep = w_1 * dir_indep_trm; w_2_indep = w_2 * dir_indep_trm;