From 1b1c0c8e7618b7b8ae4c37745aea8f3e1601fdaf Mon Sep 17 00:00:00 2001 From: mozdal Date: Tue, 21 Jan 2014 11:47:30 -0800 Subject: [PATCH] Split the inner loop to avoid the overhead incurred when -fPIC flag is enabled. --- PairHMM_JNI/pairhmm-template-kernel.cc | 80 +++++++++++++++----------- PairHMM_JNI/utils.cc | 2 +- 2 files changed, 47 insertions(+), 35 deletions(-) diff --git a/PairHMM_JNI/pairhmm-template-kernel.cc b/PairHMM_JNI/pairhmm-template-kernel.cc index 44d205869..66dc557aa 100644 --- a/PairHMM_JNI/pairhmm-template-kernel.cc +++ b/PairHMM_JNI/pairhmm-template-kernel.cc @@ -345,33 +345,38 @@ template NUMBER GEN_INTRINSIC(GEN_INTRINSIC(compute_full_prob_,SIM BITMASK_VEC bitMaskVec ; - for (int d=1;d NUMBER GEN_INTRINSIC(GEN_INTRINSIC(compute_full_prob_,SIM // Since there are no shift intrinsics in AVX, keep the masks in 2 SSE vectors BITMASK_VEC bitMaskVec ; - for (int d=1;d;