Compare commits

...

2 Commits

Author SHA1 Message Date
zzh 093aeda028 merge 2025-09-18 15:15:30 +08:00
zzh 338c56e6ed 完成avx2的align代码 2025-09-18 15:09:48 +08:00
5 changed files with 9 additions and 8 deletions

View File

@ -106,7 +106,7 @@ end_loop8:
gmax = imax; te = i;
for (j = 0; LIKELY(j < slen); ++j)
_mm_store_si128(Hmax + j, _mm_load_si128(H1 + j));
//if (gmax >= endsc) break;
if (gmax >= endsc) break;
}
S = H1; H1 = H0; H0 = S;

View File

@ -120,7 +120,7 @@ end_loop16:
gmax = imax; te = i; // te is the end position on the target
for (j = 0; LIKELY(j < slen); ++j) // keep the H1 vector
_mm_store_si128(Hmax + j, _mm_load_si128(H1 + j));
//if (gmax + q->shift >= 255 || gmax >= endsc) break;
if (gmax + q->shift >= 255 || gmax >= endsc) break;
}
S = H1; H1 = H0; H0 = S; // swap H0 and H1
}

View File

@ -21,7 +21,8 @@ extern FILE *ins_f_arr[LIM_TYPE],
*retval_f_arr[LIM_TYPE];
// GLOBAL performance info
enum {
enum
{
G_ALL = 0,
G_EXT_SCALAR,
G_EXT_AVX2_I16,