* additions worthwhile or if it's worth it to just eat the cost of an unaligned
* load. This is a pretty simple test, just test if 16 - the remainder + len is
* < 16 */
- int max_iters = NMAX;
- int rem = (uintptr_t)buf & 15;
- int align_offset = 16 - rem;
- int k = 0;
+ uint32_t max_iters = NMAX;
+ uint32_t rem = (uintptr_t)buf & 15;
+ uint32_t align_offset = 16 - rem;
+ uint32_t k = 0;
if (rem) {
if (len < 16 + align_offset) {
/* Let's eat the cost of this one unaligned load so that
goto unaligned_jmp;
}
- for (int i = 0; i < align_offset; ++i) {
+ for (uint32_t i = 0; i < align_offset; ++i) {
adler += *(buf++);
sum2 += adler;
}
vs2_0 = _mm_setzero_si128();
vs1_0 = vs1;
- k = (len < max_iters ? (int)len : max_iters);
+ k = (len < max_iters ? len : max_iters);
k -= k % 16;
len -= k;