Reviewed-by: Dmitry Belyavskiy <beldmit@gmail.com>
Reviewed-by: Paul Dale <paul.dale@oracle.com>
MergeDate: Fri Feb 13 14:31:43 2026
(Merged from https://github.com/openssl/openssl/pull/29858)
/* Process 96 bytes at a time */
for (; i + 100 <= srclen; i += 96) {
+ _mm_prefetch((const char *)(input + i + 192), _MM_HINT_T0);
/* We shave off 4 bytes from the beginning and the end */
const __m128i lo0 = _mm_loadu_si128((const __m128i *)(input + i + 4 * 3 * 0));
const __m128i hi0 = _mm_loadu_si128((const __m128i *)(input + i + 4 * 3 * 1));