From 6755baf940ff7b822d8a500999ef616e1bd08283 Mon Sep 17 00:00:00 2001 From: Yann Collet Date: Fri, 7 May 2021 15:18:16 -0700 Subject: [PATCH] update decoder hot loop alignment This seems to bring an additional ~+1.2% decompression speed on average across 10 compilers x 6 scenarios. --- lib/decompress/zstd_decompress_block.c | 2 ++ 1 file changed, 2 insertions(+) diff --git a/lib/decompress/zstd_decompress_block.c b/lib/decompress/zstd_decompress_block.c index 90acc855f..a8ba8d8bb 100644 --- a/lib/decompress/zstd_decompress_block.c +++ b/lib/decompress/zstd_decompress_block.c @@ -1161,6 +1161,8 @@ ZSTD_decompressSequences_body( ZSTD_DCtx* dctx, * * https://gist.github.com/terrelln/9889fc06a423fd5ca6e99351564473f4 */ + __asm__(".p2align 6"); + __asm__("nop"); __asm__(".p2align 5"); __asm__("nop"); __asm__(".p2align 4"); -- 2.47.2