]> git.ipfire.org Git - thirdparty/linux.git/commitdiff
crypto: arm64/sha3 - Update sha3_ce_transform() to prepare for library
authorEric Biggers <ebiggers@kernel.org>
Sun, 26 Oct 2025 05:50:25 +0000 (22:50 -0700)
committerEric Biggers <ebiggers@kernel.org>
Thu, 6 Nov 2025 04:02:35 +0000 (20:02 -0800)
- Use size_t lengths, to match the library.

- Pass the block size instead of digest size, and add support for the
  block size that SHAKE128 uses.  This allows the code to be used with
  SHAKE128 and SHAKE256, which don't have the concept of a digest size.
  SHAKE256 has the same block size as SHA3-256, but SHAKE128 has a
  unique block size.  Thus, there are now 5 supported block sizes.

Don't bother changing the "glue" code arm64_sha3_update() too much, as
it gets deleted when the SHA-3 code is migrated into lib/crypto/ anyway.

Reviewed-by: Ard Biesheuvel <ardb@kernel.org>
Link: https://lore.kernel.org/r/20251026055032.1413733-9-ebiggers@kernel.org
Signed-off-by: Eric Biggers <ebiggers@kernel.org>
arch/arm64/crypto/sha3-ce-core.S
arch/arm64/crypto/sha3-ce-glue.c

index 9c77313f5a60885231e9374b8853a0a3252d3504..b62bd714839b1edbceaa2cd7570aa3a560846c83 100644 (file)
        .endm
 
        /*
-        * int sha3_ce_transform(u64 *st, const u8 *data, int blocks, int dg_size)
+        * size_t sha3_ce_transform(struct sha3_state *state, const u8 *data,
+        *                          size_t nblocks, size_t block_size)
+        *
+        * block_size is assumed to be one of 72 (SHA3-512), 104 (SHA3-384), 136
+        * (SHA3-256 and SHAKE256), 144 (SHA3-224), or 168 (SHAKE128).
         */
        .text
 SYM_FUNC_START(sha3_ce_transform)
@@ -51,58 +55,55 @@ SYM_FUNC_START(sha3_ce_transform)
        ld1     {v20.1d-v23.1d}, [x8], #32
        ld1     {v24.1d}, [x8]
 
-0:     sub     w2, w2, #1
+0:     sub     x2, x2, #1
        mov     w8, #24
        adr_l   x9, .Lsha3_rcon
 
        /* load input */
        ld1     {v25.8b-v28.8b}, [x1], #32
-       ld1     {v29.8b-v31.8b}, [x1], #24
+       ld1     {v29.8b}, [x1], #8
        eor     v0.8b, v0.8b, v25.8b
        eor     v1.8b, v1.8b, v26.8b
        eor     v2.8b, v2.8b, v27.8b
        eor     v3.8b, v3.8b, v28.8b
        eor     v4.8b, v4.8b, v29.8b
-       eor     v5.8b, v5.8b, v30.8b
-       eor     v6.8b, v6.8b, v31.8b
-
-       tbnz    x3, #6, 2f              // SHA3-512
 
        ld1     {v25.8b-v28.8b}, [x1], #32
-       ld1     {v29.8b-v30.8b}, [x1], #16
-       eor      v7.8b,  v7.8b, v25.8b
-       eor      v8.8b,  v8.8b, v26.8b
-       eor      v9.8b,  v9.8b, v27.8b
-       eor     v10.8b, v10.8b, v28.8b
-       eor     v11.8b, v11.8b, v29.8b
-       eor     v12.8b, v12.8b, v30.8b
+       eor     v5.8b, v5.8b, v25.8b
+       eor     v6.8b, v6.8b, v26.8b
+       eor     v7.8b, v7.8b, v27.8b
+       eor     v8.8b, v8.8b, v28.8b
+       cmp     x3, #72
+       b.eq    3f      /* SHA3-512 (block_size=72)? */
 
-       tbnz    x3, #4, 1f              // SHA3-384 or SHA3-224
+       ld1     {v25.8b-v28.8b}, [x1], #32
+       eor     v9.8b, v9.8b, v25.8b
+       eor     v10.8b, v10.8b, v26.8b
+       eor     v11.8b, v11.8b, v27.8b
+       eor     v12.8b, v12.8b, v28.8b
+       cmp     x3, #104
+       b.eq    3f      /* SHA3-384 (block_size=104)? */
 
-       // SHA3-256
        ld1     {v25.8b-v28.8b}, [x1], #32
        eor     v13.8b, v13.8b, v25.8b
        eor     v14.8b, v14.8b, v26.8b
        eor     v15.8b, v15.8b, v27.8b
        eor     v16.8b, v16.8b, v28.8b
-       b       3f
-
-1:     tbz     x3, #2, 3f              // bit 2 cleared? SHA-384
+       cmp     x3, #144
+       b.lt    3f      /* SHA3-256 or SHAKE256 (block_size=136)? */
+       b.eq    2f      /* SHA3-224 (block_size=144)? */
 
-       // SHA3-224
+       /* SHAKE128 (block_size=168) */
        ld1     {v25.8b-v28.8b}, [x1], #32
-       ld1     {v29.8b}, [x1], #8
-       eor     v13.8b, v13.8b, v25.8b
-       eor     v14.8b, v14.8b, v26.8b
-       eor     v15.8b, v15.8b, v27.8b
-       eor     v16.8b, v16.8b, v28.8b
-       eor     v17.8b, v17.8b, v29.8b
+       eor     v17.8b, v17.8b, v25.8b
+       eor     v18.8b, v18.8b, v26.8b
+       eor     v19.8b, v19.8b, v27.8b
+       eor     v20.8b, v20.8b, v28.8b
        b       3f
-
-       // SHA3-512
-2:     ld1     {v25.8b-v26.8b}, [x1], #16
-       eor      v7.8b,  v7.8b, v25.8b
-       eor      v8.8b,  v8.8b, v26.8b
+2:
+       /* SHA3-224 (block_size=144) */
+       ld1     {v25.8b}, [x1], #8
+       eor     v17.8b, v17.8b, v25.8b
 
 3:     sub     w8, w8, #1
 
@@ -185,7 +186,7 @@ SYM_FUNC_START(sha3_ce_transform)
 
        cbnz    w8, 3b
        cond_yield 4f, x8, x9
-       cbnz    w2, 0b
+       cbnz    x2, 0b
 
        /* save state */
 4:     st1     { v0.1d- v3.1d}, [x0], #32
@@ -195,7 +196,7 @@ SYM_FUNC_START(sha3_ce_transform)
        st1     {v16.1d-v19.1d}, [x0], #32
        st1     {v20.1d-v23.1d}, [x0], #32
        st1     {v24.1d}, [x0]
-       mov     w0, w2
+       mov     x0, x2
        ret
 SYM_FUNC_END(sha3_ce_transform)
 
index f5c83023493373f5e01f6fef055a510e617b7a4f..250f4fb76b4726274fcaf97c90ebfecd099addc5 100644 (file)
@@ -28,18 +28,17 @@ MODULE_ALIAS_CRYPTO("sha3-256");
 MODULE_ALIAS_CRYPTO("sha3-384");
 MODULE_ALIAS_CRYPTO("sha3-512");
 
-asmlinkage int sha3_ce_transform(u64 *st, const u8 *data, int blocks,
-                                int md_len);
+asmlinkage size_t sha3_ce_transform(struct sha3_state *state, const u8 *data,
+                                   size_t nblocks, size_t block_size);
 
 static int arm64_sha3_update(struct shash_desc *desc, const u8 *data,
                             unsigned int len)
 {
        struct sha3_state *sctx = shash_desc_ctx(desc);
        struct crypto_shash *tfm = desc->tfm;
-       unsigned int bs, ds;
+       unsigned int bs;
        int blocks;
 
-       ds = crypto_shash_digestsize(tfm);
        bs = crypto_shash_blocksize(tfm);
        blocks = len / bs;
        len -= blocks * bs;
@@ -47,7 +46,7 @@ static int arm64_sha3_update(struct shash_desc *desc, const u8 *data,
                int rem;
 
                kernel_neon_begin();
-               rem = sha3_ce_transform(sctx->st, data, blocks, ds);
+               rem = sha3_ce_transform(sctx, data, blocks, bs);
                kernel_neon_end();
                data += (blocks - rem) * bs;
                blocks = rem;
@@ -74,7 +73,7 @@ static int sha3_finup(struct shash_desc *desc, const u8 *src, unsigned int len,
        block[bs - 1] |= 0x80;
 
        kernel_neon_begin();
-       sha3_ce_transform(sctx->st, block, 1, ds);
+       sha3_ce_transform(sctx, block, 1, bs);
        kernel_neon_end();
        memzero_explicit(block , sizeof(block));