1 /* ====================================================================
2 * Copyright (c) 2011-2013 The OpenSSL Project. All rights reserved.
4 * Redistribution and use in source and binary forms, with or without
5 * modification, are permitted provided that the following conditions
8 * 1. Redistributions of source code must retain the above copyright
9 * notice, this list of conditions and the following disclaimer.
11 * 2. Redistributions in binary form must reproduce the above copyright
12 * notice, this list of conditions and the following disclaimer in
13 * the documentation and/or other materials provided with the
16 * 3. All advertising materials mentioning features or use of this
17 * software must display the following acknowledgment:
18 * "This product includes software developed by the OpenSSL Project
19 * for use in the OpenSSL Toolkit. (http://www.OpenSSL.org/)"
21 * 4. The names "OpenSSL Toolkit" and "OpenSSL Project" must not be used to
22 * endorse or promote products derived from this software without
23 * prior written permission. For written permission, please contact
24 * licensing@OpenSSL.org.
26 * 5. Products derived from this software may not be called "OpenSSL"
27 * nor may "OpenSSL" appear in their names without prior written
28 * permission of the OpenSSL Project.
30 * 6. Redistributions of any form whatsoever must retain the following
32 * "This product includes software developed by the OpenSSL Project
33 * for use in the OpenSSL Toolkit (http://www.OpenSSL.org/)"
35 * THIS SOFTWARE IS PROVIDED BY THE OpenSSL PROJECT ``AS IS'' AND ANY
36 * EXPRESSED OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
37 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
38 * PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE OpenSSL PROJECT OR
39 * ITS CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
40 * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT
41 * NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;
42 * LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
43 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT,
44 * STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
45 * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED
46 * OF THE POSSIBILITY OF SUCH DAMAGE.
47 * ====================================================================
50 #include <openssl/opensslconf.h>
55 #if !defined(OPENSSL_NO_AES)
57 # include <openssl/evp.h>
58 # include <openssl/objects.h>
59 # include <openssl/aes.h>
60 # include <openssl/sha.h>
61 # include <openssl/rand.h>
62 # include "modes_lcl.h"
63 # include "internal/evp_int.h"
65 # ifndef EVP_CIPH_FLAG_AEAD_CIPHER
66 # define EVP_CIPH_FLAG_AEAD_CIPHER 0x200000
67 # define EVP_CTRL_AEAD_TLS1_AAD 0x16
68 # define EVP_CTRL_AEAD_SET_MAC_KEY 0x17
71 # if !defined(EVP_CIPH_FLAG_DEFAULT_ASN1)
72 # define EVP_CIPH_FLAG_DEFAULT_ASN1 0
75 # if !defined(EVP_CIPH_FLAG_TLS1_1_MULTIBLOCK)
76 # define EVP_CIPH_FLAG_TLS1_1_MULTIBLOCK 0
79 # define TLS1_1_VERSION 0x0302
83 SHA256_CTX head
, tail
, md
;
84 size_t payload_length
; /* AAD length in decrypt case */
87 unsigned char tls_aad
[16]; /* 13 used */
89 } EVP_AES_HMAC_SHA256
;
91 # define NO_PAYLOAD_LENGTH ((size_t)-1)
93 # if defined(AES_ASM) && ( \
94 defined(__x86_64) || defined(__x86_64__) || \
95 defined(_M_AMD64) || defined(_M_X64) || \
98 extern unsigned int OPENSSL_ia32cap_P
[];
99 # define AESNI_CAPABLE (1<<(57-32))
101 int aesni_set_encrypt_key(const unsigned char *userKey
, int bits
,
103 int aesni_set_decrypt_key(const unsigned char *userKey
, int bits
,
106 void aesni_cbc_encrypt(const unsigned char *in
,
109 const AES_KEY
*key
, unsigned char *ivec
, int enc
);
111 int aesni_cbc_sha256_enc(const void *inp
, void *out
, size_t blocks
,
112 const AES_KEY
*key
, unsigned char iv
[16],
113 SHA256_CTX
*ctx
, const void *in0
);
115 # define data(ctx) ((EVP_AES_HMAC_SHA256 *)EVP_CIPHER_CTX_cipher_data(ctx))
117 static int aesni_cbc_hmac_sha256_init_key(EVP_CIPHER_CTX
*ctx
,
118 const unsigned char *inkey
,
119 const unsigned char *iv
, int enc
)
121 EVP_AES_HMAC_SHA256
*key
= data(ctx
);
125 memset(&key
->ks
, 0, sizeof(key
->ks
.rd_key
)),
126 ret
= aesni_set_encrypt_key(inkey
,
127 EVP_CIPHER_CTX_key_length(ctx
) * 8,
130 ret
= aesni_set_decrypt_key(inkey
,
131 EVP_CIPHER_CTX_key_length(ctx
) * 8,
134 SHA256_Init(&key
->head
); /* handy when benchmarking */
135 key
->tail
= key
->head
;
138 key
->payload_length
= NO_PAYLOAD_LENGTH
;
140 return ret
< 0 ? 0 : 1;
143 # define STITCHED_CALL
145 # if !defined(STITCHED_CALL)
149 void sha256_block_data_order(void *c
, const void *p
, size_t len
);
151 static void sha256_update(SHA256_CTX
*c
, const void *data
, size_t len
)
153 const unsigned char *ptr
= data
;
156 if ((res
= c
->num
)) {
157 res
= SHA256_CBLOCK
- res
;
160 SHA256_Update(c
, ptr
, res
);
165 res
= len
% SHA256_CBLOCK
;
169 sha256_block_data_order(c
, ptr
, len
/ SHA256_CBLOCK
);
174 if (c
->Nl
< (unsigned int)len
)
179 SHA256_Update(c
, ptr
, res
);
182 # ifdef SHA256_Update
183 # undef SHA256_Update
185 # define SHA256_Update sha256_update
187 # if !defined(OPENSSL_NO_MULTIBLOCK) && EVP_CIPH_FLAG_TLS1_1_MULTIBLOCK
190 unsigned int A
[8], B
[8], C
[8], D
[8], E
[8], F
[8], G
[8], H
[8];
193 const unsigned char *ptr
;
197 void sha256_multi_block(SHA256_MB_CTX
*, const HASH_DESC
*, int);
200 const unsigned char *inp
;
206 void aesni_multi_cbc_encrypt(CIPH_DESC
*, void *, int);
208 static size_t tls1_1_multi_block_encrypt(EVP_AES_HMAC_SHA256
*key
,
210 const unsigned char *inp
,
211 size_t inp_len
, int n4x
)
212 { /* n4x is 1 or 2 */
213 HASH_DESC hash_d
[8], edges
[8];
215 unsigned char storage
[sizeof(SHA256_MB_CTX
) + 32];
222 unsigned int frag
, last
, packlen
, i
, x4
= 4 * n4x
, minblocks
, processed
=
230 /* ask for IVs in bulk */
231 if (RAND_bytes((IVs
= blocks
[0].c
), 16 * x4
) <= 0)
235 ctx
= (SHA256_MB_CTX
*) (storage
+ 32 - ((size_t)storage
% 32));
237 frag
= (unsigned int)inp_len
>> (1 + n4x
);
238 last
= (unsigned int)inp_len
+ frag
- (frag
<< (1 + n4x
));
239 if (last
> frag
&& ((last
+ 13 + 9) % 64) < (x4
- 1)) {
244 packlen
= 5 + 16 + ((frag
+ 32 + 16) & -16);
246 /* populate descriptors with pointers and IVs */
249 /* 5+16 is place for header and explicit IV */
250 ciph_d
[0].out
= out
+ 5 + 16;
251 memcpy(ciph_d
[0].out
- 16, IVs
, 16);
252 memcpy(ciph_d
[0].iv
, IVs
, 16);
255 for (i
= 1; i
< x4
; i
++) {
256 ciph_d
[i
].inp
= hash_d
[i
].ptr
= hash_d
[i
- 1].ptr
+ frag
;
257 ciph_d
[i
].out
= ciph_d
[i
- 1].out
+ packlen
;
258 memcpy(ciph_d
[i
].out
- 16, IVs
, 16);
259 memcpy(ciph_d
[i
].iv
, IVs
, 16);
264 memcpy(blocks
[0].c
, key
->md
.data
, 8);
265 seqnum
= BSWAP8(blocks
[0].q
[0]);
267 for (i
= 0; i
< x4
; i
++) {
268 unsigned int len
= (i
== (x4
- 1) ? last
: frag
);
269 # if !defined(BSWAP8)
270 unsigned int carry
, j
;
273 ctx
->A
[i
] = key
->md
.h
[0];
274 ctx
->B
[i
] = key
->md
.h
[1];
275 ctx
->C
[i
] = key
->md
.h
[2];
276 ctx
->D
[i
] = key
->md
.h
[3];
277 ctx
->E
[i
] = key
->md
.h
[4];
278 ctx
->F
[i
] = key
->md
.h
[5];
279 ctx
->G
[i
] = key
->md
.h
[6];
280 ctx
->H
[i
] = key
->md
.h
[7];
284 blocks
[i
].q
[0] = BSWAP8(seqnum
+ i
);
286 for (carry
= i
, j
= 8; j
--;) {
287 blocks
[i
].c
[j
] = ((u8
*)key
->md
.data
)[j
] + carry
;
288 carry
= (blocks
[i
].c
[j
] - carry
) >> (sizeof(carry
) * 8 - 1);
291 blocks
[i
].c
[8] = ((u8
*)key
->md
.data
)[8];
292 blocks
[i
].c
[9] = ((u8
*)key
->md
.data
)[9];
293 blocks
[i
].c
[10] = ((u8
*)key
->md
.data
)[10];
295 blocks
[i
].c
[11] = (u8
)(len
>> 8);
296 blocks
[i
].c
[12] = (u8
)(len
);
298 memcpy(blocks
[i
].c
+ 13, hash_d
[i
].ptr
, 64 - 13);
299 hash_d
[i
].ptr
+= 64 - 13;
300 hash_d
[i
].blocks
= (len
- (64 - 13)) / 64;
302 edges
[i
].ptr
= blocks
[i
].c
;
306 /* hash 13-byte headers and first 64-13 bytes of inputs */
307 sha256_multi_block(ctx
, edges
, n4x
);
308 /* hash bulk inputs */
309 # define MAXCHUNKSIZE 2048
311 # error "MAXCHUNKSIZE is not divisible by 64"
314 * goal is to minimize pressure on L1 cache by moving in shorter steps,
315 * so that hashed data is still in the cache by the time we encrypt it
317 minblocks
= ((frag
<= last
? frag
: last
) - (64 - 13)) / 64;
318 if (minblocks
> MAXCHUNKSIZE
/ 64) {
319 for (i
= 0; i
< x4
; i
++) {
320 edges
[i
].ptr
= hash_d
[i
].ptr
;
321 edges
[i
].blocks
= MAXCHUNKSIZE
/ 64;
322 ciph_d
[i
].blocks
= MAXCHUNKSIZE
/ 16;
325 sha256_multi_block(ctx
, edges
, n4x
);
326 aesni_multi_cbc_encrypt(ciph_d
, &key
->ks
, n4x
);
328 for (i
= 0; i
< x4
; i
++) {
329 edges
[i
].ptr
= hash_d
[i
].ptr
+= MAXCHUNKSIZE
;
330 hash_d
[i
].blocks
-= MAXCHUNKSIZE
/ 64;
331 edges
[i
].blocks
= MAXCHUNKSIZE
/ 64;
332 ciph_d
[i
].inp
+= MAXCHUNKSIZE
;
333 ciph_d
[i
].out
+= MAXCHUNKSIZE
;
334 ciph_d
[i
].blocks
= MAXCHUNKSIZE
/ 16;
335 memcpy(ciph_d
[i
].iv
, ciph_d
[i
].out
- 16, 16);
337 processed
+= MAXCHUNKSIZE
;
338 minblocks
-= MAXCHUNKSIZE
/ 64;
339 } while (minblocks
> MAXCHUNKSIZE
/ 64);
343 sha256_multi_block(ctx
, hash_d
, n4x
);
345 memset(blocks
, 0, sizeof(blocks
));
346 for (i
= 0; i
< x4
; i
++) {
347 unsigned int len
= (i
== (x4
- 1) ? last
: frag
),
348 off
= hash_d
[i
].blocks
* 64;
349 const unsigned char *ptr
= hash_d
[i
].ptr
+ off
;
351 off
= (len
- processed
) - (64 - 13) - off
; /* remainder actually */
352 memcpy(blocks
[i
].c
, ptr
, off
);
353 blocks
[i
].c
[off
] = 0x80;
354 len
+= 64 + 13; /* 64 is HMAC header */
355 len
*= 8; /* convert to bits */
356 if (off
< (64 - 8)) {
358 blocks
[i
].d
[15] = BSWAP4(len
);
360 PUTU32(blocks
[i
].c
+ 60, len
);
365 blocks
[i
].d
[31] = BSWAP4(len
);
367 PUTU32(blocks
[i
].c
+ 124, len
);
371 edges
[i
].ptr
= blocks
[i
].c
;
374 /* hash input tails and finalize */
375 sha256_multi_block(ctx
, edges
, n4x
);
377 memset(blocks
, 0, sizeof(blocks
));
378 for (i
= 0; i
< x4
; i
++) {
380 blocks
[i
].d
[0] = BSWAP4(ctx
->A
[i
]);
381 ctx
->A
[i
] = key
->tail
.h
[0];
382 blocks
[i
].d
[1] = BSWAP4(ctx
->B
[i
]);
383 ctx
->B
[i
] = key
->tail
.h
[1];
384 blocks
[i
].d
[2] = BSWAP4(ctx
->C
[i
]);
385 ctx
->C
[i
] = key
->tail
.h
[2];
386 blocks
[i
].d
[3] = BSWAP4(ctx
->D
[i
]);
387 ctx
->D
[i
] = key
->tail
.h
[3];
388 blocks
[i
].d
[4] = BSWAP4(ctx
->E
[i
]);
389 ctx
->E
[i
] = key
->tail
.h
[4];
390 blocks
[i
].d
[5] = BSWAP4(ctx
->F
[i
]);
391 ctx
->F
[i
] = key
->tail
.h
[5];
392 blocks
[i
].d
[6] = BSWAP4(ctx
->G
[i
]);
393 ctx
->G
[i
] = key
->tail
.h
[6];
394 blocks
[i
].d
[7] = BSWAP4(ctx
->H
[i
]);
395 ctx
->H
[i
] = key
->tail
.h
[7];
396 blocks
[i
].c
[32] = 0x80;
397 blocks
[i
].d
[15] = BSWAP4((64 + 32) * 8);
399 PUTU32(blocks
[i
].c
+ 0, ctx
->A
[i
]);
400 ctx
->A
[i
] = key
->tail
.h
[0];
401 PUTU32(blocks
[i
].c
+ 4, ctx
->B
[i
]);
402 ctx
->B
[i
] = key
->tail
.h
[1];
403 PUTU32(blocks
[i
].c
+ 8, ctx
->C
[i
]);
404 ctx
->C
[i
] = key
->tail
.h
[2];
405 PUTU32(blocks
[i
].c
+ 12, ctx
->D
[i
]);
406 ctx
->D
[i
] = key
->tail
.h
[3];
407 PUTU32(blocks
[i
].c
+ 16, ctx
->E
[i
]);
408 ctx
->E
[i
] = key
->tail
.h
[4];
409 PUTU32(blocks
[i
].c
+ 20, ctx
->F
[i
]);
410 ctx
->F
[i
] = key
->tail
.h
[5];
411 PUTU32(blocks
[i
].c
+ 24, ctx
->G
[i
]);
412 ctx
->G
[i
] = key
->tail
.h
[6];
413 PUTU32(blocks
[i
].c
+ 28, ctx
->H
[i
]);
414 ctx
->H
[i
] = key
->tail
.h
[7];
415 blocks
[i
].c
[32] = 0x80;
416 PUTU32(blocks
[i
].c
+ 60, (64 + 32) * 8);
418 edges
[i
].ptr
= blocks
[i
].c
;
423 sha256_multi_block(ctx
, edges
, n4x
);
425 for (i
= 0; i
< x4
; i
++) {
426 unsigned int len
= (i
== (x4
- 1) ? last
: frag
), pad
, j
;
427 unsigned char *out0
= out
;
429 memcpy(ciph_d
[i
].out
, ciph_d
[i
].inp
, len
- processed
);
430 ciph_d
[i
].inp
= ciph_d
[i
].out
;
435 PUTU32(out
+ 0, ctx
->A
[i
]);
436 PUTU32(out
+ 4, ctx
->B
[i
]);
437 PUTU32(out
+ 8, ctx
->C
[i
]);
438 PUTU32(out
+ 12, ctx
->D
[i
]);
439 PUTU32(out
+ 16, ctx
->E
[i
]);
440 PUTU32(out
+ 20, ctx
->F
[i
]);
441 PUTU32(out
+ 24, ctx
->G
[i
]);
442 PUTU32(out
+ 28, ctx
->H
[i
]);
448 for (j
= 0; j
<= pad
; j
++)
452 ciph_d
[i
].blocks
= (len
- processed
) / 16;
453 len
+= 16; /* account for explicit iv */
456 out0
[0] = ((u8
*)key
->md
.data
)[8];
457 out0
[1] = ((u8
*)key
->md
.data
)[9];
458 out0
[2] = ((u8
*)key
->md
.data
)[10];
459 out0
[3] = (u8
)(len
>> 8);
466 aesni_multi_cbc_encrypt(ciph_d
, &key
->ks
, n4x
);
468 OPENSSL_cleanse(blocks
, sizeof(blocks
));
469 OPENSSL_cleanse(ctx
, sizeof(*ctx
));
475 static int aesni_cbc_hmac_sha256_cipher(EVP_CIPHER_CTX
*ctx
,
477 const unsigned char *in
, size_t len
)
479 EVP_AES_HMAC_SHA256
*key
= data(ctx
);
481 size_t plen
= key
->payload_length
, iv
= 0, /* explicit IV in TLS 1.1 and
484 # if defined(STITCHED_CALL)
485 size_t aes_off
= 0, blocks
;
487 sha_off
= SHA256_CBLOCK
- key
->md
.num
;
490 key
->payload_length
= NO_PAYLOAD_LENGTH
;
492 if (len
% AES_BLOCK_SIZE
)
495 if (EVP_CIPHER_CTX_encrypting(ctx
)) {
496 if (plen
== NO_PAYLOAD_LENGTH
)
499 ((plen
+ SHA256_DIGEST_LENGTH
+
500 AES_BLOCK_SIZE
) & -AES_BLOCK_SIZE
))
502 else if (key
->aux
.tls_ver
>= TLS1_1_VERSION
)
505 # if defined(STITCHED_CALL)
507 * Assembly stitch handles AVX-capable processors, but its
508 * performance is not optimal on AMD Jaguar, ~40% worse, for
509 * unknown reasons. Incidentally processor in question supports
510 * AVX, but not AMD-specific XOP extension, which can be used
511 * to identify it and avoid stitch invocation. So that after we
512 * establish that current CPU supports AVX, we even see if it's
513 * either even XOP-capable Bulldozer-based or GenuineIntel one.
515 if (OPENSSL_ia32cap_P
[1] & (1 << (60 - 32)) && /* AVX? */
516 ((OPENSSL_ia32cap_P
[1] & (1 << (43 - 32))) /* XOP? */
517 | (OPENSSL_ia32cap_P
[0] & (1<<30))) && /* "Intel CPU"? */
518 plen
> (sha_off
+ iv
) &&
519 (blocks
= (plen
- (sha_off
+ iv
)) / SHA256_CBLOCK
)) {
520 SHA256_Update(&key
->md
, in
+ iv
, sha_off
);
522 (void)aesni_cbc_sha256_enc(in
, out
, blocks
, &key
->ks
,
523 EVP_CIPHER_CTX_iv_noconst(ctx
),
524 &key
->md
, in
+ iv
+ sha_off
);
525 blocks
*= SHA256_CBLOCK
;
528 key
->md
.Nh
+= blocks
>> 29;
529 key
->md
.Nl
+= blocks
<<= 3;
530 if (key
->md
.Nl
< (unsigned int)blocks
)
537 SHA256_Update(&key
->md
, in
+ sha_off
, plen
- sha_off
);
539 if (plen
!= len
) { /* "TLS" mode of operation */
541 memcpy(out
+ aes_off
, in
+ aes_off
, plen
- aes_off
);
543 /* calculate HMAC and append it to payload */
544 SHA256_Final(out
+ plen
, &key
->md
);
546 SHA256_Update(&key
->md
, out
+ plen
, SHA256_DIGEST_LENGTH
);
547 SHA256_Final(out
+ plen
, &key
->md
);
549 /* pad the payload|hmac */
550 plen
+= SHA256_DIGEST_LENGTH
;
551 for (l
= len
- plen
- 1; plen
< len
; plen
++)
553 /* encrypt HMAC|padding at once */
554 aesni_cbc_encrypt(out
+ aes_off
, out
+ aes_off
, len
- aes_off
,
555 &key
->ks
, EVP_CIPHER_CTX_iv_noconst(ctx
), 1);
557 aesni_cbc_encrypt(in
+ aes_off
, out
+ aes_off
, len
- aes_off
,
558 &key
->ks
, EVP_CIPHER_CTX_iv_noconst(ctx
), 1);
562 unsigned int u
[SHA256_DIGEST_LENGTH
/ sizeof(unsigned int)];
563 unsigned char c
[64 + SHA256_DIGEST_LENGTH
];
566 /* arrange cache line alignment */
567 pmac
= (void *)(((size_t)mac
.c
+ 63) & ((size_t)0 - 64));
569 /* decrypt HMAC|padding at once */
570 aesni_cbc_encrypt(in
, out
, len
, &key
->ks
,
571 EVP_CIPHER_CTX_iv_noconst(ctx
), 0);
573 if (plen
!= NO_PAYLOAD_LENGTH
) { /* "TLS" mode of operation */
574 size_t inp_len
, mask
, j
, i
;
575 unsigned int res
, maxpad
, pad
, bitlen
;
578 unsigned int u
[SHA_LBLOCK
];
579 unsigned char c
[SHA256_CBLOCK
];
580 } *data
= (void *)key
->md
.data
;
582 if ((key
->aux
.tls_aad
[plen
- 4] << 8 | key
->aux
.tls_aad
[plen
- 3])
586 if (len
< (iv
+ SHA256_DIGEST_LENGTH
+ 1))
589 /* omit explicit iv */
593 /* figure out payload length */
595 maxpad
= len
- (SHA256_DIGEST_LENGTH
+ 1);
596 maxpad
|= (255 - maxpad
) >> (sizeof(maxpad
) * 8 - 8);
599 inp_len
= len
- (SHA256_DIGEST_LENGTH
+ pad
+ 1);
600 mask
= (0 - ((inp_len
- len
) >> (sizeof(inp_len
) * 8 - 1)));
604 key
->aux
.tls_aad
[plen
- 2] = inp_len
>> 8;
605 key
->aux
.tls_aad
[plen
- 1] = inp_len
;
609 SHA256_Update(&key
->md
, key
->aux
.tls_aad
, plen
);
612 len
-= SHA256_DIGEST_LENGTH
; /* amend mac */
613 if (len
>= (256 + SHA256_CBLOCK
)) {
614 j
= (len
- (256 + SHA256_CBLOCK
)) & (0 - SHA256_CBLOCK
);
615 j
+= SHA256_CBLOCK
- key
->md
.num
;
616 SHA256_Update(&key
->md
, out
, j
);
622 /* but pretend as if we hashed padded payload */
623 bitlen
= key
->md
.Nl
+ (inp_len
<< 3); /* at most 18 bits */
625 bitlen
= BSWAP4(bitlen
);
628 mac
.c
[1] = (unsigned char)(bitlen
>> 16);
629 mac
.c
[2] = (unsigned char)(bitlen
>> 8);
630 mac
.c
[3] = (unsigned char)bitlen
;
643 for (res
= key
->md
.num
, j
= 0; j
< len
; j
++) {
645 mask
= (j
- inp_len
) >> (sizeof(j
) * 8 - 8);
647 c
|= 0x80 & ~mask
& ~((inp_len
- j
) >> (sizeof(j
) * 8 - 8));
648 data
->c
[res
++] = (unsigned char)c
;
650 if (res
!= SHA256_CBLOCK
)
653 /* j is not incremented yet */
654 mask
= 0 - ((inp_len
+ 7 - j
) >> (sizeof(j
) * 8 - 1));
655 data
->u
[SHA_LBLOCK
- 1] |= bitlen
& mask
;
656 sha256_block_data_order(&key
->md
, data
, 1);
657 mask
&= 0 - ((j
- inp_len
- 72) >> (sizeof(j
) * 8 - 1));
658 pmac
->u
[0] |= key
->md
.h
[0] & mask
;
659 pmac
->u
[1] |= key
->md
.h
[1] & mask
;
660 pmac
->u
[2] |= key
->md
.h
[2] & mask
;
661 pmac
->u
[3] |= key
->md
.h
[3] & mask
;
662 pmac
->u
[4] |= key
->md
.h
[4] & mask
;
663 pmac
->u
[5] |= key
->md
.h
[5] & mask
;
664 pmac
->u
[6] |= key
->md
.h
[6] & mask
;
665 pmac
->u
[7] |= key
->md
.h
[7] & mask
;
669 for (i
= res
; i
< SHA256_CBLOCK
; i
++, j
++)
672 if (res
> SHA256_CBLOCK
- 8) {
673 mask
= 0 - ((inp_len
+ 8 - j
) >> (sizeof(j
) * 8 - 1));
674 data
->u
[SHA_LBLOCK
- 1] |= bitlen
& mask
;
675 sha256_block_data_order(&key
->md
, data
, 1);
676 mask
&= 0 - ((j
- inp_len
- 73) >> (sizeof(j
) * 8 - 1));
677 pmac
->u
[0] |= key
->md
.h
[0] & mask
;
678 pmac
->u
[1] |= key
->md
.h
[1] & mask
;
679 pmac
->u
[2] |= key
->md
.h
[2] & mask
;
680 pmac
->u
[3] |= key
->md
.h
[3] & mask
;
681 pmac
->u
[4] |= key
->md
.h
[4] & mask
;
682 pmac
->u
[5] |= key
->md
.h
[5] & mask
;
683 pmac
->u
[6] |= key
->md
.h
[6] & mask
;
684 pmac
->u
[7] |= key
->md
.h
[7] & mask
;
686 memset(data
, 0, SHA256_CBLOCK
);
689 data
->u
[SHA_LBLOCK
- 1] = bitlen
;
690 sha256_block_data_order(&key
->md
, data
, 1);
691 mask
= 0 - ((j
- inp_len
- 73) >> (sizeof(j
) * 8 - 1));
692 pmac
->u
[0] |= key
->md
.h
[0] & mask
;
693 pmac
->u
[1] |= key
->md
.h
[1] & mask
;
694 pmac
->u
[2] |= key
->md
.h
[2] & mask
;
695 pmac
->u
[3] |= key
->md
.h
[3] & mask
;
696 pmac
->u
[4] |= key
->md
.h
[4] & mask
;
697 pmac
->u
[5] |= key
->md
.h
[5] & mask
;
698 pmac
->u
[6] |= key
->md
.h
[6] & mask
;
699 pmac
->u
[7] |= key
->md
.h
[7] & mask
;
702 pmac
->u
[0] = BSWAP4(pmac
->u
[0]);
703 pmac
->u
[1] = BSWAP4(pmac
->u
[1]);
704 pmac
->u
[2] = BSWAP4(pmac
->u
[2]);
705 pmac
->u
[3] = BSWAP4(pmac
->u
[3]);
706 pmac
->u
[4] = BSWAP4(pmac
->u
[4]);
707 pmac
->u
[5] = BSWAP4(pmac
->u
[5]);
708 pmac
->u
[6] = BSWAP4(pmac
->u
[6]);
709 pmac
->u
[7] = BSWAP4(pmac
->u
[7]);
711 for (i
= 0; i
< 8; i
++) {
713 pmac
->c
[4 * i
+ 0] = (unsigned char)(res
>> 24);
714 pmac
->c
[4 * i
+ 1] = (unsigned char)(res
>> 16);
715 pmac
->c
[4 * i
+ 2] = (unsigned char)(res
>> 8);
716 pmac
->c
[4 * i
+ 3] = (unsigned char)res
;
719 len
+= SHA256_DIGEST_LENGTH
;
721 SHA256_Update(&key
->md
, out
, inp_len
);
723 SHA256_Final(pmac
->c
, &key
->md
);
726 unsigned int inp_blocks
, pad_blocks
;
728 /* but pretend as if we hashed padded payload */
730 1 + ((SHA256_CBLOCK
- 9 - res
) >> (sizeof(res
) * 8 - 1));
731 res
+= (unsigned int)(len
- inp_len
);
732 pad_blocks
= res
/ SHA256_CBLOCK
;
733 res
%= SHA256_CBLOCK
;
735 1 + ((SHA256_CBLOCK
- 9 - res
) >> (sizeof(res
) * 8 - 1));
736 for (; inp_blocks
< pad_blocks
; inp_blocks
++)
737 sha1_block_data_order(&key
->md
, data
, 1);
741 SHA256_Update(&key
->md
, pmac
->c
, SHA256_DIGEST_LENGTH
);
742 SHA256_Final(pmac
->c
, &key
->md
);
750 out
+ len
- 1 - maxpad
- SHA256_DIGEST_LENGTH
;
751 size_t off
= out
- p
;
752 unsigned int c
, cmask
;
754 maxpad
+= SHA256_DIGEST_LENGTH
;
755 for (res
= 0, i
= 0, j
= 0; j
< maxpad
; j
++) {
758 ((int)(j
- off
- SHA256_DIGEST_LENGTH
)) >>
759 (sizeof(int) * 8 - 1);
760 res
|= (c
^ pad
) & ~cmask
; /* ... and padding */
761 cmask
&= ((int)(off
- 1 - j
)) >> (sizeof(int) * 8 - 1);
762 res
|= (c
^ pmac
->c
[i
]) & cmask
;
765 maxpad
-= SHA256_DIGEST_LENGTH
;
767 res
= 0 - ((0 - res
) >> (sizeof(res
) * 8 - 1));
771 for (res
= 0, i
= 0; i
< SHA256_DIGEST_LENGTH
; i
++)
772 res
|= out
[i
] ^ pmac
->c
[i
];
773 res
= 0 - ((0 - res
) >> (sizeof(res
) * 8 - 1));
777 pad
= (pad
& ~res
) | (maxpad
& res
);
778 out
= out
+ len
- 1 - pad
;
779 for (res
= 0, i
= 0; i
< pad
; i
++)
782 res
= (0 - res
) >> (sizeof(res
) * 8 - 1);
787 SHA256_Update(&key
->md
, out
, len
);
794 static int aesni_cbc_hmac_sha256_ctrl(EVP_CIPHER_CTX
*ctx
, int type
, int arg
,
797 EVP_AES_HMAC_SHA256
*key
= data(ctx
);
798 unsigned int u_arg
= (unsigned int)arg
;
801 case EVP_CTRL_AEAD_SET_MAC_KEY
:
804 unsigned char hmac_key
[64];
806 memset(hmac_key
, 0, sizeof(hmac_key
));
811 if (u_arg
> sizeof(hmac_key
)) {
812 SHA256_Init(&key
->head
);
813 SHA256_Update(&key
->head
, ptr
, arg
);
814 SHA256_Final(hmac_key
, &key
->head
);
816 memcpy(hmac_key
, ptr
, arg
);
819 for (i
= 0; i
< sizeof(hmac_key
); i
++)
820 hmac_key
[i
] ^= 0x36; /* ipad */
821 SHA256_Init(&key
->head
);
822 SHA256_Update(&key
->head
, hmac_key
, sizeof(hmac_key
));
824 for (i
= 0; i
< sizeof(hmac_key
); i
++)
825 hmac_key
[i
] ^= 0x36 ^ 0x5c; /* opad */
826 SHA256_Init(&key
->tail
);
827 SHA256_Update(&key
->tail
, hmac_key
, sizeof(hmac_key
));
829 OPENSSL_cleanse(hmac_key
, sizeof(hmac_key
));
833 case EVP_CTRL_AEAD_TLS1_AAD
:
835 unsigned char *p
= ptr
;
836 unsigned int len
= p
[arg
- 2] << 8 | p
[arg
- 1];
838 if (arg
!= EVP_AEAD_TLS1_AAD_LEN
)
841 if (EVP_CIPHER_CTX_encrypting(ctx
)) {
842 key
->payload_length
= len
;
843 if ((key
->aux
.tls_ver
=
844 p
[arg
- 4] << 8 | p
[arg
- 3]) >= TLS1_1_VERSION
) {
845 len
-= AES_BLOCK_SIZE
;
846 p
[arg
- 2] = len
>> 8;
850 SHA256_Update(&key
->md
, p
, arg
);
852 return (int)(((len
+ SHA256_DIGEST_LENGTH
+
853 AES_BLOCK_SIZE
) & -AES_BLOCK_SIZE
)
856 memcpy(key
->aux
.tls_aad
, ptr
, arg
);
857 key
->payload_length
= arg
;
859 return SHA256_DIGEST_LENGTH
;
862 # if !defined(OPENSSL_NO_MULTIBLOCK) && EVP_CIPH_FLAG_TLS1_1_MULTIBLOCK
863 case EVP_CTRL_TLS1_1_MULTIBLOCK_MAX_BUFSIZE
:
864 return (int)(5 + 16 + ((arg
+ 32 + 16) & -16));
865 case EVP_CTRL_TLS1_1_MULTIBLOCK_AAD
:
867 EVP_CTRL_TLS1_1_MULTIBLOCK_PARAM
*param
=
868 (EVP_CTRL_TLS1_1_MULTIBLOCK_PARAM
*) ptr
;
869 unsigned int n4x
= 1, x4
;
870 unsigned int frag
, last
, packlen
, inp_len
;
875 if (u_arg
< sizeof(EVP_CTRL_TLS1_1_MULTIBLOCK_PARAM
))
878 inp_len
= param
->inp
[11] << 8 | param
->inp
[12];
880 if (EVP_CIPHER_CTX_encrypting(ctx
)) {
881 if ((param
->inp
[9] << 8 | param
->inp
[10]) < TLS1_1_VERSION
)
886 return 0; /* too short */
888 if (inp_len
>= 8192 && OPENSSL_ia32cap_P
[2] & (1 << 5))
890 } else if ((n4x
= param
->interleave
/ 4) && n4x
<= 2)
891 inp_len
= param
->len
;
896 SHA256_Update(&key
->md
, param
->inp
, 13);
901 frag
= inp_len
>> n4x
;
902 last
= inp_len
+ frag
- (frag
<< n4x
);
903 if (last
> frag
&& ((last
+ 13 + 9) % 64 < (x4
- 1))) {
908 packlen
= 5 + 16 + ((frag
+ 32 + 16) & -16);
909 packlen
= (packlen
<< n4x
) - packlen
;
910 packlen
+= 5 + 16 + ((last
+ 32 + 16) & -16);
912 param
->interleave
= x4
;
916 return -1; /* not yet */
918 case EVP_CTRL_TLS1_1_MULTIBLOCK_ENCRYPT
:
920 EVP_CTRL_TLS1_1_MULTIBLOCK_PARAM
*param
=
921 (EVP_CTRL_TLS1_1_MULTIBLOCK_PARAM
*) ptr
;
923 return (int)tls1_1_multi_block_encrypt(key
, param
->out
,
924 param
->inp
, param
->len
,
925 param
->interleave
/ 4);
927 case EVP_CTRL_TLS1_1_MULTIBLOCK_DECRYPT
:
934 static EVP_CIPHER aesni_128_cbc_hmac_sha256_cipher
= {
935 # ifdef NID_aes_128_cbc_hmac_sha256
936 NID_aes_128_cbc_hmac_sha256
,
940 AES_BLOCK_SIZE
, 16, AES_BLOCK_SIZE
,
941 EVP_CIPH_CBC_MODE
| EVP_CIPH_FLAG_DEFAULT_ASN1
|
942 EVP_CIPH_FLAG_AEAD_CIPHER
| EVP_CIPH_FLAG_TLS1_1_MULTIBLOCK
,
943 aesni_cbc_hmac_sha256_init_key
,
944 aesni_cbc_hmac_sha256_cipher
,
946 sizeof(EVP_AES_HMAC_SHA256
),
947 EVP_CIPH_FLAG_DEFAULT_ASN1
? NULL
: EVP_CIPHER_set_asn1_iv
,
948 EVP_CIPH_FLAG_DEFAULT_ASN1
? NULL
: EVP_CIPHER_get_asn1_iv
,
949 aesni_cbc_hmac_sha256_ctrl
,
953 static EVP_CIPHER aesni_256_cbc_hmac_sha256_cipher
= {
954 # ifdef NID_aes_256_cbc_hmac_sha256
955 NID_aes_256_cbc_hmac_sha256
,
959 AES_BLOCK_SIZE
, 32, AES_BLOCK_SIZE
,
960 EVP_CIPH_CBC_MODE
| EVP_CIPH_FLAG_DEFAULT_ASN1
|
961 EVP_CIPH_FLAG_AEAD_CIPHER
| EVP_CIPH_FLAG_TLS1_1_MULTIBLOCK
,
962 aesni_cbc_hmac_sha256_init_key
,
963 aesni_cbc_hmac_sha256_cipher
,
965 sizeof(EVP_AES_HMAC_SHA256
),
966 EVP_CIPH_FLAG_DEFAULT_ASN1
? NULL
: EVP_CIPHER_set_asn1_iv
,
967 EVP_CIPH_FLAG_DEFAULT_ASN1
? NULL
: EVP_CIPHER_get_asn1_iv
,
968 aesni_cbc_hmac_sha256_ctrl
,
972 const EVP_CIPHER
*EVP_aes_128_cbc_hmac_sha256(void)
974 return ((OPENSSL_ia32cap_P
[1] & AESNI_CAPABLE
) &&
975 aesni_cbc_sha256_enc(NULL
, NULL
, 0, NULL
, NULL
, NULL
, NULL
) ?
976 &aesni_128_cbc_hmac_sha256_cipher
: NULL
);
979 const EVP_CIPHER
*EVP_aes_256_cbc_hmac_sha256(void)
981 return ((OPENSSL_ia32cap_P
[1] & AESNI_CAPABLE
) &&
982 aesni_cbc_sha256_enc(NULL
, NULL
, 0, NULL
, NULL
, NULL
, NULL
) ?
983 &aesni_256_cbc_hmac_sha256_cipher
: NULL
);
986 const EVP_CIPHER
*EVP_aes_128_cbc_hmac_sha256(void)
991 const EVP_CIPHER
*EVP_aes_256_cbc_hmac_sha256(void)