]> git.ipfire.org Git - thirdparty/openssl.git/blob - crypto/sha/sha_locl.h
I implemented this when troubleshooting performance problem on SPARC Solaris.
[thirdparty/openssl.git] / crypto / sha / sha_locl.h
1 /* crypto/sha/sha_locl.h */
2 /* Copyright (C) 1995-1998 Eric Young (eay@cryptsoft.com)
3 * All rights reserved.
4 *
5 * This package is an SSL implementation written
6 * by Eric Young (eay@cryptsoft.com).
7 * The implementation was written so as to conform with Netscapes SSL.
8 *
9 * This library is free for commercial and non-commercial use as long as
10 * the following conditions are aheared to. The following conditions
11 * apply to all code found in this distribution, be it the RC4, RSA,
12 * lhash, DES, etc., code; not just the SSL code. The SSL documentation
13 * included with this distribution is covered by the same copyright terms
14 * except that the holder is Tim Hudson (tjh@cryptsoft.com).
15 *
16 * Copyright remains Eric Young's, and as such any Copyright notices in
17 * the code are not to be removed.
18 * If this package is used in a product, Eric Young should be given attribution
19 * as the author of the parts of the library used.
20 * This can be in the form of a textual message at program startup or
21 * in documentation (online or textual) provided with the package.
22 *
23 * Redistribution and use in source and binary forms, with or without
24 * modification, are permitted provided that the following conditions
25 * are met:
26 * 1. Redistributions of source code must retain the copyright
27 * notice, this list of conditions and the following disclaimer.
28 * 2. Redistributions in binary form must reproduce the above copyright
29 * notice, this list of conditions and the following disclaimer in the
30 * documentation and/or other materials provided with the distribution.
31 * 3. All advertising materials mentioning features or use of this software
32 * must display the following acknowledgement:
33 * "This product includes cryptographic software written by
34 * Eric Young (eay@cryptsoft.com)"
35 * The word 'cryptographic' can be left out if the rouines from the library
36 * being used are not cryptographic related :-).
37 * 4. If you include any Windows specific code (or a derivative thereof) from
38 * the apps directory (application code) you must include an acknowledgement:
39 * "This product includes software written by Tim Hudson (tjh@cryptsoft.com)"
40 *
41 * THIS SOFTWARE IS PROVIDED BY ERIC YOUNG ``AS IS'' AND
42 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
43 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
44 * ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
45 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
46 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
47 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
48 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
49 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
50 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
51 * SUCH DAMAGE.
52 *
53 * The licence and distribution terms for any publically available version or
54 * derivative of this code cannot be changed. i.e. this code cannot simply be
55 * copied and put under another distribution licence
56 * [including the GNU Public Licence.]
57 */
58
59 #include <stdlib.h>
60 #include <string.h>
61
62 #include <openssl/opensslconf.h>
63 #include <openssl/sha.h>
64
65 #ifndef SHA_LONG_LOG2
66 #define SHA_LONG_LOG2 2 /* default to 32 bits */
67 #endif
68
69 #define DATA_ORDER_IS_BIG_ENDIAN
70
71 #define HASH_LONG SHA_LONG
72 #define HASH_LONG_LOG2 SHA_LONG_LOG2
73 #define HASH_CTX SHA_CTX
74 #define HASH_CBLOCK SHA_CBLOCK
75 #define HASH_LBLOCK SHA_LBLOCK
76 #define HASH_MAKE_STRING(c,s) do { \
77 unsigned long ll; \
78 ll=(c)->h0; HOST_l2c(ll,(s)); \
79 ll=(c)->h1; HOST_l2c(ll,(s)); \
80 ll=(c)->h2; HOST_l2c(ll,(s)); \
81 ll=(c)->h3; HOST_l2c(ll,(s)); \
82 ll=(c)->h4; HOST_l2c(ll,(s)); \
83 } while (0)
84
85 #if defined(SHA_0)
86
87 # define HASH_UPDATE SHA_Update
88 # define HASH_TRANSFORM SHA_Transform
89 # define HASH_FINAL SHA_Final
90 # define HASH_INIT SHA_Init
91 # define HASH_BLOCK_HOST_ORDER sha_block_host_order
92 # define HASH_BLOCK_DATA_ORDER sha_block_data_order
93 # define Xupdate(a,ix,ia,ib,ic,id) (ix=(a)=(ia^ib^ic^id))
94
95 void sha_block_host_order (SHA_CTX *c, const void *p,int num);
96 void sha_block_data_order (SHA_CTX *c, const void *p,int num);
97
98 #elif defined(SHA_1)
99
100 # define HASH_UPDATE SHA1_Update
101 # define HASH_TRANSFORM SHA1_Transform
102 # define HASH_FINAL SHA1_Final
103 # define HASH_INIT SHA1_Init
104 # define HASH_BLOCK_HOST_ORDER sha1_block_host_order
105 # define HASH_BLOCK_DATA_ORDER sha1_block_data_order
106 # if defined(__MWERKS__) && defined(__MC68K__)
107 /* Metrowerks for Motorola fails otherwise:-( <appro@fy.chalmers.se> */
108 # define Xupdate(a,ix,ia,ib,ic,id) do { (a)=(ia^ib^ic^id); \
109 ix=(a)=ROTATE((a),1); \
110 } while (0)
111 # else
112 # define Xupdate(a,ix,ia,ib,ic,id) ( (a)=(ia^ib^ic^id), \
113 ix=(a)=ROTATE((a),1) \
114 )
115 # endif
116
117 # ifdef SHA1_ASM
118 # if defined(__i386) || defined(__i386__) || defined(_M_IX86) || defined(__INTEL__)
119 # define sha1_block_host_order sha1_block_asm_host_order
120 # define DONT_IMPLEMENT_BLOCK_HOST_ORDER
121 # define sha1_block_data_order sha1_block_asm_data_order
122 # define DONT_IMPLEMENT_BLOCK_DATA_ORDER
123 # define HASH_BLOCK_DATA_ORDER_ALIGNED sha1_block_asm_data_order
124 # endif
125 # endif
126 void sha1_block_host_order (SHA_CTX *c, const void *p,int num);
127 void sha1_block_data_order (SHA_CTX *c, const void *p,int num);
128
129 #else
130 # error "Either SHA_0 or SHA_1 must be defined."
131 #endif
132
133 #include "md32_common.h"
134
135 #define INIT_DATA_h0 0x67452301UL
136 #define INIT_DATA_h1 0xefcdab89UL
137 #define INIT_DATA_h2 0x98badcfeUL
138 #define INIT_DATA_h3 0x10325476UL
139 #define INIT_DATA_h4 0xc3d2e1f0UL
140
141 int HASH_INIT (SHA_CTX *c)
142 {
143 c->h0=INIT_DATA_h0;
144 c->h1=INIT_DATA_h1;
145 c->h2=INIT_DATA_h2;
146 c->h3=INIT_DATA_h3;
147 c->h4=INIT_DATA_h4;
148 c->Nl=0;
149 c->Nh=0;
150 c->num=0;
151 return 1;
152 }
153
154 #define K_00_19 0x5a827999UL
155 #define K_20_39 0x6ed9eba1UL
156 #define K_40_59 0x8f1bbcdcUL
157 #define K_60_79 0xca62c1d6UL
158
159 /* As pointed out by Wei Dai <weidai@eskimo.com>, F() below can be
160 * simplified to the code in F_00_19. Wei attributes these optimisations
161 * to Peter Gutmann's SHS code, and he attributes it to Rich Schroeppel.
162 * #define F(x,y,z) (((x) & (y)) | ((~(x)) & (z)))
163 * I've just become aware of another tweak to be made, again from Wei Dai,
164 * in F_40_59, (x&a)|(y&a) -> (x|y)&a
165 */
166 #define F_00_19(b,c,d) ((((c) ^ (d)) & (b)) ^ (d))
167 #define F_20_39(b,c,d) ((b) ^ (c) ^ (d))
168 #define F_40_59(b,c,d) (((b) & (c)) | (((b)|(c)) & (d)))
169 #define F_60_79(b,c,d) F_20_39(b,c,d)
170
171 #ifndef OPENSSL_SMALL_FOOTPRINT
172
173 #define BODY_00_15(i,a,b,c,d,e,f,xi) \
174 (f)=xi+(e)+K_00_19+ROTATE((a),5)+F_00_19((b),(c),(d)); \
175 (b)=ROTATE((b),30);
176
177 #define BODY_16_19(i,a,b,c,d,e,f,xi,xa,xb,xc,xd) \
178 Xupdate(f,xi,xa,xb,xc,xd); \
179 (f)+=(e)+K_00_19+ROTATE((a),5)+F_00_19((b),(c),(d)); \
180 (b)=ROTATE((b),30);
181
182 #define BODY_20_31(i,a,b,c,d,e,f,xi,xa,xb,xc,xd) \
183 Xupdate(f,xi,xa,xb,xc,xd); \
184 (f)+=(e)+K_20_39+ROTATE((a),5)+F_20_39((b),(c),(d)); \
185 (b)=ROTATE((b),30);
186
187 #define BODY_32_39(i,a,b,c,d,e,f,xa,xb,xc,xd) \
188 Xupdate(f,xa,xa,xb,xc,xd); \
189 (f)+=(e)+K_20_39+ROTATE((a),5)+F_20_39((b),(c),(d)); \
190 (b)=ROTATE((b),30);
191
192 #define BODY_40_59(i,a,b,c,d,e,f,xa,xb,xc,xd) \
193 Xupdate(f,xa,xa,xb,xc,xd); \
194 (f)+=(e)+K_40_59+ROTATE((a),5)+F_40_59((b),(c),(d)); \
195 (b)=ROTATE((b),30);
196
197 #define BODY_60_79(i,a,b,c,d,e,f,xa,xb,xc,xd) \
198 Xupdate(f,xa,xa,xb,xc,xd); \
199 (f)=xa+(e)+K_60_79+ROTATE((a),5)+F_60_79((b),(c),(d)); \
200 (b)=ROTATE((b),30);
201
202 #ifdef X
203 #undef X
204 #endif
205 #ifndef MD32_XARRAY
206 /*
207 * Originally X was an array. As it's automatic it's natural
208 * to expect RISC compiler to accomodate at least part of it in
209 * the register bank, isn't it? Unfortunately not all compilers
210 * "find" this expectation reasonable:-( On order to make such
211 * compilers generate better code I replace X[] with a bunch of
212 * X0, X1, etc. See the function body below...
213 * <appro@fy.chalmers.se>
214 */
215 # define X(i) XX##i
216 #else
217 /*
218 * However! Some compilers (most notably HP C) get overwhelmed by
219 * that many local variables so that we have to have the way to
220 * fall down to the original behavior.
221 */
222 # define X(i) XX[i]
223 #endif
224
225 #ifndef DONT_IMPLEMENT_BLOCK_HOST_ORDER
226 void HASH_BLOCK_HOST_ORDER (SHA_CTX *c, const void *d, int num)
227 {
228 const SHA_LONG *W=d;
229 register unsigned MD32_REG_T A,B,C,D,E,T;
230 #ifndef MD32_XARRAY
231 unsigned MD32_REG_T XX0, XX1, XX2, XX3, XX4, XX5, XX6, XX7,
232 XX8, XX9,XX10,XX11,XX12,XX13,XX14,XX15;
233 #else
234 SHA_LONG XX[16];
235 #endif
236
237 A=c->h0;
238 B=c->h1;
239 C=c->h2;
240 D=c->h3;
241 E=c->h4;
242
243 for (;;)
244 {
245 BODY_00_15( 0,A,B,C,D,E,T,W[ 0]);
246 BODY_00_15( 1,T,A,B,C,D,E,W[ 1]);
247 BODY_00_15( 2,E,T,A,B,C,D,W[ 2]);
248 BODY_00_15( 3,D,E,T,A,B,C,W[ 3]);
249 BODY_00_15( 4,C,D,E,T,A,B,W[ 4]);
250 BODY_00_15( 5,B,C,D,E,T,A,W[ 5]);
251 BODY_00_15( 6,A,B,C,D,E,T,W[ 6]);
252 BODY_00_15( 7,T,A,B,C,D,E,W[ 7]);
253 BODY_00_15( 8,E,T,A,B,C,D,W[ 8]);
254 BODY_00_15( 9,D,E,T,A,B,C,W[ 9]);
255 BODY_00_15(10,C,D,E,T,A,B,W[10]);
256 BODY_00_15(11,B,C,D,E,T,A,W[11]);
257 BODY_00_15(12,A,B,C,D,E,T,W[12]);
258 BODY_00_15(13,T,A,B,C,D,E,W[13]);
259 BODY_00_15(14,E,T,A,B,C,D,W[14]);
260 BODY_00_15(15,D,E,T,A,B,C,W[15]);
261
262 BODY_16_19(16,C,D,E,T,A,B,X( 0),W[ 0],W[ 2],W[ 8],W[13]);
263 BODY_16_19(17,B,C,D,E,T,A,X( 1),W[ 1],W[ 3],W[ 9],W[14]);
264 BODY_16_19(18,A,B,C,D,E,T,X( 2),W[ 2],W[ 4],W[10],W[15]);
265 BODY_16_19(19,T,A,B,C,D,E,X( 3),W[ 3],W[ 5],W[11],X( 0));
266
267 BODY_20_31(20,E,T,A,B,C,D,X( 4),W[ 4],W[ 6],W[12],X( 1));
268 BODY_20_31(21,D,E,T,A,B,C,X( 5),W[ 5],W[ 7],W[13],X( 2));
269 BODY_20_31(22,C,D,E,T,A,B,X( 6),W[ 6],W[ 8],W[14],X( 3));
270 BODY_20_31(23,B,C,D,E,T,A,X( 7),W[ 7],W[ 9],W[15],X( 4));
271 BODY_20_31(24,A,B,C,D,E,T,X( 8),W[ 8],W[10],X( 0),X( 5));
272 BODY_20_31(25,T,A,B,C,D,E,X( 9),W[ 9],W[11],X( 1),X( 6));
273 BODY_20_31(26,E,T,A,B,C,D,X(10),W[10],W[12],X( 2),X( 7));
274 BODY_20_31(27,D,E,T,A,B,C,X(11),W[11],W[13],X( 3),X( 8));
275 BODY_20_31(28,C,D,E,T,A,B,X(12),W[12],W[14],X( 4),X( 9));
276 BODY_20_31(29,B,C,D,E,T,A,X(13),W[13],W[15],X( 5),X(10));
277 BODY_20_31(30,A,B,C,D,E,T,X(14),W[14],X( 0),X( 6),X(11));
278 BODY_20_31(31,T,A,B,C,D,E,X(15),W[15],X( 1),X( 7),X(12));
279
280 BODY_32_39(32,E,T,A,B,C,D,X( 0),X( 2),X( 8),X(13));
281 BODY_32_39(33,D,E,T,A,B,C,X( 1),X( 3),X( 9),X(14));
282 BODY_32_39(34,C,D,E,T,A,B,X( 2),X( 4),X(10),X(15));
283 BODY_32_39(35,B,C,D,E,T,A,X( 3),X( 5),X(11),X( 0));
284 BODY_32_39(36,A,B,C,D,E,T,X( 4),X( 6),X(12),X( 1));
285 BODY_32_39(37,T,A,B,C,D,E,X( 5),X( 7),X(13),X( 2));
286 BODY_32_39(38,E,T,A,B,C,D,X( 6),X( 8),X(14),X( 3));
287 BODY_32_39(39,D,E,T,A,B,C,X( 7),X( 9),X(15),X( 4));
288
289 BODY_40_59(40,C,D,E,T,A,B,X( 8),X(10),X( 0),X( 5));
290 BODY_40_59(41,B,C,D,E,T,A,X( 9),X(11),X( 1),X( 6));
291 BODY_40_59(42,A,B,C,D,E,T,X(10),X(12),X( 2),X( 7));
292 BODY_40_59(43,T,A,B,C,D,E,X(11),X(13),X( 3),X( 8));
293 BODY_40_59(44,E,T,A,B,C,D,X(12),X(14),X( 4),X( 9));
294 BODY_40_59(45,D,E,T,A,B,C,X(13),X(15),X( 5),X(10));
295 BODY_40_59(46,C,D,E,T,A,B,X(14),X( 0),X( 6),X(11));
296 BODY_40_59(47,B,C,D,E,T,A,X(15),X( 1),X( 7),X(12));
297 BODY_40_59(48,A,B,C,D,E,T,X( 0),X( 2),X( 8),X(13));
298 BODY_40_59(49,T,A,B,C,D,E,X( 1),X( 3),X( 9),X(14));
299 BODY_40_59(50,E,T,A,B,C,D,X( 2),X( 4),X(10),X(15));
300 BODY_40_59(51,D,E,T,A,B,C,X( 3),X( 5),X(11),X( 0));
301 BODY_40_59(52,C,D,E,T,A,B,X( 4),X( 6),X(12),X( 1));
302 BODY_40_59(53,B,C,D,E,T,A,X( 5),X( 7),X(13),X( 2));
303 BODY_40_59(54,A,B,C,D,E,T,X( 6),X( 8),X(14),X( 3));
304 BODY_40_59(55,T,A,B,C,D,E,X( 7),X( 9),X(15),X( 4));
305 BODY_40_59(56,E,T,A,B,C,D,X( 8),X(10),X( 0),X( 5));
306 BODY_40_59(57,D,E,T,A,B,C,X( 9),X(11),X( 1),X( 6));
307 BODY_40_59(58,C,D,E,T,A,B,X(10),X(12),X( 2),X( 7));
308 BODY_40_59(59,B,C,D,E,T,A,X(11),X(13),X( 3),X( 8));
309
310 BODY_60_79(60,A,B,C,D,E,T,X(12),X(14),X( 4),X( 9));
311 BODY_60_79(61,T,A,B,C,D,E,X(13),X(15),X( 5),X(10));
312 BODY_60_79(62,E,T,A,B,C,D,X(14),X( 0),X( 6),X(11));
313 BODY_60_79(63,D,E,T,A,B,C,X(15),X( 1),X( 7),X(12));
314 BODY_60_79(64,C,D,E,T,A,B,X( 0),X( 2),X( 8),X(13));
315 BODY_60_79(65,B,C,D,E,T,A,X( 1),X( 3),X( 9),X(14));
316 BODY_60_79(66,A,B,C,D,E,T,X( 2),X( 4),X(10),X(15));
317 BODY_60_79(67,T,A,B,C,D,E,X( 3),X( 5),X(11),X( 0));
318 BODY_60_79(68,E,T,A,B,C,D,X( 4),X( 6),X(12),X( 1));
319 BODY_60_79(69,D,E,T,A,B,C,X( 5),X( 7),X(13),X( 2));
320 BODY_60_79(70,C,D,E,T,A,B,X( 6),X( 8),X(14),X( 3));
321 BODY_60_79(71,B,C,D,E,T,A,X( 7),X( 9),X(15),X( 4));
322 BODY_60_79(72,A,B,C,D,E,T,X( 8),X(10),X( 0),X( 5));
323 BODY_60_79(73,T,A,B,C,D,E,X( 9),X(11),X( 1),X( 6));
324 BODY_60_79(74,E,T,A,B,C,D,X(10),X(12),X( 2),X( 7));
325 BODY_60_79(75,D,E,T,A,B,C,X(11),X(13),X( 3),X( 8));
326 BODY_60_79(76,C,D,E,T,A,B,X(12),X(14),X( 4),X( 9));
327 BODY_60_79(77,B,C,D,E,T,A,X(13),X(15),X( 5),X(10));
328 BODY_60_79(78,A,B,C,D,E,T,X(14),X( 0),X( 6),X(11));
329 BODY_60_79(79,T,A,B,C,D,E,X(15),X( 1),X( 7),X(12));
330
331 c->h0=(c->h0+E)&0xffffffffL;
332 c->h1=(c->h1+T)&0xffffffffL;
333 c->h2=(c->h2+A)&0xffffffffL;
334 c->h3=(c->h3+B)&0xffffffffL;
335 c->h4=(c->h4+C)&0xffffffffL;
336
337 if (--num <= 0) break;
338
339 A=c->h0;
340 B=c->h1;
341 C=c->h2;
342 D=c->h3;
343 E=c->h4;
344
345 W+=SHA_LBLOCK;
346 }
347 }
348 #endif
349
350 #ifndef DONT_IMPLEMENT_BLOCK_DATA_ORDER
351 void HASH_BLOCK_DATA_ORDER (SHA_CTX *c, const void *p, int num)
352 {
353 const unsigned char *data=p;
354 register unsigned MD32_REG_T A,B,C,D,E,T,l;
355 #ifndef MD32_XARRAY
356 unsigned MD32_REG_T XX0, XX1, XX2, XX3, XX4, XX5, XX6, XX7,
357 XX8, XX9,XX10,XX11,XX12,XX13,XX14,XX15;
358 #else
359 SHA_LONG XX[16];
360 #endif
361
362 A=c->h0;
363 B=c->h1;
364 C=c->h2;
365 D=c->h3;
366 E=c->h4;
367
368 for (;;)
369 {
370
371 HOST_c2l(data,l); X( 0)=l; HOST_c2l(data,l); X( 1)=l;
372 BODY_00_15( 0,A,B,C,D,E,T,X( 0)); HOST_c2l(data,l); X( 2)=l;
373 BODY_00_15( 1,T,A,B,C,D,E,X( 1)); HOST_c2l(data,l); X( 3)=l;
374 BODY_00_15( 2,E,T,A,B,C,D,X( 2)); HOST_c2l(data,l); X( 4)=l;
375 BODY_00_15( 3,D,E,T,A,B,C,X( 3)); HOST_c2l(data,l); X( 5)=l;
376 BODY_00_15( 4,C,D,E,T,A,B,X( 4)); HOST_c2l(data,l); X( 6)=l;
377 BODY_00_15( 5,B,C,D,E,T,A,X( 5)); HOST_c2l(data,l); X( 7)=l;
378 BODY_00_15( 6,A,B,C,D,E,T,X( 6)); HOST_c2l(data,l); X( 8)=l;
379 BODY_00_15( 7,T,A,B,C,D,E,X( 7)); HOST_c2l(data,l); X( 9)=l;
380 BODY_00_15( 8,E,T,A,B,C,D,X( 8)); HOST_c2l(data,l); X(10)=l;
381 BODY_00_15( 9,D,E,T,A,B,C,X( 9)); HOST_c2l(data,l); X(11)=l;
382 BODY_00_15(10,C,D,E,T,A,B,X(10)); HOST_c2l(data,l); X(12)=l;
383 BODY_00_15(11,B,C,D,E,T,A,X(11)); HOST_c2l(data,l); X(13)=l;
384 BODY_00_15(12,A,B,C,D,E,T,X(12)); HOST_c2l(data,l); X(14)=l;
385 BODY_00_15(13,T,A,B,C,D,E,X(13)); HOST_c2l(data,l); X(15)=l;
386 BODY_00_15(14,E,T,A,B,C,D,X(14));
387 BODY_00_15(15,D,E,T,A,B,C,X(15));
388
389 BODY_16_19(16,C,D,E,T,A,B,X( 0),X( 0),X( 2),X( 8),X(13));
390 BODY_16_19(17,B,C,D,E,T,A,X( 1),X( 1),X( 3),X( 9),X(14));
391 BODY_16_19(18,A,B,C,D,E,T,X( 2),X( 2),X( 4),X(10),X(15));
392 BODY_16_19(19,T,A,B,C,D,E,X( 3),X( 3),X( 5),X(11),X( 0));
393
394 BODY_20_31(20,E,T,A,B,C,D,X( 4),X( 4),X( 6),X(12),X( 1));
395 BODY_20_31(21,D,E,T,A,B,C,X( 5),X( 5),X( 7),X(13),X( 2));
396 BODY_20_31(22,C,D,E,T,A,B,X( 6),X( 6),X( 8),X(14),X( 3));
397 BODY_20_31(23,B,C,D,E,T,A,X( 7),X( 7),X( 9),X(15),X( 4));
398 BODY_20_31(24,A,B,C,D,E,T,X( 8),X( 8),X(10),X( 0),X( 5));
399 BODY_20_31(25,T,A,B,C,D,E,X( 9),X( 9),X(11),X( 1),X( 6));
400 BODY_20_31(26,E,T,A,B,C,D,X(10),X(10),X(12),X( 2),X( 7));
401 BODY_20_31(27,D,E,T,A,B,C,X(11),X(11),X(13),X( 3),X( 8));
402 BODY_20_31(28,C,D,E,T,A,B,X(12),X(12),X(14),X( 4),X( 9));
403 BODY_20_31(29,B,C,D,E,T,A,X(13),X(13),X(15),X( 5),X(10));
404 BODY_20_31(30,A,B,C,D,E,T,X(14),X(14),X( 0),X( 6),X(11));
405 BODY_20_31(31,T,A,B,C,D,E,X(15),X(15),X( 1),X( 7),X(12));
406
407 BODY_32_39(32,E,T,A,B,C,D,X( 0),X( 2),X( 8),X(13));
408 BODY_32_39(33,D,E,T,A,B,C,X( 1),X( 3),X( 9),X(14));
409 BODY_32_39(34,C,D,E,T,A,B,X( 2),X( 4),X(10),X(15));
410 BODY_32_39(35,B,C,D,E,T,A,X( 3),X( 5),X(11),X( 0));
411 BODY_32_39(36,A,B,C,D,E,T,X( 4),X( 6),X(12),X( 1));
412 BODY_32_39(37,T,A,B,C,D,E,X( 5),X( 7),X(13),X( 2));
413 BODY_32_39(38,E,T,A,B,C,D,X( 6),X( 8),X(14),X( 3));
414 BODY_32_39(39,D,E,T,A,B,C,X( 7),X( 9),X(15),X( 4));
415
416 BODY_40_59(40,C,D,E,T,A,B,X( 8),X(10),X( 0),X( 5));
417 BODY_40_59(41,B,C,D,E,T,A,X( 9),X(11),X( 1),X( 6));
418 BODY_40_59(42,A,B,C,D,E,T,X(10),X(12),X( 2),X( 7));
419 BODY_40_59(43,T,A,B,C,D,E,X(11),X(13),X( 3),X( 8));
420 BODY_40_59(44,E,T,A,B,C,D,X(12),X(14),X( 4),X( 9));
421 BODY_40_59(45,D,E,T,A,B,C,X(13),X(15),X( 5),X(10));
422 BODY_40_59(46,C,D,E,T,A,B,X(14),X( 0),X( 6),X(11));
423 BODY_40_59(47,B,C,D,E,T,A,X(15),X( 1),X( 7),X(12));
424 BODY_40_59(48,A,B,C,D,E,T,X( 0),X( 2),X( 8),X(13));
425 BODY_40_59(49,T,A,B,C,D,E,X( 1),X( 3),X( 9),X(14));
426 BODY_40_59(50,E,T,A,B,C,D,X( 2),X( 4),X(10),X(15));
427 BODY_40_59(51,D,E,T,A,B,C,X( 3),X( 5),X(11),X( 0));
428 BODY_40_59(52,C,D,E,T,A,B,X( 4),X( 6),X(12),X( 1));
429 BODY_40_59(53,B,C,D,E,T,A,X( 5),X( 7),X(13),X( 2));
430 BODY_40_59(54,A,B,C,D,E,T,X( 6),X( 8),X(14),X( 3));
431 BODY_40_59(55,T,A,B,C,D,E,X( 7),X( 9),X(15),X( 4));
432 BODY_40_59(56,E,T,A,B,C,D,X( 8),X(10),X( 0),X( 5));
433 BODY_40_59(57,D,E,T,A,B,C,X( 9),X(11),X( 1),X( 6));
434 BODY_40_59(58,C,D,E,T,A,B,X(10),X(12),X( 2),X( 7));
435 BODY_40_59(59,B,C,D,E,T,A,X(11),X(13),X( 3),X( 8));
436
437 BODY_60_79(60,A,B,C,D,E,T,X(12),X(14),X( 4),X( 9));
438 BODY_60_79(61,T,A,B,C,D,E,X(13),X(15),X( 5),X(10));
439 BODY_60_79(62,E,T,A,B,C,D,X(14),X( 0),X( 6),X(11));
440 BODY_60_79(63,D,E,T,A,B,C,X(15),X( 1),X( 7),X(12));
441 BODY_60_79(64,C,D,E,T,A,B,X( 0),X( 2),X( 8),X(13));
442 BODY_60_79(65,B,C,D,E,T,A,X( 1),X( 3),X( 9),X(14));
443 BODY_60_79(66,A,B,C,D,E,T,X( 2),X( 4),X(10),X(15));
444 BODY_60_79(67,T,A,B,C,D,E,X( 3),X( 5),X(11),X( 0));
445 BODY_60_79(68,E,T,A,B,C,D,X( 4),X( 6),X(12),X( 1));
446 BODY_60_79(69,D,E,T,A,B,C,X( 5),X( 7),X(13),X( 2));
447 BODY_60_79(70,C,D,E,T,A,B,X( 6),X( 8),X(14),X( 3));
448 BODY_60_79(71,B,C,D,E,T,A,X( 7),X( 9),X(15),X( 4));
449 BODY_60_79(72,A,B,C,D,E,T,X( 8),X(10),X( 0),X( 5));
450 BODY_60_79(73,T,A,B,C,D,E,X( 9),X(11),X( 1),X( 6));
451 BODY_60_79(74,E,T,A,B,C,D,X(10),X(12),X( 2),X( 7));
452 BODY_60_79(75,D,E,T,A,B,C,X(11),X(13),X( 3),X( 8));
453 BODY_60_79(76,C,D,E,T,A,B,X(12),X(14),X( 4),X( 9));
454 BODY_60_79(77,B,C,D,E,T,A,X(13),X(15),X( 5),X(10));
455 BODY_60_79(78,A,B,C,D,E,T,X(14),X( 0),X( 6),X(11));
456 BODY_60_79(79,T,A,B,C,D,E,X(15),X( 1),X( 7),X(12));
457
458 c->h0=(c->h0+E)&0xffffffffL;
459 c->h1=(c->h1+T)&0xffffffffL;
460 c->h2=(c->h2+A)&0xffffffffL;
461 c->h3=(c->h3+B)&0xffffffffL;
462 c->h4=(c->h4+C)&0xffffffffL;
463
464 if (--num <= 0) break;
465
466 A=c->h0;
467 B=c->h1;
468 C=c->h2;
469 D=c->h3;
470 E=c->h4;
471
472 }
473 }
474 #endif
475
476 #else /* OPENSSL_SMALL_FOOTPRINT */
477
478 #define BODY_00_15(xi) do { \
479 T=E+K_00_19+F_00_19(B,C,D); \
480 E=D, D=C, C=ROTATE(B,30), B=A; \
481 A=ROTATE(A,5)+T+xi; } while(0)
482
483 #define BODY_16_19(xa,xb,xc,xd) do { \
484 Xupdate(T,xa,xa,xb,xc,xd); \
485 T+=E+K_00_19+F_00_19(B,C,D); \
486 E=D, D=C, C=ROTATE(B,30), B=A; \
487 A=ROTATE(A,5)+T; } while(0)
488
489 #define BODY_20_39(xa,xb,xc,xd) do { \
490 Xupdate(T,xa,xa,xb,xc,xd); \
491 T+=E+K_20_39+F_20_39(B,C,D); \
492 E=D, D=C, C=ROTATE(B,30), B=A; \
493 A=ROTATE(A,5)+T; } while(0)
494
495 #define BODY_40_59(xa,xb,xc,xd) do { \
496 Xupdate(T,xa,xa,xb,xc,xd); \
497 T+=E+K_40_59+F_40_59(B,C,D); \
498 E=D, D=C, C=ROTATE(B,30), B=A; \
499 A=ROTATE(A,5)+T; } while(0)
500
501 #define BODY_60_79(xa,xb,xc,xd) do { \
502 Xupdate(T,xa,xa,xb,xc,xd); \
503 T=E+K_60_79+F_60_79(B,C,D); \
504 E=D, D=C, C=ROTATE(B,30), B=A; \
505 A=ROTATE(A,5)+T+xa; } while(0)
506
507 #ifndef DONT_IMPLEMENT_BLOCK_HOST_ORDER
508 void HASH_BLOCK_HOST_ORDER (SHA_CTX *c, const void *d, int num)
509 {
510 const SHA_LONG *W=d;
511 register unsigned MD32_REG_T A,B,C,D,E,T;
512 int i;
513 SHA_LONG X[16];
514
515 A=c->h0;
516 B=c->h1;
517 C=c->h2;
518 D=c->h3;
519 E=c->h4;
520
521 for (;;)
522 {
523 for (i=0;i<16;i++)
524 { X[i]=W[i]; BODY_00_15(X[i]); }
525 for (i=0;i<4;i++)
526 { BODY_16_19(X[i], X[i+2], X[i+8], X[(i+13)&15]); }
527 for (;i<24;i++)
528 { BODY_20_39(X[i&15], X[(i+2)&15], X[(i+8)&15],X[(i+13)&15]); }
529 for (i=0;i<20;i++)
530 { BODY_40_59(X[(i+8)&15],X[(i+10)&15],X[i&15], X[(i+5)&15]); }
531 for (i=4;i<24;i++)
532 { BODY_60_79(X[(i+8)&15],X[(i+10)&15],X[i&15], X[(i+5)&15]); }
533
534 c->h0=(c->h0+A)&0xffffffffL;
535 c->h1=(c->h1+B)&0xffffffffL;
536 c->h2=(c->h2+C)&0xffffffffL;
537 c->h3=(c->h3+D)&0xffffffffL;
538 c->h4=(c->h4+E)&0xffffffffL;
539
540 if (--num <= 0) break;
541
542 A=c->h0;
543 B=c->h1;
544 C=c->h2;
545 D=c->h3;
546 E=c->h4;
547
548 W+=SHA_LBLOCK;
549 }
550 }
551 #endif
552
553 #ifndef DONT_IMPLEMENT_BLOCK_DATA_ORDER
554 void HASH_BLOCK_DATA_ORDER (SHA_CTX *c, const void *p, int num)
555 {
556 const unsigned char *data=p;
557 register unsigned MD32_REG_T A,B,C,D,E,T,l;
558 int i;
559 SHA_LONG X[16];
560
561 A=c->h0;
562 B=c->h1;
563 C=c->h2;
564 D=c->h3;
565 E=c->h4;
566
567 for (;;)
568 {
569 for (i=0;i<16;i++)
570 { HOST_c2l(data,l); X[i]=l; BODY_00_15(X[i]); }
571 for (i=0;i<4;i++)
572 { BODY_16_19(X[i], X[i+2], X[i+8], X[(i+13)&15]); }
573 for (;i<24;i++)
574 { BODY_20_39(X[i&15], X[(i+2)&15], X[(i+8)&15],X[(i+13)&15]); }
575 for (i=0;i<20;i++)
576 { BODY_40_59(X[(i+8)&15],X[(i+10)&15],X[i&15], X[(i+5)&15]); }
577 for (i=4;i<24;i++)
578 { BODY_60_79(X[(i+8)&15],X[(i+10)&15],X[i&15], X[(i+5)&15]); }
579
580 c->h0=(c->h0+A)&0xffffffffL;
581 c->h1=(c->h1+B)&0xffffffffL;
582 c->h2=(c->h2+C)&0xffffffffL;
583 c->h3=(c->h3+D)&0xffffffffL;
584 c->h4=(c->h4+E)&0xffffffffL;
585
586 if (--num <= 0) break;
587
588 A=c->h0;
589 B=c->h1;
590 C=c->h2;
591 D=c->h3;
592 E=c->h4;
593
594 }
595 }
596 #endif
597
598 #endif