1 /* crypto/sha/sha512.c */
2 /* ====================================================================
3 * Copyright (c) 2004 The OpenSSL Project. All rights reserved
4 * according to the OpenSSL license [found in ../../LICENSE].
5 * ====================================================================
7 #if !defined(OPENSSL_NO_SHA) && !defined(OPENSSL_NO_SHA512)
9 * IMPLEMENTATION NOTES.
11 * As you might have noticed 32-bit hash algorithms:
13 * - permit SHA_LONG to be wider than 32-bit (case on CRAY);
14 * - optimized versions implement two transform functions: one operating
15 * on [aligned] data in host byte order and one - on data in input
17 * - share common byte-order neutral collector and padding function
18 * implementations, ../md32_common.h;
20 * Neither of the above applies to this SHA-512 implementations. Reasons
21 * [in reverse order] are:
23 * - it's the only 64-bit hash algorithm for the moment of this writing,
24 * there is no need for common collector/padding implementation [yet];
25 * - by supporting only one transform function [which operates on
26 * *aligned* data in input stream byte order, big-endian in this case]
27 * we minimize burden of maintenance in two ways: a) collector/padding
28 * function is simpler; b) only one transform function to stare at;
29 * - SHA_LONG64 is required to be exactly 64-bit in order to be able to
30 * apply a number of optimizations to mitigate potential performance
31 * penalties caused by previous design decision;
35 * Implementation relies on the fact that "long long" is 64-bit on
36 * both 32- and 64-bit platforms. If some compiler vendor comes up
37 * with 128-bit long long, adjustment to sha.h would be required.
38 * As this implementation relies on 64-bit integer type, it's totally
39 * inappropriate for platforms which don't support it, most notably
41 * <appro@fy.chalmers.se>
46 #include <openssl/opensslconf.h>
47 #include <openssl/crypto.h>
48 #include <openssl/fips_sha.h>
49 #include <openssl/fips.h>
50 #include <openssl/opensslv.h>
54 const char SHA512_version[]="SHA-512" OPENSSL_VERSION_PTEXT;
56 #if defined(_M_IX86) || defined(_M_AMD64) || defined(__i386) || defined(__x86_64)
57 #define SHA512_BLOCK_CAN_MANAGE_UNALIGNED_DATA
60 int SHA384_Init (SHA512_CTX *c)
62 c->h[0]=U64(0xcbbb9d5dc1059ed8);
63 c->h[1]=U64(0x629a292a367cd507);
64 c->h[2]=U64(0x9159015a3070dd17);
65 c->h[3]=U64(0x152fecd8f70e5939);
66 c->h[4]=U64(0x67332667ffc00b31);
67 c->h[5]=U64(0x8eb44a8768581511);
68 c->h[6]=U64(0xdb0c2e0d64f98fa7);
69 c->h[7]=U64(0x47b5481dbefa4fa4);
71 c->num=0; c->md_len=SHA384_DIGEST_LENGTH;
75 int SHA512_Init (SHA512_CTX *c)
77 c->h[0]=U64(0x6a09e667f3bcc908);
78 c->h[1]=U64(0xbb67ae8584caa73b);
79 c->h[2]=U64(0x3c6ef372fe94f82b);
80 c->h[3]=U64(0xa54ff53a5f1d36f1);
81 c->h[4]=U64(0x510e527fade682d1);
82 c->h[5]=U64(0x9b05688c2b3e6c1f);
83 c->h[6]=U64(0x1f83d9abfb41bd6b);
84 c->h[7]=U64(0x5be0cd19137e2179);
86 c->num=0; c->md_len=SHA512_DIGEST_LENGTH;
93 void sha512_block (SHA512_CTX *ctx, const void *in, size_t num);
95 int SHA512_Final (unsigned char *md, SHA512_CTX *c)
97 unsigned char *p=(unsigned char *)c->u.p;
100 p[n]=0x80; /* There always is a room for one */
102 if (n > (sizeof(c->u)-16))
103 memset (p+n,0,sizeof(c->u)-n), n=0,
104 sha512_block (c,p,1);
106 memset (p+n,0,sizeof(c->u)-16-n);
108 c->u.d[SHA_LBLOCK-2] = c->Nh;
109 c->u.d[SHA_LBLOCK-1] = c->Nl;
111 p[sizeof(c->u)-1] = (unsigned char)(c->Nl);
112 p[sizeof(c->u)-2] = (unsigned char)(c->Nl>>8);
113 p[sizeof(c->u)-3] = (unsigned char)(c->Nl>>16);
114 p[sizeof(c->u)-4] = (unsigned char)(c->Nl>>24);
115 p[sizeof(c->u)-5] = (unsigned char)(c->Nl>>32);
116 p[sizeof(c->u)-6] = (unsigned char)(c->Nl>>40);
117 p[sizeof(c->u)-7] = (unsigned char)(c->Nl>>48);
118 p[sizeof(c->u)-8] = (unsigned char)(c->Nl>>56);
119 p[sizeof(c->u)-9] = (unsigned char)(c->Nh);
120 p[sizeof(c->u)-10] = (unsigned char)(c->Nh>>8);
121 p[sizeof(c->u)-11] = (unsigned char)(c->Nh>>16);
122 p[sizeof(c->u)-12] = (unsigned char)(c->Nh>>24);
123 p[sizeof(c->u)-13] = (unsigned char)(c->Nh>>32);
124 p[sizeof(c->u)-14] = (unsigned char)(c->Nh>>40);
125 p[sizeof(c->u)-15] = (unsigned char)(c->Nh>>48);
126 p[sizeof(c->u)-16] = (unsigned char)(c->Nh>>56);
129 sha512_block (c,p,1);
135 /* Let compiler decide if it's appropriate to unroll... */
136 case SHA384_DIGEST_LENGTH:
137 for (n=0;n<SHA384_DIGEST_LENGTH/8;n++)
139 SHA_LONG64 t = c->h[n];
141 *(md++) = (unsigned char)(t>>56);
142 *(md++) = (unsigned char)(t>>48);
143 *(md++) = (unsigned char)(t>>40);
144 *(md++) = (unsigned char)(t>>32);
145 *(md++) = (unsigned char)(t>>24);
146 *(md++) = (unsigned char)(t>>16);
147 *(md++) = (unsigned char)(t>>8);
148 *(md++) = (unsigned char)(t);
151 case SHA512_DIGEST_LENGTH:
152 for (n=0;n<SHA512_DIGEST_LENGTH/8;n++)
154 SHA_LONG64 t = c->h[n];
156 *(md++) = (unsigned char)(t>>56);
157 *(md++) = (unsigned char)(t>>48);
158 *(md++) = (unsigned char)(t>>40);
159 *(md++) = (unsigned char)(t>>32);
160 *(md++) = (unsigned char)(t>>24);
161 *(md++) = (unsigned char)(t>>16);
162 *(md++) = (unsigned char)(t>>8);
163 *(md++) = (unsigned char)(t);
166 /* ... as well as make sure md_len is not abused. */
173 int SHA384_Final (unsigned char *md,SHA512_CTX *c)
174 { return SHA512_Final (md,c); }
176 int SHA512_Update (SHA512_CTX *c, const void *_data, size_t len)
179 unsigned char *p=c->u.p;
180 const unsigned char *data=(const unsigned char *)_data;
182 if(FIPS_selftest_failed())
185 if (len==0) return 1;
187 l = (c->Nl+(((SHA_LONG64)len)<<3))&U64(0xffffffffffffffff);
188 if (l < c->Nl) c->Nh++;
189 if (sizeof(len)>=8) c->Nh+=(((SHA_LONG64)len)>>61);
194 size_t n = sizeof(c->u) - c->num;
198 memcpy (p+c->num,data,len), c->num += len;
202 memcpy (p+c->num,data,n), c->num = 0;
204 sha512_block (c,p,1);
208 if (len >= sizeof(c->u))
210 #ifndef SHA512_BLOCK_CAN_MANAGE_UNALIGNED_DATA
211 if ((size_t)data%sizeof(c->u.d[0]) != 0)
212 while (len >= sizeof(c->u))
213 memcpy (p,data,sizeof(c->u)),
214 sha512_block (c,p,1),
216 data += sizeof(c->u);
219 sha512_block (c,data,len/sizeof(c->u)),
225 if (len != 0) memcpy (p,data,len), c->num = (int)len;
230 int SHA384_Update (SHA512_CTX *c, const void *data, size_t len)
231 { return SHA512_Update (c,data,len); }
233 void SHA512_Transform (SHA512_CTX *c, const unsigned char *data)
234 { sha512_block (c,data,1); }
236 unsigned char *SHA384(const unsigned char *d, size_t n, unsigned char *md)
239 static unsigned char m[SHA384_DIGEST_LENGTH];
241 if (md == NULL) md=m;
243 SHA512_Update(&c,d,n);
245 OPENSSL_cleanse(&c,sizeof(c));
249 unsigned char *SHA512(const unsigned char *d, size_t n, unsigned char *md)
252 static unsigned char m[SHA512_DIGEST_LENGTH];
254 if (md == NULL) md=m;
256 SHA512_Update(&c,d,n);
258 OPENSSL_cleanse(&c,sizeof(c));
263 static const SHA_LONG64 K512[80] = {
264 U64(0x428a2f98d728ae22),U64(0x7137449123ef65cd),
265 U64(0xb5c0fbcfec4d3b2f),U64(0xe9b5dba58189dbbc),
266 U64(0x3956c25bf348b538),U64(0x59f111f1b605d019),
267 U64(0x923f82a4af194f9b),U64(0xab1c5ed5da6d8118),
268 U64(0xd807aa98a3030242),U64(0x12835b0145706fbe),
269 U64(0x243185be4ee4b28c),U64(0x550c7dc3d5ffb4e2),
270 U64(0x72be5d74f27b896f),U64(0x80deb1fe3b1696b1),
271 U64(0x9bdc06a725c71235),U64(0xc19bf174cf692694),
272 U64(0xe49b69c19ef14ad2),U64(0xefbe4786384f25e3),
273 U64(0x0fc19dc68b8cd5b5),U64(0x240ca1cc77ac9c65),
274 U64(0x2de92c6f592b0275),U64(0x4a7484aa6ea6e483),
275 U64(0x5cb0a9dcbd41fbd4),U64(0x76f988da831153b5),
276 U64(0x983e5152ee66dfab),U64(0xa831c66d2db43210),
277 U64(0xb00327c898fb213f),U64(0xbf597fc7beef0ee4),
278 U64(0xc6e00bf33da88fc2),U64(0xd5a79147930aa725),
279 U64(0x06ca6351e003826f),U64(0x142929670a0e6e70),
280 U64(0x27b70a8546d22ffc),U64(0x2e1b21385c26c926),
281 U64(0x4d2c6dfc5ac42aed),U64(0x53380d139d95b3df),
282 U64(0x650a73548baf63de),U64(0x766a0abb3c77b2a8),
283 U64(0x81c2c92e47edaee6),U64(0x92722c851482353b),
284 U64(0xa2bfe8a14cf10364),U64(0xa81a664bbc423001),
285 U64(0xc24b8b70d0f89791),U64(0xc76c51a30654be30),
286 U64(0xd192e819d6ef5218),U64(0xd69906245565a910),
287 U64(0xf40e35855771202a),U64(0x106aa07032bbd1b8),
288 U64(0x19a4c116b8d2d0c8),U64(0x1e376c085141ab53),
289 U64(0x2748774cdf8eeb99),U64(0x34b0bcb5e19b48a8),
290 U64(0x391c0cb3c5c95a63),U64(0x4ed8aa4ae3418acb),
291 U64(0x5b9cca4f7763e373),U64(0x682e6ff3d6b2b8a3),
292 U64(0x748f82ee5defb2fc),U64(0x78a5636f43172f60),
293 U64(0x84c87814a1f0ab72),U64(0x8cc702081a6439ec),
294 U64(0x90befffa23631e28),U64(0xa4506cebde82bde9),
295 U64(0xbef9a3f7b2c67915),U64(0xc67178f2e372532b),
296 U64(0xca273eceea26619c),U64(0xd186b8c721c0c207),
297 U64(0xeada7dd6cde0eb1e),U64(0xf57d4f7fee6ed178),
298 U64(0x06f067aa72176fba),U64(0x0a637dc5a2c898a6),
299 U64(0x113f9804bef90dae),U64(0x1b710b35131c471b),
300 U64(0x28db77f523047d84),U64(0x32caab7b40c72493),
301 U64(0x3c9ebe0a15c9bebc),U64(0x431d67c49c100d4c),
302 U64(0x4cc5d4becb3e42b6),U64(0x597f299cfc657e2a),
303 U64(0x5fcb6fab3ad6faec),U64(0x6c44198c4a475817) };
306 # if defined(__GNUC__) && __GNUC__>=2 && !defined(OPENSSL_NO_ASM) && !defined(OPENSSL_NO_INLINE_ASM)
307 # if defined(__x86_64) || defined(__x86_64__)
308 # define PULL64(x) ({ SHA_LONG64 ret=*((const SHA_LONG64 *)(&(x))); \
317 #define B(x,j) (((SHA_LONG64)(*(((const unsigned char *)(&x))+j)))<<((7-j)*8))
318 #define PULL64(x) (B(x,0)|B(x,1)|B(x,2)|B(x,3)|B(x,4)|B(x,5)|B(x,6)|B(x,7))
322 # if defined(_MSC_VER)
323 # if defined(_WIN64) /* applies to both IA-64 and AMD64 */
324 # define ROTR(a,n) _rotr64((a),n)
326 # elif defined(__GNUC__) && __GNUC__>=2 && !defined(OPENSSL_NO_ASM) && !defined(OPENSSL_NO_INLINE_ASM)
327 # if defined(__x86_64) || defined(__x86_64__)
328 # define ROTR(a,n) ({ unsigned long ret; \
333 # elif defined(_ARCH_PPC) && defined(__64BIT__)
334 # define ROTR(a,n) ({ unsigned long ret; \
335 asm ("rotrdi %0,%1,%2" \
337 : "r"(a),"K"(n)); ret; })
343 #define ROTR(x,s) (((x)>>s) | (x)<<(64-s))
346 #define Sigma0(x) (ROTR((x),28) ^ ROTR((x),34) ^ ROTR((x),39))
347 #define Sigma1(x) (ROTR((x),14) ^ ROTR((x),18) ^ ROTR((x),41))
348 #define sigma0(x) (ROTR((x),1) ^ ROTR((x),8) ^ ((x)>>7))
349 #define sigma1(x) (ROTR((x),19) ^ ROTR((x),61) ^ ((x)>>6))
351 #define Ch(x,y,z) (((x) & (y)) ^ ((~(x)) & (z)))
352 #define Maj(x,y,z) (((x) & (y)) ^ ((x) & (z)) ^ ((y) & (z)))
354 #ifdef OPENSSL_SMALL_FOOTPRINT
356 static void sha512_block (SHA512_CTX *ctx, const void *in, size_t num)
358 const SHA_LONG64 *W=in;
359 SHA_LONG64 a,b,c,d,e,f,g,h,s0,s1,T1,T2;
365 a = ctx->h[0]; b = ctx->h[1]; c = ctx->h[2]; d = ctx->h[3];
366 e = ctx->h[4]; f = ctx->h[5]; g = ctx->h[6]; h = ctx->h[7];
373 T1 = X[i] = PULL64(W[i]);
375 T1 += h + Sigma1(e) + Ch(e,f,g) + K512[i];
376 T2 = Sigma0(a) + Maj(a,b,c);
377 h = g; g = f; f = e; e = d + T1;
378 d = c; c = b; b = a; a = T1 + T2;
383 s0 = X[(i+1)&0x0f]; s0 = sigma0(s0);
384 s1 = X[(i+14)&0x0f]; s1 = sigma1(s1);
386 T1 = X[i&0xf] += s0 + s1 + X[(i+9)&0xf];
387 T1 += h + Sigma1(e) + Ch(e,f,g) + K512[i];
388 T2 = Sigma0(a) + Maj(a,b,c);
389 h = g; g = f; f = e; e = d + T1;
390 d = c; c = b; b = a; a = T1 + T2;
393 ctx->h[0] += a; ctx->h[1] += b; ctx->h[2] += c; ctx->h[3] += d;
394 ctx->h[4] += e; ctx->h[5] += f; ctx->h[6] += g; ctx->h[7] += h;
402 #define ROUND_00_15(i,a,b,c,d,e,f,g,h) do { \
403 T1 += h + Sigma1(e) + Ch(e,f,g) + K512[i]; \
404 h = Sigma0(a) + Maj(a,b,c); \
405 d += T1; h += T1; } while (0)
407 #define ROUND_16_80(i,a,b,c,d,e,f,g,h,X) do { \
408 s0 = X[(i+1)&0x0f]; s0 = sigma0(s0); \
409 s1 = X[(i+14)&0x0f]; s1 = sigma1(s1); \
410 T1 = X[(i)&0x0f] += s0 + s1 + X[(i+9)&0x0f]; \
411 ROUND_00_15(i,a,b,c,d,e,f,g,h); } while (0)
413 static void sha512_block (SHA512_CTX *ctx, const void *in, size_t num)
415 const SHA_LONG64 *W=in;
416 SHA_LONG64 a,b,c,d,e,f,g,h,s0,s1,T1;
422 a = ctx->h[0]; b = ctx->h[1]; c = ctx->h[2]; d = ctx->h[3];
423 e = ctx->h[4]; f = ctx->h[5]; g = ctx->h[6]; h = ctx->h[7];
426 T1 = X[0] = W[0]; ROUND_00_15(0,a,b,c,d,e,f,g,h);
427 T1 = X[1] = W[1]; ROUND_00_15(1,h,a,b,c,d,e,f,g);
428 T1 = X[2] = W[2]; ROUND_00_15(2,g,h,a,b,c,d,e,f);
429 T1 = X[3] = W[3]; ROUND_00_15(3,f,g,h,a,b,c,d,e);
430 T1 = X[4] = W[4]; ROUND_00_15(4,e,f,g,h,a,b,c,d);
431 T1 = X[5] = W[5]; ROUND_00_15(5,d,e,f,g,h,a,b,c);
432 T1 = X[6] = W[6]; ROUND_00_15(6,c,d,e,f,g,h,a,b);
433 T1 = X[7] = W[7]; ROUND_00_15(7,b,c,d,e,f,g,h,a);
434 T1 = X[8] = W[8]; ROUND_00_15(8,a,b,c,d,e,f,g,h);
435 T1 = X[9] = W[9]; ROUND_00_15(9,h,a,b,c,d,e,f,g);
436 T1 = X[10] = W[10]; ROUND_00_15(10,g,h,a,b,c,d,e,f);
437 T1 = X[11] = W[11]; ROUND_00_15(11,f,g,h,a,b,c,d,e);
438 T1 = X[12] = W[12]; ROUND_00_15(12,e,f,g,h,a,b,c,d);
439 T1 = X[13] = W[13]; ROUND_00_15(13,d,e,f,g,h,a,b,c);
440 T1 = X[14] = W[14]; ROUND_00_15(14,c,d,e,f,g,h,a,b);
441 T1 = X[15] = W[15]; ROUND_00_15(15,b,c,d,e,f,g,h,a);
443 T1 = X[0] = PULL64(W[0]); ROUND_00_15(0,a,b,c,d,e,f,g,h);
444 T1 = X[1] = PULL64(W[1]); ROUND_00_15(1,h,a,b,c,d,e,f,g);
445 T1 = X[2] = PULL64(W[2]); ROUND_00_15(2,g,h,a,b,c,d,e,f);
446 T1 = X[3] = PULL64(W[3]); ROUND_00_15(3,f,g,h,a,b,c,d,e);
447 T1 = X[4] = PULL64(W[4]); ROUND_00_15(4,e,f,g,h,a,b,c,d);
448 T1 = X[5] = PULL64(W[5]); ROUND_00_15(5,d,e,f,g,h,a,b,c);
449 T1 = X[6] = PULL64(W[6]); ROUND_00_15(6,c,d,e,f,g,h,a,b);
450 T1 = X[7] = PULL64(W[7]); ROUND_00_15(7,b,c,d,e,f,g,h,a);
451 T1 = X[8] = PULL64(W[8]); ROUND_00_15(8,a,b,c,d,e,f,g,h);
452 T1 = X[9] = PULL64(W[9]); ROUND_00_15(9,h,a,b,c,d,e,f,g);
453 T1 = X[10] = PULL64(W[10]); ROUND_00_15(10,g,h,a,b,c,d,e,f);
454 T1 = X[11] = PULL64(W[11]); ROUND_00_15(11,f,g,h,a,b,c,d,e);
455 T1 = X[12] = PULL64(W[12]); ROUND_00_15(12,e,f,g,h,a,b,c,d);
456 T1 = X[13] = PULL64(W[13]); ROUND_00_15(13,d,e,f,g,h,a,b,c);
457 T1 = X[14] = PULL64(W[14]); ROUND_00_15(14,c,d,e,f,g,h,a,b);
458 T1 = X[15] = PULL64(W[15]); ROUND_00_15(15,b,c,d,e,f,g,h,a);
463 ROUND_16_80(i+0,a,b,c,d,e,f,g,h,X);
464 ROUND_16_80(i+1,h,a,b,c,d,e,f,g,X);
465 ROUND_16_80(i+2,g,h,a,b,c,d,e,f,X);
466 ROUND_16_80(i+3,f,g,h,a,b,c,d,e,X);
467 ROUND_16_80(i+4,e,f,g,h,a,b,c,d,X);
468 ROUND_16_80(i+5,d,e,f,g,h,a,b,c,X);
469 ROUND_16_80(i+6,c,d,e,f,g,h,a,b,X);
470 ROUND_16_80(i+7,b,c,d,e,f,g,h,a,X);
473 ctx->h[0] += a; ctx->h[1] += b; ctx->h[2] += c; ctx->h[3] += d;
474 ctx->h[4] += e; ctx->h[5] += f; ctx->h[6] += g; ctx->h[7] += h;
482 #endif /* SHA512_ASM */
486 #endif /* OPENSSL_NO_SHA512 */