1 /* crypto/sha/sha512.c */
   2 /* ====================================================================
   3  * Copyright (c) 2004 The OpenSSL Project.  All rights reserved
   4  * according to the OpenSSL license [found in ../../LICENSE].
   5  * ====================================================================
   6  */
   7 #include <openssl/opensslconf.h>
   8 #if !defined(OPENSSL_NO_SHA) && !defined(OPENSSL_NO_SHA512)
   9 /*
  10  * IMPLEMENTATION NOTES.
  11  *
  12  * As you might have noticed 32-bit hash algorithms:
  13  *
  14  * - permit SHA_LONG to be wider than 32-bit (case on CRAY);
  15  * - optimized versions implement two transform functions: one operating
  16  *   on [aligned] data in host byte order and one - on data in input
  17  *   stream byte order;
  18  * - share common byte-order neutral collector and padding function
  19  *   implementations, ../md32_common.h;
  20  *
  21  * Neither of the above applies to this SHA-512 implementations. Reasons
  22  * [in reverse order] are:
  23  *
  24  * - it's the only 64-bit hash algorithm for the moment of this writing,
  25  *   there is no need for common collector/padding implementation [yet];
  26  * - by supporting only one transform function [which operates on
  27  *   *aligned* data in input stream byte order, big-endian in this case]
  28  *   we minimize burden of maintenance in two ways: a) collector/padding
  29  *   function is simpler; b) only one transform function to stare at;
  30  * - SHA_LONG64 is required to be exactly 64-bit in order to be able to
  31  *   apply a number of optimizations to mitigate potential performance
  32  *   penalties caused by previous design decision;
  33  *
  34  * Caveat lector.
  35  *
  36  * Implementation relies on the fact that "long long" is 64-bit on
  37  * both 32- and 64-bit platforms. If some compiler vendor comes up
  38  * with 128-bit long long, adjustment to sha.h would be required.
  39  * As this implementation relies on 64-bit integer type, it's totally
  40  * inappropriate for platforms which don't support it, most notably
  41  * 16-bit platforms.
  42  *                                      <appro@fy.chalmers.se>
  43  */
  44 #include <stdlib.h>
  45 #include <string.h>
  46 
  47 #include <openssl/crypto.h>
  48 #include <openssl/sha.h>
  49 #include <openssl/opensslv.h>
  50 
  51 #include "cryptlib.h"
  52 
  53 const char SHA512_version[]="SHA-512" OPENSSL_VERSION_PTEXT;
  54 
  55 #if defined(__i386) || defined(__i386__) || defined(_M_IX86) || \
  56     defined(__x86_64) || defined(_M_AMD64) || defined(_M_X64) || \
  57     defined(__s390__) || defined(__s390x__) || \
  58     defined(SHA512_ASM)
  59 #define SHA512_BLOCK_CAN_MANAGE_UNALIGNED_DATA
  60 #endif
  61 
  62 fips_md_init_ctx(SHA384, SHA512)
  63         {
  64         c->h[0]=U64(0xcbbb9d5dc1059ed8);
  65         c->h[1]=U64(0x629a292a367cd507);
  66         c->h[2]=U64(0x9159015a3070dd17);
  67         c->h[3]=U64(0x152fecd8f70e5939);
  68         c->h[4]=U64(0x67332667ffc00b31);
  69         c->h[5]=U64(0x8eb44a8768581511);
  70         c->h[6]=U64(0xdb0c2e0d64f98fa7);
  71         c->h[7]=U64(0x47b5481dbefa4fa4);
  72 
  73         c->Nl=0;        c->Nh=0;
  74         c->num=0;       c->md_len=SHA384_DIGEST_LENGTH;
  75         return 1;
  76         }
  77 
  78 fips_md_init(SHA512)
  79         {
  80         c->h[0]=U64(0x6a09e667f3bcc908);
  81         c->h[1]=U64(0xbb67ae8584caa73b);
  82         c->h[2]=U64(0x3c6ef372fe94f82b);
  83         c->h[3]=U64(0xa54ff53a5f1d36f1);
  84         c->h[4]=U64(0x510e527fade682d1);
  85         c->h[5]=U64(0x9b05688c2b3e6c1f);
  86         c->h[6]=U64(0x1f83d9abfb41bd6b);
  87         c->h[7]=U64(0x5be0cd19137e2179);
  88 
  89         c->Nl=0;        c->Nh=0;
  90         c->num=0;       c->md_len=SHA512_DIGEST_LENGTH;
  91         return 1;
  92         }
  93 
  94 #ifndef SHA512_ASM
  95 static
  96 #endif
  97 void sha512_block_data_order (SHA512_CTX *ctx, const void *in, size_t num);
  98 
  99 int SHA512_Final (unsigned char *md, SHA512_CTX *c)
 100         {
 101         unsigned char *p=(unsigned char *)c->u.p;
 102         size_t n=c->num;
 103 
 104         p[n]=0x80;      /* There always is a room for one */
 105         n++;
 106         if (n > (sizeof(c->u)-16))
 107                 memset (p+n,0,sizeof(c->u)-n), n=0,
 108                 sha512_block_data_order (c,p,1);
 109 
 110         memset (p+n,0,sizeof(c->u)-16-n);
 111 #ifdef  B_ENDIAN
 112         c->u.d[SHA_LBLOCK-2] = c->Nh;
 113         c->u.d[SHA_LBLOCK-1] = c->Nl;
 114 #else
 115         p[sizeof(c->u)-1]  = (unsigned char)(c->Nl);
 116         p[sizeof(c->u)-2]  = (unsigned char)(c->Nl>>8);
 117         p[sizeof(c->u)-3]  = (unsigned char)(c->Nl>>16);
 118         p[sizeof(c->u)-4]  = (unsigned char)(c->Nl>>24);
 119         p[sizeof(c->u)-5]  = (unsigned char)(c->Nl>>32);
 120         p[sizeof(c->u)-6]  = (unsigned char)(c->Nl>>40);
 121         p[sizeof(c->u)-7]  = (unsigned char)(c->Nl>>48);
 122         p[sizeof(c->u)-8]  = (unsigned char)(c->Nl>>56);
 123         p[sizeof(c->u)-9]  = (unsigned char)(c->Nh);
 124         p[sizeof(c->u)-10] = (unsigned char)(c->Nh>>8);
 125         p[sizeof(c->u)-11] = (unsigned char)(c->Nh>>16);
 126         p[sizeof(c->u)-12] = (unsigned char)(c->Nh>>24);
 127         p[sizeof(c->u)-13] = (unsigned char)(c->Nh>>32);
 128         p[sizeof(c->u)-14] = (unsigned char)(c->Nh>>40);
 129         p[sizeof(c->u)-15] = (unsigned char)(c->Nh>>48);
 130         p[sizeof(c->u)-16] = (unsigned char)(c->Nh>>56);
 131 #endif
 132 
 133         sha512_block_data_order (c,p,1);
 134 
 135         if (md==0) return 0;
 136 
 137         switch (c->md_len)
 138                 {
 139                 /* Let compiler decide if it's appropriate to unroll... */
 140                 case SHA384_DIGEST_LENGTH:
 141                         for (n=0;n<SHA384_DIGEST_LENGTH/8;n++)
 142                                 {
 143                                 SHA_LONG64 t = c->h[n];
 144 
 145                                 *(md++) = (unsigned char)(t>>56);
 146                                 *(md++) = (unsigned char)(t>>48);
 147                                 *(md++) = (unsigned char)(t>>40);
 148                                 *(md++) = (unsigned char)(t>>32);
 149                                 *(md++) = (unsigned char)(t>>24);
 150                                 *(md++) = (unsigned char)(t>>16);
 151                                 *(md++) = (unsigned char)(t>>8);
 152                                 *(md++) = (unsigned char)(t);
 153                                 }
 154                         break;
 155                 case SHA512_DIGEST_LENGTH:
 156                         for (n=0;n<SHA512_DIGEST_LENGTH/8;n++)
 157                                 {
 158                                 SHA_LONG64 t = c->h[n];
 159 
 160                                 *(md++) = (unsigned char)(t>>56);
 161                                 *(md++) = (unsigned char)(t>>48);
 162                                 *(md++) = (unsigned char)(t>>40);
 163                                 *(md++) = (unsigned char)(t>>32);
 164                                 *(md++) = (unsigned char)(t>>24);
 165                                 *(md++) = (unsigned char)(t>>16);
 166                                 *(md++) = (unsigned char)(t>>8);
 167                                 *(md++) = (unsigned char)(t);
 168                                 }
 169                         break;
 170                 /* ... as well as make sure md_len is not abused. */
 171                 default:        return 0;
 172                 }
 173 
 174         return 1;
 175         }
 176 
 177 int SHA384_Final (unsigned char *md,SHA512_CTX *c)
 178 {   return SHA512_Final (md,c);   }
 179 
 180 int SHA512_Update (SHA512_CTX *c, const void *_data, size_t len)
 181         {
 182         SHA_LONG64      l;
 183         unsigned char  *p=c->u.p;
 184         const unsigned char *data=(const unsigned char *)_data;
 185 
 186         if (len==0) return  1;
 187 
 188         l = (c->Nl+(((SHA_LONG64)len)<<3))&U64(0xffffffffffffffff);
 189         if (l < c->Nl)            c->Nh++;
 190         if (sizeof(len)>=8)  c->Nh+=(((SHA_LONG64)len)>>61);
 191         c->Nl=l;
 192 
 193         if (c->num != 0)
 194                 {
 195                 size_t n = sizeof(c->u) - c->num;
 196 
 197                 if (len < n)
 198                         {
 199                         memcpy (p+c->num,data,len), c->num += (unsigned int)len;
 200                         return 1;
 201                         }
 202                 else    {
 203                         memcpy (p+c->num,data,n), c->num = 0;
 204                         len-=n, data+=n;
 205                         sha512_block_data_order (c,p,1);
 206                         }
 207                 }
 208 
 209         if (len >= sizeof(c->u))
 210                 {
 211 #ifndef SHA512_BLOCK_CAN_MANAGE_UNALIGNED_DATA
 212                 if ((size_t)data%sizeof(c->u.d[0]) != 0)
 213                         while (len >= sizeof(c->u))
 214                                 memcpy (p,data,sizeof(c->u)),
 215                                 sha512_block_data_order (c,p,1),
 216                                 len  -= sizeof(c->u),
 217                                 data += sizeof(c->u);
 218                 else
 219 #endif
 220                         sha512_block_data_order (c,data,len/sizeof(c->u)),
 221                         data += len,
 222                         len  %= sizeof(c->u),
 223                         data -= len;
 224                 }
 225 
 226         if (len != 0)   memcpy (p,data,len), c->num = (int)len;
 227 
 228         return 1;
 229         }
 230 
 231 int SHA384_Update (SHA512_CTX *c, const void *data, size_t len)
 232 {   return SHA512_Update (c,data,len);   }
 233 
 234 void SHA512_Transform (SHA512_CTX *c, const unsigned char *data)
 235         {
 236 #ifndef SHA512_BLOCK_CAN_MANAGE_UNALIGNED_DATA
 237         if ((size_t)data%sizeof(c->u.d[0]) != 0)
 238                 memcpy(c->u.p,data,sizeof(c->u.p)),
 239                 data = c->u.p;
 240 #endif
 241         sha512_block_data_order (c,data,1);
 242         }
 243 
 244 unsigned char *SHA384(const unsigned char *d, size_t n, unsigned char *md)
 245         {
 246         SHA512_CTX c;
 247         static unsigned char m[SHA384_DIGEST_LENGTH];
 248 
 249         if (md == NULL) md=m;
 250         SHA384_Init(&c);
 251         SHA512_Update(&c,d,n);
 252         SHA512_Final(md,&c);
 253         OPENSSL_cleanse(&c,sizeof(c));
 254         return(md);
 255         }
 256 
 257 unsigned char *SHA512(const unsigned char *d, size_t n, unsigned char *md)
 258         {
 259         SHA512_CTX c;
 260         static unsigned char m[SHA512_DIGEST_LENGTH];
 261 
 262         if (md == NULL) md=m;
 263         SHA512_Init(&c);
 264         SHA512_Update(&c,d,n);
 265         SHA512_Final(md,&c);
 266         OPENSSL_cleanse(&c,sizeof(c));
 267         return(md);
 268         }
 269 
 270 #ifndef SHA512_ASM
 271 static const SHA_LONG64 K512[80] = {
 272         U64(0x428a2f98d728ae22),U64(0x7137449123ef65cd),
 273         U64(0xb5c0fbcfec4d3b2f),U64(0xe9b5dba58189dbbc),
 274         U64(0x3956c25bf348b538),U64(0x59f111f1b605d019),
 275         U64(0x923f82a4af194f9b),U64(0xab1c5ed5da6d8118),
 276         U64(0xd807aa98a3030242),U64(0x12835b0145706fbe),
 277         U64(0x243185be4ee4b28c),U64(0x550c7dc3d5ffb4e2),
 278         U64(0x72be5d74f27b896f),U64(0x80deb1fe3b1696b1),
 279         U64(0x9bdc06a725c71235),U64(0xc19bf174cf692694),
 280         U64(0xe49b69c19ef14ad2),U64(0xefbe4786384f25e3),
 281         U64(0x0fc19dc68b8cd5b5),U64(0x240ca1cc77ac9c65),
 282         U64(0x2de92c6f592b0275),U64(0x4a7484aa6ea6e483),
 283         U64(0x5cb0a9dcbd41fbd4),U64(0x76f988da831153b5),
 284         U64(0x983e5152ee66dfab),U64(0xa831c66d2db43210),
 285         U64(0xb00327c898fb213f),U64(0xbf597fc7beef0ee4),
 286         U64(0xc6e00bf33da88fc2),U64(0xd5a79147930aa725),
 287         U64(0x06ca6351e003826f),U64(0x142929670a0e6e70),
 288         U64(0x27b70a8546d22ffc),U64(0x2e1b21385c26c926),
 289         U64(0x4d2c6dfc5ac42aed),U64(0x53380d139d95b3df),
 290         U64(0x650a73548baf63de),U64(0x766a0abb3c77b2a8),
 291         U64(0x81c2c92e47edaee6),U64(0x92722c851482353b),
 292         U64(0xa2bfe8a14cf10364),U64(0xa81a664bbc423001),
 293         U64(0xc24b8b70d0f89791),U64(0xc76c51a30654be30),
 294         U64(0xd192e819d6ef5218),U64(0xd69906245565a910),
 295         U64(0xf40e35855771202a),U64(0x106aa07032bbd1b8),
 296         U64(0x19a4c116b8d2d0c8),U64(0x1e376c085141ab53),
 297         U64(0x2748774cdf8eeb99),U64(0x34b0bcb5e19b48a8),
 298         U64(0x391c0cb3c5c95a63),U64(0x4ed8aa4ae3418acb),
 299         U64(0x5b9cca4f7763e373),U64(0x682e6ff3d6b2b8a3),
 300         U64(0x748f82ee5defb2fc),U64(0x78a5636f43172f60),
 301         U64(0x84c87814a1f0ab72),U64(0x8cc702081a6439ec),
 302         U64(0x90befffa23631e28),U64(0xa4506cebde82bde9),
 303         U64(0xbef9a3f7b2c67915),U64(0xc67178f2e372532b),
 304         U64(0xca273eceea26619c),U64(0xd186b8c721c0c207),
 305         U64(0xeada7dd6cde0eb1e),U64(0xf57d4f7fee6ed178),
 306         U64(0x06f067aa72176fba),U64(0x0a637dc5a2c898a6),
 307         U64(0x113f9804bef90dae),U64(0x1b710b35131c471b),
 308         U64(0x28db77f523047d84),U64(0x32caab7b40c72493),
 309         U64(0x3c9ebe0a15c9bebc),U64(0x431d67c49c100d4c),
 310         U64(0x4cc5d4becb3e42b6),U64(0x597f299cfc657e2a),
 311         U64(0x5fcb6fab3ad6faec),U64(0x6c44198c4a475817) };
 312 
 313 #ifndef PEDANTIC
 314 # if defined(__GNUC__) && __GNUC__>=2 && !defined(OPENSSL_NO_ASM) && !defined(OPENSSL_NO_INLINE_ASM)
 315 #  if defined(__x86_64) || defined(__x86_64__)
 316 #   define ROTR(a,n)    ({ SHA_LONG64 ret;              \
 317                                 asm ("rorq %1,%0"       \
 318                                 : "=r"(ret)             \
 319                                 : "J"(n),"0"(a)         \
 320                                 : "cc"); ret;           })
 321 #   if !defined(B_ENDIAN)
 322 #    define PULL64(x) ({ SHA_LONG64 ret=*((const SHA_LONG64 *)(&(x)));      \
 323                                 asm ("bswapq    %0"             \
 324                                 : "=r"(ret)                     \
 325                                 : "0"(ret)); ret;               })
 326 #   endif
 327 #  elif (defined(__i386) || defined(__i386__)) && !defined(B_ENDIAN)
 328 #   if defined(I386_ONLY)
 329 #    define PULL64(x) ({ const unsigned int *p=(const unsigned int *)(&(x));\
 330                          unsigned int hi=p[0],lo=p[1];          \
 331                                 asm("xchgb %%ah,%%al;xchgb %%dh,%%dl;"\
 332                                     "roll $16,%%eax; roll $16,%%edx; "\
 333                                     "xchgb %%ah,%%al;xchgb %%dh,%%dl;" \
 334                                 : "=a"(lo),"=d"(hi)             \
 335                                 : "0"(lo),"1"(hi) : "cc");      \
 336                                 ((SHA_LONG64)hi)<<32|lo;  })
 337 #   else
 338 #    define PULL64(x) ({ const unsigned int *p=(const unsigned int *)(&(x));\
 339                          unsigned int hi=p[0],lo=p[1];          \
 340                                 asm ("bswapl %0; bswapl %1;"    \
 341                                 : "=r"(lo),"=r"(hi)             \
 342                                 : "0"(lo),"1"(hi));             \
 343                                 ((SHA_LONG64)hi)<<32|lo;  })
 344 #   endif
 345 #  elif (defined(_ARCH_PPC) && defined(__64BIT__)) || defined(_ARCH_PPC64)
 346 #   define ROTR(a,n)    ({ SHA_LONG64 ret;              \
 347                                 asm ("rotrdi %0,%1,%2"  \
 348                                 : "=r"(ret)             \
 349                                 : "r"(a),"K"(n)); ret;  })
 350 #  endif
 351 # elif defined(_MSC_VER)
 352 #  if defined(_WIN64)   /* applies to both IA-64 and AMD64 */
 353 #   pragma intrinsic(_rotr64)
 354 #   define ROTR(a,n)    _rotr64((a),n)
 355 #  endif
 356 #  if defined(_M_IX86) && !defined(OPENSSL_NO_ASM) && !defined(OPENSSL_NO_INLINE_ASM)
 357 #   if defined(I386_ONLY)
 358     static SHA_LONG64 __fastcall __pull64be(const void *x)
 359     {   _asm    mov     edx, [ecx + 0]
 360         _asm    mov     eax, [ecx + 4]
 361         _asm    xchg    dh,dl
 362         _asm    xchg    ah,al
 363         _asm    rol     edx,16
 364         _asm    rol     eax,16
 365         _asm    xchg    dh,dl
 366         _asm    xchg    ah,al
 367     }
 368 #   else
 369     static SHA_LONG64 __fastcall __pull64be(const void *x)
 370     {   _asm    mov     edx, [ecx + 0]
 371         _asm    mov     eax, [ecx + 4]
 372         _asm    bswap   edx
 373         _asm    bswap   eax
 374     }
 375 #   endif
 376 #   define PULL64(x) __pull64be(&(x))
 377 #   if _MSC_VER<=1200
 378 #    pragma inline_depth(0)
 379 #   endif
 380 #  endif
 381 # endif
 382 #endif
 383 
 384 #ifndef PULL64
 385 #define B(x,j)    (((SHA_LONG64)(*(((const unsigned char *)(&x))+j)))<<((7-j)*8))
 386 #define PULL64(x) (B(x,0)|B(x,1)|B(x,2)|B(x,3)|B(x,4)|B(x,5)|B(x,6)|B(x,7))
 387 #endif
 388 
 389 #ifndef ROTR
 390 #define ROTR(x,s)       (((x)>>s) | (x)<<(64-s))
 391 #endif
 392 
 393 #define Sigma0(x)       (ROTR((x),28) ^ ROTR((x),34) ^ ROTR((x),39))
 394 #define Sigma1(x)       (ROTR((x),14) ^ ROTR((x),18) ^ ROTR((x),41))
 395 #define sigma0(x)       (ROTR((x),1)  ^ ROTR((x),8)  ^ ((x)>>7))
 396 #define sigma1(x)       (ROTR((x),19) ^ ROTR((x),61) ^ ((x)>>6))
 397 
 398 #define Ch(x,y,z)       (((x) & (y)) ^ ((~(x)) & (z)))
 399 #define Maj(x,y,z)      (((x) & (y)) ^ ((x) & (z)) ^ ((y) & (z)))
 400 
 401 
 402 #if defined(__i386) || defined(__i386__) || defined(_M_IX86)
 403 /*
 404  * This code should give better results on 32-bit CPU with less than
 405  * ~24 registers, both size and performance wise...
 406  */
 407 static void sha512_block_data_order (SHA512_CTX *ctx, const void *in, size_t num)
 408         {
 409         const SHA_LONG64 *W=in;
 410         SHA_LONG64      A,E,T;
 411         SHA_LONG64      X[9+80],*F;
 412         int i;
 413 
 414                         while (num--) {
 415 
 416         F    = X+80;
 417         A    = ctx->h[0];    F[1] = ctx->h[1];
 418         F[2] = ctx->h[2];    F[3] = ctx->h[3];
 419         E    = ctx->h[4];    F[5] = ctx->h[5];
 420         F[6] = ctx->h[6];    F[7] = ctx->h[7];
 421 
 422         for (i=0;i<16;i++,F--)
 423                 {
 424 #ifdef B_ENDIAN
 425                 T = W[i];
 426 #else
 427                 T = PULL64(W[i]);
 428 #endif
 429                 F[0] = A;
 430                 F[4] = E;
 431                 F[8] = T;
 432                 T   += F[7] + Sigma1(E) + Ch(E,F[5],F[6]) + K512[i];
 433                 E    = F[3] + T;
 434                 A    = T + Sigma0(A) + Maj(A,F[1],F[2]);
 435                 }
 436 
 437         for (;i<80;i++,F--)
 438                 {
 439                 T    = sigma0(F[8+16-1]);
 440                 T   += sigma1(F[8+16-14]);
 441                 T   += F[8+16] + F[8+16-9];
 442 
 443                 F[0] = A;
 444                 F[4] = E;
 445                 F[8] = T;
 446                 T   += F[7] + Sigma1(E) + Ch(E,F[5],F[6]) + K512[i];
 447                 E    = F[3] + T;
 448                 A    = T + Sigma0(A) + Maj(A,F[1],F[2]);
 449                 }
 450 
 451         ctx->h[0] += A;              ctx->h[1] += F[1];
 452         ctx->h[2] += F[2];   ctx->h[3] += F[3];
 453         ctx->h[4] += E;              ctx->h[5] += F[5];
 454         ctx->h[6] += F[6];   ctx->h[7] += F[7];
 455 
 456                         W+=SHA_LBLOCK;
 457                         }
 458         }
 459 
 460 #elif defined(OPENSSL_SMALL_FOOTPRINT)
 461 
 462 static void sha512_block_data_order (SHA512_CTX *ctx, const void *in, size_t num)
 463         {
 464         const SHA_LONG64 *W=in;
 465         SHA_LONG64      a,b,c,d,e,f,g,h,s0,s1,T1,T2;
 466         SHA_LONG64      X[16];
 467         int i;
 468 
 469                         while (num--) {
 470 
 471         a = ctx->h[0];       b = ctx->h[1];       c = ctx->h[2];       d = ctx->h[3];
 472         e = ctx->h[4];       f = ctx->h[5];       g = ctx->h[6];       h = ctx->h[7];
 473 
 474         for (i=0;i<16;i++)
 475                 {
 476 #ifdef B_ENDIAN
 477                 T1 = X[i] = W[i];
 478 #else
 479                 T1 = X[i] = PULL64(W[i]);
 480 #endif
 481                 T1 += h + Sigma1(e) + Ch(e,f,g) + K512[i];
 482                 T2 = Sigma0(a) + Maj(a,b,c);
 483                 h = g;  g = f;  f = e;  e = d + T1;
 484                 d = c;  c = b;  b = a;  a = T1 + T2;
 485                 }
 486 
 487         for (;i<80;i++)
 488                 {
 489                 s0 = X[(i+1)&0x0f]; s0 = sigma0(s0);
 490                 s1 = X[(i+14)&0x0f];        s1 = sigma1(s1);
 491 
 492                 T1 = X[i&0xf] += s0 + s1 + X[(i+9)&0xf];
 493                 T1 += h + Sigma1(e) + Ch(e,f,g) + K512[i];
 494                 T2 = Sigma0(a) + Maj(a,b,c);
 495                 h = g;  g = f;  f = e;  e = d + T1;
 496                 d = c;  c = b;  b = a;  a = T1 + T2;
 497                 }
 498 
 499         ctx->h[0] += a;      ctx->h[1] += b;      ctx->h[2] += c;      ctx->h[3] += d;
 500         ctx->h[4] += e;      ctx->h[5] += f;      ctx->h[6] += g;      ctx->h[7] += h;
 501 
 502                         W+=SHA_LBLOCK;
 503                         }
 504         }
 505 
 506 #else
 507 
 508 #define ROUND_00_15(i,a,b,c,d,e,f,g,h)          do {    \
 509         T1 += h + Sigma1(e) + Ch(e,f,g) + K512[i];      \
 510         h = Sigma0(a) + Maj(a,b,c);                     \
 511         d += T1;        h += T1;                } while (0)
 512 
 513 #define ROUND_16_80(i,j,a,b,c,d,e,f,g,h,X)      do {    \
 514         s0 = X[(j+1)&0x0f]; s0 = sigma0(s0);        \
 515         s1 = X[(j+14)&0x0f];        s1 = sigma1(s1);        \
 516         T1 = X[(j)&0x0f] += s0 + s1 + X[(j+9)&0x0f];    \
 517         ROUND_00_15(i+j,a,b,c,d,e,f,g,h);               } while (0)
 518 
 519 static void sha512_block_data_order (SHA512_CTX *ctx, const void *in, size_t num)
 520         {
 521         const SHA_LONG64 *W=in;
 522         SHA_LONG64      a,b,c,d,e,f,g,h,s0,s1,T1;
 523         SHA_LONG64      X[16];
 524         int i;
 525 
 526                         while (num--) {
 527 
 528         a = ctx->h[0];       b = ctx->h[1];       c = ctx->h[2];       d = ctx->h[3];
 529         e = ctx->h[4];       f = ctx->h[5];       g = ctx->h[6];       h = ctx->h[7];
 530 
 531 #ifdef B_ENDIAN
 532         T1 = X[0] = W[0];       ROUND_00_15(0,a,b,c,d,e,f,g,h);
 533         T1 = X[1] = W[1];       ROUND_00_15(1,h,a,b,c,d,e,f,g);
 534         T1 = X[2] = W[2];       ROUND_00_15(2,g,h,a,b,c,d,e,f);
 535         T1 = X[3] = W[3];       ROUND_00_15(3,f,g,h,a,b,c,d,e);
 536         T1 = X[4] = W[4];       ROUND_00_15(4,e,f,g,h,a,b,c,d);
 537         T1 = X[5] = W[5];       ROUND_00_15(5,d,e,f,g,h,a,b,c);
 538         T1 = X[6] = W[6];       ROUND_00_15(6,c,d,e,f,g,h,a,b);
 539         T1 = X[7] = W[7];       ROUND_00_15(7,b,c,d,e,f,g,h,a);
 540         T1 = X[8] = W[8];       ROUND_00_15(8,a,b,c,d,e,f,g,h);
 541         T1 = X[9] = W[9];       ROUND_00_15(9,h,a,b,c,d,e,f,g);
 542         T1 = X[10] = W[10];     ROUND_00_15(10,g,h,a,b,c,d,e,f);
 543         T1 = X[11] = W[11];     ROUND_00_15(11,f,g,h,a,b,c,d,e);
 544         T1 = X[12] = W[12];     ROUND_00_15(12,e,f,g,h,a,b,c,d);
 545         T1 = X[13] = W[13];     ROUND_00_15(13,d,e,f,g,h,a,b,c);
 546         T1 = X[14] = W[14];     ROUND_00_15(14,c,d,e,f,g,h,a,b);
 547         T1 = X[15] = W[15];     ROUND_00_15(15,b,c,d,e,f,g,h,a);
 548 #else
 549         T1 = X[0]  = PULL64(W[0]);      ROUND_00_15(0,a,b,c,d,e,f,g,h);
 550         T1 = X[1]  = PULL64(W[1]);      ROUND_00_15(1,h,a,b,c,d,e,f,g);
 551         T1 = X[2]  = PULL64(W[2]);      ROUND_00_15(2,g,h,a,b,c,d,e,f);
 552         T1 = X[3]  = PULL64(W[3]);      ROUND_00_15(3,f,g,h,a,b,c,d,e);
 553         T1 = X[4]  = PULL64(W[4]);      ROUND_00_15(4,e,f,g,h,a,b,c,d);
 554         T1 = X[5]  = PULL64(W[5]);      ROUND_00_15(5,d,e,f,g,h,a,b,c);
 555         T1 = X[6]  = PULL64(W[6]);      ROUND_00_15(6,c,d,e,f,g,h,a,b);
 556         T1 = X[7]  = PULL64(W[7]);      ROUND_00_15(7,b,c,d,e,f,g,h,a);
 557         T1 = X[8]  = PULL64(W[8]);      ROUND_00_15(8,a,b,c,d,e,f,g,h);
 558         T1 = X[9]  = PULL64(W[9]);      ROUND_00_15(9,h,a,b,c,d,e,f,g);
 559         T1 = X[10] = PULL64(W[10]);     ROUND_00_15(10,g,h,a,b,c,d,e,f);
 560         T1 = X[11] = PULL64(W[11]);     ROUND_00_15(11,f,g,h,a,b,c,d,e);
 561         T1 = X[12] = PULL64(W[12]);     ROUND_00_15(12,e,f,g,h,a,b,c,d);
 562         T1 = X[13] = PULL64(W[13]);     ROUND_00_15(13,d,e,f,g,h,a,b,c);
 563         T1 = X[14] = PULL64(W[14]);     ROUND_00_15(14,c,d,e,f,g,h,a,b);
 564         T1 = X[15] = PULL64(W[15]);     ROUND_00_15(15,b,c,d,e,f,g,h,a);
 565 #endif
 566 
 567         for (i=16;i<80;i+=16)
 568                 {
 569                 ROUND_16_80(i, 0,a,b,c,d,e,f,g,h,X);
 570                 ROUND_16_80(i, 1,h,a,b,c,d,e,f,g,X);
 571                 ROUND_16_80(i, 2,g,h,a,b,c,d,e,f,X);
 572                 ROUND_16_80(i, 3,f,g,h,a,b,c,d,e,X);
 573                 ROUND_16_80(i, 4,e,f,g,h,a,b,c,d,X);
 574                 ROUND_16_80(i, 5,d,e,f,g,h,a,b,c,X);
 575                 ROUND_16_80(i, 6,c,d,e,f,g,h,a,b,X);
 576                 ROUND_16_80(i, 7,b,c,d,e,f,g,h,a,X);
 577                 ROUND_16_80(i, 8,a,b,c,d,e,f,g,h,X);
 578                 ROUND_16_80(i, 9,h,a,b,c,d,e,f,g,X);
 579                 ROUND_16_80(i,10,g,h,a,b,c,d,e,f,X);
 580                 ROUND_16_80(i,11,f,g,h,a,b,c,d,e,X);
 581                 ROUND_16_80(i,12,e,f,g,h,a,b,c,d,X);
 582                 ROUND_16_80(i,13,d,e,f,g,h,a,b,c,X);
 583                 ROUND_16_80(i,14,c,d,e,f,g,h,a,b,X);
 584                 ROUND_16_80(i,15,b,c,d,e,f,g,h,a,X);
 585                 }
 586 
 587         ctx->h[0] += a;      ctx->h[1] += b;      ctx->h[2] += c;      ctx->h[3] += d;
 588         ctx->h[4] += e;      ctx->h[5] += f;      ctx->h[6] += g;      ctx->h[7] += h;
 589 
 590                         W+=SHA_LBLOCK;
 591                         }
 592         }
 593 
 594 #endif
 595 
 596 #endif /* SHA512_ASM */
 597 
 598 #else /* !OPENSSL_NO_SHA512 */
 599 
 600 #if defined(PEDANTIC) || defined(__DECC) || defined(OPENSSL_SYS_MACOSX)
 601 static void *dummy=&dummy;
 602 #endif
 603 
 604 #endif /* !OPENSSL_NO_SHA512 */