17c478bd9Sstevel@tonic-gate /* 2*8de5c4f4SDan OpenSolaris Anderson * Copyright 2009 Sun Microsystems, Inc. All rights reserved. 37c478bd9Sstevel@tonic-gate * Use is subject to license terms. 47c478bd9Sstevel@tonic-gate */ 57c478bd9Sstevel@tonic-gate 67c478bd9Sstevel@tonic-gate /* 77c478bd9Sstevel@tonic-gate * The basic framework for this code came from the reference 87c478bd9Sstevel@tonic-gate * implementation for MD5. That implementation is Copyright (C) 97c478bd9Sstevel@tonic-gate * 1991-2, RSA Data Security, Inc. Created 1991. All rights reserved. 107c478bd9Sstevel@tonic-gate * 117c478bd9Sstevel@tonic-gate * License to copy and use this software is granted provided that it 127c478bd9Sstevel@tonic-gate * is identified as the "RSA Data Security, Inc. MD5 Message-Digest 137c478bd9Sstevel@tonic-gate * Algorithm" in all material mentioning or referencing this software 147c478bd9Sstevel@tonic-gate * or this function. 157c478bd9Sstevel@tonic-gate * 167c478bd9Sstevel@tonic-gate * License is also granted to make and use derivative works provided 177c478bd9Sstevel@tonic-gate * that such works are identified as "derived from the RSA Data 187c478bd9Sstevel@tonic-gate * Security, Inc. MD5 Message-Digest Algorithm" in all material 197c478bd9Sstevel@tonic-gate * mentioning or referencing the derived work. 207c478bd9Sstevel@tonic-gate * 217c478bd9Sstevel@tonic-gate * RSA Data Security, Inc. makes no representations concerning either 227c478bd9Sstevel@tonic-gate * the merchantability of this software or the suitability of this 237c478bd9Sstevel@tonic-gate * software for any particular purpose. It is provided "as is" 247c478bd9Sstevel@tonic-gate * without express or implied warranty of any kind. 257c478bd9Sstevel@tonic-gate * 267c478bd9Sstevel@tonic-gate * These notices must be retained in any copies of any part of this 277c478bd9Sstevel@tonic-gate * documentation and/or software. 287c478bd9Sstevel@tonic-gate * 297c478bd9Sstevel@tonic-gate * NOTE: Cleaned-up and optimized, version of SHA1, based on the FIPS 180-1 304b56a003SDaniel Anderson * standard, available at http://www.itl.nist.gov/fipspubs/fip180-1.htm 317c478bd9Sstevel@tonic-gate * Not as fast as one would like -- further optimizations are encouraged 327c478bd9Sstevel@tonic-gate * and appreciated. 337c478bd9Sstevel@tonic-gate */ 347c478bd9Sstevel@tonic-gate 35*8de5c4f4SDan OpenSolaris Anderson #ifndef _KERNEL 36*8de5c4f4SDan OpenSolaris Anderson #include <stdint.h> 37*8de5c4f4SDan OpenSolaris Anderson #include <strings.h> 38*8de5c4f4SDan OpenSolaris Anderson #include <stdlib.h> 39*8de5c4f4SDan OpenSolaris Anderson #include <errno.h> 40*8de5c4f4SDan OpenSolaris Anderson #include <sys/systeminfo.h> 41*8de5c4f4SDan OpenSolaris Anderson #endif /* !_KERNEL */ 42*8de5c4f4SDan OpenSolaris Anderson 437c478bd9Sstevel@tonic-gate #include <sys/types.h> 447c478bd9Sstevel@tonic-gate #include <sys/param.h> 457c478bd9Sstevel@tonic-gate #include <sys/systm.h> 467c478bd9Sstevel@tonic-gate #include <sys/sysmacros.h> 477c478bd9Sstevel@tonic-gate #include <sys/sha1.h> 487c478bd9Sstevel@tonic-gate #include <sys/sha1_consts.h> 497c478bd9Sstevel@tonic-gate 504b56a003SDaniel Anderson #ifdef _LITTLE_ENDIAN 514b56a003SDaniel Anderson #include <sys/byteorder.h> 524b56a003SDaniel Anderson #define HAVE_HTONL 534b56a003SDaniel Anderson #endif 544b56a003SDaniel Anderson 55734b6a94Sdarrenm static void Encode(uint8_t *, const uint32_t *, size_t); 56734b6a94Sdarrenm 57734b6a94Sdarrenm #if defined(__sparc) 58734b6a94Sdarrenm 59734b6a94Sdarrenm #define SHA1_TRANSFORM(ctx, in) \ 60734b6a94Sdarrenm SHA1Transform((ctx)->state[0], (ctx)->state[1], (ctx)->state[2], \ 61734b6a94Sdarrenm (ctx)->state[3], (ctx)->state[4], (ctx), (in)) 62734b6a94Sdarrenm 637c478bd9Sstevel@tonic-gate static void SHA1Transform(uint32_t, uint32_t, uint32_t, uint32_t, uint32_t, 647c478bd9Sstevel@tonic-gate SHA1_CTX *, const uint8_t *); 657c478bd9Sstevel@tonic-gate 66321502cdSda73024 #elif defined(__amd64) 67321502cdSda73024 68321502cdSda73024 #define SHA1_TRANSFORM(ctx, in) sha1_block_data_order((ctx), (in), 1) 69321502cdSda73024 #define SHA1_TRANSFORM_BLOCKS(ctx, in, num) sha1_block_data_order((ctx), \ 70321502cdSda73024 (in), (num)) 71321502cdSda73024 72321502cdSda73024 void sha1_block_data_order(SHA1_CTX *ctx, const void *inpp, size_t num_blocks); 73321502cdSda73024 74734b6a94Sdarrenm #else 75734b6a94Sdarrenm 76734b6a94Sdarrenm #define SHA1_TRANSFORM(ctx, in) SHA1Transform((ctx), (in)) 77734b6a94Sdarrenm 78734b6a94Sdarrenm static void SHA1Transform(SHA1_CTX *, const uint8_t *); 79734b6a94Sdarrenm 80734b6a94Sdarrenm #endif 81734b6a94Sdarrenm 82734b6a94Sdarrenm 837c478bd9Sstevel@tonic-gate static uint8_t PADDING[64] = { 0x80, /* all zeros */ }; 847c478bd9Sstevel@tonic-gate 857c478bd9Sstevel@tonic-gate /* 867c478bd9Sstevel@tonic-gate * F, G, and H are the basic SHA1 functions. 877c478bd9Sstevel@tonic-gate */ 887c478bd9Sstevel@tonic-gate #define F(b, c, d) (((b) & (c)) | ((~b) & (d))) 897c478bd9Sstevel@tonic-gate #define G(b, c, d) ((b) ^ (c) ^ (d)) 90734b6a94Sdarrenm #define H(b, c, d) (((b) & (c)) | (((b)|(c)) & (d))) 917c478bd9Sstevel@tonic-gate 927c478bd9Sstevel@tonic-gate /* 937c478bd9Sstevel@tonic-gate * ROTATE_LEFT rotates x left n bits. 947c478bd9Sstevel@tonic-gate */ 95734b6a94Sdarrenm 96734b6a94Sdarrenm #if defined(__GNUC__) && defined(_LP64) 97734b6a94Sdarrenm static __inline__ uint64_t 98734b6a94Sdarrenm ROTATE_LEFT(uint64_t value, uint32_t n) 99734b6a94Sdarrenm { 100734b6a94Sdarrenm uint32_t t32; 101734b6a94Sdarrenm 102734b6a94Sdarrenm t32 = (uint32_t)value; 103734b6a94Sdarrenm return ((t32 << n) | (t32 >> (32 - n))); 104734b6a94Sdarrenm } 105734b6a94Sdarrenm 106734b6a94Sdarrenm #else 107734b6a94Sdarrenm 1087c478bd9Sstevel@tonic-gate #define ROTATE_LEFT(x, n) \ 1097c478bd9Sstevel@tonic-gate (((x) << (n)) | ((x) >> ((sizeof (x) * NBBY)-(n)))) 1107c478bd9Sstevel@tonic-gate 111734b6a94Sdarrenm #endif 1127c478bd9Sstevel@tonic-gate 1137c478bd9Sstevel@tonic-gate 1147c478bd9Sstevel@tonic-gate /* 1157c478bd9Sstevel@tonic-gate * SHA1Init() 1167c478bd9Sstevel@tonic-gate * 1177c478bd9Sstevel@tonic-gate * purpose: initializes the sha1 context and begins and sha1 digest operation 1187c478bd9Sstevel@tonic-gate * input: SHA1_CTX * : the context to initializes. 1197c478bd9Sstevel@tonic-gate * output: void 1207c478bd9Sstevel@tonic-gate */ 1217c478bd9Sstevel@tonic-gate 1227c478bd9Sstevel@tonic-gate void 1237c478bd9Sstevel@tonic-gate SHA1Init(SHA1_CTX *ctx) 1247c478bd9Sstevel@tonic-gate { 1257c478bd9Sstevel@tonic-gate ctx->count[0] = ctx->count[1] = 0; 1267c478bd9Sstevel@tonic-gate 1277c478bd9Sstevel@tonic-gate /* 1287c478bd9Sstevel@tonic-gate * load magic initialization constants. Tell lint 1297c478bd9Sstevel@tonic-gate * that these constants are unsigned by using U. 1307c478bd9Sstevel@tonic-gate */ 1317c478bd9Sstevel@tonic-gate 1327c478bd9Sstevel@tonic-gate ctx->state[0] = 0x67452301U; 1337c478bd9Sstevel@tonic-gate ctx->state[1] = 0xefcdab89U; 1347c478bd9Sstevel@tonic-gate ctx->state[2] = 0x98badcfeU; 1357c478bd9Sstevel@tonic-gate ctx->state[3] = 0x10325476U; 1367c478bd9Sstevel@tonic-gate ctx->state[4] = 0xc3d2e1f0U; 1377c478bd9Sstevel@tonic-gate } 1387c478bd9Sstevel@tonic-gate 1397c478bd9Sstevel@tonic-gate #ifdef VIS_SHA1 1407c478bd9Sstevel@tonic-gate #ifdef _KERNEL 1417c478bd9Sstevel@tonic-gate 1427c478bd9Sstevel@tonic-gate #include <sys/regset.h> 1437c478bd9Sstevel@tonic-gate #include <sys/vis.h> 14415b9cbbcSkrishna #include <sys/fpu/fpusystm.h> 1457c478bd9Sstevel@tonic-gate 1467c478bd9Sstevel@tonic-gate /* the alignment for block stores to save fp registers */ 1477c478bd9Sstevel@tonic-gate #define VIS_ALIGN (64) 1487c478bd9Sstevel@tonic-gate 1497c478bd9Sstevel@tonic-gate extern int sha1_savefp(kfpu_t *, int); 1507c478bd9Sstevel@tonic-gate extern void sha1_restorefp(kfpu_t *); 1517c478bd9Sstevel@tonic-gate 1527c478bd9Sstevel@tonic-gate uint32_t vis_sha1_svfp_threshold = 128; 1537c478bd9Sstevel@tonic-gate 1547c478bd9Sstevel@tonic-gate #endif /* _KERNEL */ 1557c478bd9Sstevel@tonic-gate 1567c478bd9Sstevel@tonic-gate /* 1577c478bd9Sstevel@tonic-gate * VIS SHA-1 consts. 1587c478bd9Sstevel@tonic-gate */ 1597c478bd9Sstevel@tonic-gate static uint64_t VIS[] = { 1604cc1ac68Skrishna 0x8000000080000000ULL, 1614cc1ac68Skrishna 0x0002000200020002ULL, 1624cc1ac68Skrishna 0x5a8279996ed9eba1ULL, 1634cc1ac68Skrishna 0x8f1bbcdcca62c1d6ULL, 1644cc1ac68Skrishna 0x012389ab456789abULL}; 1657c478bd9Sstevel@tonic-gate 166734b6a94Sdarrenm extern void SHA1TransformVIS(uint64_t *, uint32_t *, uint32_t *, uint64_t *); 1677c478bd9Sstevel@tonic-gate 1687c478bd9Sstevel@tonic-gate 1697c478bd9Sstevel@tonic-gate /* 1707c478bd9Sstevel@tonic-gate * SHA1Update() 1717c478bd9Sstevel@tonic-gate * 1727c478bd9Sstevel@tonic-gate * purpose: continues an sha1 digest operation, using the message block 1737c478bd9Sstevel@tonic-gate * to update the context. 1747c478bd9Sstevel@tonic-gate * input: SHA1_CTX * : the context to update 175734b6a94Sdarrenm * void * : the message block 176734b6a94Sdarrenm * size_t : the length of the message block in bytes 1777c478bd9Sstevel@tonic-gate * output: void 1787c478bd9Sstevel@tonic-gate */ 1797c478bd9Sstevel@tonic-gate 1807c478bd9Sstevel@tonic-gate void 181734b6a94Sdarrenm SHA1Update(SHA1_CTX *ctx, const void *inptr, size_t input_len) 1827c478bd9Sstevel@tonic-gate { 1837c478bd9Sstevel@tonic-gate uint32_t i, buf_index, buf_len; 1847c478bd9Sstevel@tonic-gate uint64_t X0[40], input64[8]; 185734b6a94Sdarrenm const uint8_t *input = inptr; 18615b9cbbcSkrishna #ifdef _KERNEL 18715b9cbbcSkrishna int usevis = 0; 188734b6a94Sdarrenm #else 189734b6a94Sdarrenm int usevis = 1; 19015b9cbbcSkrishna #endif /* _KERNEL */ 1917c478bd9Sstevel@tonic-gate 1927c478bd9Sstevel@tonic-gate /* check for noop */ 1937c478bd9Sstevel@tonic-gate if (input_len == 0) 1947c478bd9Sstevel@tonic-gate return; 1957c478bd9Sstevel@tonic-gate 1967c478bd9Sstevel@tonic-gate /* compute number of bytes mod 64 */ 1977c478bd9Sstevel@tonic-gate buf_index = (ctx->count[1] >> 3) & 0x3F; 1987c478bd9Sstevel@tonic-gate 1997c478bd9Sstevel@tonic-gate /* update number of bits */ 2007c478bd9Sstevel@tonic-gate if ((ctx->count[1] += (input_len << 3)) < (input_len << 3)) 2017c478bd9Sstevel@tonic-gate ctx->count[0]++; 2027c478bd9Sstevel@tonic-gate 2037c478bd9Sstevel@tonic-gate ctx->count[0] += (input_len >> 29); 2047c478bd9Sstevel@tonic-gate 2057c478bd9Sstevel@tonic-gate buf_len = 64 - buf_index; 2067c478bd9Sstevel@tonic-gate 2077c478bd9Sstevel@tonic-gate /* transform as many times as possible */ 2087c478bd9Sstevel@tonic-gate i = 0; 2097c478bd9Sstevel@tonic-gate if (input_len >= buf_len) { 2107c478bd9Sstevel@tonic-gate #ifdef _KERNEL 2117c478bd9Sstevel@tonic-gate kfpu_t *fpu; 212734b6a94Sdarrenm if (fpu_exists) { 213734b6a94Sdarrenm uint8_t fpua[sizeof (kfpu_t) + GSR_SIZE + VIS_ALIGN]; 2147c478bd9Sstevel@tonic-gate uint32_t len = (input_len + buf_index) & ~0x3f; 2157c478bd9Sstevel@tonic-gate int svfp_ok; 2167c478bd9Sstevel@tonic-gate 2177c478bd9Sstevel@tonic-gate fpu = (kfpu_t *)P2ROUNDUP((uintptr_t)fpua, 64); 2187c478bd9Sstevel@tonic-gate svfp_ok = ((len >= vis_sha1_svfp_threshold) ? 1 : 0); 21915b9cbbcSkrishna usevis = fpu_exists && sha1_savefp(fpu, svfp_ok); 220734b6a94Sdarrenm } else { 221734b6a94Sdarrenm usevis = 0; 222734b6a94Sdarrenm } 2237c478bd9Sstevel@tonic-gate #endif /* _KERNEL */ 2247c478bd9Sstevel@tonic-gate 2257c478bd9Sstevel@tonic-gate /* 2267c478bd9Sstevel@tonic-gate * general optimization: 2277c478bd9Sstevel@tonic-gate * 2287c478bd9Sstevel@tonic-gate * only do initial bcopy() and SHA1Transform() if 2297c478bd9Sstevel@tonic-gate * buf_index != 0. if buf_index == 0, we're just 2307c478bd9Sstevel@tonic-gate * wasting our time doing the bcopy() since there 2317c478bd9Sstevel@tonic-gate * wasn't any data left over from a previous call to 2327c478bd9Sstevel@tonic-gate * SHA1Update(). 2337c478bd9Sstevel@tonic-gate */ 2347c478bd9Sstevel@tonic-gate 2357c478bd9Sstevel@tonic-gate if (buf_index) { 2367c478bd9Sstevel@tonic-gate bcopy(input, &ctx->buf_un.buf8[buf_index], buf_len); 2377c478bd9Sstevel@tonic-gate if (usevis) { 2387c478bd9Sstevel@tonic-gate SHA1TransformVIS(X0, 239734b6a94Sdarrenm ctx->buf_un.buf32, 2407c478bd9Sstevel@tonic-gate &ctx->state[0], VIS); 2417c478bd9Sstevel@tonic-gate } else { 242734b6a94Sdarrenm SHA1_TRANSFORM(ctx, ctx->buf_un.buf8); 2437c478bd9Sstevel@tonic-gate } 2447c478bd9Sstevel@tonic-gate i = buf_len; 2457c478bd9Sstevel@tonic-gate } 2467c478bd9Sstevel@tonic-gate 2477c478bd9Sstevel@tonic-gate /* 2487c478bd9Sstevel@tonic-gate * VIS SHA-1: uses the VIS 1.0 instructions to accelerate 2497c478bd9Sstevel@tonic-gate * SHA-1 processing. This is achieved by "offloading" the 2507c478bd9Sstevel@tonic-gate * computation of the message schedule (MS) to the VIS units. 2517c478bd9Sstevel@tonic-gate * This allows the VIS computation of the message schedule 2527c478bd9Sstevel@tonic-gate * to be performed in parallel with the standard integer 2537c478bd9Sstevel@tonic-gate * processing of the remainder of the SHA-1 computation. 2547c478bd9Sstevel@tonic-gate * performance by up to around 1.37X, compared to an optimized 2557c478bd9Sstevel@tonic-gate * integer-only implementation. 2567c478bd9Sstevel@tonic-gate * 2577c478bd9Sstevel@tonic-gate * The VIS implementation of SHA1Transform has a different API 2587c478bd9Sstevel@tonic-gate * to the standard integer version: 2597c478bd9Sstevel@tonic-gate * 2607c478bd9Sstevel@tonic-gate * void SHA1TransformVIS( 2617c478bd9Sstevel@tonic-gate * uint64_t *, // Pointer to MS for ith block 262734b6a94Sdarrenm * uint32_t *, // Pointer to ith block of message data 2637c478bd9Sstevel@tonic-gate * uint32_t *, // Pointer to SHA state i.e ctx->state 2647c478bd9Sstevel@tonic-gate * uint64_t *, // Pointer to various VIS constants 2657c478bd9Sstevel@tonic-gate * ) 2667c478bd9Sstevel@tonic-gate * 2677c478bd9Sstevel@tonic-gate * Note: the message data must by 4-byte aligned. 2687c478bd9Sstevel@tonic-gate * 2697c478bd9Sstevel@tonic-gate * Function requires VIS 1.0 support. 2707c478bd9Sstevel@tonic-gate * 2717c478bd9Sstevel@tonic-gate * Handling is provided to deal with arbitrary byte alingment 2727c478bd9Sstevel@tonic-gate * of the input data but the performance gains are reduced 2737c478bd9Sstevel@tonic-gate * for alignments other than 4-bytes. 2747c478bd9Sstevel@tonic-gate */ 2757c478bd9Sstevel@tonic-gate if (usevis) { 276734b6a94Sdarrenm if (!IS_P2ALIGNED(&input[i], sizeof (uint32_t))) { 2777c478bd9Sstevel@tonic-gate /* 2787c478bd9Sstevel@tonic-gate * Main processing loop - input misaligned 2797c478bd9Sstevel@tonic-gate */ 2807c478bd9Sstevel@tonic-gate for (; i + 63 < input_len; i += 64) { 2817c478bd9Sstevel@tonic-gate bcopy(&input[i], input64, 64); 282321502cdSda73024 SHA1TransformVIS(X0, 283321502cdSda73024 (uint32_t *)input64, 2847c478bd9Sstevel@tonic-gate &ctx->state[0], VIS); 2857c478bd9Sstevel@tonic-gate } 2867c478bd9Sstevel@tonic-gate } else { 2877c478bd9Sstevel@tonic-gate /* 2887c478bd9Sstevel@tonic-gate * Main processing loop - input 8-byte aligned 2897c478bd9Sstevel@tonic-gate */ 2907c478bd9Sstevel@tonic-gate for (; i + 63 < input_len; i += 64) { 2917c478bd9Sstevel@tonic-gate SHA1TransformVIS(X0, 292734b6a94Sdarrenm /* LINTED E_BAD_PTR_CAST_ALIGN */ 2934b56a003SDaniel Anderson (uint32_t *)&input[i], /* CSTYLED */ 2947c478bd9Sstevel@tonic-gate &ctx->state[0], VIS); 2957c478bd9Sstevel@tonic-gate } 2967c478bd9Sstevel@tonic-gate 2977c478bd9Sstevel@tonic-gate } 2987c478bd9Sstevel@tonic-gate #ifdef _KERNEL 2997c478bd9Sstevel@tonic-gate sha1_restorefp(fpu); 3007c478bd9Sstevel@tonic-gate #endif /* _KERNEL */ 3017c478bd9Sstevel@tonic-gate } else { 3027c478bd9Sstevel@tonic-gate for (; i + 63 < input_len; i += 64) { 303734b6a94Sdarrenm SHA1_TRANSFORM(ctx, &input[i]); 3047c478bd9Sstevel@tonic-gate } 3057c478bd9Sstevel@tonic-gate } 3067c478bd9Sstevel@tonic-gate 3077c478bd9Sstevel@tonic-gate /* 3087c478bd9Sstevel@tonic-gate * general optimization: 3097c478bd9Sstevel@tonic-gate * 3107c478bd9Sstevel@tonic-gate * if i and input_len are the same, return now instead 3117c478bd9Sstevel@tonic-gate * of calling bcopy(), since the bcopy() in this case 3127c478bd9Sstevel@tonic-gate * will be an expensive nop. 3137c478bd9Sstevel@tonic-gate */ 3147c478bd9Sstevel@tonic-gate 3157c478bd9Sstevel@tonic-gate if (input_len == i) 3167c478bd9Sstevel@tonic-gate return; 3177c478bd9Sstevel@tonic-gate 3187c478bd9Sstevel@tonic-gate buf_index = 0; 3197c478bd9Sstevel@tonic-gate } 3207c478bd9Sstevel@tonic-gate 3217c478bd9Sstevel@tonic-gate /* buffer remaining input */ 3227c478bd9Sstevel@tonic-gate bcopy(&input[i], &ctx->buf_un.buf8[buf_index], input_len - i); 3237c478bd9Sstevel@tonic-gate } 3247c478bd9Sstevel@tonic-gate 3257c478bd9Sstevel@tonic-gate #else /* VIS_SHA1 */ 3267c478bd9Sstevel@tonic-gate 3277c478bd9Sstevel@tonic-gate void 328734b6a94Sdarrenm SHA1Update(SHA1_CTX *ctx, const void *inptr, size_t input_len) 3297c478bd9Sstevel@tonic-gate { 3307c478bd9Sstevel@tonic-gate uint32_t i, buf_index, buf_len; 331734b6a94Sdarrenm const uint8_t *input = inptr; 332321502cdSda73024 #if defined(__amd64) 333321502cdSda73024 uint32_t block_count; 334321502cdSda73024 #endif /* __amd64 */ 3357c478bd9Sstevel@tonic-gate 3367c478bd9Sstevel@tonic-gate /* check for noop */ 3377c478bd9Sstevel@tonic-gate if (input_len == 0) 3387c478bd9Sstevel@tonic-gate return; 3397c478bd9Sstevel@tonic-gate 3407c478bd9Sstevel@tonic-gate /* compute number of bytes mod 64 */ 3417c478bd9Sstevel@tonic-gate buf_index = (ctx->count[1] >> 3) & 0x3F; 3427c478bd9Sstevel@tonic-gate 3437c478bd9Sstevel@tonic-gate /* update number of bits */ 3447c478bd9Sstevel@tonic-gate if ((ctx->count[1] += (input_len << 3)) < (input_len << 3)) 3457c478bd9Sstevel@tonic-gate ctx->count[0]++; 3467c478bd9Sstevel@tonic-gate 3477c478bd9Sstevel@tonic-gate ctx->count[0] += (input_len >> 29); 3487c478bd9Sstevel@tonic-gate 3497c478bd9Sstevel@tonic-gate buf_len = 64 - buf_index; 3507c478bd9Sstevel@tonic-gate 3517c478bd9Sstevel@tonic-gate /* transform as many times as possible */ 3527c478bd9Sstevel@tonic-gate i = 0; 3537c478bd9Sstevel@tonic-gate if (input_len >= buf_len) { 3547c478bd9Sstevel@tonic-gate 3557c478bd9Sstevel@tonic-gate /* 3567c478bd9Sstevel@tonic-gate * general optimization: 3577c478bd9Sstevel@tonic-gate * 3587c478bd9Sstevel@tonic-gate * only do initial bcopy() and SHA1Transform() if 3597c478bd9Sstevel@tonic-gate * buf_index != 0. if buf_index == 0, we're just 3607c478bd9Sstevel@tonic-gate * wasting our time doing the bcopy() since there 3617c478bd9Sstevel@tonic-gate * wasn't any data left over from a previous call to 3627c478bd9Sstevel@tonic-gate * SHA1Update(). 3637c478bd9Sstevel@tonic-gate */ 3647c478bd9Sstevel@tonic-gate 3657c478bd9Sstevel@tonic-gate if (buf_index) { 3667c478bd9Sstevel@tonic-gate bcopy(input, &ctx->buf_un.buf8[buf_index], buf_len); 367734b6a94Sdarrenm SHA1_TRANSFORM(ctx, ctx->buf_un.buf8); 3687c478bd9Sstevel@tonic-gate i = buf_len; 3697c478bd9Sstevel@tonic-gate } 3707c478bd9Sstevel@tonic-gate 371321502cdSda73024 #if !defined(__amd64) 3727c478bd9Sstevel@tonic-gate for (; i + 63 < input_len; i += 64) 373734b6a94Sdarrenm SHA1_TRANSFORM(ctx, &input[i]); 374321502cdSda73024 #else 375321502cdSda73024 block_count = (input_len - i) >> 6; 376321502cdSda73024 if (block_count > 0) { 377321502cdSda73024 SHA1_TRANSFORM_BLOCKS(ctx, &input[i], block_count); 378321502cdSda73024 i += block_count << 6; 379321502cdSda73024 } 380321502cdSda73024 #endif /* !__amd64 */ 3817c478bd9Sstevel@tonic-gate 3827c478bd9Sstevel@tonic-gate /* 3837c478bd9Sstevel@tonic-gate * general optimization: 3847c478bd9Sstevel@tonic-gate * 3857c478bd9Sstevel@tonic-gate * if i and input_len are the same, return now instead 3867c478bd9Sstevel@tonic-gate * of calling bcopy(), since the bcopy() in this case 3877c478bd9Sstevel@tonic-gate * will be an expensive nop. 3887c478bd9Sstevel@tonic-gate */ 3897c478bd9Sstevel@tonic-gate 3907c478bd9Sstevel@tonic-gate if (input_len == i) 3917c478bd9Sstevel@tonic-gate return; 3927c478bd9Sstevel@tonic-gate 3937c478bd9Sstevel@tonic-gate buf_index = 0; 3947c478bd9Sstevel@tonic-gate } 3957c478bd9Sstevel@tonic-gate 3967c478bd9Sstevel@tonic-gate /* buffer remaining input */ 3977c478bd9Sstevel@tonic-gate bcopy(&input[i], &ctx->buf_un.buf8[buf_index], input_len - i); 3987c478bd9Sstevel@tonic-gate } 3997c478bd9Sstevel@tonic-gate 4007c478bd9Sstevel@tonic-gate #endif /* VIS_SHA1 */ 4017c478bd9Sstevel@tonic-gate 4027c478bd9Sstevel@tonic-gate /* 4037c478bd9Sstevel@tonic-gate * SHA1Final() 4047c478bd9Sstevel@tonic-gate * 4057c478bd9Sstevel@tonic-gate * purpose: ends an sha1 digest operation, finalizing the message digest and 4067c478bd9Sstevel@tonic-gate * zeroing the context. 407321502cdSda73024 * input: uchar_t * : A buffer to store the digest. 4085151fb12Sdarrenm * : The function actually uses void* because many 4095151fb12Sdarrenm * : callers pass things other than uchar_t here. 4107c478bd9Sstevel@tonic-gate * SHA1_CTX * : the context to finalize, save, and zero 4117c478bd9Sstevel@tonic-gate * output: void 4127c478bd9Sstevel@tonic-gate */ 4137c478bd9Sstevel@tonic-gate 4147c478bd9Sstevel@tonic-gate void 415734b6a94Sdarrenm SHA1Final(void *digest, SHA1_CTX *ctx) 4167c478bd9Sstevel@tonic-gate { 4177c478bd9Sstevel@tonic-gate uint8_t bitcount_be[sizeof (ctx->count)]; 4187c478bd9Sstevel@tonic-gate uint32_t index = (ctx->count[1] >> 3) & 0x3f; 4197c478bd9Sstevel@tonic-gate 4207c478bd9Sstevel@tonic-gate /* store bit count, big endian */ 4217c478bd9Sstevel@tonic-gate Encode(bitcount_be, ctx->count, sizeof (bitcount_be)); 4227c478bd9Sstevel@tonic-gate 4237c478bd9Sstevel@tonic-gate /* pad out to 56 mod 64 */ 4247c478bd9Sstevel@tonic-gate SHA1Update(ctx, PADDING, ((index < 56) ? 56 : 120) - index); 4257c478bd9Sstevel@tonic-gate 4267c478bd9Sstevel@tonic-gate /* append length (before padding) */ 4277c478bd9Sstevel@tonic-gate SHA1Update(ctx, bitcount_be, sizeof (bitcount_be)); 4287c478bd9Sstevel@tonic-gate 4297c478bd9Sstevel@tonic-gate /* store state in digest */ 4307c478bd9Sstevel@tonic-gate Encode(digest, ctx->state, sizeof (ctx->state)); 431673007c6Sdarrenm 432673007c6Sdarrenm /* zeroize sensitive information */ 433673007c6Sdarrenm bzero(ctx, sizeof (*ctx)); 4347c478bd9Sstevel@tonic-gate } 4357c478bd9Sstevel@tonic-gate 436321502cdSda73024 437321502cdSda73024 #if !defined(__amd64) 438321502cdSda73024 439734b6a94Sdarrenm typedef uint32_t sha1word; 440734b6a94Sdarrenm 4417c478bd9Sstevel@tonic-gate /* 4427c478bd9Sstevel@tonic-gate * sparc optimization: 4437c478bd9Sstevel@tonic-gate * 4447c478bd9Sstevel@tonic-gate * on the sparc, we can load big endian 32-bit data easily. note that 4457c478bd9Sstevel@tonic-gate * special care must be taken to ensure the address is 32-bit aligned. 4467c478bd9Sstevel@tonic-gate * in the interest of speed, we don't check to make sure, since 4477c478bd9Sstevel@tonic-gate * careful programming can guarantee this for us. 4487c478bd9Sstevel@tonic-gate */ 4497c478bd9Sstevel@tonic-gate 4507c478bd9Sstevel@tonic-gate #if defined(_BIG_ENDIAN) 4517c478bd9Sstevel@tonic-gate #define LOAD_BIG_32(addr) (*(uint32_t *)(addr)) 4527c478bd9Sstevel@tonic-gate 4534b56a003SDaniel Anderson #elif defined(HAVE_HTONL) 4544b56a003SDaniel Anderson #define LOAD_BIG_32(addr) htonl(*((uint32_t *)(addr))) 4557c478bd9Sstevel@tonic-gate 4564b56a003SDaniel Anderson #else 457734b6a94Sdarrenm /* little endian -- will work on big endian, but slowly */ 4587c478bd9Sstevel@tonic-gate #define LOAD_BIG_32(addr) \ 4597c478bd9Sstevel@tonic-gate (((addr)[0] << 24) | ((addr)[1] << 16) | ((addr)[2] << 8) | (addr)[3]) 4604b56a003SDaniel Anderson #endif /* _BIG_ENDIAN */ 461734b6a94Sdarrenm 462734b6a94Sdarrenm /* 463734b6a94Sdarrenm * SHA1Transform() 464734b6a94Sdarrenm */ 465734b6a94Sdarrenm #if defined(W_ARRAY) 466734b6a94Sdarrenm #define W(n) w[n] 467734b6a94Sdarrenm #else /* !defined(W_ARRAY) */ 468734b6a94Sdarrenm #define W(n) w_ ## n 469734b6a94Sdarrenm #endif /* !defined(W_ARRAY) */ 470734b6a94Sdarrenm 471734b6a94Sdarrenm 472734b6a94Sdarrenm #if defined(__sparc) 4737c478bd9Sstevel@tonic-gate 4747c478bd9Sstevel@tonic-gate /* 4757c478bd9Sstevel@tonic-gate * sparc register window optimization: 4767c478bd9Sstevel@tonic-gate * 4777c478bd9Sstevel@tonic-gate * `a', `b', `c', `d', and `e' are passed into SHA1Transform 4787c478bd9Sstevel@tonic-gate * explicitly since it increases the number of registers available to 4797c478bd9Sstevel@tonic-gate * the compiler. under this scheme, these variables can be held in 4807c478bd9Sstevel@tonic-gate * %i0 - %i4, which leaves more local and out registers available. 4817c478bd9Sstevel@tonic-gate * 4827c478bd9Sstevel@tonic-gate * purpose: sha1 transformation -- updates the digest based on `block' 4837c478bd9Sstevel@tonic-gate * input: uint32_t : bytes 1 - 4 of the digest 4847c478bd9Sstevel@tonic-gate * uint32_t : bytes 5 - 8 of the digest 4857c478bd9Sstevel@tonic-gate * uint32_t : bytes 9 - 12 of the digest 4867c478bd9Sstevel@tonic-gate * uint32_t : bytes 12 - 16 of the digest 4877c478bd9Sstevel@tonic-gate * uint32_t : bytes 16 - 20 of the digest 4887c478bd9Sstevel@tonic-gate * SHA1_CTX * : the context to update 4897c478bd9Sstevel@tonic-gate * uint8_t [64]: the block to use to update the digest 4907c478bd9Sstevel@tonic-gate * output: void 4917c478bd9Sstevel@tonic-gate */ 4927c478bd9Sstevel@tonic-gate 4937c478bd9Sstevel@tonic-gate void 4947c478bd9Sstevel@tonic-gate SHA1Transform(uint32_t a, uint32_t b, uint32_t c, uint32_t d, uint32_t e, 4957c478bd9Sstevel@tonic-gate SHA1_CTX *ctx, const uint8_t blk[64]) 4967c478bd9Sstevel@tonic-gate { 4977c478bd9Sstevel@tonic-gate /* 4987c478bd9Sstevel@tonic-gate * sparc optimization: 4997c478bd9Sstevel@tonic-gate * 5007c478bd9Sstevel@tonic-gate * while it is somewhat counter-intuitive, on sparc, it is 5017c478bd9Sstevel@tonic-gate * more efficient to place all the constants used in this 5027c478bd9Sstevel@tonic-gate * function in an array and load the values out of the array 5037c478bd9Sstevel@tonic-gate * than to manually load the constants. this is because 5047c478bd9Sstevel@tonic-gate * setting a register to a 32-bit value takes two ops in most 5057c478bd9Sstevel@tonic-gate * cases: a `sethi' and an `or', but loading a 32-bit value 5067c478bd9Sstevel@tonic-gate * from memory only takes one `ld' (or `lduw' on v9). while 5077c478bd9Sstevel@tonic-gate * this increases memory usage, the compiler can find enough 5087c478bd9Sstevel@tonic-gate * other things to do while waiting to keep the pipeline does 5097c478bd9Sstevel@tonic-gate * not stall. additionally, it is likely that many of these 5107c478bd9Sstevel@tonic-gate * constants are cached so that later accesses do not even go 5117c478bd9Sstevel@tonic-gate * out to the bus. 5127c478bd9Sstevel@tonic-gate * 5137c478bd9Sstevel@tonic-gate * this array is declared `static' to keep the compiler from 5147c478bd9Sstevel@tonic-gate * having to bcopy() this array onto the stack frame of 5157c478bd9Sstevel@tonic-gate * SHA1Transform() each time it is called -- which is 5167c478bd9Sstevel@tonic-gate * unacceptably expensive. 5177c478bd9Sstevel@tonic-gate * 5187c478bd9Sstevel@tonic-gate * the `const' is to ensure that callers are good citizens and 5197c478bd9Sstevel@tonic-gate * do not try to munge the array. since these routines are 5207c478bd9Sstevel@tonic-gate * going to be called from inside multithreaded kernelland, 5217c478bd9Sstevel@tonic-gate * this is a good safety check. -- `sha1_consts' will end up in 5227c478bd9Sstevel@tonic-gate * .rodata. 5237c478bd9Sstevel@tonic-gate * 5247c478bd9Sstevel@tonic-gate * unfortunately, loading from an array in this manner hurts 5254b56a003SDaniel Anderson * performance under Intel. So, there is a macro, 5267c478bd9Sstevel@tonic-gate * SHA1_CONST(), used in SHA1Transform(), that either expands to 5277c478bd9Sstevel@tonic-gate * a reference to this array, or to the actual constant, 5287c478bd9Sstevel@tonic-gate * depending on what platform this code is compiled for. 5297c478bd9Sstevel@tonic-gate */ 5307c478bd9Sstevel@tonic-gate 5317c478bd9Sstevel@tonic-gate static const uint32_t sha1_consts[] = { 5324b56a003SDaniel Anderson SHA1_CONST_0, SHA1_CONST_1, SHA1_CONST_2, SHA1_CONST_3 5337c478bd9Sstevel@tonic-gate }; 5347c478bd9Sstevel@tonic-gate 5357c478bd9Sstevel@tonic-gate /* 5367c478bd9Sstevel@tonic-gate * general optimization: 5377c478bd9Sstevel@tonic-gate * 5387c478bd9Sstevel@tonic-gate * use individual integers instead of using an array. this is a 5397c478bd9Sstevel@tonic-gate * win, although the amount it wins by seems to vary quite a bit. 5407c478bd9Sstevel@tonic-gate */ 5417c478bd9Sstevel@tonic-gate 5427c478bd9Sstevel@tonic-gate uint32_t w_0, w_1, w_2, w_3, w_4, w_5, w_6, w_7; 5437c478bd9Sstevel@tonic-gate uint32_t w_8, w_9, w_10, w_11, w_12, w_13, w_14, w_15; 5447c478bd9Sstevel@tonic-gate 5457c478bd9Sstevel@tonic-gate /* 5467c478bd9Sstevel@tonic-gate * sparc optimization: 5477c478bd9Sstevel@tonic-gate * 5487c478bd9Sstevel@tonic-gate * if `block' is already aligned on a 4-byte boundary, use 5497c478bd9Sstevel@tonic-gate * LOAD_BIG_32() directly. otherwise, bcopy() into a 5507c478bd9Sstevel@tonic-gate * buffer that *is* aligned on a 4-byte boundary and then do 5517c478bd9Sstevel@tonic-gate * the LOAD_BIG_32() on that buffer. benchmarks have shown 5527c478bd9Sstevel@tonic-gate * that using the bcopy() is better than loading the bytes 5537c478bd9Sstevel@tonic-gate * individually and doing the endian-swap by hand. 5547c478bd9Sstevel@tonic-gate * 5557c478bd9Sstevel@tonic-gate * even though it's quite tempting to assign to do: 5567c478bd9Sstevel@tonic-gate * 5577c478bd9Sstevel@tonic-gate * blk = bcopy(ctx->buf_un.buf32, blk, sizeof (ctx->buf_un.buf32)); 5587c478bd9Sstevel@tonic-gate * 5597c478bd9Sstevel@tonic-gate * and only have one set of LOAD_BIG_32()'s, the compiler 5607c478bd9Sstevel@tonic-gate * *does not* like that, so please resist the urge. 5617c478bd9Sstevel@tonic-gate */ 5627c478bd9Sstevel@tonic-gate 5637c478bd9Sstevel@tonic-gate if ((uintptr_t)blk & 0x3) { /* not 4-byte aligned? */ 5647c478bd9Sstevel@tonic-gate bcopy(blk, ctx->buf_un.buf32, sizeof (ctx->buf_un.buf32)); 5657c478bd9Sstevel@tonic-gate w_15 = LOAD_BIG_32(ctx->buf_un.buf32 + 15); 5667c478bd9Sstevel@tonic-gate w_14 = LOAD_BIG_32(ctx->buf_un.buf32 + 14); 5677c478bd9Sstevel@tonic-gate w_13 = LOAD_BIG_32(ctx->buf_un.buf32 + 13); 5687c478bd9Sstevel@tonic-gate w_12 = LOAD_BIG_32(ctx->buf_un.buf32 + 12); 5697c478bd9Sstevel@tonic-gate w_11 = LOAD_BIG_32(ctx->buf_un.buf32 + 11); 5707c478bd9Sstevel@tonic-gate w_10 = LOAD_BIG_32(ctx->buf_un.buf32 + 10); 5717c478bd9Sstevel@tonic-gate w_9 = LOAD_BIG_32(ctx->buf_un.buf32 + 9); 5727c478bd9Sstevel@tonic-gate w_8 = LOAD_BIG_32(ctx->buf_un.buf32 + 8); 5737c478bd9Sstevel@tonic-gate w_7 = LOAD_BIG_32(ctx->buf_un.buf32 + 7); 5747c478bd9Sstevel@tonic-gate w_6 = LOAD_BIG_32(ctx->buf_un.buf32 + 6); 5757c478bd9Sstevel@tonic-gate w_5 = LOAD_BIG_32(ctx->buf_un.buf32 + 5); 5767c478bd9Sstevel@tonic-gate w_4 = LOAD_BIG_32(ctx->buf_un.buf32 + 4); 5777c478bd9Sstevel@tonic-gate w_3 = LOAD_BIG_32(ctx->buf_un.buf32 + 3); 5787c478bd9Sstevel@tonic-gate w_2 = LOAD_BIG_32(ctx->buf_un.buf32 + 2); 5797c478bd9Sstevel@tonic-gate w_1 = LOAD_BIG_32(ctx->buf_un.buf32 + 1); 5807c478bd9Sstevel@tonic-gate w_0 = LOAD_BIG_32(ctx->buf_un.buf32 + 0); 5817c478bd9Sstevel@tonic-gate } else { 582*8de5c4f4SDan OpenSolaris Anderson /* LINTED E_BAD_PTR_CAST_ALIGN */ 5837c478bd9Sstevel@tonic-gate w_15 = LOAD_BIG_32(blk + 60); 584*8de5c4f4SDan OpenSolaris Anderson /* LINTED E_BAD_PTR_CAST_ALIGN */ 5857c478bd9Sstevel@tonic-gate w_14 = LOAD_BIG_32(blk + 56); 586*8de5c4f4SDan OpenSolaris Anderson /* LINTED E_BAD_PTR_CAST_ALIGN */ 5877c478bd9Sstevel@tonic-gate w_13 = LOAD_BIG_32(blk + 52); 588*8de5c4f4SDan OpenSolaris Anderson /* LINTED E_BAD_PTR_CAST_ALIGN */ 5897c478bd9Sstevel@tonic-gate w_12 = LOAD_BIG_32(blk + 48); 590*8de5c4f4SDan OpenSolaris Anderson /* LINTED E_BAD_PTR_CAST_ALIGN */ 5917c478bd9Sstevel@tonic-gate w_11 = LOAD_BIG_32(blk + 44); 592*8de5c4f4SDan OpenSolaris Anderson /* LINTED E_BAD_PTR_CAST_ALIGN */ 5937c478bd9Sstevel@tonic-gate w_10 = LOAD_BIG_32(blk + 40); 594*8de5c4f4SDan OpenSolaris Anderson /* LINTED E_BAD_PTR_CAST_ALIGN */ 5957c478bd9Sstevel@tonic-gate w_9 = LOAD_BIG_32(blk + 36); 596*8de5c4f4SDan OpenSolaris Anderson /* LINTED E_BAD_PTR_CAST_ALIGN */ 5977c478bd9Sstevel@tonic-gate w_8 = LOAD_BIG_32(blk + 32); 598*8de5c4f4SDan OpenSolaris Anderson /* LINTED E_BAD_PTR_CAST_ALIGN */ 5997c478bd9Sstevel@tonic-gate w_7 = LOAD_BIG_32(blk + 28); 600*8de5c4f4SDan OpenSolaris Anderson /* LINTED E_BAD_PTR_CAST_ALIGN */ 6017c478bd9Sstevel@tonic-gate w_6 = LOAD_BIG_32(blk + 24); 602*8de5c4f4SDan OpenSolaris Anderson /* LINTED E_BAD_PTR_CAST_ALIGN */ 6037c478bd9Sstevel@tonic-gate w_5 = LOAD_BIG_32(blk + 20); 604*8de5c4f4SDan OpenSolaris Anderson /* LINTED E_BAD_PTR_CAST_ALIGN */ 6057c478bd9Sstevel@tonic-gate w_4 = LOAD_BIG_32(blk + 16); 606*8de5c4f4SDan OpenSolaris Anderson /* LINTED E_BAD_PTR_CAST_ALIGN */ 6077c478bd9Sstevel@tonic-gate w_3 = LOAD_BIG_32(blk + 12); 608*8de5c4f4SDan OpenSolaris Anderson /* LINTED E_BAD_PTR_CAST_ALIGN */ 6097c478bd9Sstevel@tonic-gate w_2 = LOAD_BIG_32(blk + 8); 610*8de5c4f4SDan OpenSolaris Anderson /* LINTED E_BAD_PTR_CAST_ALIGN */ 6117c478bd9Sstevel@tonic-gate w_1 = LOAD_BIG_32(blk + 4); 612*8de5c4f4SDan OpenSolaris Anderson /* LINTED E_BAD_PTR_CAST_ALIGN */ 6137c478bd9Sstevel@tonic-gate w_0 = LOAD_BIG_32(blk + 0); 6147c478bd9Sstevel@tonic-gate } 615734b6a94Sdarrenm #else /* !defined(__sparc) */ 616734b6a94Sdarrenm 6174b56a003SDaniel Anderson void /* CSTYLED */ 618734b6a94Sdarrenm SHA1Transform(SHA1_CTX *ctx, const uint8_t blk[64]) 619734b6a94Sdarrenm { 6204b56a003SDaniel Anderson /* CSTYLED */ 621734b6a94Sdarrenm sha1word a = ctx->state[0]; 622734b6a94Sdarrenm sha1word b = ctx->state[1]; 623734b6a94Sdarrenm sha1word c = ctx->state[2]; 624734b6a94Sdarrenm sha1word d = ctx->state[3]; 625734b6a94Sdarrenm sha1word e = ctx->state[4]; 626734b6a94Sdarrenm 627734b6a94Sdarrenm #if defined(W_ARRAY) 628734b6a94Sdarrenm sha1word w[16]; 629734b6a94Sdarrenm #else /* !defined(W_ARRAY) */ 630734b6a94Sdarrenm sha1word w_0, w_1, w_2, w_3, w_4, w_5, w_6, w_7; 631734b6a94Sdarrenm sha1word w_8, w_9, w_10, w_11, w_12, w_13, w_14, w_15; 632734b6a94Sdarrenm #endif /* !defined(W_ARRAY) */ 633734b6a94Sdarrenm 63425cc6a40SDaniel Anderson W(0) = LOAD_BIG_32((void *)(blk + 0)); 63525cc6a40SDaniel Anderson W(1) = LOAD_BIG_32((void *)(blk + 4)); 63625cc6a40SDaniel Anderson W(2) = LOAD_BIG_32((void *)(blk + 8)); 63725cc6a40SDaniel Anderson W(3) = LOAD_BIG_32((void *)(blk + 12)); 63825cc6a40SDaniel Anderson W(4) = LOAD_BIG_32((void *)(blk + 16)); 63925cc6a40SDaniel Anderson W(5) = LOAD_BIG_32((void *)(blk + 20)); 64025cc6a40SDaniel Anderson W(6) = LOAD_BIG_32((void *)(blk + 24)); 64125cc6a40SDaniel Anderson W(7) = LOAD_BIG_32((void *)(blk + 28)); 64225cc6a40SDaniel Anderson W(8) = LOAD_BIG_32((void *)(blk + 32)); 64325cc6a40SDaniel Anderson W(9) = LOAD_BIG_32((void *)(blk + 36)); 64425cc6a40SDaniel Anderson W(10) = LOAD_BIG_32((void *)(blk + 40)); 64525cc6a40SDaniel Anderson W(11) = LOAD_BIG_32((void *)(blk + 44)); 64625cc6a40SDaniel Anderson W(12) = LOAD_BIG_32((void *)(blk + 48)); 64725cc6a40SDaniel Anderson W(13) = LOAD_BIG_32((void *)(blk + 52)); 64825cc6a40SDaniel Anderson W(14) = LOAD_BIG_32((void *)(blk + 56)); 64925cc6a40SDaniel Anderson W(15) = LOAD_BIG_32((void *)(blk + 60)); 650734b6a94Sdarrenm 651734b6a94Sdarrenm #endif /* !defined(__sparc) */ 652734b6a94Sdarrenm 6537c478bd9Sstevel@tonic-gate /* 6547c478bd9Sstevel@tonic-gate * general optimization: 6557c478bd9Sstevel@tonic-gate * 6567c478bd9Sstevel@tonic-gate * even though this approach is described in the standard as 6577c478bd9Sstevel@tonic-gate * being slower algorithmically, it is 30-40% faster than the 6587c478bd9Sstevel@tonic-gate * "faster" version under SPARC, because this version has more 6597c478bd9Sstevel@tonic-gate * of the constraints specified at compile-time and uses fewer 6607c478bd9Sstevel@tonic-gate * variables (and therefore has better register utilization) 6617c478bd9Sstevel@tonic-gate * than its "speedier" brother. (i've tried both, trust me) 6627c478bd9Sstevel@tonic-gate * 6637c478bd9Sstevel@tonic-gate * for either method given in the spec, there is an "assignment" 6647c478bd9Sstevel@tonic-gate * phase where the following takes place: 6657c478bd9Sstevel@tonic-gate * 6667c478bd9Sstevel@tonic-gate * tmp = (main_computation); 6677c478bd9Sstevel@tonic-gate * e = d; d = c; c = rotate_left(b, 30); b = a; a = tmp; 6687c478bd9Sstevel@tonic-gate * 6697c478bd9Sstevel@tonic-gate * we can make the algorithm go faster by not doing this work, 6707c478bd9Sstevel@tonic-gate * but just pretending that `d' is now `e', etc. this works 6717c478bd9Sstevel@tonic-gate * really well and obviates the need for a temporary variable. 672321502cdSda73024 * however, we still explicitly perform the rotate action, 6737c478bd9Sstevel@tonic-gate * since it is cheaper on SPARC to do it once than to have to 6747c478bd9Sstevel@tonic-gate * do it over and over again. 6757c478bd9Sstevel@tonic-gate */ 6767c478bd9Sstevel@tonic-gate 6777c478bd9Sstevel@tonic-gate /* round 1 */ 678734b6a94Sdarrenm e = ROTATE_LEFT(a, 5) + F(b, c, d) + e + W(0) + SHA1_CONST(0); /* 0 */ 6797c478bd9Sstevel@tonic-gate b = ROTATE_LEFT(b, 30); 6807c478bd9Sstevel@tonic-gate 681734b6a94Sdarrenm d = ROTATE_LEFT(e, 5) + F(a, b, c) + d + W(1) + SHA1_CONST(0); /* 1 */ 6827c478bd9Sstevel@tonic-gate a = ROTATE_LEFT(a, 30); 6837c478bd9Sstevel@tonic-gate 684734b6a94Sdarrenm c = ROTATE_LEFT(d, 5) + F(e, a, b) + c + W(2) + SHA1_CONST(0); /* 2 */ 6857c478bd9Sstevel@tonic-gate e = ROTATE_LEFT(e, 30); 6867c478bd9Sstevel@tonic-gate 687734b6a94Sdarrenm b = ROTATE_LEFT(c, 5) + F(d, e, a) + b + W(3) + SHA1_CONST(0); /* 3 */ 6887c478bd9Sstevel@tonic-gate d = ROTATE_LEFT(d, 30); 6897c478bd9Sstevel@tonic-gate 690734b6a94Sdarrenm a = ROTATE_LEFT(b, 5) + F(c, d, e) + a + W(4) + SHA1_CONST(0); /* 4 */ 6917c478bd9Sstevel@tonic-gate c = ROTATE_LEFT(c, 30); 6927c478bd9Sstevel@tonic-gate 693734b6a94Sdarrenm e = ROTATE_LEFT(a, 5) + F(b, c, d) + e + W(5) + SHA1_CONST(0); /* 5 */ 6947c478bd9Sstevel@tonic-gate b = ROTATE_LEFT(b, 30); 6957c478bd9Sstevel@tonic-gate 696734b6a94Sdarrenm d = ROTATE_LEFT(e, 5) + F(a, b, c) + d + W(6) + SHA1_CONST(0); /* 6 */ 6977c478bd9Sstevel@tonic-gate a = ROTATE_LEFT(a, 30); 6987c478bd9Sstevel@tonic-gate 699734b6a94Sdarrenm c = ROTATE_LEFT(d, 5) + F(e, a, b) + c + W(7) + SHA1_CONST(0); /* 7 */ 7007c478bd9Sstevel@tonic-gate e = ROTATE_LEFT(e, 30); 7017c478bd9Sstevel@tonic-gate 702734b6a94Sdarrenm b = ROTATE_LEFT(c, 5) + F(d, e, a) + b + W(8) + SHA1_CONST(0); /* 8 */ 7037c478bd9Sstevel@tonic-gate d = ROTATE_LEFT(d, 30); 7047c478bd9Sstevel@tonic-gate 705734b6a94Sdarrenm a = ROTATE_LEFT(b, 5) + F(c, d, e) + a + W(9) + SHA1_CONST(0); /* 9 */ 7067c478bd9Sstevel@tonic-gate c = ROTATE_LEFT(c, 30); 7077c478bd9Sstevel@tonic-gate 708734b6a94Sdarrenm e = ROTATE_LEFT(a, 5) + F(b, c, d) + e + W(10) + SHA1_CONST(0); /* 10 */ 7097c478bd9Sstevel@tonic-gate b = ROTATE_LEFT(b, 30); 7107c478bd9Sstevel@tonic-gate 711734b6a94Sdarrenm d = ROTATE_LEFT(e, 5) + F(a, b, c) + d + W(11) + SHA1_CONST(0); /* 11 */ 7127c478bd9Sstevel@tonic-gate a = ROTATE_LEFT(a, 30); 7137c478bd9Sstevel@tonic-gate 714734b6a94Sdarrenm c = ROTATE_LEFT(d, 5) + F(e, a, b) + c + W(12) + SHA1_CONST(0); /* 12 */ 7157c478bd9Sstevel@tonic-gate e = ROTATE_LEFT(e, 30); 7167c478bd9Sstevel@tonic-gate 717734b6a94Sdarrenm b = ROTATE_LEFT(c, 5) + F(d, e, a) + b + W(13) + SHA1_CONST(0); /* 13 */ 7187c478bd9Sstevel@tonic-gate d = ROTATE_LEFT(d, 30); 7197c478bd9Sstevel@tonic-gate 720734b6a94Sdarrenm a = ROTATE_LEFT(b, 5) + F(c, d, e) + a + W(14) + SHA1_CONST(0); /* 14 */ 7217c478bd9Sstevel@tonic-gate c = ROTATE_LEFT(c, 30); 7227c478bd9Sstevel@tonic-gate 723734b6a94Sdarrenm e = ROTATE_LEFT(a, 5) + F(b, c, d) + e + W(15) + SHA1_CONST(0); /* 15 */ 7247c478bd9Sstevel@tonic-gate b = ROTATE_LEFT(b, 30); 7257c478bd9Sstevel@tonic-gate 726734b6a94Sdarrenm W(0) = ROTATE_LEFT((W(13) ^ W(8) ^ W(2) ^ W(0)), 1); /* 16 */ 727734b6a94Sdarrenm d = ROTATE_LEFT(e, 5) + F(a, b, c) + d + W(0) + SHA1_CONST(0); 7287c478bd9Sstevel@tonic-gate a = ROTATE_LEFT(a, 30); 7297c478bd9Sstevel@tonic-gate 730734b6a94Sdarrenm W(1) = ROTATE_LEFT((W(14) ^ W(9) ^ W(3) ^ W(1)), 1); /* 17 */ 731734b6a94Sdarrenm c = ROTATE_LEFT(d, 5) + F(e, a, b) + c + W(1) + SHA1_CONST(0); 7327c478bd9Sstevel@tonic-gate e = ROTATE_LEFT(e, 30); 7337c478bd9Sstevel@tonic-gate 734734b6a94Sdarrenm W(2) = ROTATE_LEFT((W(15) ^ W(10) ^ W(4) ^ W(2)), 1); /* 18 */ 735734b6a94Sdarrenm b = ROTATE_LEFT(c, 5) + F(d, e, a) + b + W(2) + SHA1_CONST(0); 7367c478bd9Sstevel@tonic-gate d = ROTATE_LEFT(d, 30); 7377c478bd9Sstevel@tonic-gate 738734b6a94Sdarrenm W(3) = ROTATE_LEFT((W(0) ^ W(11) ^ W(5) ^ W(3)), 1); /* 19 */ 739734b6a94Sdarrenm a = ROTATE_LEFT(b, 5) + F(c, d, e) + a + W(3) + SHA1_CONST(0); 7407c478bd9Sstevel@tonic-gate c = ROTATE_LEFT(c, 30); 7417c478bd9Sstevel@tonic-gate 7427c478bd9Sstevel@tonic-gate /* round 2 */ 743734b6a94Sdarrenm W(4) = ROTATE_LEFT((W(1) ^ W(12) ^ W(6) ^ W(4)), 1); /* 20 */ 744734b6a94Sdarrenm e = ROTATE_LEFT(a, 5) + G(b, c, d) + e + W(4) + SHA1_CONST(1); 7457c478bd9Sstevel@tonic-gate b = ROTATE_LEFT(b, 30); 7467c478bd9Sstevel@tonic-gate 747734b6a94Sdarrenm W(5) = ROTATE_LEFT((W(2) ^ W(13) ^ W(7) ^ W(5)), 1); /* 21 */ 748734b6a94Sdarrenm d = ROTATE_LEFT(e, 5) + G(a, b, c) + d + W(5) + SHA1_CONST(1); 7497c478bd9Sstevel@tonic-gate a = ROTATE_LEFT(a, 30); 7507c478bd9Sstevel@tonic-gate 751734b6a94Sdarrenm W(6) = ROTATE_LEFT((W(3) ^ W(14) ^ W(8) ^ W(6)), 1); /* 22 */ 752734b6a94Sdarrenm c = ROTATE_LEFT(d, 5) + G(e, a, b) + c + W(6) + SHA1_CONST(1); 7537c478bd9Sstevel@tonic-gate e = ROTATE_LEFT(e, 30); 7547c478bd9Sstevel@tonic-gate 755734b6a94Sdarrenm W(7) = ROTATE_LEFT((W(4) ^ W(15) ^ W(9) ^ W(7)), 1); /* 23 */ 756734b6a94Sdarrenm b = ROTATE_LEFT(c, 5) + G(d, e, a) + b + W(7) + SHA1_CONST(1); 7577c478bd9Sstevel@tonic-gate d = ROTATE_LEFT(d, 30); 7587c478bd9Sstevel@tonic-gate 759734b6a94Sdarrenm W(8) = ROTATE_LEFT((W(5) ^ W(0) ^ W(10) ^ W(8)), 1); /* 24 */ 760734b6a94Sdarrenm a = ROTATE_LEFT(b, 5) + G(c, d, e) + a + W(8) + SHA1_CONST(1); 7617c478bd9Sstevel@tonic-gate c = ROTATE_LEFT(c, 30); 7627c478bd9Sstevel@tonic-gate 763734b6a94Sdarrenm W(9) = ROTATE_LEFT((W(6) ^ W(1) ^ W(11) ^ W(9)), 1); /* 25 */ 764734b6a94Sdarrenm e = ROTATE_LEFT(a, 5) + G(b, c, d) + e + W(9) + SHA1_CONST(1); 7657c478bd9Sstevel@tonic-gate b = ROTATE_LEFT(b, 30); 7667c478bd9Sstevel@tonic-gate 767734b6a94Sdarrenm W(10) = ROTATE_LEFT((W(7) ^ W(2) ^ W(12) ^ W(10)), 1); /* 26 */ 768734b6a94Sdarrenm d = ROTATE_LEFT(e, 5) + G(a, b, c) + d + W(10) + SHA1_CONST(1); 7697c478bd9Sstevel@tonic-gate a = ROTATE_LEFT(a, 30); 7707c478bd9Sstevel@tonic-gate 771734b6a94Sdarrenm W(11) = ROTATE_LEFT((W(8) ^ W(3) ^ W(13) ^ W(11)), 1); /* 27 */ 772734b6a94Sdarrenm c = ROTATE_LEFT(d, 5) + G(e, a, b) + c + W(11) + SHA1_CONST(1); 7737c478bd9Sstevel@tonic-gate e = ROTATE_LEFT(e, 30); 7747c478bd9Sstevel@tonic-gate 775734b6a94Sdarrenm W(12) = ROTATE_LEFT((W(9) ^ W(4) ^ W(14) ^ W(12)), 1); /* 28 */ 776734b6a94Sdarrenm b = ROTATE_LEFT(c, 5) + G(d, e, a) + b + W(12) + SHA1_CONST(1); 7777c478bd9Sstevel@tonic-gate d = ROTATE_LEFT(d, 30); 7787c478bd9Sstevel@tonic-gate 779734b6a94Sdarrenm W(13) = ROTATE_LEFT((W(10) ^ W(5) ^ W(15) ^ W(13)), 1); /* 29 */ 780734b6a94Sdarrenm a = ROTATE_LEFT(b, 5) + G(c, d, e) + a + W(13) + SHA1_CONST(1); 7817c478bd9Sstevel@tonic-gate c = ROTATE_LEFT(c, 30); 7827c478bd9Sstevel@tonic-gate 783734b6a94Sdarrenm W(14) = ROTATE_LEFT((W(11) ^ W(6) ^ W(0) ^ W(14)), 1); /* 30 */ 784734b6a94Sdarrenm e = ROTATE_LEFT(a, 5) + G(b, c, d) + e + W(14) + SHA1_CONST(1); 7857c478bd9Sstevel@tonic-gate b = ROTATE_LEFT(b, 30); 7867c478bd9Sstevel@tonic-gate 787734b6a94Sdarrenm W(15) = ROTATE_LEFT((W(12) ^ W(7) ^ W(1) ^ W(15)), 1); /* 31 */ 788734b6a94Sdarrenm d = ROTATE_LEFT(e, 5) + G(a, b, c) + d + W(15) + SHA1_CONST(1); 7897c478bd9Sstevel@tonic-gate a = ROTATE_LEFT(a, 30); 7907c478bd9Sstevel@tonic-gate 791734b6a94Sdarrenm W(0) = ROTATE_LEFT((W(13) ^ W(8) ^ W(2) ^ W(0)), 1); /* 32 */ 792734b6a94Sdarrenm c = ROTATE_LEFT(d, 5) + G(e, a, b) + c + W(0) + SHA1_CONST(1); 7937c478bd9Sstevel@tonic-gate e = ROTATE_LEFT(e, 30); 7947c478bd9Sstevel@tonic-gate 795734b6a94Sdarrenm W(1) = ROTATE_LEFT((W(14) ^ W(9) ^ W(3) ^ W(1)), 1); /* 33 */ 796734b6a94Sdarrenm b = ROTATE_LEFT(c, 5) + G(d, e, a) + b + W(1) + SHA1_CONST(1); 7977c478bd9Sstevel@tonic-gate d = ROTATE_LEFT(d, 30); 7987c478bd9Sstevel@tonic-gate 799734b6a94Sdarrenm W(2) = ROTATE_LEFT((W(15) ^ W(10) ^ W(4) ^ W(2)), 1); /* 34 */ 800734b6a94Sdarrenm a = ROTATE_LEFT(b, 5) + G(c, d, e) + a + W(2) + SHA1_CONST(1); 8017c478bd9Sstevel@tonic-gate c = ROTATE_LEFT(c, 30); 8027c478bd9Sstevel@tonic-gate 803734b6a94Sdarrenm W(3) = ROTATE_LEFT((W(0) ^ W(11) ^ W(5) ^ W(3)), 1); /* 35 */ 804734b6a94Sdarrenm e = ROTATE_LEFT(a, 5) + G(b, c, d) + e + W(3) + SHA1_CONST(1); 8057c478bd9Sstevel@tonic-gate b = ROTATE_LEFT(b, 30); 8067c478bd9Sstevel@tonic-gate 807734b6a94Sdarrenm W(4) = ROTATE_LEFT((W(1) ^ W(12) ^ W(6) ^ W(4)), 1); /* 36 */ 808734b6a94Sdarrenm d = ROTATE_LEFT(e, 5) + G(a, b, c) + d + W(4) + SHA1_CONST(1); 8097c478bd9Sstevel@tonic-gate a = ROTATE_LEFT(a, 30); 8107c478bd9Sstevel@tonic-gate 811734b6a94Sdarrenm W(5) = ROTATE_LEFT((W(2) ^ W(13) ^ W(7) ^ W(5)), 1); /* 37 */ 812734b6a94Sdarrenm c = ROTATE_LEFT(d, 5) + G(e, a, b) + c + W(5) + SHA1_CONST(1); 8137c478bd9Sstevel@tonic-gate e = ROTATE_LEFT(e, 30); 8147c478bd9Sstevel@tonic-gate 815734b6a94Sdarrenm W(6) = ROTATE_LEFT((W(3) ^ W(14) ^ W(8) ^ W(6)), 1); /* 38 */ 816734b6a94Sdarrenm b = ROTATE_LEFT(c, 5) + G(d, e, a) + b + W(6) + SHA1_CONST(1); 8177c478bd9Sstevel@tonic-gate d = ROTATE_LEFT(d, 30); 8187c478bd9Sstevel@tonic-gate 819734b6a94Sdarrenm W(7) = ROTATE_LEFT((W(4) ^ W(15) ^ W(9) ^ W(7)), 1); /* 39 */ 820734b6a94Sdarrenm a = ROTATE_LEFT(b, 5) + G(c, d, e) + a + W(7) + SHA1_CONST(1); 8217c478bd9Sstevel@tonic-gate c = ROTATE_LEFT(c, 30); 8227c478bd9Sstevel@tonic-gate 8237c478bd9Sstevel@tonic-gate /* round 3 */ 824734b6a94Sdarrenm W(8) = ROTATE_LEFT((W(5) ^ W(0) ^ W(10) ^ W(8)), 1); /* 40 */ 825734b6a94Sdarrenm e = ROTATE_LEFT(a, 5) + H(b, c, d) + e + W(8) + SHA1_CONST(2); 8267c478bd9Sstevel@tonic-gate b = ROTATE_LEFT(b, 30); 8277c478bd9Sstevel@tonic-gate 828734b6a94Sdarrenm W(9) = ROTATE_LEFT((W(6) ^ W(1) ^ W(11) ^ W(9)), 1); /* 41 */ 829734b6a94Sdarrenm d = ROTATE_LEFT(e, 5) + H(a, b, c) + d + W(9) + SHA1_CONST(2); 8307c478bd9Sstevel@tonic-gate a = ROTATE_LEFT(a, 30); 8317c478bd9Sstevel@tonic-gate 832734b6a94Sdarrenm W(10) = ROTATE_LEFT((W(7) ^ W(2) ^ W(12) ^ W(10)), 1); /* 42 */ 833734b6a94Sdarrenm c = ROTATE_LEFT(d, 5) + H(e, a, b) + c + W(10) + SHA1_CONST(2); 8347c478bd9Sstevel@tonic-gate e = ROTATE_LEFT(e, 30); 8357c478bd9Sstevel@tonic-gate 836734b6a94Sdarrenm W(11) = ROTATE_LEFT((W(8) ^ W(3) ^ W(13) ^ W(11)), 1); /* 43 */ 837734b6a94Sdarrenm b = ROTATE_LEFT(c, 5) + H(d, e, a) + b + W(11) + SHA1_CONST(2); 8387c478bd9Sstevel@tonic-gate d = ROTATE_LEFT(d, 30); 8397c478bd9Sstevel@tonic-gate 840734b6a94Sdarrenm W(12) = ROTATE_LEFT((W(9) ^ W(4) ^ W(14) ^ W(12)), 1); /* 44 */ 841734b6a94Sdarrenm a = ROTATE_LEFT(b, 5) + H(c, d, e) + a + W(12) + SHA1_CONST(2); 8427c478bd9Sstevel@tonic-gate c = ROTATE_LEFT(c, 30); 8437c478bd9Sstevel@tonic-gate 844734b6a94Sdarrenm W(13) = ROTATE_LEFT((W(10) ^ W(5) ^ W(15) ^ W(13)), 1); /* 45 */ 845734b6a94Sdarrenm e = ROTATE_LEFT(a, 5) + H(b, c, d) + e + W(13) + SHA1_CONST(2); 8467c478bd9Sstevel@tonic-gate b = ROTATE_LEFT(b, 30); 8477c478bd9Sstevel@tonic-gate 848734b6a94Sdarrenm W(14) = ROTATE_LEFT((W(11) ^ W(6) ^ W(0) ^ W(14)), 1); /* 46 */ 849734b6a94Sdarrenm d = ROTATE_LEFT(e, 5) + H(a, b, c) + d + W(14) + SHA1_CONST(2); 8507c478bd9Sstevel@tonic-gate a = ROTATE_LEFT(a, 30); 8517c478bd9Sstevel@tonic-gate 852734b6a94Sdarrenm W(15) = ROTATE_LEFT((W(12) ^ W(7) ^ W(1) ^ W(15)), 1); /* 47 */ 853734b6a94Sdarrenm c = ROTATE_LEFT(d, 5) + H(e, a, b) + c + W(15) + SHA1_CONST(2); 8547c478bd9Sstevel@tonic-gate e = ROTATE_LEFT(e, 30); 8557c478bd9Sstevel@tonic-gate 856734b6a94Sdarrenm W(0) = ROTATE_LEFT((W(13) ^ W(8) ^ W(2) ^ W(0)), 1); /* 48 */ 857734b6a94Sdarrenm b = ROTATE_LEFT(c, 5) + H(d, e, a) + b + W(0) + SHA1_CONST(2); 8587c478bd9Sstevel@tonic-gate d = ROTATE_LEFT(d, 30); 8597c478bd9Sstevel@tonic-gate 860734b6a94Sdarrenm W(1) = ROTATE_LEFT((W(14) ^ W(9) ^ W(3) ^ W(1)), 1); /* 49 */ 861734b6a94Sdarrenm a = ROTATE_LEFT(b, 5) + H(c, d, e) + a + W(1) + SHA1_CONST(2); 8627c478bd9Sstevel@tonic-gate c = ROTATE_LEFT(c, 30); 8637c478bd9Sstevel@tonic-gate 864734b6a94Sdarrenm W(2) = ROTATE_LEFT((W(15) ^ W(10) ^ W(4) ^ W(2)), 1); /* 50 */ 865734b6a94Sdarrenm e = ROTATE_LEFT(a, 5) + H(b, c, d) + e + W(2) + SHA1_CONST(2); 8667c478bd9Sstevel@tonic-gate b = ROTATE_LEFT(b, 30); 8677c478bd9Sstevel@tonic-gate 868734b6a94Sdarrenm W(3) = ROTATE_LEFT((W(0) ^ W(11) ^ W(5) ^ W(3)), 1); /* 51 */ 869734b6a94Sdarrenm d = ROTATE_LEFT(e, 5) + H(a, b, c) + d + W(3) + SHA1_CONST(2); 8707c478bd9Sstevel@tonic-gate a = ROTATE_LEFT(a, 30); 8717c478bd9Sstevel@tonic-gate 872734b6a94Sdarrenm W(4) = ROTATE_LEFT((W(1) ^ W(12) ^ W(6) ^ W(4)), 1); /* 52 */ 873734b6a94Sdarrenm c = ROTATE_LEFT(d, 5) + H(e, a, b) + c + W(4) + SHA1_CONST(2); 8747c478bd9Sstevel@tonic-gate e = ROTATE_LEFT(e, 30); 8757c478bd9Sstevel@tonic-gate 876734b6a94Sdarrenm W(5) = ROTATE_LEFT((W(2) ^ W(13) ^ W(7) ^ W(5)), 1); /* 53 */ 877734b6a94Sdarrenm b = ROTATE_LEFT(c, 5) + H(d, e, a) + b + W(5) + SHA1_CONST(2); 8787c478bd9Sstevel@tonic-gate d = ROTATE_LEFT(d, 30); 8797c478bd9Sstevel@tonic-gate 880734b6a94Sdarrenm W(6) = ROTATE_LEFT((W(3) ^ W(14) ^ W(8) ^ W(6)), 1); /* 54 */ 881734b6a94Sdarrenm a = ROTATE_LEFT(b, 5) + H(c, d, e) + a + W(6) + SHA1_CONST(2); 8827c478bd9Sstevel@tonic-gate c = ROTATE_LEFT(c, 30); 8837c478bd9Sstevel@tonic-gate 884734b6a94Sdarrenm W(7) = ROTATE_LEFT((W(4) ^ W(15) ^ W(9) ^ W(7)), 1); /* 55 */ 885734b6a94Sdarrenm e = ROTATE_LEFT(a, 5) + H(b, c, d) + e + W(7) + SHA1_CONST(2); 8867c478bd9Sstevel@tonic-gate b = ROTATE_LEFT(b, 30); 8877c478bd9Sstevel@tonic-gate 888734b6a94Sdarrenm W(8) = ROTATE_LEFT((W(5) ^ W(0) ^ W(10) ^ W(8)), 1); /* 56 */ 889734b6a94Sdarrenm d = ROTATE_LEFT(e, 5) + H(a, b, c) + d + W(8) + SHA1_CONST(2); 8907c478bd9Sstevel@tonic-gate a = ROTATE_LEFT(a, 30); 8917c478bd9Sstevel@tonic-gate 892734b6a94Sdarrenm W(9) = ROTATE_LEFT((W(6) ^ W(1) ^ W(11) ^ W(9)), 1); /* 57 */ 893734b6a94Sdarrenm c = ROTATE_LEFT(d, 5) + H(e, a, b) + c + W(9) + SHA1_CONST(2); 8947c478bd9Sstevel@tonic-gate e = ROTATE_LEFT(e, 30); 8957c478bd9Sstevel@tonic-gate 896734b6a94Sdarrenm W(10) = ROTATE_LEFT((W(7) ^ W(2) ^ W(12) ^ W(10)), 1); /* 58 */ 897734b6a94Sdarrenm b = ROTATE_LEFT(c, 5) + H(d, e, a) + b + W(10) + SHA1_CONST(2); 8987c478bd9Sstevel@tonic-gate d = ROTATE_LEFT(d, 30); 8997c478bd9Sstevel@tonic-gate 900734b6a94Sdarrenm W(11) = ROTATE_LEFT((W(8) ^ W(3) ^ W(13) ^ W(11)), 1); /* 59 */ 901734b6a94Sdarrenm a = ROTATE_LEFT(b, 5) + H(c, d, e) + a + W(11) + SHA1_CONST(2); 9027c478bd9Sstevel@tonic-gate c = ROTATE_LEFT(c, 30); 9037c478bd9Sstevel@tonic-gate 9047c478bd9Sstevel@tonic-gate /* round 4 */ 905734b6a94Sdarrenm W(12) = ROTATE_LEFT((W(9) ^ W(4) ^ W(14) ^ W(12)), 1); /* 60 */ 906734b6a94Sdarrenm e = ROTATE_LEFT(a, 5) + G(b, c, d) + e + W(12) + SHA1_CONST(3); 9077c478bd9Sstevel@tonic-gate b = ROTATE_LEFT(b, 30); 9087c478bd9Sstevel@tonic-gate 909734b6a94Sdarrenm W(13) = ROTATE_LEFT((W(10) ^ W(5) ^ W(15) ^ W(13)), 1); /* 61 */ 910734b6a94Sdarrenm d = ROTATE_LEFT(e, 5) + G(a, b, c) + d + W(13) + SHA1_CONST(3); 9117c478bd9Sstevel@tonic-gate a = ROTATE_LEFT(a, 30); 9127c478bd9Sstevel@tonic-gate 913734b6a94Sdarrenm W(14) = ROTATE_LEFT((W(11) ^ W(6) ^ W(0) ^ W(14)), 1); /* 62 */ 914734b6a94Sdarrenm c = ROTATE_LEFT(d, 5) + G(e, a, b) + c + W(14) + SHA1_CONST(3); 9157c478bd9Sstevel@tonic-gate e = ROTATE_LEFT(e, 30); 9167c478bd9Sstevel@tonic-gate 917734b6a94Sdarrenm W(15) = ROTATE_LEFT((W(12) ^ W(7) ^ W(1) ^ W(15)), 1); /* 63 */ 918734b6a94Sdarrenm b = ROTATE_LEFT(c, 5) + G(d, e, a) + b + W(15) + SHA1_CONST(3); 9197c478bd9Sstevel@tonic-gate d = ROTATE_LEFT(d, 30); 9207c478bd9Sstevel@tonic-gate 921734b6a94Sdarrenm W(0) = ROTATE_LEFT((W(13) ^ W(8) ^ W(2) ^ W(0)), 1); /* 64 */ 922734b6a94Sdarrenm a = ROTATE_LEFT(b, 5) + G(c, d, e) + a + W(0) + SHA1_CONST(3); 9237c478bd9Sstevel@tonic-gate c = ROTATE_LEFT(c, 30); 9247c478bd9Sstevel@tonic-gate 925734b6a94Sdarrenm W(1) = ROTATE_LEFT((W(14) ^ W(9) ^ W(3) ^ W(1)), 1); /* 65 */ 926734b6a94Sdarrenm e = ROTATE_LEFT(a, 5) + G(b, c, d) + e + W(1) + SHA1_CONST(3); 9277c478bd9Sstevel@tonic-gate b = ROTATE_LEFT(b, 30); 9287c478bd9Sstevel@tonic-gate 929734b6a94Sdarrenm W(2) = ROTATE_LEFT((W(15) ^ W(10) ^ W(4) ^ W(2)), 1); /* 66 */ 930734b6a94Sdarrenm d = ROTATE_LEFT(e, 5) + G(a, b, c) + d + W(2) + SHA1_CONST(3); 9317c478bd9Sstevel@tonic-gate a = ROTATE_LEFT(a, 30); 9327c478bd9Sstevel@tonic-gate 933734b6a94Sdarrenm W(3) = ROTATE_LEFT((W(0) ^ W(11) ^ W(5) ^ W(3)), 1); /* 67 */ 934734b6a94Sdarrenm c = ROTATE_LEFT(d, 5) + G(e, a, b) + c + W(3) + SHA1_CONST(3); 9357c478bd9Sstevel@tonic-gate e = ROTATE_LEFT(e, 30); 9367c478bd9Sstevel@tonic-gate 937734b6a94Sdarrenm W(4) = ROTATE_LEFT((W(1) ^ W(12) ^ W(6) ^ W(4)), 1); /* 68 */ 938734b6a94Sdarrenm b = ROTATE_LEFT(c, 5) + G(d, e, a) + b + W(4) + SHA1_CONST(3); 9397c478bd9Sstevel@tonic-gate d = ROTATE_LEFT(d, 30); 9407c478bd9Sstevel@tonic-gate 941734b6a94Sdarrenm W(5) = ROTATE_LEFT((W(2) ^ W(13) ^ W(7) ^ W(5)), 1); /* 69 */ 942734b6a94Sdarrenm a = ROTATE_LEFT(b, 5) + G(c, d, e) + a + W(5) + SHA1_CONST(3); 9437c478bd9Sstevel@tonic-gate c = ROTATE_LEFT(c, 30); 9447c478bd9Sstevel@tonic-gate 945734b6a94Sdarrenm W(6) = ROTATE_LEFT((W(3) ^ W(14) ^ W(8) ^ W(6)), 1); /* 70 */ 946734b6a94Sdarrenm e = ROTATE_LEFT(a, 5) + G(b, c, d) + e + W(6) + SHA1_CONST(3); 9477c478bd9Sstevel@tonic-gate b = ROTATE_LEFT(b, 30); 9487c478bd9Sstevel@tonic-gate 949734b6a94Sdarrenm W(7) = ROTATE_LEFT((W(4) ^ W(15) ^ W(9) ^ W(7)), 1); /* 71 */ 950734b6a94Sdarrenm d = ROTATE_LEFT(e, 5) + G(a, b, c) + d + W(7) + SHA1_CONST(3); 9517c478bd9Sstevel@tonic-gate a = ROTATE_LEFT(a, 30); 9527c478bd9Sstevel@tonic-gate 953734b6a94Sdarrenm W(8) = ROTATE_LEFT((W(5) ^ W(0) ^ W(10) ^ W(8)), 1); /* 72 */ 954734b6a94Sdarrenm c = ROTATE_LEFT(d, 5) + G(e, a, b) + c + W(8) + SHA1_CONST(3); 9557c478bd9Sstevel@tonic-gate e = ROTATE_LEFT(e, 30); 9567c478bd9Sstevel@tonic-gate 957734b6a94Sdarrenm W(9) = ROTATE_LEFT((W(6) ^ W(1) ^ W(11) ^ W(9)), 1); /* 73 */ 958734b6a94Sdarrenm b = ROTATE_LEFT(c, 5) + G(d, e, a) + b + W(9) + SHA1_CONST(3); 9597c478bd9Sstevel@tonic-gate d = ROTATE_LEFT(d, 30); 9607c478bd9Sstevel@tonic-gate 961734b6a94Sdarrenm W(10) = ROTATE_LEFT((W(7) ^ W(2) ^ W(12) ^ W(10)), 1); /* 74 */ 962734b6a94Sdarrenm a = ROTATE_LEFT(b, 5) + G(c, d, e) + a + W(10) + SHA1_CONST(3); 9637c478bd9Sstevel@tonic-gate c = ROTATE_LEFT(c, 30); 9647c478bd9Sstevel@tonic-gate 965734b6a94Sdarrenm W(11) = ROTATE_LEFT((W(8) ^ W(3) ^ W(13) ^ W(11)), 1); /* 75 */ 966734b6a94Sdarrenm e = ROTATE_LEFT(a, 5) + G(b, c, d) + e + W(11) + SHA1_CONST(3); 9677c478bd9Sstevel@tonic-gate b = ROTATE_LEFT(b, 30); 9687c478bd9Sstevel@tonic-gate 969734b6a94Sdarrenm W(12) = ROTATE_LEFT((W(9) ^ W(4) ^ W(14) ^ W(12)), 1); /* 76 */ 970734b6a94Sdarrenm d = ROTATE_LEFT(e, 5) + G(a, b, c) + d + W(12) + SHA1_CONST(3); 9717c478bd9Sstevel@tonic-gate a = ROTATE_LEFT(a, 30); 9727c478bd9Sstevel@tonic-gate 973734b6a94Sdarrenm W(13) = ROTATE_LEFT((W(10) ^ W(5) ^ W(15) ^ W(13)), 1); /* 77 */ 974734b6a94Sdarrenm c = ROTATE_LEFT(d, 5) + G(e, a, b) + c + W(13) + SHA1_CONST(3); 9757c478bd9Sstevel@tonic-gate e = ROTATE_LEFT(e, 30); 9767c478bd9Sstevel@tonic-gate 977734b6a94Sdarrenm W(14) = ROTATE_LEFT((W(11) ^ W(6) ^ W(0) ^ W(14)), 1); /* 78 */ 978734b6a94Sdarrenm b = ROTATE_LEFT(c, 5) + G(d, e, a) + b + W(14) + SHA1_CONST(3); 9797c478bd9Sstevel@tonic-gate d = ROTATE_LEFT(d, 30); 9807c478bd9Sstevel@tonic-gate 981734b6a94Sdarrenm W(15) = ROTATE_LEFT((W(12) ^ W(7) ^ W(1) ^ W(15)), 1); /* 79 */ 9827c478bd9Sstevel@tonic-gate 983734b6a94Sdarrenm ctx->state[0] += ROTATE_LEFT(b, 5) + G(c, d, e) + a + W(15) + 9847c478bd9Sstevel@tonic-gate SHA1_CONST(3); 9857c478bd9Sstevel@tonic-gate ctx->state[1] += b; 9867c478bd9Sstevel@tonic-gate ctx->state[2] += ROTATE_LEFT(c, 30); 9877c478bd9Sstevel@tonic-gate ctx->state[3] += d; 9887c478bd9Sstevel@tonic-gate ctx->state[4] += e; 9897c478bd9Sstevel@tonic-gate 9907c478bd9Sstevel@tonic-gate /* zeroize sensitive information */ 991734b6a94Sdarrenm W(0) = W(1) = W(2) = W(3) = W(4) = W(5) = W(6) = W(7) = W(8) = 0; 992734b6a94Sdarrenm W(9) = W(10) = W(11) = W(12) = W(13) = W(14) = W(15) = 0; 9937c478bd9Sstevel@tonic-gate } 994321502cdSda73024 #endif /* !__amd64 */ 995321502cdSda73024 9967c478bd9Sstevel@tonic-gate 9977c478bd9Sstevel@tonic-gate /* 9987c478bd9Sstevel@tonic-gate * Encode() 9997c478bd9Sstevel@tonic-gate * 10007c478bd9Sstevel@tonic-gate * purpose: to convert a list of numbers from little endian to big endian 10017c478bd9Sstevel@tonic-gate * input: uint8_t * : place to store the converted big endian numbers 10027c478bd9Sstevel@tonic-gate * uint32_t * : place to get numbers to convert from 10037c478bd9Sstevel@tonic-gate * size_t : the length of the input in bytes 10047c478bd9Sstevel@tonic-gate * output: void 10057c478bd9Sstevel@tonic-gate */ 10067c478bd9Sstevel@tonic-gate 10077c478bd9Sstevel@tonic-gate static void 1008734b6a94Sdarrenm Encode(uint8_t *_RESTRICT_KYWD output, const uint32_t *_RESTRICT_KYWD input, 1009734b6a94Sdarrenm size_t len) 10107c478bd9Sstevel@tonic-gate { 10117c478bd9Sstevel@tonic-gate size_t i, j; 10127c478bd9Sstevel@tonic-gate 10137c478bd9Sstevel@tonic-gate #if defined(__sparc) 10147c478bd9Sstevel@tonic-gate if (IS_P2ALIGNED(output, sizeof (uint32_t))) { 10157c478bd9Sstevel@tonic-gate for (i = 0, j = 0; j < len; i++, j += 4) { 1016*8de5c4f4SDan OpenSolaris Anderson /* LINTED E_BAD_PTR_CAST_ALIGN */ 10177c478bd9Sstevel@tonic-gate *((uint32_t *)(output + j)) = input[i]; 10187c478bd9Sstevel@tonic-gate } 10197c478bd9Sstevel@tonic-gate } else { 10207c478bd9Sstevel@tonic-gate #endif /* little endian -- will work on big endian, but slowly */ 10217c478bd9Sstevel@tonic-gate for (i = 0, j = 0; j < len; i++, j += 4) { 10227c478bd9Sstevel@tonic-gate output[j] = (input[i] >> 24) & 0xff; 10237c478bd9Sstevel@tonic-gate output[j + 1] = (input[i] >> 16) & 0xff; 10247c478bd9Sstevel@tonic-gate output[j + 2] = (input[i] >> 8) & 0xff; 10257c478bd9Sstevel@tonic-gate output[j + 3] = input[i] & 0xff; 10267c478bd9Sstevel@tonic-gate } 10277c478bd9Sstevel@tonic-gate #if defined(__sparc) 10287c478bd9Sstevel@tonic-gate } 10297c478bd9Sstevel@tonic-gate #endif 10307c478bd9Sstevel@tonic-gate } 1031