17c478bd9Sstevel@tonic-gate /* 2321502cdSda73024 * Copyright 2008 Sun Microsystems, Inc. All rights reserved. 37c478bd9Sstevel@tonic-gate * Use is subject to license terms. 47c478bd9Sstevel@tonic-gate */ 57c478bd9Sstevel@tonic-gate 67c478bd9Sstevel@tonic-gate /* 77c478bd9Sstevel@tonic-gate * The basic framework for this code came from the reference 87c478bd9Sstevel@tonic-gate * implementation for MD5. That implementation is Copyright (C) 97c478bd9Sstevel@tonic-gate * 1991-2, RSA Data Security, Inc. Created 1991. All rights reserved. 107c478bd9Sstevel@tonic-gate * 117c478bd9Sstevel@tonic-gate * License to copy and use this software is granted provided that it 127c478bd9Sstevel@tonic-gate * is identified as the "RSA Data Security, Inc. MD5 Message-Digest 137c478bd9Sstevel@tonic-gate * Algorithm" in all material mentioning or referencing this software 147c478bd9Sstevel@tonic-gate * or this function. 157c478bd9Sstevel@tonic-gate * 167c478bd9Sstevel@tonic-gate * License is also granted to make and use derivative works provided 177c478bd9Sstevel@tonic-gate * that such works are identified as "derived from the RSA Data 187c478bd9Sstevel@tonic-gate * Security, Inc. MD5 Message-Digest Algorithm" in all material 197c478bd9Sstevel@tonic-gate * mentioning or referencing the derived work. 207c478bd9Sstevel@tonic-gate * 217c478bd9Sstevel@tonic-gate * RSA Data Security, Inc. makes no representations concerning either 227c478bd9Sstevel@tonic-gate * the merchantability of this software or the suitability of this 237c478bd9Sstevel@tonic-gate * software for any particular purpose. It is provided "as is" 247c478bd9Sstevel@tonic-gate * without express or implied warranty of any kind. 257c478bd9Sstevel@tonic-gate * 267c478bd9Sstevel@tonic-gate * These notices must be retained in any copies of any part of this 277c478bd9Sstevel@tonic-gate * documentation and/or software. 287c478bd9Sstevel@tonic-gate * 297c478bd9Sstevel@tonic-gate * NOTE: Cleaned-up and optimized, version of SHA1, based on the FIPS 180-1 30*4b56a003SDaniel Anderson * standard, available at http://www.itl.nist.gov/fipspubs/fip180-1.htm 317c478bd9Sstevel@tonic-gate * Not as fast as one would like -- further optimizations are encouraged 327c478bd9Sstevel@tonic-gate * and appreciated. 337c478bd9Sstevel@tonic-gate */ 347c478bd9Sstevel@tonic-gate 357c478bd9Sstevel@tonic-gate #include <sys/types.h> 367c478bd9Sstevel@tonic-gate #include <sys/param.h> 377c478bd9Sstevel@tonic-gate #include <sys/systm.h> 387c478bd9Sstevel@tonic-gate #include <sys/sysmacros.h> 397c478bd9Sstevel@tonic-gate #include <sys/sha1.h> 407c478bd9Sstevel@tonic-gate #include <sys/sha1_consts.h> 417c478bd9Sstevel@tonic-gate 427c478bd9Sstevel@tonic-gate #ifndef _KERNEL 437c478bd9Sstevel@tonic-gate #include <strings.h> 447c478bd9Sstevel@tonic-gate #include <stdlib.h> 457c478bd9Sstevel@tonic-gate #include <errno.h> 467c478bd9Sstevel@tonic-gate #include <sys/systeminfo.h> 477c478bd9Sstevel@tonic-gate #endif /* !_KERNEL */ 487c478bd9Sstevel@tonic-gate 49*4b56a003SDaniel Anderson #ifdef _LITTLE_ENDIAN 50*4b56a003SDaniel Anderson #include <sys/byteorder.h> 51*4b56a003SDaniel Anderson #define HAVE_HTONL 52*4b56a003SDaniel Anderson #endif 53*4b56a003SDaniel Anderson 54734b6a94Sdarrenm static void Encode(uint8_t *, const uint32_t *, size_t); 55734b6a94Sdarrenm 56734b6a94Sdarrenm #if defined(__sparc) 57734b6a94Sdarrenm 58734b6a94Sdarrenm #define SHA1_TRANSFORM(ctx, in) \ 59734b6a94Sdarrenm SHA1Transform((ctx)->state[0], (ctx)->state[1], (ctx)->state[2], \ 60734b6a94Sdarrenm (ctx)->state[3], (ctx)->state[4], (ctx), (in)) 61734b6a94Sdarrenm 627c478bd9Sstevel@tonic-gate static void SHA1Transform(uint32_t, uint32_t, uint32_t, uint32_t, uint32_t, 637c478bd9Sstevel@tonic-gate SHA1_CTX *, const uint8_t *); 647c478bd9Sstevel@tonic-gate 65321502cdSda73024 #elif defined(__amd64) 66321502cdSda73024 67321502cdSda73024 #define SHA1_TRANSFORM(ctx, in) sha1_block_data_order((ctx), (in), 1) 68321502cdSda73024 #define SHA1_TRANSFORM_BLOCKS(ctx, in, num) sha1_block_data_order((ctx), \ 69321502cdSda73024 (in), (num)) 70321502cdSda73024 71321502cdSda73024 void sha1_block_data_order(SHA1_CTX *ctx, const void *inpp, size_t num_blocks); 72321502cdSda73024 73734b6a94Sdarrenm #else 74734b6a94Sdarrenm 75734b6a94Sdarrenm #define SHA1_TRANSFORM(ctx, in) SHA1Transform((ctx), (in)) 76734b6a94Sdarrenm 77734b6a94Sdarrenm static void SHA1Transform(SHA1_CTX *, const uint8_t *); 78734b6a94Sdarrenm 79734b6a94Sdarrenm #endif 80734b6a94Sdarrenm 81734b6a94Sdarrenm 827c478bd9Sstevel@tonic-gate static uint8_t PADDING[64] = { 0x80, /* all zeros */ }; 837c478bd9Sstevel@tonic-gate 847c478bd9Sstevel@tonic-gate /* 857c478bd9Sstevel@tonic-gate * F, G, and H are the basic SHA1 functions. 867c478bd9Sstevel@tonic-gate */ 877c478bd9Sstevel@tonic-gate #define F(b, c, d) (((b) & (c)) | ((~b) & (d))) 887c478bd9Sstevel@tonic-gate #define G(b, c, d) ((b) ^ (c) ^ (d)) 89734b6a94Sdarrenm #define H(b, c, d) (((b) & (c)) | (((b)|(c)) & (d))) 907c478bd9Sstevel@tonic-gate 917c478bd9Sstevel@tonic-gate /* 927c478bd9Sstevel@tonic-gate * ROTATE_LEFT rotates x left n bits. 937c478bd9Sstevel@tonic-gate */ 94734b6a94Sdarrenm 95734b6a94Sdarrenm #if defined(__GNUC__) && defined(_LP64) 96734b6a94Sdarrenm static __inline__ uint64_t 97734b6a94Sdarrenm ROTATE_LEFT(uint64_t value, uint32_t n) 98734b6a94Sdarrenm { 99734b6a94Sdarrenm uint32_t t32; 100734b6a94Sdarrenm 101734b6a94Sdarrenm t32 = (uint32_t)value; 102734b6a94Sdarrenm return ((t32 << n) | (t32 >> (32 - n))); 103734b6a94Sdarrenm } 104734b6a94Sdarrenm 105734b6a94Sdarrenm #else 106734b6a94Sdarrenm 1077c478bd9Sstevel@tonic-gate #define ROTATE_LEFT(x, n) \ 1087c478bd9Sstevel@tonic-gate (((x) << (n)) | ((x) >> ((sizeof (x) * NBBY)-(n)))) 1097c478bd9Sstevel@tonic-gate 110734b6a94Sdarrenm #endif 1117c478bd9Sstevel@tonic-gate 1127c478bd9Sstevel@tonic-gate 1137c478bd9Sstevel@tonic-gate /* 1147c478bd9Sstevel@tonic-gate * SHA1Init() 1157c478bd9Sstevel@tonic-gate * 1167c478bd9Sstevel@tonic-gate * purpose: initializes the sha1 context and begins and sha1 digest operation 1177c478bd9Sstevel@tonic-gate * input: SHA1_CTX * : the context to initializes. 1187c478bd9Sstevel@tonic-gate * output: void 1197c478bd9Sstevel@tonic-gate */ 1207c478bd9Sstevel@tonic-gate 1217c478bd9Sstevel@tonic-gate void 1227c478bd9Sstevel@tonic-gate SHA1Init(SHA1_CTX *ctx) 1237c478bd9Sstevel@tonic-gate { 1247c478bd9Sstevel@tonic-gate ctx->count[0] = ctx->count[1] = 0; 1257c478bd9Sstevel@tonic-gate 1267c478bd9Sstevel@tonic-gate /* 1277c478bd9Sstevel@tonic-gate * load magic initialization constants. Tell lint 1287c478bd9Sstevel@tonic-gate * that these constants are unsigned by using U. 1297c478bd9Sstevel@tonic-gate */ 1307c478bd9Sstevel@tonic-gate 1317c478bd9Sstevel@tonic-gate ctx->state[0] = 0x67452301U; 1327c478bd9Sstevel@tonic-gate ctx->state[1] = 0xefcdab89U; 1337c478bd9Sstevel@tonic-gate ctx->state[2] = 0x98badcfeU; 1347c478bd9Sstevel@tonic-gate ctx->state[3] = 0x10325476U; 1357c478bd9Sstevel@tonic-gate ctx->state[4] = 0xc3d2e1f0U; 1367c478bd9Sstevel@tonic-gate } 1377c478bd9Sstevel@tonic-gate 1387c478bd9Sstevel@tonic-gate #ifdef VIS_SHA1 1397c478bd9Sstevel@tonic-gate #ifdef _KERNEL 1407c478bd9Sstevel@tonic-gate 1417c478bd9Sstevel@tonic-gate #include <sys/regset.h> 1427c478bd9Sstevel@tonic-gate #include <sys/vis.h> 14315b9cbbcSkrishna #include <sys/fpu/fpusystm.h> 1447c478bd9Sstevel@tonic-gate 1457c478bd9Sstevel@tonic-gate /* the alignment for block stores to save fp registers */ 1467c478bd9Sstevel@tonic-gate #define VIS_ALIGN (64) 1477c478bd9Sstevel@tonic-gate 1487c478bd9Sstevel@tonic-gate extern int sha1_savefp(kfpu_t *, int); 1497c478bd9Sstevel@tonic-gate extern void sha1_restorefp(kfpu_t *); 1507c478bd9Sstevel@tonic-gate 1517c478bd9Sstevel@tonic-gate uint32_t vis_sha1_svfp_threshold = 128; 1527c478bd9Sstevel@tonic-gate 1537c478bd9Sstevel@tonic-gate #endif /* _KERNEL */ 1547c478bd9Sstevel@tonic-gate 1557c478bd9Sstevel@tonic-gate /* 1567c478bd9Sstevel@tonic-gate * VIS SHA-1 consts. 1577c478bd9Sstevel@tonic-gate */ 1587c478bd9Sstevel@tonic-gate static uint64_t VIS[] = { 1594cc1ac68Skrishna 0x8000000080000000ULL, 1604cc1ac68Skrishna 0x0002000200020002ULL, 1614cc1ac68Skrishna 0x5a8279996ed9eba1ULL, 1624cc1ac68Skrishna 0x8f1bbcdcca62c1d6ULL, 1634cc1ac68Skrishna 0x012389ab456789abULL}; 1647c478bd9Sstevel@tonic-gate 165734b6a94Sdarrenm extern void SHA1TransformVIS(uint64_t *, uint32_t *, uint32_t *, uint64_t *); 1667c478bd9Sstevel@tonic-gate 1677c478bd9Sstevel@tonic-gate 1687c478bd9Sstevel@tonic-gate /* 1697c478bd9Sstevel@tonic-gate * SHA1Update() 1707c478bd9Sstevel@tonic-gate * 1717c478bd9Sstevel@tonic-gate * purpose: continues an sha1 digest operation, using the message block 1727c478bd9Sstevel@tonic-gate * to update the context. 1737c478bd9Sstevel@tonic-gate * input: SHA1_CTX * : the context to update 174734b6a94Sdarrenm * void * : the message block 175734b6a94Sdarrenm * size_t : the length of the message block in bytes 1767c478bd9Sstevel@tonic-gate * output: void 1777c478bd9Sstevel@tonic-gate */ 1787c478bd9Sstevel@tonic-gate 1797c478bd9Sstevel@tonic-gate void 180734b6a94Sdarrenm SHA1Update(SHA1_CTX *ctx, const void *inptr, size_t input_len) 1817c478bd9Sstevel@tonic-gate { 1827c478bd9Sstevel@tonic-gate uint32_t i, buf_index, buf_len; 1837c478bd9Sstevel@tonic-gate uint64_t X0[40], input64[8]; 184734b6a94Sdarrenm const uint8_t *input = inptr; 18515b9cbbcSkrishna #ifdef _KERNEL 18615b9cbbcSkrishna int usevis = 0; 187734b6a94Sdarrenm #else 188734b6a94Sdarrenm int usevis = 1; 18915b9cbbcSkrishna #endif /* _KERNEL */ 1907c478bd9Sstevel@tonic-gate 1917c478bd9Sstevel@tonic-gate /* check for noop */ 1927c478bd9Sstevel@tonic-gate if (input_len == 0) 1937c478bd9Sstevel@tonic-gate return; 1947c478bd9Sstevel@tonic-gate 1957c478bd9Sstevel@tonic-gate /* compute number of bytes mod 64 */ 1967c478bd9Sstevel@tonic-gate buf_index = (ctx->count[1] >> 3) & 0x3F; 1977c478bd9Sstevel@tonic-gate 1987c478bd9Sstevel@tonic-gate /* update number of bits */ 1997c478bd9Sstevel@tonic-gate if ((ctx->count[1] += (input_len << 3)) < (input_len << 3)) 2007c478bd9Sstevel@tonic-gate ctx->count[0]++; 2017c478bd9Sstevel@tonic-gate 2027c478bd9Sstevel@tonic-gate ctx->count[0] += (input_len >> 29); 2037c478bd9Sstevel@tonic-gate 2047c478bd9Sstevel@tonic-gate buf_len = 64 - buf_index; 2057c478bd9Sstevel@tonic-gate 2067c478bd9Sstevel@tonic-gate /* transform as many times as possible */ 2077c478bd9Sstevel@tonic-gate i = 0; 2087c478bd9Sstevel@tonic-gate if (input_len >= buf_len) { 2097c478bd9Sstevel@tonic-gate #ifdef _KERNEL 2107c478bd9Sstevel@tonic-gate kfpu_t *fpu; 211734b6a94Sdarrenm if (fpu_exists) { 212734b6a94Sdarrenm uint8_t fpua[sizeof (kfpu_t) + GSR_SIZE + VIS_ALIGN]; 2137c478bd9Sstevel@tonic-gate uint32_t len = (input_len + buf_index) & ~0x3f; 2147c478bd9Sstevel@tonic-gate int svfp_ok; 2157c478bd9Sstevel@tonic-gate 2167c478bd9Sstevel@tonic-gate fpu = (kfpu_t *)P2ROUNDUP((uintptr_t)fpua, 64); 2177c478bd9Sstevel@tonic-gate svfp_ok = ((len >= vis_sha1_svfp_threshold) ? 1 : 0); 21815b9cbbcSkrishna usevis = fpu_exists && sha1_savefp(fpu, svfp_ok); 219734b6a94Sdarrenm } else { 220734b6a94Sdarrenm usevis = 0; 221734b6a94Sdarrenm } 2227c478bd9Sstevel@tonic-gate #endif /* _KERNEL */ 2237c478bd9Sstevel@tonic-gate 2247c478bd9Sstevel@tonic-gate /* 2257c478bd9Sstevel@tonic-gate * general optimization: 2267c478bd9Sstevel@tonic-gate * 2277c478bd9Sstevel@tonic-gate * only do initial bcopy() and SHA1Transform() if 2287c478bd9Sstevel@tonic-gate * buf_index != 0. if buf_index == 0, we're just 2297c478bd9Sstevel@tonic-gate * wasting our time doing the bcopy() since there 2307c478bd9Sstevel@tonic-gate * wasn't any data left over from a previous call to 2317c478bd9Sstevel@tonic-gate * SHA1Update(). 2327c478bd9Sstevel@tonic-gate */ 2337c478bd9Sstevel@tonic-gate 2347c478bd9Sstevel@tonic-gate if (buf_index) { 2357c478bd9Sstevel@tonic-gate bcopy(input, &ctx->buf_un.buf8[buf_index], buf_len); 2367c478bd9Sstevel@tonic-gate if (usevis) { 2377c478bd9Sstevel@tonic-gate SHA1TransformVIS(X0, 238734b6a94Sdarrenm ctx->buf_un.buf32, 2397c478bd9Sstevel@tonic-gate &ctx->state[0], VIS); 2407c478bd9Sstevel@tonic-gate } else { 241734b6a94Sdarrenm SHA1_TRANSFORM(ctx, ctx->buf_un.buf8); 2427c478bd9Sstevel@tonic-gate } 2437c478bd9Sstevel@tonic-gate i = buf_len; 2447c478bd9Sstevel@tonic-gate } 2457c478bd9Sstevel@tonic-gate 2467c478bd9Sstevel@tonic-gate /* 2477c478bd9Sstevel@tonic-gate * VIS SHA-1: uses the VIS 1.0 instructions to accelerate 2487c478bd9Sstevel@tonic-gate * SHA-1 processing. This is achieved by "offloading" the 2497c478bd9Sstevel@tonic-gate * computation of the message schedule (MS) to the VIS units. 2507c478bd9Sstevel@tonic-gate * This allows the VIS computation of the message schedule 2517c478bd9Sstevel@tonic-gate * to be performed in parallel with the standard integer 2527c478bd9Sstevel@tonic-gate * processing of the remainder of the SHA-1 computation. 2537c478bd9Sstevel@tonic-gate * performance by up to around 1.37X, compared to an optimized 2547c478bd9Sstevel@tonic-gate * integer-only implementation. 2557c478bd9Sstevel@tonic-gate * 2567c478bd9Sstevel@tonic-gate * The VIS implementation of SHA1Transform has a different API 2577c478bd9Sstevel@tonic-gate * to the standard integer version: 2587c478bd9Sstevel@tonic-gate * 2597c478bd9Sstevel@tonic-gate * void SHA1TransformVIS( 2607c478bd9Sstevel@tonic-gate * uint64_t *, // Pointer to MS for ith block 261734b6a94Sdarrenm * uint32_t *, // Pointer to ith block of message data 2627c478bd9Sstevel@tonic-gate * uint32_t *, // Pointer to SHA state i.e ctx->state 2637c478bd9Sstevel@tonic-gate * uint64_t *, // Pointer to various VIS constants 2647c478bd9Sstevel@tonic-gate * ) 2657c478bd9Sstevel@tonic-gate * 2667c478bd9Sstevel@tonic-gate * Note: the message data must by 4-byte aligned. 2677c478bd9Sstevel@tonic-gate * 2687c478bd9Sstevel@tonic-gate * Function requires VIS 1.0 support. 2697c478bd9Sstevel@tonic-gate * 2707c478bd9Sstevel@tonic-gate * Handling is provided to deal with arbitrary byte alingment 2717c478bd9Sstevel@tonic-gate * of the input data but the performance gains are reduced 2727c478bd9Sstevel@tonic-gate * for alignments other than 4-bytes. 2737c478bd9Sstevel@tonic-gate */ 2747c478bd9Sstevel@tonic-gate if (usevis) { 275734b6a94Sdarrenm if (!IS_P2ALIGNED(&input[i], sizeof (uint32_t))) { 2767c478bd9Sstevel@tonic-gate /* 2777c478bd9Sstevel@tonic-gate * Main processing loop - input misaligned 2787c478bd9Sstevel@tonic-gate */ 2797c478bd9Sstevel@tonic-gate for (; i + 63 < input_len; i += 64) { 2807c478bd9Sstevel@tonic-gate bcopy(&input[i], input64, 64); 281321502cdSda73024 SHA1TransformVIS(X0, 282321502cdSda73024 (uint32_t *)input64, 2837c478bd9Sstevel@tonic-gate &ctx->state[0], VIS); 2847c478bd9Sstevel@tonic-gate } 2857c478bd9Sstevel@tonic-gate } else { 2867c478bd9Sstevel@tonic-gate /* 2877c478bd9Sstevel@tonic-gate * Main processing loop - input 8-byte aligned 2887c478bd9Sstevel@tonic-gate */ 2897c478bd9Sstevel@tonic-gate for (; i + 63 < input_len; i += 64) { 2907c478bd9Sstevel@tonic-gate SHA1TransformVIS(X0, 291734b6a94Sdarrenm /* LINTED E_BAD_PTR_CAST_ALIGN */ 292*4b56a003SDaniel Anderson (uint32_t *)&input[i], /* CSTYLED */ 2937c478bd9Sstevel@tonic-gate &ctx->state[0], VIS); 2947c478bd9Sstevel@tonic-gate } 2957c478bd9Sstevel@tonic-gate 2967c478bd9Sstevel@tonic-gate } 2977c478bd9Sstevel@tonic-gate #ifdef _KERNEL 2987c478bd9Sstevel@tonic-gate sha1_restorefp(fpu); 2997c478bd9Sstevel@tonic-gate #endif /* _KERNEL */ 3007c478bd9Sstevel@tonic-gate } else { 3017c478bd9Sstevel@tonic-gate for (; i + 63 < input_len; i += 64) { 302734b6a94Sdarrenm SHA1_TRANSFORM(ctx, &input[i]); 3037c478bd9Sstevel@tonic-gate } 3047c478bd9Sstevel@tonic-gate } 3057c478bd9Sstevel@tonic-gate 3067c478bd9Sstevel@tonic-gate /* 3077c478bd9Sstevel@tonic-gate * general optimization: 3087c478bd9Sstevel@tonic-gate * 3097c478bd9Sstevel@tonic-gate * if i and input_len are the same, return now instead 3107c478bd9Sstevel@tonic-gate * of calling bcopy(), since the bcopy() in this case 3117c478bd9Sstevel@tonic-gate * will be an expensive nop. 3127c478bd9Sstevel@tonic-gate */ 3137c478bd9Sstevel@tonic-gate 3147c478bd9Sstevel@tonic-gate if (input_len == i) 3157c478bd9Sstevel@tonic-gate return; 3167c478bd9Sstevel@tonic-gate 3177c478bd9Sstevel@tonic-gate buf_index = 0; 3187c478bd9Sstevel@tonic-gate } 3197c478bd9Sstevel@tonic-gate 3207c478bd9Sstevel@tonic-gate /* buffer remaining input */ 3217c478bd9Sstevel@tonic-gate bcopy(&input[i], &ctx->buf_un.buf8[buf_index], input_len - i); 3227c478bd9Sstevel@tonic-gate } 3237c478bd9Sstevel@tonic-gate 3247c478bd9Sstevel@tonic-gate #else /* VIS_SHA1 */ 3257c478bd9Sstevel@tonic-gate 3267c478bd9Sstevel@tonic-gate void 327734b6a94Sdarrenm SHA1Update(SHA1_CTX *ctx, const void *inptr, size_t input_len) 3287c478bd9Sstevel@tonic-gate { 3297c478bd9Sstevel@tonic-gate uint32_t i, buf_index, buf_len; 330734b6a94Sdarrenm const uint8_t *input = inptr; 331321502cdSda73024 #if defined(__amd64) 332321502cdSda73024 uint32_t block_count; 333321502cdSda73024 #endif /* __amd64 */ 3347c478bd9Sstevel@tonic-gate 3357c478bd9Sstevel@tonic-gate /* check for noop */ 3367c478bd9Sstevel@tonic-gate if (input_len == 0) 3377c478bd9Sstevel@tonic-gate return; 3387c478bd9Sstevel@tonic-gate 3397c478bd9Sstevel@tonic-gate /* compute number of bytes mod 64 */ 3407c478bd9Sstevel@tonic-gate buf_index = (ctx->count[1] >> 3) & 0x3F; 3417c478bd9Sstevel@tonic-gate 3427c478bd9Sstevel@tonic-gate /* update number of bits */ 3437c478bd9Sstevel@tonic-gate if ((ctx->count[1] += (input_len << 3)) < (input_len << 3)) 3447c478bd9Sstevel@tonic-gate ctx->count[0]++; 3457c478bd9Sstevel@tonic-gate 3467c478bd9Sstevel@tonic-gate ctx->count[0] += (input_len >> 29); 3477c478bd9Sstevel@tonic-gate 3487c478bd9Sstevel@tonic-gate buf_len = 64 - buf_index; 3497c478bd9Sstevel@tonic-gate 3507c478bd9Sstevel@tonic-gate /* transform as many times as possible */ 3517c478bd9Sstevel@tonic-gate i = 0; 3527c478bd9Sstevel@tonic-gate if (input_len >= buf_len) { 3537c478bd9Sstevel@tonic-gate 3547c478bd9Sstevel@tonic-gate /* 3557c478bd9Sstevel@tonic-gate * general optimization: 3567c478bd9Sstevel@tonic-gate * 3577c478bd9Sstevel@tonic-gate * only do initial bcopy() and SHA1Transform() if 3587c478bd9Sstevel@tonic-gate * buf_index != 0. if buf_index == 0, we're just 3597c478bd9Sstevel@tonic-gate * wasting our time doing the bcopy() since there 3607c478bd9Sstevel@tonic-gate * wasn't any data left over from a previous call to 3617c478bd9Sstevel@tonic-gate * SHA1Update(). 3627c478bd9Sstevel@tonic-gate */ 3637c478bd9Sstevel@tonic-gate 3647c478bd9Sstevel@tonic-gate if (buf_index) { 3657c478bd9Sstevel@tonic-gate bcopy(input, &ctx->buf_un.buf8[buf_index], buf_len); 366734b6a94Sdarrenm SHA1_TRANSFORM(ctx, ctx->buf_un.buf8); 3677c478bd9Sstevel@tonic-gate i = buf_len; 3687c478bd9Sstevel@tonic-gate } 3697c478bd9Sstevel@tonic-gate 370321502cdSda73024 #if !defined(__amd64) 3717c478bd9Sstevel@tonic-gate for (; i + 63 < input_len; i += 64) 372734b6a94Sdarrenm SHA1_TRANSFORM(ctx, &input[i]); 373321502cdSda73024 #else 374321502cdSda73024 block_count = (input_len - i) >> 6; 375321502cdSda73024 if (block_count > 0) { 376321502cdSda73024 SHA1_TRANSFORM_BLOCKS(ctx, &input[i], block_count); 377321502cdSda73024 i += block_count << 6; 378321502cdSda73024 } 379321502cdSda73024 #endif /* !__amd64 */ 3807c478bd9Sstevel@tonic-gate 3817c478bd9Sstevel@tonic-gate /* 3827c478bd9Sstevel@tonic-gate * general optimization: 3837c478bd9Sstevel@tonic-gate * 3847c478bd9Sstevel@tonic-gate * if i and input_len are the same, return now instead 3857c478bd9Sstevel@tonic-gate * of calling bcopy(), since the bcopy() in this case 3867c478bd9Sstevel@tonic-gate * will be an expensive nop. 3877c478bd9Sstevel@tonic-gate */ 3887c478bd9Sstevel@tonic-gate 3897c478bd9Sstevel@tonic-gate if (input_len == i) 3907c478bd9Sstevel@tonic-gate return; 3917c478bd9Sstevel@tonic-gate 3927c478bd9Sstevel@tonic-gate buf_index = 0; 3937c478bd9Sstevel@tonic-gate } 3947c478bd9Sstevel@tonic-gate 3957c478bd9Sstevel@tonic-gate /* buffer remaining input */ 3967c478bd9Sstevel@tonic-gate bcopy(&input[i], &ctx->buf_un.buf8[buf_index], input_len - i); 3977c478bd9Sstevel@tonic-gate } 3987c478bd9Sstevel@tonic-gate 3997c478bd9Sstevel@tonic-gate #endif /* VIS_SHA1 */ 4007c478bd9Sstevel@tonic-gate 4017c478bd9Sstevel@tonic-gate /* 4027c478bd9Sstevel@tonic-gate * SHA1Final() 4037c478bd9Sstevel@tonic-gate * 4047c478bd9Sstevel@tonic-gate * purpose: ends an sha1 digest operation, finalizing the message digest and 4057c478bd9Sstevel@tonic-gate * zeroing the context. 406321502cdSda73024 * input: uchar_t * : A buffer to store the digest. 4075151fb12Sdarrenm * : The function actually uses void* because many 4085151fb12Sdarrenm * : callers pass things other than uchar_t here. 4097c478bd9Sstevel@tonic-gate * SHA1_CTX * : the context to finalize, save, and zero 4107c478bd9Sstevel@tonic-gate * output: void 4117c478bd9Sstevel@tonic-gate */ 4127c478bd9Sstevel@tonic-gate 4137c478bd9Sstevel@tonic-gate void 414734b6a94Sdarrenm SHA1Final(void *digest, SHA1_CTX *ctx) 4157c478bd9Sstevel@tonic-gate { 4167c478bd9Sstevel@tonic-gate uint8_t bitcount_be[sizeof (ctx->count)]; 4177c478bd9Sstevel@tonic-gate uint32_t index = (ctx->count[1] >> 3) & 0x3f; 4187c478bd9Sstevel@tonic-gate 4197c478bd9Sstevel@tonic-gate /* store bit count, big endian */ 4207c478bd9Sstevel@tonic-gate Encode(bitcount_be, ctx->count, sizeof (bitcount_be)); 4217c478bd9Sstevel@tonic-gate 4227c478bd9Sstevel@tonic-gate /* pad out to 56 mod 64 */ 4237c478bd9Sstevel@tonic-gate SHA1Update(ctx, PADDING, ((index < 56) ? 56 : 120) - index); 4247c478bd9Sstevel@tonic-gate 4257c478bd9Sstevel@tonic-gate /* append length (before padding) */ 4267c478bd9Sstevel@tonic-gate SHA1Update(ctx, bitcount_be, sizeof (bitcount_be)); 4277c478bd9Sstevel@tonic-gate 4287c478bd9Sstevel@tonic-gate /* store state in digest */ 4297c478bd9Sstevel@tonic-gate Encode(digest, ctx->state, sizeof (ctx->state)); 430673007c6Sdarrenm 431673007c6Sdarrenm /* zeroize sensitive information */ 432673007c6Sdarrenm bzero(ctx, sizeof (*ctx)); 4337c478bd9Sstevel@tonic-gate } 4347c478bd9Sstevel@tonic-gate 435321502cdSda73024 436321502cdSda73024 #if !defined(__amd64) 437321502cdSda73024 438734b6a94Sdarrenm typedef uint32_t sha1word; 439734b6a94Sdarrenm 4407c478bd9Sstevel@tonic-gate /* 4417c478bd9Sstevel@tonic-gate * sparc optimization: 4427c478bd9Sstevel@tonic-gate * 4437c478bd9Sstevel@tonic-gate * on the sparc, we can load big endian 32-bit data easily. note that 4447c478bd9Sstevel@tonic-gate * special care must be taken to ensure the address is 32-bit aligned. 4457c478bd9Sstevel@tonic-gate * in the interest of speed, we don't check to make sure, since 4467c478bd9Sstevel@tonic-gate * careful programming can guarantee this for us. 4477c478bd9Sstevel@tonic-gate */ 4487c478bd9Sstevel@tonic-gate 4497c478bd9Sstevel@tonic-gate #if defined(_BIG_ENDIAN) 4507c478bd9Sstevel@tonic-gate #define LOAD_BIG_32(addr) (*(uint32_t *)(addr)) 4517c478bd9Sstevel@tonic-gate 452*4b56a003SDaniel Anderson #elif defined(HAVE_HTONL) 453*4b56a003SDaniel Anderson #define LOAD_BIG_32(addr) htonl(*((uint32_t *)(addr))) 4547c478bd9Sstevel@tonic-gate 455*4b56a003SDaniel Anderson #else 456734b6a94Sdarrenm /* little endian -- will work on big endian, but slowly */ 4577c478bd9Sstevel@tonic-gate #define LOAD_BIG_32(addr) \ 4587c478bd9Sstevel@tonic-gate (((addr)[0] << 24) | ((addr)[1] << 16) | ((addr)[2] << 8) | (addr)[3]) 459*4b56a003SDaniel Anderson #endif /* _BIG_ENDIAN */ 460734b6a94Sdarrenm 461734b6a94Sdarrenm /* 462734b6a94Sdarrenm * SHA1Transform() 463734b6a94Sdarrenm */ 464734b6a94Sdarrenm #if defined(W_ARRAY) 465734b6a94Sdarrenm #define W(n) w[n] 466734b6a94Sdarrenm #else /* !defined(W_ARRAY) */ 467734b6a94Sdarrenm #define W(n) w_ ## n 468734b6a94Sdarrenm #endif /* !defined(W_ARRAY) */ 469734b6a94Sdarrenm 470734b6a94Sdarrenm 471734b6a94Sdarrenm #if defined(__sparc) 4727c478bd9Sstevel@tonic-gate 4737c478bd9Sstevel@tonic-gate /* 4747c478bd9Sstevel@tonic-gate * sparc register window optimization: 4757c478bd9Sstevel@tonic-gate * 4767c478bd9Sstevel@tonic-gate * `a', `b', `c', `d', and `e' are passed into SHA1Transform 4777c478bd9Sstevel@tonic-gate * explicitly since it increases the number of registers available to 4787c478bd9Sstevel@tonic-gate * the compiler. under this scheme, these variables can be held in 4797c478bd9Sstevel@tonic-gate * %i0 - %i4, which leaves more local and out registers available. 4807c478bd9Sstevel@tonic-gate * 4817c478bd9Sstevel@tonic-gate * purpose: sha1 transformation -- updates the digest based on `block' 4827c478bd9Sstevel@tonic-gate * input: uint32_t : bytes 1 - 4 of the digest 4837c478bd9Sstevel@tonic-gate * uint32_t : bytes 5 - 8 of the digest 4847c478bd9Sstevel@tonic-gate * uint32_t : bytes 9 - 12 of the digest 4857c478bd9Sstevel@tonic-gate * uint32_t : bytes 12 - 16 of the digest 4867c478bd9Sstevel@tonic-gate * uint32_t : bytes 16 - 20 of the digest 4877c478bd9Sstevel@tonic-gate * SHA1_CTX * : the context to update 4887c478bd9Sstevel@tonic-gate * uint8_t [64]: the block to use to update the digest 4897c478bd9Sstevel@tonic-gate * output: void 4907c478bd9Sstevel@tonic-gate */ 4917c478bd9Sstevel@tonic-gate 4927c478bd9Sstevel@tonic-gate void 4937c478bd9Sstevel@tonic-gate SHA1Transform(uint32_t a, uint32_t b, uint32_t c, uint32_t d, uint32_t e, 4947c478bd9Sstevel@tonic-gate SHA1_CTX *ctx, const uint8_t blk[64]) 4957c478bd9Sstevel@tonic-gate { 4967c478bd9Sstevel@tonic-gate /* 4977c478bd9Sstevel@tonic-gate * sparc optimization: 4987c478bd9Sstevel@tonic-gate * 4997c478bd9Sstevel@tonic-gate * while it is somewhat counter-intuitive, on sparc, it is 5007c478bd9Sstevel@tonic-gate * more efficient to place all the constants used in this 5017c478bd9Sstevel@tonic-gate * function in an array and load the values out of the array 5027c478bd9Sstevel@tonic-gate * than to manually load the constants. this is because 5037c478bd9Sstevel@tonic-gate * setting a register to a 32-bit value takes two ops in most 5047c478bd9Sstevel@tonic-gate * cases: a `sethi' and an `or', but loading a 32-bit value 5057c478bd9Sstevel@tonic-gate * from memory only takes one `ld' (or `lduw' on v9). while 5067c478bd9Sstevel@tonic-gate * this increases memory usage, the compiler can find enough 5077c478bd9Sstevel@tonic-gate * other things to do while waiting to keep the pipeline does 5087c478bd9Sstevel@tonic-gate * not stall. additionally, it is likely that many of these 5097c478bd9Sstevel@tonic-gate * constants are cached so that later accesses do not even go 5107c478bd9Sstevel@tonic-gate * out to the bus. 5117c478bd9Sstevel@tonic-gate * 5127c478bd9Sstevel@tonic-gate * this array is declared `static' to keep the compiler from 5137c478bd9Sstevel@tonic-gate * having to bcopy() this array onto the stack frame of 5147c478bd9Sstevel@tonic-gate * SHA1Transform() each time it is called -- which is 5157c478bd9Sstevel@tonic-gate * unacceptably expensive. 5167c478bd9Sstevel@tonic-gate * 5177c478bd9Sstevel@tonic-gate * the `const' is to ensure that callers are good citizens and 5187c478bd9Sstevel@tonic-gate * do not try to munge the array. since these routines are 5197c478bd9Sstevel@tonic-gate * going to be called from inside multithreaded kernelland, 5207c478bd9Sstevel@tonic-gate * this is a good safety check. -- `sha1_consts' will end up in 5217c478bd9Sstevel@tonic-gate * .rodata. 5227c478bd9Sstevel@tonic-gate * 5237c478bd9Sstevel@tonic-gate * unfortunately, loading from an array in this manner hurts 524*4b56a003SDaniel Anderson * performance under Intel. So, there is a macro, 5257c478bd9Sstevel@tonic-gate * SHA1_CONST(), used in SHA1Transform(), that either expands to 5267c478bd9Sstevel@tonic-gate * a reference to this array, or to the actual constant, 5277c478bd9Sstevel@tonic-gate * depending on what platform this code is compiled for. 5287c478bd9Sstevel@tonic-gate */ 5297c478bd9Sstevel@tonic-gate 5307c478bd9Sstevel@tonic-gate static const uint32_t sha1_consts[] = { 531*4b56a003SDaniel Anderson SHA1_CONST_0, SHA1_CONST_1, SHA1_CONST_2, SHA1_CONST_3 5327c478bd9Sstevel@tonic-gate }; 5337c478bd9Sstevel@tonic-gate 5347c478bd9Sstevel@tonic-gate /* 5357c478bd9Sstevel@tonic-gate * general optimization: 5367c478bd9Sstevel@tonic-gate * 5377c478bd9Sstevel@tonic-gate * use individual integers instead of using an array. this is a 5387c478bd9Sstevel@tonic-gate * win, although the amount it wins by seems to vary quite a bit. 5397c478bd9Sstevel@tonic-gate */ 5407c478bd9Sstevel@tonic-gate 5417c478bd9Sstevel@tonic-gate uint32_t w_0, w_1, w_2, w_3, w_4, w_5, w_6, w_7; 5427c478bd9Sstevel@tonic-gate uint32_t w_8, w_9, w_10, w_11, w_12, w_13, w_14, w_15; 5437c478bd9Sstevel@tonic-gate 5447c478bd9Sstevel@tonic-gate /* 5457c478bd9Sstevel@tonic-gate * sparc optimization: 5467c478bd9Sstevel@tonic-gate * 5477c478bd9Sstevel@tonic-gate * if `block' is already aligned on a 4-byte boundary, use 5487c478bd9Sstevel@tonic-gate * LOAD_BIG_32() directly. otherwise, bcopy() into a 5497c478bd9Sstevel@tonic-gate * buffer that *is* aligned on a 4-byte boundary and then do 5507c478bd9Sstevel@tonic-gate * the LOAD_BIG_32() on that buffer. benchmarks have shown 5517c478bd9Sstevel@tonic-gate * that using the bcopy() is better than loading the bytes 5527c478bd9Sstevel@tonic-gate * individually and doing the endian-swap by hand. 5537c478bd9Sstevel@tonic-gate * 5547c478bd9Sstevel@tonic-gate * even though it's quite tempting to assign to do: 5557c478bd9Sstevel@tonic-gate * 5567c478bd9Sstevel@tonic-gate * blk = bcopy(ctx->buf_un.buf32, blk, sizeof (ctx->buf_un.buf32)); 5577c478bd9Sstevel@tonic-gate * 5587c478bd9Sstevel@tonic-gate * and only have one set of LOAD_BIG_32()'s, the compiler 5597c478bd9Sstevel@tonic-gate * *does not* like that, so please resist the urge. 5607c478bd9Sstevel@tonic-gate */ 5617c478bd9Sstevel@tonic-gate 5627c478bd9Sstevel@tonic-gate if ((uintptr_t)blk & 0x3) { /* not 4-byte aligned? */ 5637c478bd9Sstevel@tonic-gate bcopy(blk, ctx->buf_un.buf32, sizeof (ctx->buf_un.buf32)); 5647c478bd9Sstevel@tonic-gate w_15 = LOAD_BIG_32(ctx->buf_un.buf32 + 15); 5657c478bd9Sstevel@tonic-gate w_14 = LOAD_BIG_32(ctx->buf_un.buf32 + 14); 5667c478bd9Sstevel@tonic-gate w_13 = LOAD_BIG_32(ctx->buf_un.buf32 + 13); 5677c478bd9Sstevel@tonic-gate w_12 = LOAD_BIG_32(ctx->buf_un.buf32 + 12); 5687c478bd9Sstevel@tonic-gate w_11 = LOAD_BIG_32(ctx->buf_un.buf32 + 11); 5697c478bd9Sstevel@tonic-gate w_10 = LOAD_BIG_32(ctx->buf_un.buf32 + 10); 5707c478bd9Sstevel@tonic-gate w_9 = LOAD_BIG_32(ctx->buf_un.buf32 + 9); 5717c478bd9Sstevel@tonic-gate w_8 = LOAD_BIG_32(ctx->buf_un.buf32 + 8); 5727c478bd9Sstevel@tonic-gate w_7 = LOAD_BIG_32(ctx->buf_un.buf32 + 7); 5737c478bd9Sstevel@tonic-gate w_6 = LOAD_BIG_32(ctx->buf_un.buf32 + 6); 5747c478bd9Sstevel@tonic-gate w_5 = LOAD_BIG_32(ctx->buf_un.buf32 + 5); 5757c478bd9Sstevel@tonic-gate w_4 = LOAD_BIG_32(ctx->buf_un.buf32 + 4); 5767c478bd9Sstevel@tonic-gate w_3 = LOAD_BIG_32(ctx->buf_un.buf32 + 3); 5777c478bd9Sstevel@tonic-gate w_2 = LOAD_BIG_32(ctx->buf_un.buf32 + 2); 5787c478bd9Sstevel@tonic-gate w_1 = LOAD_BIG_32(ctx->buf_un.buf32 + 1); 5797c478bd9Sstevel@tonic-gate w_0 = LOAD_BIG_32(ctx->buf_un.buf32 + 0); 5807c478bd9Sstevel@tonic-gate } else { 5817c478bd9Sstevel@tonic-gate /*LINTED*/ 5827c478bd9Sstevel@tonic-gate w_15 = LOAD_BIG_32(blk + 60); 5837c478bd9Sstevel@tonic-gate /*LINTED*/ 5847c478bd9Sstevel@tonic-gate w_14 = LOAD_BIG_32(blk + 56); 5857c478bd9Sstevel@tonic-gate /*LINTED*/ 5867c478bd9Sstevel@tonic-gate w_13 = LOAD_BIG_32(blk + 52); 5877c478bd9Sstevel@tonic-gate /*LINTED*/ 5887c478bd9Sstevel@tonic-gate w_12 = LOAD_BIG_32(blk + 48); 5897c478bd9Sstevel@tonic-gate /*LINTED*/ 5907c478bd9Sstevel@tonic-gate w_11 = LOAD_BIG_32(blk + 44); 5917c478bd9Sstevel@tonic-gate /*LINTED*/ 5927c478bd9Sstevel@tonic-gate w_10 = LOAD_BIG_32(blk + 40); 5937c478bd9Sstevel@tonic-gate /*LINTED*/ 5947c478bd9Sstevel@tonic-gate w_9 = LOAD_BIG_32(blk + 36); 5957c478bd9Sstevel@tonic-gate /*LINTED*/ 5967c478bd9Sstevel@tonic-gate w_8 = LOAD_BIG_32(blk + 32); 5977c478bd9Sstevel@tonic-gate /*LINTED*/ 5987c478bd9Sstevel@tonic-gate w_7 = LOAD_BIG_32(blk + 28); 5997c478bd9Sstevel@tonic-gate /*LINTED*/ 6007c478bd9Sstevel@tonic-gate w_6 = LOAD_BIG_32(blk + 24); 6017c478bd9Sstevel@tonic-gate /*LINTED*/ 6027c478bd9Sstevel@tonic-gate w_5 = LOAD_BIG_32(blk + 20); 6037c478bd9Sstevel@tonic-gate /*LINTED*/ 6047c478bd9Sstevel@tonic-gate w_4 = LOAD_BIG_32(blk + 16); 6057c478bd9Sstevel@tonic-gate /*LINTED*/ 6067c478bd9Sstevel@tonic-gate w_3 = LOAD_BIG_32(blk + 12); 6077c478bd9Sstevel@tonic-gate /*LINTED*/ 6087c478bd9Sstevel@tonic-gate w_2 = LOAD_BIG_32(blk + 8); 6097c478bd9Sstevel@tonic-gate /*LINTED*/ 6107c478bd9Sstevel@tonic-gate w_1 = LOAD_BIG_32(blk + 4); 6117c478bd9Sstevel@tonic-gate /*LINTED*/ 6127c478bd9Sstevel@tonic-gate w_0 = LOAD_BIG_32(blk + 0); 6137c478bd9Sstevel@tonic-gate } 614734b6a94Sdarrenm #else /* !defined(__sparc) */ 615734b6a94Sdarrenm 616*4b56a003SDaniel Anderson void /* CSTYLED */ 617734b6a94Sdarrenm SHA1Transform(SHA1_CTX *ctx, const uint8_t blk[64]) 618734b6a94Sdarrenm { 619*4b56a003SDaniel Anderson /* CSTYLED */ 620734b6a94Sdarrenm sha1word a = ctx->state[0]; 621734b6a94Sdarrenm sha1word b = ctx->state[1]; 622734b6a94Sdarrenm sha1word c = ctx->state[2]; 623734b6a94Sdarrenm sha1word d = ctx->state[3]; 624734b6a94Sdarrenm sha1word e = ctx->state[4]; 625734b6a94Sdarrenm 626734b6a94Sdarrenm #if defined(W_ARRAY) 627734b6a94Sdarrenm sha1word w[16]; 628734b6a94Sdarrenm #else /* !defined(W_ARRAY) */ 629734b6a94Sdarrenm sha1word w_0, w_1, w_2, w_3, w_4, w_5, w_6, w_7; 630734b6a94Sdarrenm sha1word w_8, w_9, w_10, w_11, w_12, w_13, w_14, w_15; 631734b6a94Sdarrenm #endif /* !defined(W_ARRAY) */ 632734b6a94Sdarrenm 633734b6a94Sdarrenm W(0) = LOAD_BIG_32(blk + 0); 634734b6a94Sdarrenm W(1) = LOAD_BIG_32(blk + 4); 635734b6a94Sdarrenm W(2) = LOAD_BIG_32(blk + 8); 636734b6a94Sdarrenm W(3) = LOAD_BIG_32(blk + 12); 637734b6a94Sdarrenm W(4) = LOAD_BIG_32(blk + 16); 638734b6a94Sdarrenm W(5) = LOAD_BIG_32(blk + 20); 639734b6a94Sdarrenm W(6) = LOAD_BIG_32(blk + 24); 640734b6a94Sdarrenm W(7) = LOAD_BIG_32(blk + 28); 641734b6a94Sdarrenm W(8) = LOAD_BIG_32(blk + 32); 642734b6a94Sdarrenm W(9) = LOAD_BIG_32(blk + 36); 643734b6a94Sdarrenm W(10) = LOAD_BIG_32(blk + 40); 644734b6a94Sdarrenm W(11) = LOAD_BIG_32(blk + 44); 645734b6a94Sdarrenm W(12) = LOAD_BIG_32(blk + 48); 646734b6a94Sdarrenm W(13) = LOAD_BIG_32(blk + 52); 647734b6a94Sdarrenm W(14) = LOAD_BIG_32(blk + 56); 648734b6a94Sdarrenm W(15) = LOAD_BIG_32(blk + 60); 649734b6a94Sdarrenm 650734b6a94Sdarrenm #endif /* !defined(__sparc) */ 651734b6a94Sdarrenm 6527c478bd9Sstevel@tonic-gate /* 6537c478bd9Sstevel@tonic-gate * general optimization: 6547c478bd9Sstevel@tonic-gate * 6557c478bd9Sstevel@tonic-gate * even though this approach is described in the standard as 6567c478bd9Sstevel@tonic-gate * being slower algorithmically, it is 30-40% faster than the 6577c478bd9Sstevel@tonic-gate * "faster" version under SPARC, because this version has more 6587c478bd9Sstevel@tonic-gate * of the constraints specified at compile-time and uses fewer 6597c478bd9Sstevel@tonic-gate * variables (and therefore has better register utilization) 6607c478bd9Sstevel@tonic-gate * than its "speedier" brother. (i've tried both, trust me) 6617c478bd9Sstevel@tonic-gate * 6627c478bd9Sstevel@tonic-gate * for either method given in the spec, there is an "assignment" 6637c478bd9Sstevel@tonic-gate * phase where the following takes place: 6647c478bd9Sstevel@tonic-gate * 6657c478bd9Sstevel@tonic-gate * tmp = (main_computation); 6667c478bd9Sstevel@tonic-gate * e = d; d = c; c = rotate_left(b, 30); b = a; a = tmp; 6677c478bd9Sstevel@tonic-gate * 6687c478bd9Sstevel@tonic-gate * we can make the algorithm go faster by not doing this work, 6697c478bd9Sstevel@tonic-gate * but just pretending that `d' is now `e', etc. this works 6707c478bd9Sstevel@tonic-gate * really well and obviates the need for a temporary variable. 671321502cdSda73024 * however, we still explicitly perform the rotate action, 6727c478bd9Sstevel@tonic-gate * since it is cheaper on SPARC to do it once than to have to 6737c478bd9Sstevel@tonic-gate * do it over and over again. 6747c478bd9Sstevel@tonic-gate */ 6757c478bd9Sstevel@tonic-gate 6767c478bd9Sstevel@tonic-gate /* round 1 */ 677734b6a94Sdarrenm e = ROTATE_LEFT(a, 5) + F(b, c, d) + e + W(0) + SHA1_CONST(0); /* 0 */ 6787c478bd9Sstevel@tonic-gate b = ROTATE_LEFT(b, 30); 6797c478bd9Sstevel@tonic-gate 680734b6a94Sdarrenm d = ROTATE_LEFT(e, 5) + F(a, b, c) + d + W(1) + SHA1_CONST(0); /* 1 */ 6817c478bd9Sstevel@tonic-gate a = ROTATE_LEFT(a, 30); 6827c478bd9Sstevel@tonic-gate 683734b6a94Sdarrenm c = ROTATE_LEFT(d, 5) + F(e, a, b) + c + W(2) + SHA1_CONST(0); /* 2 */ 6847c478bd9Sstevel@tonic-gate e = ROTATE_LEFT(e, 30); 6857c478bd9Sstevel@tonic-gate 686734b6a94Sdarrenm b = ROTATE_LEFT(c, 5) + F(d, e, a) + b + W(3) + SHA1_CONST(0); /* 3 */ 6877c478bd9Sstevel@tonic-gate d = ROTATE_LEFT(d, 30); 6887c478bd9Sstevel@tonic-gate 689734b6a94Sdarrenm a = ROTATE_LEFT(b, 5) + F(c, d, e) + a + W(4) + SHA1_CONST(0); /* 4 */ 6907c478bd9Sstevel@tonic-gate c = ROTATE_LEFT(c, 30); 6917c478bd9Sstevel@tonic-gate 692734b6a94Sdarrenm e = ROTATE_LEFT(a, 5) + F(b, c, d) + e + W(5) + SHA1_CONST(0); /* 5 */ 6937c478bd9Sstevel@tonic-gate b = ROTATE_LEFT(b, 30); 6947c478bd9Sstevel@tonic-gate 695734b6a94Sdarrenm d = ROTATE_LEFT(e, 5) + F(a, b, c) + d + W(6) + SHA1_CONST(0); /* 6 */ 6967c478bd9Sstevel@tonic-gate a = ROTATE_LEFT(a, 30); 6977c478bd9Sstevel@tonic-gate 698734b6a94Sdarrenm c = ROTATE_LEFT(d, 5) + F(e, a, b) + c + W(7) + SHA1_CONST(0); /* 7 */ 6997c478bd9Sstevel@tonic-gate e = ROTATE_LEFT(e, 30); 7007c478bd9Sstevel@tonic-gate 701734b6a94Sdarrenm b = ROTATE_LEFT(c, 5) + F(d, e, a) + b + W(8) + SHA1_CONST(0); /* 8 */ 7027c478bd9Sstevel@tonic-gate d = ROTATE_LEFT(d, 30); 7037c478bd9Sstevel@tonic-gate 704734b6a94Sdarrenm a = ROTATE_LEFT(b, 5) + F(c, d, e) + a + W(9) + SHA1_CONST(0); /* 9 */ 7057c478bd9Sstevel@tonic-gate c = ROTATE_LEFT(c, 30); 7067c478bd9Sstevel@tonic-gate 707734b6a94Sdarrenm e = ROTATE_LEFT(a, 5) + F(b, c, d) + e + W(10) + SHA1_CONST(0); /* 10 */ 7087c478bd9Sstevel@tonic-gate b = ROTATE_LEFT(b, 30); 7097c478bd9Sstevel@tonic-gate 710734b6a94Sdarrenm d = ROTATE_LEFT(e, 5) + F(a, b, c) + d + W(11) + SHA1_CONST(0); /* 11 */ 7117c478bd9Sstevel@tonic-gate a = ROTATE_LEFT(a, 30); 7127c478bd9Sstevel@tonic-gate 713734b6a94Sdarrenm c = ROTATE_LEFT(d, 5) + F(e, a, b) + c + W(12) + SHA1_CONST(0); /* 12 */ 7147c478bd9Sstevel@tonic-gate e = ROTATE_LEFT(e, 30); 7157c478bd9Sstevel@tonic-gate 716734b6a94Sdarrenm b = ROTATE_LEFT(c, 5) + F(d, e, a) + b + W(13) + SHA1_CONST(0); /* 13 */ 7177c478bd9Sstevel@tonic-gate d = ROTATE_LEFT(d, 30); 7187c478bd9Sstevel@tonic-gate 719734b6a94Sdarrenm a = ROTATE_LEFT(b, 5) + F(c, d, e) + a + W(14) + SHA1_CONST(0); /* 14 */ 7207c478bd9Sstevel@tonic-gate c = ROTATE_LEFT(c, 30); 7217c478bd9Sstevel@tonic-gate 722734b6a94Sdarrenm e = ROTATE_LEFT(a, 5) + F(b, c, d) + e + W(15) + SHA1_CONST(0); /* 15 */ 7237c478bd9Sstevel@tonic-gate b = ROTATE_LEFT(b, 30); 7247c478bd9Sstevel@tonic-gate 725734b6a94Sdarrenm W(0) = ROTATE_LEFT((W(13) ^ W(8) ^ W(2) ^ W(0)), 1); /* 16 */ 726734b6a94Sdarrenm d = ROTATE_LEFT(e, 5) + F(a, b, c) + d + W(0) + SHA1_CONST(0); 7277c478bd9Sstevel@tonic-gate a = ROTATE_LEFT(a, 30); 7287c478bd9Sstevel@tonic-gate 729734b6a94Sdarrenm W(1) = ROTATE_LEFT((W(14) ^ W(9) ^ W(3) ^ W(1)), 1); /* 17 */ 730734b6a94Sdarrenm c = ROTATE_LEFT(d, 5) + F(e, a, b) + c + W(1) + SHA1_CONST(0); 7317c478bd9Sstevel@tonic-gate e = ROTATE_LEFT(e, 30); 7327c478bd9Sstevel@tonic-gate 733734b6a94Sdarrenm W(2) = ROTATE_LEFT((W(15) ^ W(10) ^ W(4) ^ W(2)), 1); /* 18 */ 734734b6a94Sdarrenm b = ROTATE_LEFT(c, 5) + F(d, e, a) + b + W(2) + SHA1_CONST(0); 7357c478bd9Sstevel@tonic-gate d = ROTATE_LEFT(d, 30); 7367c478bd9Sstevel@tonic-gate 737734b6a94Sdarrenm W(3) = ROTATE_LEFT((W(0) ^ W(11) ^ W(5) ^ W(3)), 1); /* 19 */ 738734b6a94Sdarrenm a = ROTATE_LEFT(b, 5) + F(c, d, e) + a + W(3) + SHA1_CONST(0); 7397c478bd9Sstevel@tonic-gate c = ROTATE_LEFT(c, 30); 7407c478bd9Sstevel@tonic-gate 7417c478bd9Sstevel@tonic-gate /* round 2 */ 742734b6a94Sdarrenm W(4) = ROTATE_LEFT((W(1) ^ W(12) ^ W(6) ^ W(4)), 1); /* 20 */ 743734b6a94Sdarrenm e = ROTATE_LEFT(a, 5) + G(b, c, d) + e + W(4) + SHA1_CONST(1); 7447c478bd9Sstevel@tonic-gate b = ROTATE_LEFT(b, 30); 7457c478bd9Sstevel@tonic-gate 746734b6a94Sdarrenm W(5) = ROTATE_LEFT((W(2) ^ W(13) ^ W(7) ^ W(5)), 1); /* 21 */ 747734b6a94Sdarrenm d = ROTATE_LEFT(e, 5) + G(a, b, c) + d + W(5) + SHA1_CONST(1); 7487c478bd9Sstevel@tonic-gate a = ROTATE_LEFT(a, 30); 7497c478bd9Sstevel@tonic-gate 750734b6a94Sdarrenm W(6) = ROTATE_LEFT((W(3) ^ W(14) ^ W(8) ^ W(6)), 1); /* 22 */ 751734b6a94Sdarrenm c = ROTATE_LEFT(d, 5) + G(e, a, b) + c + W(6) + SHA1_CONST(1); 7527c478bd9Sstevel@tonic-gate e = ROTATE_LEFT(e, 30); 7537c478bd9Sstevel@tonic-gate 754734b6a94Sdarrenm W(7) = ROTATE_LEFT((W(4) ^ W(15) ^ W(9) ^ W(7)), 1); /* 23 */ 755734b6a94Sdarrenm b = ROTATE_LEFT(c, 5) + G(d, e, a) + b + W(7) + SHA1_CONST(1); 7567c478bd9Sstevel@tonic-gate d = ROTATE_LEFT(d, 30); 7577c478bd9Sstevel@tonic-gate 758734b6a94Sdarrenm W(8) = ROTATE_LEFT((W(5) ^ W(0) ^ W(10) ^ W(8)), 1); /* 24 */ 759734b6a94Sdarrenm a = ROTATE_LEFT(b, 5) + G(c, d, e) + a + W(8) + SHA1_CONST(1); 7607c478bd9Sstevel@tonic-gate c = ROTATE_LEFT(c, 30); 7617c478bd9Sstevel@tonic-gate 762734b6a94Sdarrenm W(9) = ROTATE_LEFT((W(6) ^ W(1) ^ W(11) ^ W(9)), 1); /* 25 */ 763734b6a94Sdarrenm e = ROTATE_LEFT(a, 5) + G(b, c, d) + e + W(9) + SHA1_CONST(1); 7647c478bd9Sstevel@tonic-gate b = ROTATE_LEFT(b, 30); 7657c478bd9Sstevel@tonic-gate 766734b6a94Sdarrenm W(10) = ROTATE_LEFT((W(7) ^ W(2) ^ W(12) ^ W(10)), 1); /* 26 */ 767734b6a94Sdarrenm d = ROTATE_LEFT(e, 5) + G(a, b, c) + d + W(10) + SHA1_CONST(1); 7687c478bd9Sstevel@tonic-gate a = ROTATE_LEFT(a, 30); 7697c478bd9Sstevel@tonic-gate 770734b6a94Sdarrenm W(11) = ROTATE_LEFT((W(8) ^ W(3) ^ W(13) ^ W(11)), 1); /* 27 */ 771734b6a94Sdarrenm c = ROTATE_LEFT(d, 5) + G(e, a, b) + c + W(11) + SHA1_CONST(1); 7727c478bd9Sstevel@tonic-gate e = ROTATE_LEFT(e, 30); 7737c478bd9Sstevel@tonic-gate 774734b6a94Sdarrenm W(12) = ROTATE_LEFT((W(9) ^ W(4) ^ W(14) ^ W(12)), 1); /* 28 */ 775734b6a94Sdarrenm b = ROTATE_LEFT(c, 5) + G(d, e, a) + b + W(12) + SHA1_CONST(1); 7767c478bd9Sstevel@tonic-gate d = ROTATE_LEFT(d, 30); 7777c478bd9Sstevel@tonic-gate 778734b6a94Sdarrenm W(13) = ROTATE_LEFT((W(10) ^ W(5) ^ W(15) ^ W(13)), 1); /* 29 */ 779734b6a94Sdarrenm a = ROTATE_LEFT(b, 5) + G(c, d, e) + a + W(13) + SHA1_CONST(1); 7807c478bd9Sstevel@tonic-gate c = ROTATE_LEFT(c, 30); 7817c478bd9Sstevel@tonic-gate 782734b6a94Sdarrenm W(14) = ROTATE_LEFT((W(11) ^ W(6) ^ W(0) ^ W(14)), 1); /* 30 */ 783734b6a94Sdarrenm e = ROTATE_LEFT(a, 5) + G(b, c, d) + e + W(14) + SHA1_CONST(1); 7847c478bd9Sstevel@tonic-gate b = ROTATE_LEFT(b, 30); 7857c478bd9Sstevel@tonic-gate 786734b6a94Sdarrenm W(15) = ROTATE_LEFT((W(12) ^ W(7) ^ W(1) ^ W(15)), 1); /* 31 */ 787734b6a94Sdarrenm d = ROTATE_LEFT(e, 5) + G(a, b, c) + d + W(15) + SHA1_CONST(1); 7887c478bd9Sstevel@tonic-gate a = ROTATE_LEFT(a, 30); 7897c478bd9Sstevel@tonic-gate 790734b6a94Sdarrenm W(0) = ROTATE_LEFT((W(13) ^ W(8) ^ W(2) ^ W(0)), 1); /* 32 */ 791734b6a94Sdarrenm c = ROTATE_LEFT(d, 5) + G(e, a, b) + c + W(0) + SHA1_CONST(1); 7927c478bd9Sstevel@tonic-gate e = ROTATE_LEFT(e, 30); 7937c478bd9Sstevel@tonic-gate 794734b6a94Sdarrenm W(1) = ROTATE_LEFT((W(14) ^ W(9) ^ W(3) ^ W(1)), 1); /* 33 */ 795734b6a94Sdarrenm b = ROTATE_LEFT(c, 5) + G(d, e, a) + b + W(1) + SHA1_CONST(1); 7967c478bd9Sstevel@tonic-gate d = ROTATE_LEFT(d, 30); 7977c478bd9Sstevel@tonic-gate 798734b6a94Sdarrenm W(2) = ROTATE_LEFT((W(15) ^ W(10) ^ W(4) ^ W(2)), 1); /* 34 */ 799734b6a94Sdarrenm a = ROTATE_LEFT(b, 5) + G(c, d, e) + a + W(2) + SHA1_CONST(1); 8007c478bd9Sstevel@tonic-gate c = ROTATE_LEFT(c, 30); 8017c478bd9Sstevel@tonic-gate 802734b6a94Sdarrenm W(3) = ROTATE_LEFT((W(0) ^ W(11) ^ W(5) ^ W(3)), 1); /* 35 */ 803734b6a94Sdarrenm e = ROTATE_LEFT(a, 5) + G(b, c, d) + e + W(3) + SHA1_CONST(1); 8047c478bd9Sstevel@tonic-gate b = ROTATE_LEFT(b, 30); 8057c478bd9Sstevel@tonic-gate 806734b6a94Sdarrenm W(4) = ROTATE_LEFT((W(1) ^ W(12) ^ W(6) ^ W(4)), 1); /* 36 */ 807734b6a94Sdarrenm d = ROTATE_LEFT(e, 5) + G(a, b, c) + d + W(4) + SHA1_CONST(1); 8087c478bd9Sstevel@tonic-gate a = ROTATE_LEFT(a, 30); 8097c478bd9Sstevel@tonic-gate 810734b6a94Sdarrenm W(5) = ROTATE_LEFT((W(2) ^ W(13) ^ W(7) ^ W(5)), 1); /* 37 */ 811734b6a94Sdarrenm c = ROTATE_LEFT(d, 5) + G(e, a, b) + c + W(5) + SHA1_CONST(1); 8127c478bd9Sstevel@tonic-gate e = ROTATE_LEFT(e, 30); 8137c478bd9Sstevel@tonic-gate 814734b6a94Sdarrenm W(6) = ROTATE_LEFT((W(3) ^ W(14) ^ W(8) ^ W(6)), 1); /* 38 */ 815734b6a94Sdarrenm b = ROTATE_LEFT(c, 5) + G(d, e, a) + b + W(6) + SHA1_CONST(1); 8167c478bd9Sstevel@tonic-gate d = ROTATE_LEFT(d, 30); 8177c478bd9Sstevel@tonic-gate 818734b6a94Sdarrenm W(7) = ROTATE_LEFT((W(4) ^ W(15) ^ W(9) ^ W(7)), 1); /* 39 */ 819734b6a94Sdarrenm a = ROTATE_LEFT(b, 5) + G(c, d, e) + a + W(7) + SHA1_CONST(1); 8207c478bd9Sstevel@tonic-gate c = ROTATE_LEFT(c, 30); 8217c478bd9Sstevel@tonic-gate 8227c478bd9Sstevel@tonic-gate /* round 3 */ 823734b6a94Sdarrenm W(8) = ROTATE_LEFT((W(5) ^ W(0) ^ W(10) ^ W(8)), 1); /* 40 */ 824734b6a94Sdarrenm e = ROTATE_LEFT(a, 5) + H(b, c, d) + e + W(8) + SHA1_CONST(2); 8257c478bd9Sstevel@tonic-gate b = ROTATE_LEFT(b, 30); 8267c478bd9Sstevel@tonic-gate 827734b6a94Sdarrenm W(9) = ROTATE_LEFT((W(6) ^ W(1) ^ W(11) ^ W(9)), 1); /* 41 */ 828734b6a94Sdarrenm d = ROTATE_LEFT(e, 5) + H(a, b, c) + d + W(9) + SHA1_CONST(2); 8297c478bd9Sstevel@tonic-gate a = ROTATE_LEFT(a, 30); 8307c478bd9Sstevel@tonic-gate 831734b6a94Sdarrenm W(10) = ROTATE_LEFT((W(7) ^ W(2) ^ W(12) ^ W(10)), 1); /* 42 */ 832734b6a94Sdarrenm c = ROTATE_LEFT(d, 5) + H(e, a, b) + c + W(10) + SHA1_CONST(2); 8337c478bd9Sstevel@tonic-gate e = ROTATE_LEFT(e, 30); 8347c478bd9Sstevel@tonic-gate 835734b6a94Sdarrenm W(11) = ROTATE_LEFT((W(8) ^ W(3) ^ W(13) ^ W(11)), 1); /* 43 */ 836734b6a94Sdarrenm b = ROTATE_LEFT(c, 5) + H(d, e, a) + b + W(11) + SHA1_CONST(2); 8377c478bd9Sstevel@tonic-gate d = ROTATE_LEFT(d, 30); 8387c478bd9Sstevel@tonic-gate 839734b6a94Sdarrenm W(12) = ROTATE_LEFT((W(9) ^ W(4) ^ W(14) ^ W(12)), 1); /* 44 */ 840734b6a94Sdarrenm a = ROTATE_LEFT(b, 5) + H(c, d, e) + a + W(12) + SHA1_CONST(2); 8417c478bd9Sstevel@tonic-gate c = ROTATE_LEFT(c, 30); 8427c478bd9Sstevel@tonic-gate 843734b6a94Sdarrenm W(13) = ROTATE_LEFT((W(10) ^ W(5) ^ W(15) ^ W(13)), 1); /* 45 */ 844734b6a94Sdarrenm e = ROTATE_LEFT(a, 5) + H(b, c, d) + e + W(13) + SHA1_CONST(2); 8457c478bd9Sstevel@tonic-gate b = ROTATE_LEFT(b, 30); 8467c478bd9Sstevel@tonic-gate 847734b6a94Sdarrenm W(14) = ROTATE_LEFT((W(11) ^ W(6) ^ W(0) ^ W(14)), 1); /* 46 */ 848734b6a94Sdarrenm d = ROTATE_LEFT(e, 5) + H(a, b, c) + d + W(14) + SHA1_CONST(2); 8497c478bd9Sstevel@tonic-gate a = ROTATE_LEFT(a, 30); 8507c478bd9Sstevel@tonic-gate 851734b6a94Sdarrenm W(15) = ROTATE_LEFT((W(12) ^ W(7) ^ W(1) ^ W(15)), 1); /* 47 */ 852734b6a94Sdarrenm c = ROTATE_LEFT(d, 5) + H(e, a, b) + c + W(15) + SHA1_CONST(2); 8537c478bd9Sstevel@tonic-gate e = ROTATE_LEFT(e, 30); 8547c478bd9Sstevel@tonic-gate 855734b6a94Sdarrenm W(0) = ROTATE_LEFT((W(13) ^ W(8) ^ W(2) ^ W(0)), 1); /* 48 */ 856734b6a94Sdarrenm b = ROTATE_LEFT(c, 5) + H(d, e, a) + b + W(0) + SHA1_CONST(2); 8577c478bd9Sstevel@tonic-gate d = ROTATE_LEFT(d, 30); 8587c478bd9Sstevel@tonic-gate 859734b6a94Sdarrenm W(1) = ROTATE_LEFT((W(14) ^ W(9) ^ W(3) ^ W(1)), 1); /* 49 */ 860734b6a94Sdarrenm a = ROTATE_LEFT(b, 5) + H(c, d, e) + a + W(1) + SHA1_CONST(2); 8617c478bd9Sstevel@tonic-gate c = ROTATE_LEFT(c, 30); 8627c478bd9Sstevel@tonic-gate 863734b6a94Sdarrenm W(2) = ROTATE_LEFT((W(15) ^ W(10) ^ W(4) ^ W(2)), 1); /* 50 */ 864734b6a94Sdarrenm e = ROTATE_LEFT(a, 5) + H(b, c, d) + e + W(2) + SHA1_CONST(2); 8657c478bd9Sstevel@tonic-gate b = ROTATE_LEFT(b, 30); 8667c478bd9Sstevel@tonic-gate 867734b6a94Sdarrenm W(3) = ROTATE_LEFT((W(0) ^ W(11) ^ W(5) ^ W(3)), 1); /* 51 */ 868734b6a94Sdarrenm d = ROTATE_LEFT(e, 5) + H(a, b, c) + d + W(3) + SHA1_CONST(2); 8697c478bd9Sstevel@tonic-gate a = ROTATE_LEFT(a, 30); 8707c478bd9Sstevel@tonic-gate 871734b6a94Sdarrenm W(4) = ROTATE_LEFT((W(1) ^ W(12) ^ W(6) ^ W(4)), 1); /* 52 */ 872734b6a94Sdarrenm c = ROTATE_LEFT(d, 5) + H(e, a, b) + c + W(4) + SHA1_CONST(2); 8737c478bd9Sstevel@tonic-gate e = ROTATE_LEFT(e, 30); 8747c478bd9Sstevel@tonic-gate 875734b6a94Sdarrenm W(5) = ROTATE_LEFT((W(2) ^ W(13) ^ W(7) ^ W(5)), 1); /* 53 */ 876734b6a94Sdarrenm b = ROTATE_LEFT(c, 5) + H(d, e, a) + b + W(5) + SHA1_CONST(2); 8777c478bd9Sstevel@tonic-gate d = ROTATE_LEFT(d, 30); 8787c478bd9Sstevel@tonic-gate 879734b6a94Sdarrenm W(6) = ROTATE_LEFT((W(3) ^ W(14) ^ W(8) ^ W(6)), 1); /* 54 */ 880734b6a94Sdarrenm a = ROTATE_LEFT(b, 5) + H(c, d, e) + a + W(6) + SHA1_CONST(2); 8817c478bd9Sstevel@tonic-gate c = ROTATE_LEFT(c, 30); 8827c478bd9Sstevel@tonic-gate 883734b6a94Sdarrenm W(7) = ROTATE_LEFT((W(4) ^ W(15) ^ W(9) ^ W(7)), 1); /* 55 */ 884734b6a94Sdarrenm e = ROTATE_LEFT(a, 5) + H(b, c, d) + e + W(7) + SHA1_CONST(2); 8857c478bd9Sstevel@tonic-gate b = ROTATE_LEFT(b, 30); 8867c478bd9Sstevel@tonic-gate 887734b6a94Sdarrenm W(8) = ROTATE_LEFT((W(5) ^ W(0) ^ W(10) ^ W(8)), 1); /* 56 */ 888734b6a94Sdarrenm d = ROTATE_LEFT(e, 5) + H(a, b, c) + d + W(8) + SHA1_CONST(2); 8897c478bd9Sstevel@tonic-gate a = ROTATE_LEFT(a, 30); 8907c478bd9Sstevel@tonic-gate 891734b6a94Sdarrenm W(9) = ROTATE_LEFT((W(6) ^ W(1) ^ W(11) ^ W(9)), 1); /* 57 */ 892734b6a94Sdarrenm c = ROTATE_LEFT(d, 5) + H(e, a, b) + c + W(9) + SHA1_CONST(2); 8937c478bd9Sstevel@tonic-gate e = ROTATE_LEFT(e, 30); 8947c478bd9Sstevel@tonic-gate 895734b6a94Sdarrenm W(10) = ROTATE_LEFT((W(7) ^ W(2) ^ W(12) ^ W(10)), 1); /* 58 */ 896734b6a94Sdarrenm b = ROTATE_LEFT(c, 5) + H(d, e, a) + b + W(10) + SHA1_CONST(2); 8977c478bd9Sstevel@tonic-gate d = ROTATE_LEFT(d, 30); 8987c478bd9Sstevel@tonic-gate 899734b6a94Sdarrenm W(11) = ROTATE_LEFT((W(8) ^ W(3) ^ W(13) ^ W(11)), 1); /* 59 */ 900734b6a94Sdarrenm a = ROTATE_LEFT(b, 5) + H(c, d, e) + a + W(11) + SHA1_CONST(2); 9017c478bd9Sstevel@tonic-gate c = ROTATE_LEFT(c, 30); 9027c478bd9Sstevel@tonic-gate 9037c478bd9Sstevel@tonic-gate /* round 4 */ 904734b6a94Sdarrenm W(12) = ROTATE_LEFT((W(9) ^ W(4) ^ W(14) ^ W(12)), 1); /* 60 */ 905734b6a94Sdarrenm e = ROTATE_LEFT(a, 5) + G(b, c, d) + e + W(12) + SHA1_CONST(3); 9067c478bd9Sstevel@tonic-gate b = ROTATE_LEFT(b, 30); 9077c478bd9Sstevel@tonic-gate 908734b6a94Sdarrenm W(13) = ROTATE_LEFT((W(10) ^ W(5) ^ W(15) ^ W(13)), 1); /* 61 */ 909734b6a94Sdarrenm d = ROTATE_LEFT(e, 5) + G(a, b, c) + d + W(13) + SHA1_CONST(3); 9107c478bd9Sstevel@tonic-gate a = ROTATE_LEFT(a, 30); 9117c478bd9Sstevel@tonic-gate 912734b6a94Sdarrenm W(14) = ROTATE_LEFT((W(11) ^ W(6) ^ W(0) ^ W(14)), 1); /* 62 */ 913734b6a94Sdarrenm c = ROTATE_LEFT(d, 5) + G(e, a, b) + c + W(14) + SHA1_CONST(3); 9147c478bd9Sstevel@tonic-gate e = ROTATE_LEFT(e, 30); 9157c478bd9Sstevel@tonic-gate 916734b6a94Sdarrenm W(15) = ROTATE_LEFT((W(12) ^ W(7) ^ W(1) ^ W(15)), 1); /* 63 */ 917734b6a94Sdarrenm b = ROTATE_LEFT(c, 5) + G(d, e, a) + b + W(15) + SHA1_CONST(3); 9187c478bd9Sstevel@tonic-gate d = ROTATE_LEFT(d, 30); 9197c478bd9Sstevel@tonic-gate 920734b6a94Sdarrenm W(0) = ROTATE_LEFT((W(13) ^ W(8) ^ W(2) ^ W(0)), 1); /* 64 */ 921734b6a94Sdarrenm a = ROTATE_LEFT(b, 5) + G(c, d, e) + a + W(0) + SHA1_CONST(3); 9227c478bd9Sstevel@tonic-gate c = ROTATE_LEFT(c, 30); 9237c478bd9Sstevel@tonic-gate 924734b6a94Sdarrenm W(1) = ROTATE_LEFT((W(14) ^ W(9) ^ W(3) ^ W(1)), 1); /* 65 */ 925734b6a94Sdarrenm e = ROTATE_LEFT(a, 5) + G(b, c, d) + e + W(1) + SHA1_CONST(3); 9267c478bd9Sstevel@tonic-gate b = ROTATE_LEFT(b, 30); 9277c478bd9Sstevel@tonic-gate 928734b6a94Sdarrenm W(2) = ROTATE_LEFT((W(15) ^ W(10) ^ W(4) ^ W(2)), 1); /* 66 */ 929734b6a94Sdarrenm d = ROTATE_LEFT(e, 5) + G(a, b, c) + d + W(2) + SHA1_CONST(3); 9307c478bd9Sstevel@tonic-gate a = ROTATE_LEFT(a, 30); 9317c478bd9Sstevel@tonic-gate 932734b6a94Sdarrenm W(3) = ROTATE_LEFT((W(0) ^ W(11) ^ W(5) ^ W(3)), 1); /* 67 */ 933734b6a94Sdarrenm c = ROTATE_LEFT(d, 5) + G(e, a, b) + c + W(3) + SHA1_CONST(3); 9347c478bd9Sstevel@tonic-gate e = ROTATE_LEFT(e, 30); 9357c478bd9Sstevel@tonic-gate 936734b6a94Sdarrenm W(4) = ROTATE_LEFT((W(1) ^ W(12) ^ W(6) ^ W(4)), 1); /* 68 */ 937734b6a94Sdarrenm b = ROTATE_LEFT(c, 5) + G(d, e, a) + b + W(4) + SHA1_CONST(3); 9387c478bd9Sstevel@tonic-gate d = ROTATE_LEFT(d, 30); 9397c478bd9Sstevel@tonic-gate 940734b6a94Sdarrenm W(5) = ROTATE_LEFT((W(2) ^ W(13) ^ W(7) ^ W(5)), 1); /* 69 */ 941734b6a94Sdarrenm a = ROTATE_LEFT(b, 5) + G(c, d, e) + a + W(5) + SHA1_CONST(3); 9427c478bd9Sstevel@tonic-gate c = ROTATE_LEFT(c, 30); 9437c478bd9Sstevel@tonic-gate 944734b6a94Sdarrenm W(6) = ROTATE_LEFT((W(3) ^ W(14) ^ W(8) ^ W(6)), 1); /* 70 */ 945734b6a94Sdarrenm e = ROTATE_LEFT(a, 5) + G(b, c, d) + e + W(6) + SHA1_CONST(3); 9467c478bd9Sstevel@tonic-gate b = ROTATE_LEFT(b, 30); 9477c478bd9Sstevel@tonic-gate 948734b6a94Sdarrenm W(7) = ROTATE_LEFT((W(4) ^ W(15) ^ W(9) ^ W(7)), 1); /* 71 */ 949734b6a94Sdarrenm d = ROTATE_LEFT(e, 5) + G(a, b, c) + d + W(7) + SHA1_CONST(3); 9507c478bd9Sstevel@tonic-gate a = ROTATE_LEFT(a, 30); 9517c478bd9Sstevel@tonic-gate 952734b6a94Sdarrenm W(8) = ROTATE_LEFT((W(5) ^ W(0) ^ W(10) ^ W(8)), 1); /* 72 */ 953734b6a94Sdarrenm c = ROTATE_LEFT(d, 5) + G(e, a, b) + c + W(8) + SHA1_CONST(3); 9547c478bd9Sstevel@tonic-gate e = ROTATE_LEFT(e, 30); 9557c478bd9Sstevel@tonic-gate 956734b6a94Sdarrenm W(9) = ROTATE_LEFT((W(6) ^ W(1) ^ W(11) ^ W(9)), 1); /* 73 */ 957734b6a94Sdarrenm b = ROTATE_LEFT(c, 5) + G(d, e, a) + b + W(9) + SHA1_CONST(3); 9587c478bd9Sstevel@tonic-gate d = ROTATE_LEFT(d, 30); 9597c478bd9Sstevel@tonic-gate 960734b6a94Sdarrenm W(10) = ROTATE_LEFT((W(7) ^ W(2) ^ W(12) ^ W(10)), 1); /* 74 */ 961734b6a94Sdarrenm a = ROTATE_LEFT(b, 5) + G(c, d, e) + a + W(10) + SHA1_CONST(3); 9627c478bd9Sstevel@tonic-gate c = ROTATE_LEFT(c, 30); 9637c478bd9Sstevel@tonic-gate 964734b6a94Sdarrenm W(11) = ROTATE_LEFT((W(8) ^ W(3) ^ W(13) ^ W(11)), 1); /* 75 */ 965734b6a94Sdarrenm e = ROTATE_LEFT(a, 5) + G(b, c, d) + e + W(11) + SHA1_CONST(3); 9667c478bd9Sstevel@tonic-gate b = ROTATE_LEFT(b, 30); 9677c478bd9Sstevel@tonic-gate 968734b6a94Sdarrenm W(12) = ROTATE_LEFT((W(9) ^ W(4) ^ W(14) ^ W(12)), 1); /* 76 */ 969734b6a94Sdarrenm d = ROTATE_LEFT(e, 5) + G(a, b, c) + d + W(12) + SHA1_CONST(3); 9707c478bd9Sstevel@tonic-gate a = ROTATE_LEFT(a, 30); 9717c478bd9Sstevel@tonic-gate 972734b6a94Sdarrenm W(13) = ROTATE_LEFT((W(10) ^ W(5) ^ W(15) ^ W(13)), 1); /* 77 */ 973734b6a94Sdarrenm c = ROTATE_LEFT(d, 5) + G(e, a, b) + c + W(13) + SHA1_CONST(3); 9747c478bd9Sstevel@tonic-gate e = ROTATE_LEFT(e, 30); 9757c478bd9Sstevel@tonic-gate 976734b6a94Sdarrenm W(14) = ROTATE_LEFT((W(11) ^ W(6) ^ W(0) ^ W(14)), 1); /* 78 */ 977734b6a94Sdarrenm b = ROTATE_LEFT(c, 5) + G(d, e, a) + b + W(14) + SHA1_CONST(3); 9787c478bd9Sstevel@tonic-gate d = ROTATE_LEFT(d, 30); 9797c478bd9Sstevel@tonic-gate 980734b6a94Sdarrenm W(15) = ROTATE_LEFT((W(12) ^ W(7) ^ W(1) ^ W(15)), 1); /* 79 */ 9817c478bd9Sstevel@tonic-gate 982734b6a94Sdarrenm ctx->state[0] += ROTATE_LEFT(b, 5) + G(c, d, e) + a + W(15) + 9837c478bd9Sstevel@tonic-gate SHA1_CONST(3); 9847c478bd9Sstevel@tonic-gate ctx->state[1] += b; 9857c478bd9Sstevel@tonic-gate ctx->state[2] += ROTATE_LEFT(c, 30); 9867c478bd9Sstevel@tonic-gate ctx->state[3] += d; 9877c478bd9Sstevel@tonic-gate ctx->state[4] += e; 9887c478bd9Sstevel@tonic-gate 9897c478bd9Sstevel@tonic-gate /* zeroize sensitive information */ 990734b6a94Sdarrenm W(0) = W(1) = W(2) = W(3) = W(4) = W(5) = W(6) = W(7) = W(8) = 0; 991734b6a94Sdarrenm W(9) = W(10) = W(11) = W(12) = W(13) = W(14) = W(15) = 0; 9927c478bd9Sstevel@tonic-gate } 993321502cdSda73024 #endif /* !__amd64 */ 994321502cdSda73024 9957c478bd9Sstevel@tonic-gate 9967c478bd9Sstevel@tonic-gate /* 9977c478bd9Sstevel@tonic-gate * Encode() 9987c478bd9Sstevel@tonic-gate * 9997c478bd9Sstevel@tonic-gate * purpose: to convert a list of numbers from little endian to big endian 10007c478bd9Sstevel@tonic-gate * input: uint8_t * : place to store the converted big endian numbers 10017c478bd9Sstevel@tonic-gate * uint32_t * : place to get numbers to convert from 10027c478bd9Sstevel@tonic-gate * size_t : the length of the input in bytes 10037c478bd9Sstevel@tonic-gate * output: void 10047c478bd9Sstevel@tonic-gate */ 10057c478bd9Sstevel@tonic-gate 10067c478bd9Sstevel@tonic-gate static void 1007734b6a94Sdarrenm Encode(uint8_t *_RESTRICT_KYWD output, const uint32_t *_RESTRICT_KYWD input, 1008734b6a94Sdarrenm size_t len) 10097c478bd9Sstevel@tonic-gate { 10107c478bd9Sstevel@tonic-gate size_t i, j; 10117c478bd9Sstevel@tonic-gate 10127c478bd9Sstevel@tonic-gate #if defined(__sparc) 10137c478bd9Sstevel@tonic-gate if (IS_P2ALIGNED(output, sizeof (uint32_t))) { 10147c478bd9Sstevel@tonic-gate for (i = 0, j = 0; j < len; i++, j += 4) { 10157c478bd9Sstevel@tonic-gate /* LINTED: pointer alignment */ 10167c478bd9Sstevel@tonic-gate *((uint32_t *)(output + j)) = input[i]; 10177c478bd9Sstevel@tonic-gate } 10187c478bd9Sstevel@tonic-gate } else { 10197c478bd9Sstevel@tonic-gate #endif /* little endian -- will work on big endian, but slowly */ 10207c478bd9Sstevel@tonic-gate for (i = 0, j = 0; j < len; i++, j += 4) { 10217c478bd9Sstevel@tonic-gate output[j] = (input[i] >> 24) & 0xff; 10227c478bd9Sstevel@tonic-gate output[j + 1] = (input[i] >> 16) & 0xff; 10237c478bd9Sstevel@tonic-gate output[j + 2] = (input[i] >> 8) & 0xff; 10247c478bd9Sstevel@tonic-gate output[j + 3] = input[i] & 0xff; 10257c478bd9Sstevel@tonic-gate } 10267c478bd9Sstevel@tonic-gate #if defined(__sparc) 10277c478bd9Sstevel@tonic-gate } 10287c478bd9Sstevel@tonic-gate #endif 10297c478bd9Sstevel@tonic-gate } 1030