17c478bd9Sstevel@tonic-gate /* 2*5151fb12Sdarrenm * Copyright 2007 Sun Microsystems, Inc. All rights reserved. 37c478bd9Sstevel@tonic-gate * Use is subject to license terms. 47c478bd9Sstevel@tonic-gate */ 57c478bd9Sstevel@tonic-gate 67c478bd9Sstevel@tonic-gate #pragma ident "%Z%%M% %I% %E% SMI" 77c478bd9Sstevel@tonic-gate 87c478bd9Sstevel@tonic-gate /* 97c478bd9Sstevel@tonic-gate * The basic framework for this code came from the reference 107c478bd9Sstevel@tonic-gate * implementation for MD5. That implementation is Copyright (C) 117c478bd9Sstevel@tonic-gate * 1991-2, RSA Data Security, Inc. Created 1991. All rights reserved. 127c478bd9Sstevel@tonic-gate * 137c478bd9Sstevel@tonic-gate * License to copy and use this software is granted provided that it 147c478bd9Sstevel@tonic-gate * is identified as the "RSA Data Security, Inc. MD5 Message-Digest 157c478bd9Sstevel@tonic-gate * Algorithm" in all material mentioning or referencing this software 167c478bd9Sstevel@tonic-gate * or this function. 177c478bd9Sstevel@tonic-gate * 187c478bd9Sstevel@tonic-gate * License is also granted to make and use derivative works provided 197c478bd9Sstevel@tonic-gate * that such works are identified as "derived from the RSA Data 207c478bd9Sstevel@tonic-gate * Security, Inc. MD5 Message-Digest Algorithm" in all material 217c478bd9Sstevel@tonic-gate * mentioning or referencing the derived work. 227c478bd9Sstevel@tonic-gate * 237c478bd9Sstevel@tonic-gate * RSA Data Security, Inc. makes no representations concerning either 247c478bd9Sstevel@tonic-gate * the merchantability of this software or the suitability of this 257c478bd9Sstevel@tonic-gate * software for any particular purpose. It is provided "as is" 267c478bd9Sstevel@tonic-gate * without express or implied warranty of any kind. 277c478bd9Sstevel@tonic-gate * 287c478bd9Sstevel@tonic-gate * These notices must be retained in any copies of any part of this 297c478bd9Sstevel@tonic-gate * documentation and/or software. 307c478bd9Sstevel@tonic-gate * 317c478bd9Sstevel@tonic-gate * NOTE: Cleaned-up and optimized, version of SHA1, based on the FIPS 180-1 327c478bd9Sstevel@tonic-gate * standard, available at http://www.itl.nist.gov/div897/pubs/fip180-1.htm 337c478bd9Sstevel@tonic-gate * Not as fast as one would like -- further optimizations are encouraged 347c478bd9Sstevel@tonic-gate * and appreciated. 357c478bd9Sstevel@tonic-gate */ 367c478bd9Sstevel@tonic-gate 377c478bd9Sstevel@tonic-gate #include <sys/types.h> 387c478bd9Sstevel@tonic-gate #include <sys/param.h> 397c478bd9Sstevel@tonic-gate #include <sys/systm.h> 407c478bd9Sstevel@tonic-gate #include <sys/sysmacros.h> 417c478bd9Sstevel@tonic-gate #include <sys/sha1.h> 427c478bd9Sstevel@tonic-gate #include <sys/sha1_consts.h> 437c478bd9Sstevel@tonic-gate 447c478bd9Sstevel@tonic-gate #ifndef _KERNEL 457c478bd9Sstevel@tonic-gate #include <strings.h> 467c478bd9Sstevel@tonic-gate #include <stdlib.h> 477c478bd9Sstevel@tonic-gate #include <errno.h> 487c478bd9Sstevel@tonic-gate #include <sys/systeminfo.h> 497c478bd9Sstevel@tonic-gate #endif /* !_KERNEL */ 507c478bd9Sstevel@tonic-gate 51734b6a94Sdarrenm static void Encode(uint8_t *, const uint32_t *, size_t); 52734b6a94Sdarrenm 53734b6a94Sdarrenm #if defined(__sparc) 54734b6a94Sdarrenm 55734b6a94Sdarrenm #define SHA1_TRANSFORM(ctx, in) \ 56734b6a94Sdarrenm SHA1Transform((ctx)->state[0], (ctx)->state[1], (ctx)->state[2], \ 57734b6a94Sdarrenm (ctx)->state[3], (ctx)->state[4], (ctx), (in)) 58734b6a94Sdarrenm 597c478bd9Sstevel@tonic-gate static void SHA1Transform(uint32_t, uint32_t, uint32_t, uint32_t, uint32_t, 607c478bd9Sstevel@tonic-gate SHA1_CTX *, const uint8_t *); 617c478bd9Sstevel@tonic-gate 62734b6a94Sdarrenm #else 63734b6a94Sdarrenm 64734b6a94Sdarrenm #define SHA1_TRANSFORM(ctx, in) SHA1Transform((ctx), (in)) 65734b6a94Sdarrenm 66734b6a94Sdarrenm static void SHA1Transform(SHA1_CTX *, const uint8_t *); 67734b6a94Sdarrenm 68734b6a94Sdarrenm #endif 69734b6a94Sdarrenm 70734b6a94Sdarrenm 717c478bd9Sstevel@tonic-gate static uint8_t PADDING[64] = { 0x80, /* all zeros */ }; 727c478bd9Sstevel@tonic-gate 737c478bd9Sstevel@tonic-gate /* 747c478bd9Sstevel@tonic-gate * F, G, and H are the basic SHA1 functions. 757c478bd9Sstevel@tonic-gate */ 767c478bd9Sstevel@tonic-gate #define F(b, c, d) (((b) & (c)) | ((~b) & (d))) 777c478bd9Sstevel@tonic-gate #define G(b, c, d) ((b) ^ (c) ^ (d)) 78734b6a94Sdarrenm #define H(b, c, d) (((b) & (c)) | (((b)|(c)) & (d))) 797c478bd9Sstevel@tonic-gate 807c478bd9Sstevel@tonic-gate /* 817c478bd9Sstevel@tonic-gate * ROTATE_LEFT rotates x left n bits. 827c478bd9Sstevel@tonic-gate */ 83734b6a94Sdarrenm 84734b6a94Sdarrenm #if defined(__GNUC__) && defined(_LP64) 85734b6a94Sdarrenm static __inline__ uint64_t 86734b6a94Sdarrenm ROTATE_LEFT(uint64_t value, uint32_t n) 87734b6a94Sdarrenm { 88734b6a94Sdarrenm uint32_t t32; 89734b6a94Sdarrenm 90734b6a94Sdarrenm t32 = (uint32_t)value; 91734b6a94Sdarrenm return ((t32 << n) | (t32 >> (32 - n))); 92734b6a94Sdarrenm } 93734b6a94Sdarrenm 94734b6a94Sdarrenm #else 95734b6a94Sdarrenm 967c478bd9Sstevel@tonic-gate #define ROTATE_LEFT(x, n) \ 977c478bd9Sstevel@tonic-gate (((x) << (n)) | ((x) >> ((sizeof (x) * NBBY)-(n)))) 987c478bd9Sstevel@tonic-gate 99734b6a94Sdarrenm #endif 1007c478bd9Sstevel@tonic-gate 101734b6a94Sdarrenm #if defined(__GNUC__) && (defined(__i386) || defined(__amd64)) 1027c478bd9Sstevel@tonic-gate 103734b6a94Sdarrenm #define HAVE_BSWAP 1047c478bd9Sstevel@tonic-gate 105734b6a94Sdarrenm extern __inline__ uint32_t bswap(uint32_t value) 1067c478bd9Sstevel@tonic-gate { 107734b6a94Sdarrenm __asm__("bswap %0" : "+r" (value)); 108734b6a94Sdarrenm return (value); 1097c478bd9Sstevel@tonic-gate } 1107c478bd9Sstevel@tonic-gate 111734b6a94Sdarrenm #endif 1127c478bd9Sstevel@tonic-gate 1137c478bd9Sstevel@tonic-gate /* 1147c478bd9Sstevel@tonic-gate * SHA1Init() 1157c478bd9Sstevel@tonic-gate * 1167c478bd9Sstevel@tonic-gate * purpose: initializes the sha1 context and begins and sha1 digest operation 1177c478bd9Sstevel@tonic-gate * input: SHA1_CTX * : the context to initializes. 1187c478bd9Sstevel@tonic-gate * output: void 1197c478bd9Sstevel@tonic-gate */ 1207c478bd9Sstevel@tonic-gate 1217c478bd9Sstevel@tonic-gate void 1227c478bd9Sstevel@tonic-gate SHA1Init(SHA1_CTX *ctx) 1237c478bd9Sstevel@tonic-gate { 1247c478bd9Sstevel@tonic-gate ctx->count[0] = ctx->count[1] = 0; 1257c478bd9Sstevel@tonic-gate 1267c478bd9Sstevel@tonic-gate /* 1277c478bd9Sstevel@tonic-gate * load magic initialization constants. Tell lint 1287c478bd9Sstevel@tonic-gate * that these constants are unsigned by using U. 1297c478bd9Sstevel@tonic-gate */ 1307c478bd9Sstevel@tonic-gate 1317c478bd9Sstevel@tonic-gate ctx->state[0] = 0x67452301U; 1327c478bd9Sstevel@tonic-gate ctx->state[1] = 0xefcdab89U; 1337c478bd9Sstevel@tonic-gate ctx->state[2] = 0x98badcfeU; 1347c478bd9Sstevel@tonic-gate ctx->state[3] = 0x10325476U; 1357c478bd9Sstevel@tonic-gate ctx->state[4] = 0xc3d2e1f0U; 1367c478bd9Sstevel@tonic-gate } 1377c478bd9Sstevel@tonic-gate 1387c478bd9Sstevel@tonic-gate #ifdef VIS_SHA1 1397c478bd9Sstevel@tonic-gate #ifdef _KERNEL 1407c478bd9Sstevel@tonic-gate 1417c478bd9Sstevel@tonic-gate #include <sys/regset.h> 1427c478bd9Sstevel@tonic-gate #include <sys/vis.h> 14315b9cbbcSkrishna #include <sys/fpu/fpusystm.h> 1447c478bd9Sstevel@tonic-gate 1457c478bd9Sstevel@tonic-gate /* the alignment for block stores to save fp registers */ 1467c478bd9Sstevel@tonic-gate #define VIS_ALIGN (64) 1477c478bd9Sstevel@tonic-gate 1487c478bd9Sstevel@tonic-gate extern int sha1_savefp(kfpu_t *, int); 1497c478bd9Sstevel@tonic-gate extern void sha1_restorefp(kfpu_t *); 1507c478bd9Sstevel@tonic-gate 1517c478bd9Sstevel@tonic-gate uint32_t vis_sha1_svfp_threshold = 128; 1527c478bd9Sstevel@tonic-gate 1537c478bd9Sstevel@tonic-gate #endif /* _KERNEL */ 1547c478bd9Sstevel@tonic-gate 1557c478bd9Sstevel@tonic-gate /* 1567c478bd9Sstevel@tonic-gate * VIS SHA-1 consts. 1577c478bd9Sstevel@tonic-gate */ 1587c478bd9Sstevel@tonic-gate static uint64_t VIS[] = { 1594cc1ac68Skrishna 0x8000000080000000ULL, 1604cc1ac68Skrishna 0x0002000200020002ULL, 1614cc1ac68Skrishna 0x5a8279996ed9eba1ULL, 1624cc1ac68Skrishna 0x8f1bbcdcca62c1d6ULL, 1634cc1ac68Skrishna 0x012389ab456789abULL}; 1647c478bd9Sstevel@tonic-gate 165734b6a94Sdarrenm extern void SHA1TransformVIS(uint64_t *, uint32_t *, uint32_t *, uint64_t *); 1667c478bd9Sstevel@tonic-gate 1677c478bd9Sstevel@tonic-gate 1687c478bd9Sstevel@tonic-gate /* 1697c478bd9Sstevel@tonic-gate * SHA1Update() 1707c478bd9Sstevel@tonic-gate * 1717c478bd9Sstevel@tonic-gate * purpose: continues an sha1 digest operation, using the message block 1727c478bd9Sstevel@tonic-gate * to update the context. 1737c478bd9Sstevel@tonic-gate * input: SHA1_CTX * : the context to update 174734b6a94Sdarrenm * void * : the message block 175734b6a94Sdarrenm * size_t : the length of the message block in bytes 1767c478bd9Sstevel@tonic-gate * output: void 1777c478bd9Sstevel@tonic-gate */ 1787c478bd9Sstevel@tonic-gate 1797c478bd9Sstevel@tonic-gate void 180734b6a94Sdarrenm SHA1Update(SHA1_CTX *ctx, const void *inptr, size_t input_len) 1817c478bd9Sstevel@tonic-gate { 1827c478bd9Sstevel@tonic-gate uint32_t i, buf_index, buf_len; 1837c478bd9Sstevel@tonic-gate uint64_t X0[40], input64[8]; 184734b6a94Sdarrenm const uint8_t *input = inptr; 18515b9cbbcSkrishna #ifdef _KERNEL 18615b9cbbcSkrishna int usevis = 0; 187734b6a94Sdarrenm #else 188734b6a94Sdarrenm int usevis = 1; 18915b9cbbcSkrishna #endif /* _KERNEL */ 1907c478bd9Sstevel@tonic-gate 1917c478bd9Sstevel@tonic-gate /* check for noop */ 1927c478bd9Sstevel@tonic-gate if (input_len == 0) 1937c478bd9Sstevel@tonic-gate return; 1947c478bd9Sstevel@tonic-gate 1957c478bd9Sstevel@tonic-gate /* compute number of bytes mod 64 */ 1967c478bd9Sstevel@tonic-gate buf_index = (ctx->count[1] >> 3) & 0x3F; 1977c478bd9Sstevel@tonic-gate 1987c478bd9Sstevel@tonic-gate /* update number of bits */ 1997c478bd9Sstevel@tonic-gate if ((ctx->count[1] += (input_len << 3)) < (input_len << 3)) 2007c478bd9Sstevel@tonic-gate ctx->count[0]++; 2017c478bd9Sstevel@tonic-gate 2027c478bd9Sstevel@tonic-gate ctx->count[0] += (input_len >> 29); 2037c478bd9Sstevel@tonic-gate 2047c478bd9Sstevel@tonic-gate buf_len = 64 - buf_index; 2057c478bd9Sstevel@tonic-gate 2067c478bd9Sstevel@tonic-gate /* transform as many times as possible */ 2077c478bd9Sstevel@tonic-gate i = 0; 2087c478bd9Sstevel@tonic-gate if (input_len >= buf_len) { 2097c478bd9Sstevel@tonic-gate #ifdef _KERNEL 2107c478bd9Sstevel@tonic-gate kfpu_t *fpu; 211734b6a94Sdarrenm if (fpu_exists) { 212734b6a94Sdarrenm uint8_t fpua[sizeof (kfpu_t) + GSR_SIZE + VIS_ALIGN]; 2137c478bd9Sstevel@tonic-gate uint32_t len = (input_len + buf_index) & ~0x3f; 2147c478bd9Sstevel@tonic-gate int svfp_ok; 2157c478bd9Sstevel@tonic-gate 2167c478bd9Sstevel@tonic-gate fpu = (kfpu_t *)P2ROUNDUP((uintptr_t)fpua, 64); 2177c478bd9Sstevel@tonic-gate svfp_ok = ((len >= vis_sha1_svfp_threshold) ? 1 : 0); 21815b9cbbcSkrishna usevis = fpu_exists && sha1_savefp(fpu, svfp_ok); 219734b6a94Sdarrenm } else { 220734b6a94Sdarrenm usevis = 0; 221734b6a94Sdarrenm } 2227c478bd9Sstevel@tonic-gate #endif /* _KERNEL */ 2237c478bd9Sstevel@tonic-gate 2247c478bd9Sstevel@tonic-gate /* 2257c478bd9Sstevel@tonic-gate * general optimization: 2267c478bd9Sstevel@tonic-gate * 2277c478bd9Sstevel@tonic-gate * only do initial bcopy() and SHA1Transform() if 2287c478bd9Sstevel@tonic-gate * buf_index != 0. if buf_index == 0, we're just 2297c478bd9Sstevel@tonic-gate * wasting our time doing the bcopy() since there 2307c478bd9Sstevel@tonic-gate * wasn't any data left over from a previous call to 2317c478bd9Sstevel@tonic-gate * SHA1Update(). 2327c478bd9Sstevel@tonic-gate */ 2337c478bd9Sstevel@tonic-gate 2347c478bd9Sstevel@tonic-gate if (buf_index) { 2357c478bd9Sstevel@tonic-gate bcopy(input, &ctx->buf_un.buf8[buf_index], buf_len); 2367c478bd9Sstevel@tonic-gate if (usevis) { 2377c478bd9Sstevel@tonic-gate SHA1TransformVIS(X0, 238734b6a94Sdarrenm ctx->buf_un.buf32, 2397c478bd9Sstevel@tonic-gate &ctx->state[0], VIS); 2407c478bd9Sstevel@tonic-gate } else { 241734b6a94Sdarrenm SHA1_TRANSFORM(ctx, ctx->buf_un.buf8); 2427c478bd9Sstevel@tonic-gate } 2437c478bd9Sstevel@tonic-gate i = buf_len; 2447c478bd9Sstevel@tonic-gate } 2457c478bd9Sstevel@tonic-gate 2467c478bd9Sstevel@tonic-gate /* 2477c478bd9Sstevel@tonic-gate * VIS SHA-1: uses the VIS 1.0 instructions to accelerate 2487c478bd9Sstevel@tonic-gate * SHA-1 processing. This is achieved by "offloading" the 2497c478bd9Sstevel@tonic-gate * computation of the message schedule (MS) to the VIS units. 2507c478bd9Sstevel@tonic-gate * This allows the VIS computation of the message schedule 2517c478bd9Sstevel@tonic-gate * to be performed in parallel with the standard integer 2527c478bd9Sstevel@tonic-gate * processing of the remainder of the SHA-1 computation. 2537c478bd9Sstevel@tonic-gate * performance by up to around 1.37X, compared to an optimized 2547c478bd9Sstevel@tonic-gate * integer-only implementation. 2557c478bd9Sstevel@tonic-gate * 2567c478bd9Sstevel@tonic-gate * The VIS implementation of SHA1Transform has a different API 2577c478bd9Sstevel@tonic-gate * to the standard integer version: 2587c478bd9Sstevel@tonic-gate * 2597c478bd9Sstevel@tonic-gate * void SHA1TransformVIS( 2607c478bd9Sstevel@tonic-gate * uint64_t *, // Pointer to MS for ith block 261734b6a94Sdarrenm * uint32_t *, // Pointer to ith block of message data 2627c478bd9Sstevel@tonic-gate * uint32_t *, // Pointer to SHA state i.e ctx->state 2637c478bd9Sstevel@tonic-gate * uint64_t *, // Pointer to various VIS constants 2647c478bd9Sstevel@tonic-gate * ) 2657c478bd9Sstevel@tonic-gate * 2667c478bd9Sstevel@tonic-gate * Note: the message data must by 4-byte aligned. 2677c478bd9Sstevel@tonic-gate * 2687c478bd9Sstevel@tonic-gate * Function requires VIS 1.0 support. 2697c478bd9Sstevel@tonic-gate * 2707c478bd9Sstevel@tonic-gate * Handling is provided to deal with arbitrary byte alingment 2717c478bd9Sstevel@tonic-gate * of the input data but the performance gains are reduced 2727c478bd9Sstevel@tonic-gate * for alignments other than 4-bytes. 2737c478bd9Sstevel@tonic-gate */ 2747c478bd9Sstevel@tonic-gate if (usevis) { 275734b6a94Sdarrenm if (!IS_P2ALIGNED(&input[i], sizeof (uint32_t))) { 2767c478bd9Sstevel@tonic-gate /* 2777c478bd9Sstevel@tonic-gate * Main processing loop - input misaligned 2787c478bd9Sstevel@tonic-gate */ 2797c478bd9Sstevel@tonic-gate for (; i + 63 < input_len; i += 64) { 2807c478bd9Sstevel@tonic-gate bcopy(&input[i], input64, 64); 281734b6a94Sdarrenm SHA1TransformVIS(X0, (uint32_t *)input64, 2827c478bd9Sstevel@tonic-gate &ctx->state[0], VIS); 2837c478bd9Sstevel@tonic-gate } 2847c478bd9Sstevel@tonic-gate } else { 2857c478bd9Sstevel@tonic-gate /* 2867c478bd9Sstevel@tonic-gate * Main processing loop - input 8-byte aligned 2877c478bd9Sstevel@tonic-gate */ 2887c478bd9Sstevel@tonic-gate for (; i + 63 < input_len; i += 64) { 2897c478bd9Sstevel@tonic-gate SHA1TransformVIS(X0, 290734b6a94Sdarrenm /* LINTED E_BAD_PTR_CAST_ALIGN */ 291734b6a94Sdarrenm (uint32_t *)&input[i], 2927c478bd9Sstevel@tonic-gate &ctx->state[0], VIS); 2937c478bd9Sstevel@tonic-gate } 2947c478bd9Sstevel@tonic-gate 2957c478bd9Sstevel@tonic-gate } 2967c478bd9Sstevel@tonic-gate #ifdef _KERNEL 2977c478bd9Sstevel@tonic-gate sha1_restorefp(fpu); 2987c478bd9Sstevel@tonic-gate #endif /* _KERNEL */ 2997c478bd9Sstevel@tonic-gate } else { 3007c478bd9Sstevel@tonic-gate for (; i + 63 < input_len; i += 64) { 301734b6a94Sdarrenm SHA1_TRANSFORM(ctx, &input[i]); 3027c478bd9Sstevel@tonic-gate } 3037c478bd9Sstevel@tonic-gate } 3047c478bd9Sstevel@tonic-gate 3057c478bd9Sstevel@tonic-gate /* 3067c478bd9Sstevel@tonic-gate * general optimization: 3077c478bd9Sstevel@tonic-gate * 3087c478bd9Sstevel@tonic-gate * if i and input_len are the same, return now instead 3097c478bd9Sstevel@tonic-gate * of calling bcopy(), since the bcopy() in this case 3107c478bd9Sstevel@tonic-gate * will be an expensive nop. 3117c478bd9Sstevel@tonic-gate */ 3127c478bd9Sstevel@tonic-gate 3137c478bd9Sstevel@tonic-gate if (input_len == i) 3147c478bd9Sstevel@tonic-gate return; 3157c478bd9Sstevel@tonic-gate 3167c478bd9Sstevel@tonic-gate buf_index = 0; 3177c478bd9Sstevel@tonic-gate } 3187c478bd9Sstevel@tonic-gate 3197c478bd9Sstevel@tonic-gate /* buffer remaining input */ 3207c478bd9Sstevel@tonic-gate bcopy(&input[i], &ctx->buf_un.buf8[buf_index], input_len - i); 3217c478bd9Sstevel@tonic-gate } 3227c478bd9Sstevel@tonic-gate 3237c478bd9Sstevel@tonic-gate #else /* VIS_SHA1 */ 3247c478bd9Sstevel@tonic-gate 3257c478bd9Sstevel@tonic-gate void 326734b6a94Sdarrenm SHA1Update(SHA1_CTX *ctx, const void *inptr, size_t input_len) 3277c478bd9Sstevel@tonic-gate { 3287c478bd9Sstevel@tonic-gate uint32_t i, buf_index, buf_len; 329734b6a94Sdarrenm const uint8_t *input = inptr; 3307c478bd9Sstevel@tonic-gate 3317c478bd9Sstevel@tonic-gate /* check for noop */ 3327c478bd9Sstevel@tonic-gate if (input_len == 0) 3337c478bd9Sstevel@tonic-gate return; 3347c478bd9Sstevel@tonic-gate 3357c478bd9Sstevel@tonic-gate /* compute number of bytes mod 64 */ 3367c478bd9Sstevel@tonic-gate buf_index = (ctx->count[1] >> 3) & 0x3F; 3377c478bd9Sstevel@tonic-gate 3387c478bd9Sstevel@tonic-gate /* update number of bits */ 3397c478bd9Sstevel@tonic-gate if ((ctx->count[1] += (input_len << 3)) < (input_len << 3)) 3407c478bd9Sstevel@tonic-gate ctx->count[0]++; 3417c478bd9Sstevel@tonic-gate 3427c478bd9Sstevel@tonic-gate ctx->count[0] += (input_len >> 29); 3437c478bd9Sstevel@tonic-gate 3447c478bd9Sstevel@tonic-gate buf_len = 64 - buf_index; 3457c478bd9Sstevel@tonic-gate 3467c478bd9Sstevel@tonic-gate /* transform as many times as possible */ 3477c478bd9Sstevel@tonic-gate i = 0; 3487c478bd9Sstevel@tonic-gate if (input_len >= buf_len) { 3497c478bd9Sstevel@tonic-gate 3507c478bd9Sstevel@tonic-gate /* 3517c478bd9Sstevel@tonic-gate * general optimization: 3527c478bd9Sstevel@tonic-gate * 3537c478bd9Sstevel@tonic-gate * only do initial bcopy() and SHA1Transform() if 3547c478bd9Sstevel@tonic-gate * buf_index != 0. if buf_index == 0, we're just 3557c478bd9Sstevel@tonic-gate * wasting our time doing the bcopy() since there 3567c478bd9Sstevel@tonic-gate * wasn't any data left over from a previous call to 3577c478bd9Sstevel@tonic-gate * SHA1Update(). 3587c478bd9Sstevel@tonic-gate */ 3597c478bd9Sstevel@tonic-gate 3607c478bd9Sstevel@tonic-gate if (buf_index) { 3617c478bd9Sstevel@tonic-gate bcopy(input, &ctx->buf_un.buf8[buf_index], buf_len); 362734b6a94Sdarrenm SHA1_TRANSFORM(ctx, ctx->buf_un.buf8); 3637c478bd9Sstevel@tonic-gate i = buf_len; 3647c478bd9Sstevel@tonic-gate } 3657c478bd9Sstevel@tonic-gate 3667c478bd9Sstevel@tonic-gate for (; i + 63 < input_len; i += 64) 367734b6a94Sdarrenm SHA1_TRANSFORM(ctx, &input[i]); 3687c478bd9Sstevel@tonic-gate 3697c478bd9Sstevel@tonic-gate /* 3707c478bd9Sstevel@tonic-gate * general optimization: 3717c478bd9Sstevel@tonic-gate * 3727c478bd9Sstevel@tonic-gate * if i and input_len are the same, return now instead 3737c478bd9Sstevel@tonic-gate * of calling bcopy(), since the bcopy() in this case 3747c478bd9Sstevel@tonic-gate * will be an expensive nop. 3757c478bd9Sstevel@tonic-gate */ 3767c478bd9Sstevel@tonic-gate 3777c478bd9Sstevel@tonic-gate if (input_len == i) 3787c478bd9Sstevel@tonic-gate return; 3797c478bd9Sstevel@tonic-gate 3807c478bd9Sstevel@tonic-gate buf_index = 0; 3817c478bd9Sstevel@tonic-gate } 3827c478bd9Sstevel@tonic-gate 3837c478bd9Sstevel@tonic-gate /* buffer remaining input */ 3847c478bd9Sstevel@tonic-gate bcopy(&input[i], &ctx->buf_un.buf8[buf_index], input_len - i); 3857c478bd9Sstevel@tonic-gate } 3867c478bd9Sstevel@tonic-gate 3877c478bd9Sstevel@tonic-gate #endif /* VIS_SHA1 */ 3887c478bd9Sstevel@tonic-gate 3897c478bd9Sstevel@tonic-gate /* 3907c478bd9Sstevel@tonic-gate * SHA1Final() 3917c478bd9Sstevel@tonic-gate * 3927c478bd9Sstevel@tonic-gate * purpose: ends an sha1 digest operation, finalizing the message digest and 3937c478bd9Sstevel@tonic-gate * zeroing the context. 394*5151fb12Sdarrenm * input: uchar_t * : a buffer to store the digest in 395*5151fb12Sdarrenm * : The function actually uses void* because many 396*5151fb12Sdarrenm * : callers pass things other than uchar_t here. 3977c478bd9Sstevel@tonic-gate * SHA1_CTX * : the context to finalize, save, and zero 3987c478bd9Sstevel@tonic-gate * output: void 3997c478bd9Sstevel@tonic-gate */ 4007c478bd9Sstevel@tonic-gate 4017c478bd9Sstevel@tonic-gate void 402734b6a94Sdarrenm SHA1Final(void *digest, SHA1_CTX *ctx) 4037c478bd9Sstevel@tonic-gate { 4047c478bd9Sstevel@tonic-gate uint8_t bitcount_be[sizeof (ctx->count)]; 4057c478bd9Sstevel@tonic-gate uint32_t index = (ctx->count[1] >> 3) & 0x3f; 4067c478bd9Sstevel@tonic-gate 4077c478bd9Sstevel@tonic-gate /* store bit count, big endian */ 4087c478bd9Sstevel@tonic-gate Encode(bitcount_be, ctx->count, sizeof (bitcount_be)); 4097c478bd9Sstevel@tonic-gate 4107c478bd9Sstevel@tonic-gate /* pad out to 56 mod 64 */ 4117c478bd9Sstevel@tonic-gate SHA1Update(ctx, PADDING, ((index < 56) ? 56 : 120) - index); 4127c478bd9Sstevel@tonic-gate 4137c478bd9Sstevel@tonic-gate /* append length (before padding) */ 4147c478bd9Sstevel@tonic-gate SHA1Update(ctx, bitcount_be, sizeof (bitcount_be)); 4157c478bd9Sstevel@tonic-gate 4167c478bd9Sstevel@tonic-gate /* store state in digest */ 4177c478bd9Sstevel@tonic-gate Encode(digest, ctx->state, sizeof (ctx->state)); 418673007c6Sdarrenm 419673007c6Sdarrenm /* zeroize sensitive information */ 420673007c6Sdarrenm bzero(ctx, sizeof (*ctx)); 4217c478bd9Sstevel@tonic-gate } 4227c478bd9Sstevel@tonic-gate 423734b6a94Sdarrenm typedef uint32_t sha1word; 424734b6a94Sdarrenm 4257c478bd9Sstevel@tonic-gate /* 4267c478bd9Sstevel@tonic-gate * sparc optimization: 4277c478bd9Sstevel@tonic-gate * 4287c478bd9Sstevel@tonic-gate * on the sparc, we can load big endian 32-bit data easily. note that 4297c478bd9Sstevel@tonic-gate * special care must be taken to ensure the address is 32-bit aligned. 4307c478bd9Sstevel@tonic-gate * in the interest of speed, we don't check to make sure, since 4317c478bd9Sstevel@tonic-gate * careful programming can guarantee this for us. 4327c478bd9Sstevel@tonic-gate */ 4337c478bd9Sstevel@tonic-gate 4347c478bd9Sstevel@tonic-gate #if defined(_BIG_ENDIAN) 4357c478bd9Sstevel@tonic-gate 4367c478bd9Sstevel@tonic-gate #define LOAD_BIG_32(addr) (*(uint32_t *)(addr)) 4377c478bd9Sstevel@tonic-gate 438734b6a94Sdarrenm #else /* !defined(_BIG_ENDIAN) */ 4397c478bd9Sstevel@tonic-gate 440734b6a94Sdarrenm #if defined(HAVE_BSWAP) 441734b6a94Sdarrenm 442734b6a94Sdarrenm #define LOAD_BIG_32(addr) bswap(*((uint32_t *)(addr))) 443734b6a94Sdarrenm 444734b6a94Sdarrenm #else /* !defined(HAVE_BSWAP) */ 445734b6a94Sdarrenm 446734b6a94Sdarrenm /* little endian -- will work on big endian, but slowly */ 4477c478bd9Sstevel@tonic-gate #define LOAD_BIG_32(addr) \ 4487c478bd9Sstevel@tonic-gate (((addr)[0] << 24) | ((addr)[1] << 16) | ((addr)[2] << 8) | (addr)[3]) 449734b6a94Sdarrenm 450734b6a94Sdarrenm #endif /* !defined(HAVE_BSWAP) */ 451734b6a94Sdarrenm 452734b6a94Sdarrenm #endif /* !defined(_BIG_ENDIAN) */ 453734b6a94Sdarrenm 454734b6a94Sdarrenm /* 455734b6a94Sdarrenm * SHA1Transform() 456734b6a94Sdarrenm */ 457734b6a94Sdarrenm #if defined(W_ARRAY) 458734b6a94Sdarrenm #define W(n) w[n] 459734b6a94Sdarrenm #else /* !defined(W_ARRAY) */ 460734b6a94Sdarrenm #define W(n) w_ ## n 461734b6a94Sdarrenm #endif /* !defined(W_ARRAY) */ 462734b6a94Sdarrenm 463734b6a94Sdarrenm 464734b6a94Sdarrenm #if defined(__sparc) 4657c478bd9Sstevel@tonic-gate 4667c478bd9Sstevel@tonic-gate /* 4677c478bd9Sstevel@tonic-gate * sparc register window optimization: 4687c478bd9Sstevel@tonic-gate * 4697c478bd9Sstevel@tonic-gate * `a', `b', `c', `d', and `e' are passed into SHA1Transform 4707c478bd9Sstevel@tonic-gate * explicitly since it increases the number of registers available to 4717c478bd9Sstevel@tonic-gate * the compiler. under this scheme, these variables can be held in 4727c478bd9Sstevel@tonic-gate * %i0 - %i4, which leaves more local and out registers available. 4737c478bd9Sstevel@tonic-gate * 4747c478bd9Sstevel@tonic-gate * purpose: sha1 transformation -- updates the digest based on `block' 4757c478bd9Sstevel@tonic-gate * input: uint32_t : bytes 1 - 4 of the digest 4767c478bd9Sstevel@tonic-gate * uint32_t : bytes 5 - 8 of the digest 4777c478bd9Sstevel@tonic-gate * uint32_t : bytes 9 - 12 of the digest 4787c478bd9Sstevel@tonic-gate * uint32_t : bytes 12 - 16 of the digest 4797c478bd9Sstevel@tonic-gate * uint32_t : bytes 16 - 20 of the digest 4807c478bd9Sstevel@tonic-gate * SHA1_CTX * : the context to update 4817c478bd9Sstevel@tonic-gate * uint8_t [64]: the block to use to update the digest 4827c478bd9Sstevel@tonic-gate * output: void 4837c478bd9Sstevel@tonic-gate */ 4847c478bd9Sstevel@tonic-gate 4857c478bd9Sstevel@tonic-gate void 4867c478bd9Sstevel@tonic-gate SHA1Transform(uint32_t a, uint32_t b, uint32_t c, uint32_t d, uint32_t e, 4877c478bd9Sstevel@tonic-gate SHA1_CTX *ctx, const uint8_t blk[64]) 4887c478bd9Sstevel@tonic-gate { 4897c478bd9Sstevel@tonic-gate /* 4907c478bd9Sstevel@tonic-gate * sparc optimization: 4917c478bd9Sstevel@tonic-gate * 4927c478bd9Sstevel@tonic-gate * while it is somewhat counter-intuitive, on sparc, it is 4937c478bd9Sstevel@tonic-gate * more efficient to place all the constants used in this 4947c478bd9Sstevel@tonic-gate * function in an array and load the values out of the array 4957c478bd9Sstevel@tonic-gate * than to manually load the constants. this is because 4967c478bd9Sstevel@tonic-gate * setting a register to a 32-bit value takes two ops in most 4977c478bd9Sstevel@tonic-gate * cases: a `sethi' and an `or', but loading a 32-bit value 4987c478bd9Sstevel@tonic-gate * from memory only takes one `ld' (or `lduw' on v9). while 4997c478bd9Sstevel@tonic-gate * this increases memory usage, the compiler can find enough 5007c478bd9Sstevel@tonic-gate * other things to do while waiting to keep the pipeline does 5017c478bd9Sstevel@tonic-gate * not stall. additionally, it is likely that many of these 5027c478bd9Sstevel@tonic-gate * constants are cached so that later accesses do not even go 5037c478bd9Sstevel@tonic-gate * out to the bus. 5047c478bd9Sstevel@tonic-gate * 5057c478bd9Sstevel@tonic-gate * this array is declared `static' to keep the compiler from 5067c478bd9Sstevel@tonic-gate * having to bcopy() this array onto the stack frame of 5077c478bd9Sstevel@tonic-gate * SHA1Transform() each time it is called -- which is 5087c478bd9Sstevel@tonic-gate * unacceptably expensive. 5097c478bd9Sstevel@tonic-gate * 5107c478bd9Sstevel@tonic-gate * the `const' is to ensure that callers are good citizens and 5117c478bd9Sstevel@tonic-gate * do not try to munge the array. since these routines are 5127c478bd9Sstevel@tonic-gate * going to be called from inside multithreaded kernelland, 5137c478bd9Sstevel@tonic-gate * this is a good safety check. -- `sha1_consts' will end up in 5147c478bd9Sstevel@tonic-gate * .rodata. 5157c478bd9Sstevel@tonic-gate * 5167c478bd9Sstevel@tonic-gate * unfortunately, loading from an array in this manner hurts 5177c478bd9Sstevel@tonic-gate * performance under intel. so, there is a macro, 5187c478bd9Sstevel@tonic-gate * SHA1_CONST(), used in SHA1Transform(), that either expands to 5197c478bd9Sstevel@tonic-gate * a reference to this array, or to the actual constant, 5207c478bd9Sstevel@tonic-gate * depending on what platform this code is compiled for. 5217c478bd9Sstevel@tonic-gate */ 5227c478bd9Sstevel@tonic-gate 5237c478bd9Sstevel@tonic-gate static const uint32_t sha1_consts[] = { 5247c478bd9Sstevel@tonic-gate SHA1_CONST_0, SHA1_CONST_1, SHA1_CONST_2, SHA1_CONST_3, 5257c478bd9Sstevel@tonic-gate }; 5267c478bd9Sstevel@tonic-gate 5277c478bd9Sstevel@tonic-gate /* 5287c478bd9Sstevel@tonic-gate * general optimization: 5297c478bd9Sstevel@tonic-gate * 5307c478bd9Sstevel@tonic-gate * use individual integers instead of using an array. this is a 5317c478bd9Sstevel@tonic-gate * win, although the amount it wins by seems to vary quite a bit. 5327c478bd9Sstevel@tonic-gate */ 5337c478bd9Sstevel@tonic-gate 5347c478bd9Sstevel@tonic-gate uint32_t w_0, w_1, w_2, w_3, w_4, w_5, w_6, w_7; 5357c478bd9Sstevel@tonic-gate uint32_t w_8, w_9, w_10, w_11, w_12, w_13, w_14, w_15; 5367c478bd9Sstevel@tonic-gate 5377c478bd9Sstevel@tonic-gate /* 5387c478bd9Sstevel@tonic-gate * sparc optimization: 5397c478bd9Sstevel@tonic-gate * 5407c478bd9Sstevel@tonic-gate * if `block' is already aligned on a 4-byte boundary, use 5417c478bd9Sstevel@tonic-gate * LOAD_BIG_32() directly. otherwise, bcopy() into a 5427c478bd9Sstevel@tonic-gate * buffer that *is* aligned on a 4-byte boundary and then do 5437c478bd9Sstevel@tonic-gate * the LOAD_BIG_32() on that buffer. benchmarks have shown 5447c478bd9Sstevel@tonic-gate * that using the bcopy() is better than loading the bytes 5457c478bd9Sstevel@tonic-gate * individually and doing the endian-swap by hand. 5467c478bd9Sstevel@tonic-gate * 5477c478bd9Sstevel@tonic-gate * even though it's quite tempting to assign to do: 5487c478bd9Sstevel@tonic-gate * 5497c478bd9Sstevel@tonic-gate * blk = bcopy(ctx->buf_un.buf32, blk, sizeof (ctx->buf_un.buf32)); 5507c478bd9Sstevel@tonic-gate * 5517c478bd9Sstevel@tonic-gate * and only have one set of LOAD_BIG_32()'s, the compiler 5527c478bd9Sstevel@tonic-gate * *does not* like that, so please resist the urge. 5537c478bd9Sstevel@tonic-gate */ 5547c478bd9Sstevel@tonic-gate 5557c478bd9Sstevel@tonic-gate if ((uintptr_t)blk & 0x3) { /* not 4-byte aligned? */ 5567c478bd9Sstevel@tonic-gate bcopy(blk, ctx->buf_un.buf32, sizeof (ctx->buf_un.buf32)); 5577c478bd9Sstevel@tonic-gate w_15 = LOAD_BIG_32(ctx->buf_un.buf32 + 15); 5587c478bd9Sstevel@tonic-gate w_14 = LOAD_BIG_32(ctx->buf_un.buf32 + 14); 5597c478bd9Sstevel@tonic-gate w_13 = LOAD_BIG_32(ctx->buf_un.buf32 + 13); 5607c478bd9Sstevel@tonic-gate w_12 = LOAD_BIG_32(ctx->buf_un.buf32 + 12); 5617c478bd9Sstevel@tonic-gate w_11 = LOAD_BIG_32(ctx->buf_un.buf32 + 11); 5627c478bd9Sstevel@tonic-gate w_10 = LOAD_BIG_32(ctx->buf_un.buf32 + 10); 5637c478bd9Sstevel@tonic-gate w_9 = LOAD_BIG_32(ctx->buf_un.buf32 + 9); 5647c478bd9Sstevel@tonic-gate w_8 = LOAD_BIG_32(ctx->buf_un.buf32 + 8); 5657c478bd9Sstevel@tonic-gate w_7 = LOAD_BIG_32(ctx->buf_un.buf32 + 7); 5667c478bd9Sstevel@tonic-gate w_6 = LOAD_BIG_32(ctx->buf_un.buf32 + 6); 5677c478bd9Sstevel@tonic-gate w_5 = LOAD_BIG_32(ctx->buf_un.buf32 + 5); 5687c478bd9Sstevel@tonic-gate w_4 = LOAD_BIG_32(ctx->buf_un.buf32 + 4); 5697c478bd9Sstevel@tonic-gate w_3 = LOAD_BIG_32(ctx->buf_un.buf32 + 3); 5707c478bd9Sstevel@tonic-gate w_2 = LOAD_BIG_32(ctx->buf_un.buf32 + 2); 5717c478bd9Sstevel@tonic-gate w_1 = LOAD_BIG_32(ctx->buf_un.buf32 + 1); 5727c478bd9Sstevel@tonic-gate w_0 = LOAD_BIG_32(ctx->buf_un.buf32 + 0); 5737c478bd9Sstevel@tonic-gate } else { 5747c478bd9Sstevel@tonic-gate /*LINTED*/ 5757c478bd9Sstevel@tonic-gate w_15 = LOAD_BIG_32(blk + 60); 5767c478bd9Sstevel@tonic-gate /*LINTED*/ 5777c478bd9Sstevel@tonic-gate w_14 = LOAD_BIG_32(blk + 56); 5787c478bd9Sstevel@tonic-gate /*LINTED*/ 5797c478bd9Sstevel@tonic-gate w_13 = LOAD_BIG_32(blk + 52); 5807c478bd9Sstevel@tonic-gate /*LINTED*/ 5817c478bd9Sstevel@tonic-gate w_12 = LOAD_BIG_32(blk + 48); 5827c478bd9Sstevel@tonic-gate /*LINTED*/ 5837c478bd9Sstevel@tonic-gate w_11 = LOAD_BIG_32(blk + 44); 5847c478bd9Sstevel@tonic-gate /*LINTED*/ 5857c478bd9Sstevel@tonic-gate w_10 = LOAD_BIG_32(blk + 40); 5867c478bd9Sstevel@tonic-gate /*LINTED*/ 5877c478bd9Sstevel@tonic-gate w_9 = LOAD_BIG_32(blk + 36); 5887c478bd9Sstevel@tonic-gate /*LINTED*/ 5897c478bd9Sstevel@tonic-gate w_8 = LOAD_BIG_32(blk + 32); 5907c478bd9Sstevel@tonic-gate /*LINTED*/ 5917c478bd9Sstevel@tonic-gate w_7 = LOAD_BIG_32(blk + 28); 5927c478bd9Sstevel@tonic-gate /*LINTED*/ 5937c478bd9Sstevel@tonic-gate w_6 = LOAD_BIG_32(blk + 24); 5947c478bd9Sstevel@tonic-gate /*LINTED*/ 5957c478bd9Sstevel@tonic-gate w_5 = LOAD_BIG_32(blk + 20); 5967c478bd9Sstevel@tonic-gate /*LINTED*/ 5977c478bd9Sstevel@tonic-gate w_4 = LOAD_BIG_32(blk + 16); 5987c478bd9Sstevel@tonic-gate /*LINTED*/ 5997c478bd9Sstevel@tonic-gate w_3 = LOAD_BIG_32(blk + 12); 6007c478bd9Sstevel@tonic-gate /*LINTED*/ 6017c478bd9Sstevel@tonic-gate w_2 = LOAD_BIG_32(blk + 8); 6027c478bd9Sstevel@tonic-gate /*LINTED*/ 6037c478bd9Sstevel@tonic-gate w_1 = LOAD_BIG_32(blk + 4); 6047c478bd9Sstevel@tonic-gate /*LINTED*/ 6057c478bd9Sstevel@tonic-gate w_0 = LOAD_BIG_32(blk + 0); 6067c478bd9Sstevel@tonic-gate } 607734b6a94Sdarrenm #else /* !defined(__sparc) */ 608734b6a94Sdarrenm 609734b6a94Sdarrenm void 610734b6a94Sdarrenm SHA1Transform(SHA1_CTX *ctx, const uint8_t blk[64]) 611734b6a94Sdarrenm { 612734b6a94Sdarrenm sha1word a = ctx->state[0]; 613734b6a94Sdarrenm sha1word b = ctx->state[1]; 614734b6a94Sdarrenm sha1word c = ctx->state[2]; 615734b6a94Sdarrenm sha1word d = ctx->state[3]; 616734b6a94Sdarrenm sha1word e = ctx->state[4]; 617734b6a94Sdarrenm 618734b6a94Sdarrenm #if defined(W_ARRAY) 619734b6a94Sdarrenm sha1word w[16]; 620734b6a94Sdarrenm #else /* !defined(W_ARRAY) */ 621734b6a94Sdarrenm sha1word w_0, w_1, w_2, w_3, w_4, w_5, w_6, w_7; 622734b6a94Sdarrenm sha1word w_8, w_9, w_10, w_11, w_12, w_13, w_14, w_15; 623734b6a94Sdarrenm #endif /* !defined(W_ARRAY) */ 624734b6a94Sdarrenm 625734b6a94Sdarrenm W(0) = LOAD_BIG_32(blk + 0); 626734b6a94Sdarrenm W(1) = LOAD_BIG_32(blk + 4); 627734b6a94Sdarrenm W(2) = LOAD_BIG_32(blk + 8); 628734b6a94Sdarrenm W(3) = LOAD_BIG_32(blk + 12); 629734b6a94Sdarrenm W(4) = LOAD_BIG_32(blk + 16); 630734b6a94Sdarrenm W(5) = LOAD_BIG_32(blk + 20); 631734b6a94Sdarrenm W(6) = LOAD_BIG_32(blk + 24); 632734b6a94Sdarrenm W(7) = LOAD_BIG_32(blk + 28); 633734b6a94Sdarrenm W(8) = LOAD_BIG_32(blk + 32); 634734b6a94Sdarrenm W(9) = LOAD_BIG_32(blk + 36); 635734b6a94Sdarrenm W(10) = LOAD_BIG_32(blk + 40); 636734b6a94Sdarrenm W(11) = LOAD_BIG_32(blk + 44); 637734b6a94Sdarrenm W(12) = LOAD_BIG_32(blk + 48); 638734b6a94Sdarrenm W(13) = LOAD_BIG_32(blk + 52); 639734b6a94Sdarrenm W(14) = LOAD_BIG_32(blk + 56); 640734b6a94Sdarrenm W(15) = LOAD_BIG_32(blk + 60); 641734b6a94Sdarrenm 642734b6a94Sdarrenm #endif /* !defined(__sparc) */ 643734b6a94Sdarrenm 6447c478bd9Sstevel@tonic-gate /* 6457c478bd9Sstevel@tonic-gate * general optimization: 6467c478bd9Sstevel@tonic-gate * 6477c478bd9Sstevel@tonic-gate * even though this approach is described in the standard as 6487c478bd9Sstevel@tonic-gate * being slower algorithmically, it is 30-40% faster than the 6497c478bd9Sstevel@tonic-gate * "faster" version under SPARC, because this version has more 6507c478bd9Sstevel@tonic-gate * of the constraints specified at compile-time and uses fewer 6517c478bd9Sstevel@tonic-gate * variables (and therefore has better register utilization) 6527c478bd9Sstevel@tonic-gate * than its "speedier" brother. (i've tried both, trust me) 6537c478bd9Sstevel@tonic-gate * 6547c478bd9Sstevel@tonic-gate * for either method given in the spec, there is an "assignment" 6557c478bd9Sstevel@tonic-gate * phase where the following takes place: 6567c478bd9Sstevel@tonic-gate * 6577c478bd9Sstevel@tonic-gate * tmp = (main_computation); 6587c478bd9Sstevel@tonic-gate * e = d; d = c; c = rotate_left(b, 30); b = a; a = tmp; 6597c478bd9Sstevel@tonic-gate * 6607c478bd9Sstevel@tonic-gate * we can make the algorithm go faster by not doing this work, 6617c478bd9Sstevel@tonic-gate * but just pretending that `d' is now `e', etc. this works 6627c478bd9Sstevel@tonic-gate * really well and obviates the need for a temporary variable. 6637c478bd9Sstevel@tonic-gate * however, we still explictly perform the rotate action, 6647c478bd9Sstevel@tonic-gate * since it is cheaper on SPARC to do it once than to have to 6657c478bd9Sstevel@tonic-gate * do it over and over again. 6667c478bd9Sstevel@tonic-gate */ 6677c478bd9Sstevel@tonic-gate 6687c478bd9Sstevel@tonic-gate /* round 1 */ 669734b6a94Sdarrenm e = ROTATE_LEFT(a, 5) + F(b, c, d) + e + W(0) + SHA1_CONST(0); /* 0 */ 6707c478bd9Sstevel@tonic-gate b = ROTATE_LEFT(b, 30); 6717c478bd9Sstevel@tonic-gate 672734b6a94Sdarrenm d = ROTATE_LEFT(e, 5) + F(a, b, c) + d + W(1) + SHA1_CONST(0); /* 1 */ 6737c478bd9Sstevel@tonic-gate a = ROTATE_LEFT(a, 30); 6747c478bd9Sstevel@tonic-gate 675734b6a94Sdarrenm c = ROTATE_LEFT(d, 5) + F(e, a, b) + c + W(2) + SHA1_CONST(0); /* 2 */ 6767c478bd9Sstevel@tonic-gate e = ROTATE_LEFT(e, 30); 6777c478bd9Sstevel@tonic-gate 678734b6a94Sdarrenm b = ROTATE_LEFT(c, 5) + F(d, e, a) + b + W(3) + SHA1_CONST(0); /* 3 */ 6797c478bd9Sstevel@tonic-gate d = ROTATE_LEFT(d, 30); 6807c478bd9Sstevel@tonic-gate 681734b6a94Sdarrenm a = ROTATE_LEFT(b, 5) + F(c, d, e) + a + W(4) + SHA1_CONST(0); /* 4 */ 6827c478bd9Sstevel@tonic-gate c = ROTATE_LEFT(c, 30); 6837c478bd9Sstevel@tonic-gate 684734b6a94Sdarrenm e = ROTATE_LEFT(a, 5) + F(b, c, d) + e + W(5) + SHA1_CONST(0); /* 5 */ 6857c478bd9Sstevel@tonic-gate b = ROTATE_LEFT(b, 30); 6867c478bd9Sstevel@tonic-gate 687734b6a94Sdarrenm d = ROTATE_LEFT(e, 5) + F(a, b, c) + d + W(6) + SHA1_CONST(0); /* 6 */ 6887c478bd9Sstevel@tonic-gate a = ROTATE_LEFT(a, 30); 6897c478bd9Sstevel@tonic-gate 690734b6a94Sdarrenm c = ROTATE_LEFT(d, 5) + F(e, a, b) + c + W(7) + SHA1_CONST(0); /* 7 */ 6917c478bd9Sstevel@tonic-gate e = ROTATE_LEFT(e, 30); 6927c478bd9Sstevel@tonic-gate 693734b6a94Sdarrenm b = ROTATE_LEFT(c, 5) + F(d, e, a) + b + W(8) + SHA1_CONST(0); /* 8 */ 6947c478bd9Sstevel@tonic-gate d = ROTATE_LEFT(d, 30); 6957c478bd9Sstevel@tonic-gate 696734b6a94Sdarrenm a = ROTATE_LEFT(b, 5) + F(c, d, e) + a + W(9) + SHA1_CONST(0); /* 9 */ 6977c478bd9Sstevel@tonic-gate c = ROTATE_LEFT(c, 30); 6987c478bd9Sstevel@tonic-gate 699734b6a94Sdarrenm e = ROTATE_LEFT(a, 5) + F(b, c, d) + e + W(10) + SHA1_CONST(0); /* 10 */ 7007c478bd9Sstevel@tonic-gate b = ROTATE_LEFT(b, 30); 7017c478bd9Sstevel@tonic-gate 702734b6a94Sdarrenm d = ROTATE_LEFT(e, 5) + F(a, b, c) + d + W(11) + SHA1_CONST(0); /* 11 */ 7037c478bd9Sstevel@tonic-gate a = ROTATE_LEFT(a, 30); 7047c478bd9Sstevel@tonic-gate 705734b6a94Sdarrenm c = ROTATE_LEFT(d, 5) + F(e, a, b) + c + W(12) + SHA1_CONST(0); /* 12 */ 7067c478bd9Sstevel@tonic-gate e = ROTATE_LEFT(e, 30); 7077c478bd9Sstevel@tonic-gate 708734b6a94Sdarrenm b = ROTATE_LEFT(c, 5) + F(d, e, a) + b + W(13) + SHA1_CONST(0); /* 13 */ 7097c478bd9Sstevel@tonic-gate d = ROTATE_LEFT(d, 30); 7107c478bd9Sstevel@tonic-gate 711734b6a94Sdarrenm a = ROTATE_LEFT(b, 5) + F(c, d, e) + a + W(14) + SHA1_CONST(0); /* 14 */ 7127c478bd9Sstevel@tonic-gate c = ROTATE_LEFT(c, 30); 7137c478bd9Sstevel@tonic-gate 714734b6a94Sdarrenm e = ROTATE_LEFT(a, 5) + F(b, c, d) + e + W(15) + SHA1_CONST(0); /* 15 */ 7157c478bd9Sstevel@tonic-gate b = ROTATE_LEFT(b, 30); 7167c478bd9Sstevel@tonic-gate 717734b6a94Sdarrenm W(0) = ROTATE_LEFT((W(13) ^ W(8) ^ W(2) ^ W(0)), 1); /* 16 */ 718734b6a94Sdarrenm d = ROTATE_LEFT(e, 5) + F(a, b, c) + d + W(0) + SHA1_CONST(0); 7197c478bd9Sstevel@tonic-gate a = ROTATE_LEFT(a, 30); 7207c478bd9Sstevel@tonic-gate 721734b6a94Sdarrenm W(1) = ROTATE_LEFT((W(14) ^ W(9) ^ W(3) ^ W(1)), 1); /* 17 */ 722734b6a94Sdarrenm c = ROTATE_LEFT(d, 5) + F(e, a, b) + c + W(1) + SHA1_CONST(0); 7237c478bd9Sstevel@tonic-gate e = ROTATE_LEFT(e, 30); 7247c478bd9Sstevel@tonic-gate 725734b6a94Sdarrenm W(2) = ROTATE_LEFT((W(15) ^ W(10) ^ W(4) ^ W(2)), 1); /* 18 */ 726734b6a94Sdarrenm b = ROTATE_LEFT(c, 5) + F(d, e, a) + b + W(2) + SHA1_CONST(0); 7277c478bd9Sstevel@tonic-gate d = ROTATE_LEFT(d, 30); 7287c478bd9Sstevel@tonic-gate 729734b6a94Sdarrenm W(3) = ROTATE_LEFT((W(0) ^ W(11) ^ W(5) ^ W(3)), 1); /* 19 */ 730734b6a94Sdarrenm a = ROTATE_LEFT(b, 5) + F(c, d, e) + a + W(3) + SHA1_CONST(0); 7317c478bd9Sstevel@tonic-gate c = ROTATE_LEFT(c, 30); 7327c478bd9Sstevel@tonic-gate 7337c478bd9Sstevel@tonic-gate /* round 2 */ 734734b6a94Sdarrenm W(4) = ROTATE_LEFT((W(1) ^ W(12) ^ W(6) ^ W(4)), 1); /* 20 */ 735734b6a94Sdarrenm e = ROTATE_LEFT(a, 5) + G(b, c, d) + e + W(4) + SHA1_CONST(1); 7367c478bd9Sstevel@tonic-gate b = ROTATE_LEFT(b, 30); 7377c478bd9Sstevel@tonic-gate 738734b6a94Sdarrenm W(5) = ROTATE_LEFT((W(2) ^ W(13) ^ W(7) ^ W(5)), 1); /* 21 */ 739734b6a94Sdarrenm d = ROTATE_LEFT(e, 5) + G(a, b, c) + d + W(5) + SHA1_CONST(1); 7407c478bd9Sstevel@tonic-gate a = ROTATE_LEFT(a, 30); 7417c478bd9Sstevel@tonic-gate 742734b6a94Sdarrenm W(6) = ROTATE_LEFT((W(3) ^ W(14) ^ W(8) ^ W(6)), 1); /* 22 */ 743734b6a94Sdarrenm c = ROTATE_LEFT(d, 5) + G(e, a, b) + c + W(6) + SHA1_CONST(1); 7447c478bd9Sstevel@tonic-gate e = ROTATE_LEFT(e, 30); 7457c478bd9Sstevel@tonic-gate 746734b6a94Sdarrenm W(7) = ROTATE_LEFT((W(4) ^ W(15) ^ W(9) ^ W(7)), 1); /* 23 */ 747734b6a94Sdarrenm b = ROTATE_LEFT(c, 5) + G(d, e, a) + b + W(7) + SHA1_CONST(1); 7487c478bd9Sstevel@tonic-gate d = ROTATE_LEFT(d, 30); 7497c478bd9Sstevel@tonic-gate 750734b6a94Sdarrenm W(8) = ROTATE_LEFT((W(5) ^ W(0) ^ W(10) ^ W(8)), 1); /* 24 */ 751734b6a94Sdarrenm a = ROTATE_LEFT(b, 5) + G(c, d, e) + a + W(8) + SHA1_CONST(1); 7527c478bd9Sstevel@tonic-gate c = ROTATE_LEFT(c, 30); 7537c478bd9Sstevel@tonic-gate 754734b6a94Sdarrenm W(9) = ROTATE_LEFT((W(6) ^ W(1) ^ W(11) ^ W(9)), 1); /* 25 */ 755734b6a94Sdarrenm e = ROTATE_LEFT(a, 5) + G(b, c, d) + e + W(9) + SHA1_CONST(1); 7567c478bd9Sstevel@tonic-gate b = ROTATE_LEFT(b, 30); 7577c478bd9Sstevel@tonic-gate 758734b6a94Sdarrenm W(10) = ROTATE_LEFT((W(7) ^ W(2) ^ W(12) ^ W(10)), 1); /* 26 */ 759734b6a94Sdarrenm d = ROTATE_LEFT(e, 5) + G(a, b, c) + d + W(10) + SHA1_CONST(1); 7607c478bd9Sstevel@tonic-gate a = ROTATE_LEFT(a, 30); 7617c478bd9Sstevel@tonic-gate 762734b6a94Sdarrenm W(11) = ROTATE_LEFT((W(8) ^ W(3) ^ W(13) ^ W(11)), 1); /* 27 */ 763734b6a94Sdarrenm c = ROTATE_LEFT(d, 5) + G(e, a, b) + c + W(11) + SHA1_CONST(1); 7647c478bd9Sstevel@tonic-gate e = ROTATE_LEFT(e, 30); 7657c478bd9Sstevel@tonic-gate 766734b6a94Sdarrenm W(12) = ROTATE_LEFT((W(9) ^ W(4) ^ W(14) ^ W(12)), 1); /* 28 */ 767734b6a94Sdarrenm b = ROTATE_LEFT(c, 5) + G(d, e, a) + b + W(12) + SHA1_CONST(1); 7687c478bd9Sstevel@tonic-gate d = ROTATE_LEFT(d, 30); 7697c478bd9Sstevel@tonic-gate 770734b6a94Sdarrenm W(13) = ROTATE_LEFT((W(10) ^ W(5) ^ W(15) ^ W(13)), 1); /* 29 */ 771734b6a94Sdarrenm a = ROTATE_LEFT(b, 5) + G(c, d, e) + a + W(13) + SHA1_CONST(1); 7727c478bd9Sstevel@tonic-gate c = ROTATE_LEFT(c, 30); 7737c478bd9Sstevel@tonic-gate 774734b6a94Sdarrenm W(14) = ROTATE_LEFT((W(11) ^ W(6) ^ W(0) ^ W(14)), 1); /* 30 */ 775734b6a94Sdarrenm e = ROTATE_LEFT(a, 5) + G(b, c, d) + e + W(14) + SHA1_CONST(1); 7767c478bd9Sstevel@tonic-gate b = ROTATE_LEFT(b, 30); 7777c478bd9Sstevel@tonic-gate 778734b6a94Sdarrenm W(15) = ROTATE_LEFT((W(12) ^ W(7) ^ W(1) ^ W(15)), 1); /* 31 */ 779734b6a94Sdarrenm d = ROTATE_LEFT(e, 5) + G(a, b, c) + d + W(15) + SHA1_CONST(1); 7807c478bd9Sstevel@tonic-gate a = ROTATE_LEFT(a, 30); 7817c478bd9Sstevel@tonic-gate 782734b6a94Sdarrenm W(0) = ROTATE_LEFT((W(13) ^ W(8) ^ W(2) ^ W(0)), 1); /* 32 */ 783734b6a94Sdarrenm c = ROTATE_LEFT(d, 5) + G(e, a, b) + c + W(0) + SHA1_CONST(1); 7847c478bd9Sstevel@tonic-gate e = ROTATE_LEFT(e, 30); 7857c478bd9Sstevel@tonic-gate 786734b6a94Sdarrenm W(1) = ROTATE_LEFT((W(14) ^ W(9) ^ W(3) ^ W(1)), 1); /* 33 */ 787734b6a94Sdarrenm b = ROTATE_LEFT(c, 5) + G(d, e, a) + b + W(1) + SHA1_CONST(1); 7887c478bd9Sstevel@tonic-gate d = ROTATE_LEFT(d, 30); 7897c478bd9Sstevel@tonic-gate 790734b6a94Sdarrenm W(2) = ROTATE_LEFT((W(15) ^ W(10) ^ W(4) ^ W(2)), 1); /* 34 */ 791734b6a94Sdarrenm a = ROTATE_LEFT(b, 5) + G(c, d, e) + a + W(2) + SHA1_CONST(1); 7927c478bd9Sstevel@tonic-gate c = ROTATE_LEFT(c, 30); 7937c478bd9Sstevel@tonic-gate 794734b6a94Sdarrenm W(3) = ROTATE_LEFT((W(0) ^ W(11) ^ W(5) ^ W(3)), 1); /* 35 */ 795734b6a94Sdarrenm e = ROTATE_LEFT(a, 5) + G(b, c, d) + e + W(3) + SHA1_CONST(1); 7967c478bd9Sstevel@tonic-gate b = ROTATE_LEFT(b, 30); 7977c478bd9Sstevel@tonic-gate 798734b6a94Sdarrenm W(4) = ROTATE_LEFT((W(1) ^ W(12) ^ W(6) ^ W(4)), 1); /* 36 */ 799734b6a94Sdarrenm d = ROTATE_LEFT(e, 5) + G(a, b, c) + d + W(4) + SHA1_CONST(1); 8007c478bd9Sstevel@tonic-gate a = ROTATE_LEFT(a, 30); 8017c478bd9Sstevel@tonic-gate 802734b6a94Sdarrenm W(5) = ROTATE_LEFT((W(2) ^ W(13) ^ W(7) ^ W(5)), 1); /* 37 */ 803734b6a94Sdarrenm c = ROTATE_LEFT(d, 5) + G(e, a, b) + c + W(5) + SHA1_CONST(1); 8047c478bd9Sstevel@tonic-gate e = ROTATE_LEFT(e, 30); 8057c478bd9Sstevel@tonic-gate 806734b6a94Sdarrenm W(6) = ROTATE_LEFT((W(3) ^ W(14) ^ W(8) ^ W(6)), 1); /* 38 */ 807734b6a94Sdarrenm b = ROTATE_LEFT(c, 5) + G(d, e, a) + b + W(6) + SHA1_CONST(1); 8087c478bd9Sstevel@tonic-gate d = ROTATE_LEFT(d, 30); 8097c478bd9Sstevel@tonic-gate 810734b6a94Sdarrenm W(7) = ROTATE_LEFT((W(4) ^ W(15) ^ W(9) ^ W(7)), 1); /* 39 */ 811734b6a94Sdarrenm a = ROTATE_LEFT(b, 5) + G(c, d, e) + a + W(7) + SHA1_CONST(1); 8127c478bd9Sstevel@tonic-gate c = ROTATE_LEFT(c, 30); 8137c478bd9Sstevel@tonic-gate 8147c478bd9Sstevel@tonic-gate /* round 3 */ 815734b6a94Sdarrenm W(8) = ROTATE_LEFT((W(5) ^ W(0) ^ W(10) ^ W(8)), 1); /* 40 */ 816734b6a94Sdarrenm e = ROTATE_LEFT(a, 5) + H(b, c, d) + e + W(8) + SHA1_CONST(2); 8177c478bd9Sstevel@tonic-gate b = ROTATE_LEFT(b, 30); 8187c478bd9Sstevel@tonic-gate 819734b6a94Sdarrenm W(9) = ROTATE_LEFT((W(6) ^ W(1) ^ W(11) ^ W(9)), 1); /* 41 */ 820734b6a94Sdarrenm d = ROTATE_LEFT(e, 5) + H(a, b, c) + d + W(9) + SHA1_CONST(2); 8217c478bd9Sstevel@tonic-gate a = ROTATE_LEFT(a, 30); 8227c478bd9Sstevel@tonic-gate 823734b6a94Sdarrenm W(10) = ROTATE_LEFT((W(7) ^ W(2) ^ W(12) ^ W(10)), 1); /* 42 */ 824734b6a94Sdarrenm c = ROTATE_LEFT(d, 5) + H(e, a, b) + c + W(10) + SHA1_CONST(2); 8257c478bd9Sstevel@tonic-gate e = ROTATE_LEFT(e, 30); 8267c478bd9Sstevel@tonic-gate 827734b6a94Sdarrenm W(11) = ROTATE_LEFT((W(8) ^ W(3) ^ W(13) ^ W(11)), 1); /* 43 */ 828734b6a94Sdarrenm b = ROTATE_LEFT(c, 5) + H(d, e, a) + b + W(11) + SHA1_CONST(2); 8297c478bd9Sstevel@tonic-gate d = ROTATE_LEFT(d, 30); 8307c478bd9Sstevel@tonic-gate 831734b6a94Sdarrenm W(12) = ROTATE_LEFT((W(9) ^ W(4) ^ W(14) ^ W(12)), 1); /* 44 */ 832734b6a94Sdarrenm a = ROTATE_LEFT(b, 5) + H(c, d, e) + a + W(12) + SHA1_CONST(2); 8337c478bd9Sstevel@tonic-gate c = ROTATE_LEFT(c, 30); 8347c478bd9Sstevel@tonic-gate 835734b6a94Sdarrenm W(13) = ROTATE_LEFT((W(10) ^ W(5) ^ W(15) ^ W(13)), 1); /* 45 */ 836734b6a94Sdarrenm e = ROTATE_LEFT(a, 5) + H(b, c, d) + e + W(13) + SHA1_CONST(2); 8377c478bd9Sstevel@tonic-gate b = ROTATE_LEFT(b, 30); 8387c478bd9Sstevel@tonic-gate 839734b6a94Sdarrenm W(14) = ROTATE_LEFT((W(11) ^ W(6) ^ W(0) ^ W(14)), 1); /* 46 */ 840734b6a94Sdarrenm d = ROTATE_LEFT(e, 5) + H(a, b, c) + d + W(14) + SHA1_CONST(2); 8417c478bd9Sstevel@tonic-gate a = ROTATE_LEFT(a, 30); 8427c478bd9Sstevel@tonic-gate 843734b6a94Sdarrenm W(15) = ROTATE_LEFT((W(12) ^ W(7) ^ W(1) ^ W(15)), 1); /* 47 */ 844734b6a94Sdarrenm c = ROTATE_LEFT(d, 5) + H(e, a, b) + c + W(15) + SHA1_CONST(2); 8457c478bd9Sstevel@tonic-gate e = ROTATE_LEFT(e, 30); 8467c478bd9Sstevel@tonic-gate 847734b6a94Sdarrenm W(0) = ROTATE_LEFT((W(13) ^ W(8) ^ W(2) ^ W(0)), 1); /* 48 */ 848734b6a94Sdarrenm b = ROTATE_LEFT(c, 5) + H(d, e, a) + b + W(0) + SHA1_CONST(2); 8497c478bd9Sstevel@tonic-gate d = ROTATE_LEFT(d, 30); 8507c478bd9Sstevel@tonic-gate 851734b6a94Sdarrenm W(1) = ROTATE_LEFT((W(14) ^ W(9) ^ W(3) ^ W(1)), 1); /* 49 */ 852734b6a94Sdarrenm a = ROTATE_LEFT(b, 5) + H(c, d, e) + a + W(1) + SHA1_CONST(2); 8537c478bd9Sstevel@tonic-gate c = ROTATE_LEFT(c, 30); 8547c478bd9Sstevel@tonic-gate 855734b6a94Sdarrenm W(2) = ROTATE_LEFT((W(15) ^ W(10) ^ W(4) ^ W(2)), 1); /* 50 */ 856734b6a94Sdarrenm e = ROTATE_LEFT(a, 5) + H(b, c, d) + e + W(2) + SHA1_CONST(2); 8577c478bd9Sstevel@tonic-gate b = ROTATE_LEFT(b, 30); 8587c478bd9Sstevel@tonic-gate 859734b6a94Sdarrenm W(3) = ROTATE_LEFT((W(0) ^ W(11) ^ W(5) ^ W(3)), 1); /* 51 */ 860734b6a94Sdarrenm d = ROTATE_LEFT(e, 5) + H(a, b, c) + d + W(3) + SHA1_CONST(2); 8617c478bd9Sstevel@tonic-gate a = ROTATE_LEFT(a, 30); 8627c478bd9Sstevel@tonic-gate 863734b6a94Sdarrenm W(4) = ROTATE_LEFT((W(1) ^ W(12) ^ W(6) ^ W(4)), 1); /* 52 */ 864734b6a94Sdarrenm c = ROTATE_LEFT(d, 5) + H(e, a, b) + c + W(4) + SHA1_CONST(2); 8657c478bd9Sstevel@tonic-gate e = ROTATE_LEFT(e, 30); 8667c478bd9Sstevel@tonic-gate 867734b6a94Sdarrenm W(5) = ROTATE_LEFT((W(2) ^ W(13) ^ W(7) ^ W(5)), 1); /* 53 */ 868734b6a94Sdarrenm b = ROTATE_LEFT(c, 5) + H(d, e, a) + b + W(5) + SHA1_CONST(2); 8697c478bd9Sstevel@tonic-gate d = ROTATE_LEFT(d, 30); 8707c478bd9Sstevel@tonic-gate 871734b6a94Sdarrenm W(6) = ROTATE_LEFT((W(3) ^ W(14) ^ W(8) ^ W(6)), 1); /* 54 */ 872734b6a94Sdarrenm a = ROTATE_LEFT(b, 5) + H(c, d, e) + a + W(6) + SHA1_CONST(2); 8737c478bd9Sstevel@tonic-gate c = ROTATE_LEFT(c, 30); 8747c478bd9Sstevel@tonic-gate 875734b6a94Sdarrenm W(7) = ROTATE_LEFT((W(4) ^ W(15) ^ W(9) ^ W(7)), 1); /* 55 */ 876734b6a94Sdarrenm e = ROTATE_LEFT(a, 5) + H(b, c, d) + e + W(7) + SHA1_CONST(2); 8777c478bd9Sstevel@tonic-gate b = ROTATE_LEFT(b, 30); 8787c478bd9Sstevel@tonic-gate 879734b6a94Sdarrenm W(8) = ROTATE_LEFT((W(5) ^ W(0) ^ W(10) ^ W(8)), 1); /* 56 */ 880734b6a94Sdarrenm d = ROTATE_LEFT(e, 5) + H(a, b, c) + d + W(8) + SHA1_CONST(2); 8817c478bd9Sstevel@tonic-gate a = ROTATE_LEFT(a, 30); 8827c478bd9Sstevel@tonic-gate 883734b6a94Sdarrenm W(9) = ROTATE_LEFT((W(6) ^ W(1) ^ W(11) ^ W(9)), 1); /* 57 */ 884734b6a94Sdarrenm c = ROTATE_LEFT(d, 5) + H(e, a, b) + c + W(9) + SHA1_CONST(2); 8857c478bd9Sstevel@tonic-gate e = ROTATE_LEFT(e, 30); 8867c478bd9Sstevel@tonic-gate 887734b6a94Sdarrenm W(10) = ROTATE_LEFT((W(7) ^ W(2) ^ W(12) ^ W(10)), 1); /* 58 */ 888734b6a94Sdarrenm b = ROTATE_LEFT(c, 5) + H(d, e, a) + b + W(10) + SHA1_CONST(2); 8897c478bd9Sstevel@tonic-gate d = ROTATE_LEFT(d, 30); 8907c478bd9Sstevel@tonic-gate 891734b6a94Sdarrenm W(11) = ROTATE_LEFT((W(8) ^ W(3) ^ W(13) ^ W(11)), 1); /* 59 */ 892734b6a94Sdarrenm a = ROTATE_LEFT(b, 5) + H(c, d, e) + a + W(11) + SHA1_CONST(2); 8937c478bd9Sstevel@tonic-gate c = ROTATE_LEFT(c, 30); 8947c478bd9Sstevel@tonic-gate 8957c478bd9Sstevel@tonic-gate /* round 4 */ 896734b6a94Sdarrenm W(12) = ROTATE_LEFT((W(9) ^ W(4) ^ W(14) ^ W(12)), 1); /* 60 */ 897734b6a94Sdarrenm e = ROTATE_LEFT(a, 5) + G(b, c, d) + e + W(12) + SHA1_CONST(3); 8987c478bd9Sstevel@tonic-gate b = ROTATE_LEFT(b, 30); 8997c478bd9Sstevel@tonic-gate 900734b6a94Sdarrenm W(13) = ROTATE_LEFT((W(10) ^ W(5) ^ W(15) ^ W(13)), 1); /* 61 */ 901734b6a94Sdarrenm d = ROTATE_LEFT(e, 5) + G(a, b, c) + d + W(13) + SHA1_CONST(3); 9027c478bd9Sstevel@tonic-gate a = ROTATE_LEFT(a, 30); 9037c478bd9Sstevel@tonic-gate 904734b6a94Sdarrenm W(14) = ROTATE_LEFT((W(11) ^ W(6) ^ W(0) ^ W(14)), 1); /* 62 */ 905734b6a94Sdarrenm c = ROTATE_LEFT(d, 5) + G(e, a, b) + c + W(14) + SHA1_CONST(3); 9067c478bd9Sstevel@tonic-gate e = ROTATE_LEFT(e, 30); 9077c478bd9Sstevel@tonic-gate 908734b6a94Sdarrenm W(15) = ROTATE_LEFT((W(12) ^ W(7) ^ W(1) ^ W(15)), 1); /* 63 */ 909734b6a94Sdarrenm b = ROTATE_LEFT(c, 5) + G(d, e, a) + b + W(15) + SHA1_CONST(3); 9107c478bd9Sstevel@tonic-gate d = ROTATE_LEFT(d, 30); 9117c478bd9Sstevel@tonic-gate 912734b6a94Sdarrenm W(0) = ROTATE_LEFT((W(13) ^ W(8) ^ W(2) ^ W(0)), 1); /* 64 */ 913734b6a94Sdarrenm a = ROTATE_LEFT(b, 5) + G(c, d, e) + a + W(0) + SHA1_CONST(3); 9147c478bd9Sstevel@tonic-gate c = ROTATE_LEFT(c, 30); 9157c478bd9Sstevel@tonic-gate 916734b6a94Sdarrenm W(1) = ROTATE_LEFT((W(14) ^ W(9) ^ W(3) ^ W(1)), 1); /* 65 */ 917734b6a94Sdarrenm e = ROTATE_LEFT(a, 5) + G(b, c, d) + e + W(1) + SHA1_CONST(3); 9187c478bd9Sstevel@tonic-gate b = ROTATE_LEFT(b, 30); 9197c478bd9Sstevel@tonic-gate 920734b6a94Sdarrenm W(2) = ROTATE_LEFT((W(15) ^ W(10) ^ W(4) ^ W(2)), 1); /* 66 */ 921734b6a94Sdarrenm d = ROTATE_LEFT(e, 5) + G(a, b, c) + d + W(2) + SHA1_CONST(3); 9227c478bd9Sstevel@tonic-gate a = ROTATE_LEFT(a, 30); 9237c478bd9Sstevel@tonic-gate 924734b6a94Sdarrenm W(3) = ROTATE_LEFT((W(0) ^ W(11) ^ W(5) ^ W(3)), 1); /* 67 */ 925734b6a94Sdarrenm c = ROTATE_LEFT(d, 5) + G(e, a, b) + c + W(3) + SHA1_CONST(3); 9267c478bd9Sstevel@tonic-gate e = ROTATE_LEFT(e, 30); 9277c478bd9Sstevel@tonic-gate 928734b6a94Sdarrenm W(4) = ROTATE_LEFT((W(1) ^ W(12) ^ W(6) ^ W(4)), 1); /* 68 */ 929734b6a94Sdarrenm b = ROTATE_LEFT(c, 5) + G(d, e, a) + b + W(4) + SHA1_CONST(3); 9307c478bd9Sstevel@tonic-gate d = ROTATE_LEFT(d, 30); 9317c478bd9Sstevel@tonic-gate 932734b6a94Sdarrenm W(5) = ROTATE_LEFT((W(2) ^ W(13) ^ W(7) ^ W(5)), 1); /* 69 */ 933734b6a94Sdarrenm a = ROTATE_LEFT(b, 5) + G(c, d, e) + a + W(5) + SHA1_CONST(3); 9347c478bd9Sstevel@tonic-gate c = ROTATE_LEFT(c, 30); 9357c478bd9Sstevel@tonic-gate 936734b6a94Sdarrenm W(6) = ROTATE_LEFT((W(3) ^ W(14) ^ W(8) ^ W(6)), 1); /* 70 */ 937734b6a94Sdarrenm e = ROTATE_LEFT(a, 5) + G(b, c, d) + e + W(6) + SHA1_CONST(3); 9387c478bd9Sstevel@tonic-gate b = ROTATE_LEFT(b, 30); 9397c478bd9Sstevel@tonic-gate 940734b6a94Sdarrenm W(7) = ROTATE_LEFT((W(4) ^ W(15) ^ W(9) ^ W(7)), 1); /* 71 */ 941734b6a94Sdarrenm d = ROTATE_LEFT(e, 5) + G(a, b, c) + d + W(7) + SHA1_CONST(3); 9427c478bd9Sstevel@tonic-gate a = ROTATE_LEFT(a, 30); 9437c478bd9Sstevel@tonic-gate 944734b6a94Sdarrenm W(8) = ROTATE_LEFT((W(5) ^ W(0) ^ W(10) ^ W(8)), 1); /* 72 */ 945734b6a94Sdarrenm c = ROTATE_LEFT(d, 5) + G(e, a, b) + c + W(8) + SHA1_CONST(3); 9467c478bd9Sstevel@tonic-gate e = ROTATE_LEFT(e, 30); 9477c478bd9Sstevel@tonic-gate 948734b6a94Sdarrenm W(9) = ROTATE_LEFT((W(6) ^ W(1) ^ W(11) ^ W(9)), 1); /* 73 */ 949734b6a94Sdarrenm b = ROTATE_LEFT(c, 5) + G(d, e, a) + b + W(9) + SHA1_CONST(3); 9507c478bd9Sstevel@tonic-gate d = ROTATE_LEFT(d, 30); 9517c478bd9Sstevel@tonic-gate 952734b6a94Sdarrenm W(10) = ROTATE_LEFT((W(7) ^ W(2) ^ W(12) ^ W(10)), 1); /* 74 */ 953734b6a94Sdarrenm a = ROTATE_LEFT(b, 5) + G(c, d, e) + a + W(10) + SHA1_CONST(3); 9547c478bd9Sstevel@tonic-gate c = ROTATE_LEFT(c, 30); 9557c478bd9Sstevel@tonic-gate 956734b6a94Sdarrenm W(11) = ROTATE_LEFT((W(8) ^ W(3) ^ W(13) ^ W(11)), 1); /* 75 */ 957734b6a94Sdarrenm e = ROTATE_LEFT(a, 5) + G(b, c, d) + e + W(11) + SHA1_CONST(3); 9587c478bd9Sstevel@tonic-gate b = ROTATE_LEFT(b, 30); 9597c478bd9Sstevel@tonic-gate 960734b6a94Sdarrenm W(12) = ROTATE_LEFT((W(9) ^ W(4) ^ W(14) ^ W(12)), 1); /* 76 */ 961734b6a94Sdarrenm d = ROTATE_LEFT(e, 5) + G(a, b, c) + d + W(12) + SHA1_CONST(3); 9627c478bd9Sstevel@tonic-gate a = ROTATE_LEFT(a, 30); 9637c478bd9Sstevel@tonic-gate 964734b6a94Sdarrenm W(13) = ROTATE_LEFT((W(10) ^ W(5) ^ W(15) ^ W(13)), 1); /* 77 */ 965734b6a94Sdarrenm c = ROTATE_LEFT(d, 5) + G(e, a, b) + c + W(13) + SHA1_CONST(3); 9667c478bd9Sstevel@tonic-gate e = ROTATE_LEFT(e, 30); 9677c478bd9Sstevel@tonic-gate 968734b6a94Sdarrenm W(14) = ROTATE_LEFT((W(11) ^ W(6) ^ W(0) ^ W(14)), 1); /* 78 */ 969734b6a94Sdarrenm b = ROTATE_LEFT(c, 5) + G(d, e, a) + b + W(14) + SHA1_CONST(3); 9707c478bd9Sstevel@tonic-gate d = ROTATE_LEFT(d, 30); 9717c478bd9Sstevel@tonic-gate 972734b6a94Sdarrenm W(15) = ROTATE_LEFT((W(12) ^ W(7) ^ W(1) ^ W(15)), 1); /* 79 */ 9737c478bd9Sstevel@tonic-gate 974734b6a94Sdarrenm ctx->state[0] += ROTATE_LEFT(b, 5) + G(c, d, e) + a + W(15) + 9757c478bd9Sstevel@tonic-gate SHA1_CONST(3); 9767c478bd9Sstevel@tonic-gate ctx->state[1] += b; 9777c478bd9Sstevel@tonic-gate ctx->state[2] += ROTATE_LEFT(c, 30); 9787c478bd9Sstevel@tonic-gate ctx->state[3] += d; 9797c478bd9Sstevel@tonic-gate ctx->state[4] += e; 9807c478bd9Sstevel@tonic-gate 9817c478bd9Sstevel@tonic-gate /* zeroize sensitive information */ 982734b6a94Sdarrenm W(0) = W(1) = W(2) = W(3) = W(4) = W(5) = W(6) = W(7) = W(8) = 0; 983734b6a94Sdarrenm W(9) = W(10) = W(11) = W(12) = W(13) = W(14) = W(15) = 0; 9847c478bd9Sstevel@tonic-gate } 9857c478bd9Sstevel@tonic-gate 9867c478bd9Sstevel@tonic-gate /* 9877c478bd9Sstevel@tonic-gate * Encode() 9887c478bd9Sstevel@tonic-gate * 9897c478bd9Sstevel@tonic-gate * purpose: to convert a list of numbers from little endian to big endian 9907c478bd9Sstevel@tonic-gate * input: uint8_t * : place to store the converted big endian numbers 9917c478bd9Sstevel@tonic-gate * uint32_t * : place to get numbers to convert from 9927c478bd9Sstevel@tonic-gate * size_t : the length of the input in bytes 9937c478bd9Sstevel@tonic-gate * output: void 9947c478bd9Sstevel@tonic-gate */ 9957c478bd9Sstevel@tonic-gate 9967c478bd9Sstevel@tonic-gate static void 997734b6a94Sdarrenm Encode(uint8_t *_RESTRICT_KYWD output, const uint32_t *_RESTRICT_KYWD input, 998734b6a94Sdarrenm size_t len) 9997c478bd9Sstevel@tonic-gate { 10007c478bd9Sstevel@tonic-gate size_t i, j; 10017c478bd9Sstevel@tonic-gate 10027c478bd9Sstevel@tonic-gate #if defined(__sparc) 10037c478bd9Sstevel@tonic-gate if (IS_P2ALIGNED(output, sizeof (uint32_t))) { 10047c478bd9Sstevel@tonic-gate for (i = 0, j = 0; j < len; i++, j += 4) { 10057c478bd9Sstevel@tonic-gate /* LINTED: pointer alignment */ 10067c478bd9Sstevel@tonic-gate *((uint32_t *)(output + j)) = input[i]; 10077c478bd9Sstevel@tonic-gate } 10087c478bd9Sstevel@tonic-gate } else { 10097c478bd9Sstevel@tonic-gate #endif /* little endian -- will work on big endian, but slowly */ 10107c478bd9Sstevel@tonic-gate for (i = 0, j = 0; j < len; i++, j += 4) { 10117c478bd9Sstevel@tonic-gate output[j] = (input[i] >> 24) & 0xff; 10127c478bd9Sstevel@tonic-gate output[j + 1] = (input[i] >> 16) & 0xff; 10137c478bd9Sstevel@tonic-gate output[j + 2] = (input[i] >> 8) & 0xff; 10147c478bd9Sstevel@tonic-gate output[j + 3] = input[i] & 0xff; 10157c478bd9Sstevel@tonic-gate } 10167c478bd9Sstevel@tonic-gate #if defined(__sparc) 10177c478bd9Sstevel@tonic-gate } 10187c478bd9Sstevel@tonic-gate #endif 10197c478bd9Sstevel@tonic-gate } 1020